We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent fc0e041 commit dd1fde5Copy full SHA for dd1fde5
ggml/src/ggml-sycl/flash-attn/flash-attn-sycl.cpp
@@ -59,7 +59,6 @@ void ggml_sycl_op_flash_attn(ggml_backend_sycl_context & ctx, ggml_tensor * dst)
59
stream->fill(l_d, 0.0f, N);
60
stream->fill(m_d, -std::numeric_limits<float>::infinity(), N);
61
stream->fill(dst_d, 0.0f, N * d);
62
- stream->wait();
63
64
for (int j = 0; j < Tc; ++j) {
65
stream->submit([&](sycl::handler & cgh) {
0 commit comments