We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5377edd commit 171a0e2Copy full SHA for 171a0e2
paddle/fluid/operators/gru_op.cc
@@ -276,6 +276,7 @@ class GRUCPUKernel : public framework::OpKernel<T> {
276
context.Attr<std::string>("gate_activation"));
277
278
#ifdef PADDLE_WITH_MKLML
279
+ // use MKL packed to speedup GEMM
280
if (FLAGS_paddle_num_threads >= 4) {
281
auto blas = math::GetBlas<DeviceContext, T>(dev_ctx);
282
T* packed_gate = blas.GEMM_ALLOC(CblasBMatrix, 1 /*height of C*/,
0 commit comments