Skip to content

Commit cfc5c3d

Browse files
committed
cpu: gemm: check for nocopy on sequential mode
We should check for nocopy even for single threaded mode.
1 parent 0125f28 commit cfc5c3d

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

src/cpu/gemm/gemm_driver.cpp

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1322,11 +1322,6 @@ static mkldnn_status_t gemm_threading_driver(
13221322
}
13231323
get_omp_thread_count<c_type>(arg->m, arg->n, arg->k, &nthr);
13241324

1325-
if (nthr == 1) {
1326-
return gemm_kernel_driver(arg->m, arg->n, arg->k, arg->a, arg->b,
1327-
arg->c, arg->co, arg);
1328-
}
1329-
13301325
if ((data_traits<a_type>::data_type == data_type::f32) &&
13311326
nocopy_checker(nthr, arg->transa, arg->transb, arg->m, arg->n,
13321327
arg->k, arg->lda, arg->ldb, arg->ldc))
@@ -1336,6 +1331,11 @@ static mkldnn_status_t gemm_threading_driver(
13361331
(float *) arg->b, arg->ldb,
13371332
arg->beta, (float *) arg->c, arg->ldc, NULL);
13381333

1334+
if (nthr == 1) {
1335+
return gemm_kernel_driver(
1336+
arg->m, arg->n, arg->k, arg->a, arg->b, arg->c, arg->co, arg);
1337+
}
1338+
13391339
mkldnn_status_t *results = (mkldnn_status_t *) malloc(
13401340
sizeof(*results) * nthr * CACHE_LINE_SIZE, PAGE_4K);
13411341

0 commit comments

Comments
 (0)