File tree Expand file tree Collapse file tree 1 file changed +9
-3
lines changed Expand file tree Collapse file tree 1 file changed +9
-3
lines changed Original file line number Diff line number Diff line change @@ -321,7 +321,9 @@ void exhaustive_L2sqr_blas_default_impl(
321321 ip_block.get (),
322322 &nyi);
323323 }
324- #pragma omp parallel for
324+ // Commented out - causes significant GOMP barrier overhead.
325+ // #pragma omp parallel for
326+ //
325327 for (int64_t i = i0; i < i1; i++) {
326328 float * ip_line = ip_block.get () + (i - i0) * (j1 - j0);
327329
@@ -423,7 +425,9 @@ void exhaustive_L2sqr_blas_cmax_avx2(
423425 ip_block.get (),
424426 &nyi);
425427 }
426- #pragma omp parallel for
428+ // Commented out - causes significant GOMP barrier overhead.
429+ // #pragma omp parallel for
430+ //
427431 for (int64_t i = i0; i < i1; i++) {
428432 float * ip_line = ip_block.get () + (i - i0) * (j1 - j0);
429433
@@ -633,7 +637,9 @@ void exhaustive_L2sqr_blas_cmax_sve(
633637 ip_block.get (),
634638 &nyi);
635639 }
636- #pragma omp parallel for
640+ // Commented out - causes significant GOMP barrier overhead.
641+ // #pragma omp parallel for
642+ //
637643 for (int64_t i = i0; i < i1; i++) {
638644 const size_t count = j1 - j0;
639645 float * ip_line = ip_block.get () + (i - i0) * count;
You can’t perform that action at this time.
0 commit comments