Skip to content

Commit d5611f3

Browse files
committed
Fix significant GOMP barrier overhead in exhaustive_L2sqr_blas.
Signed-off-by: Mulugeta Mammo <[email protected]>
1 parent 3de200f commit d5611f3

File tree

1 file changed

+9
-3
lines changed

1 file changed

+9
-3
lines changed

faiss/utils/distances.cpp

Lines changed: 9 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -321,7 +321,9 @@ void exhaustive_L2sqr_blas_default_impl(
321321
ip_block.get(),
322322
&nyi);
323323
}
324-
#pragma omp parallel for
324+
// Commented out - causes significant GOMP barrier overhead.
325+
// #pragma omp parallel for
326+
//
325327
for (int64_t i = i0; i < i1; i++) {
326328
float* ip_line = ip_block.get() + (i - i0) * (j1 - j0);
327329

@@ -423,7 +425,9 @@ void exhaustive_L2sqr_blas_cmax_avx2(
423425
ip_block.get(),
424426
&nyi);
425427
}
426-
#pragma omp parallel for
428+
// Commented out - causes significant GOMP barrier overhead.
429+
// #pragma omp parallel for
430+
//
427431
for (int64_t i = i0; i < i1; i++) {
428432
float* ip_line = ip_block.get() + (i - i0) * (j1 - j0);
429433

@@ -633,7 +637,9 @@ void exhaustive_L2sqr_blas_cmax_sve(
633637
ip_block.get(),
634638
&nyi);
635639
}
636-
#pragma omp parallel for
640+
// Commented out - causes significant GOMP barrier overhead.
641+
// #pragma omp parallel for
642+
//
637643
for (int64_t i = i0; i < i1; i++) {
638644
const size_t count = j1 - j0;
639645
float* ip_line = ip_block.get() + (i - i0) * count;

0 commit comments

Comments
 (0)