Skip to content

Commit d19425b

Browse files
author
Roman Dubtsov
committed
cpu: conv: 4fma: fix a threading bug
1 parent f0d6ba0 commit d19425b

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

src/cpu/jit_avx512_common_convolution.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -700,7 +700,7 @@ void jit_avx512_common_convolution_bwd_weights_t::balance() {
700700
nthr_g_ = 1;
701701
nthr_oc_b_ = 1;
702702
nthr_ic_b_ = nstl::min(j.nb_ic, max_threads);
703-
nthr_mb_ = max_threads / nthr_ic_b_;
703+
nthr_mb_ = nstl::min(max_threads / nthr_ic_b_, j.mb);
704704
nthr_ = nthr_mb_ * nthr_oc_b_ * nthr_ic_b_ * nthr_g_;
705705
return;
706706
}

0 commit comments

Comments
 (0)