Skip to content

Commit 27fa272

Browse files
committed
*refactoring of SynetConvolution16bNhwcSpecV0 class (part 2).
1 parent 39930a3 commit 27fa272

File tree

2 files changed

+4
-0
lines changed

2 files changed

+4
-0
lines changed

src/Simd/SimdBaseSynetConvolution16bNhwcSpecV0.cpp

+3
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,10 @@ namespace Simd
6464
a.srcH = p.srcH + p.padY + p.padH;
6565
a.srcW = p.srcW + p.padX + p.padW;
6666
a.dstC = AlignHi(p.dstC, a.F);
67+
a.padV = Simd::Max(p.padY, p.padH);
68+
a.padH = Simd::Max(p.padX, p.padW);
6769
a.K = p.kernelX * p.kernelY;
70+
a.padE = (a.srcW + a.padH) * a.padV + a.microC*a.F;
6871

6972
a.macroC = Simd::RestrictRange(AlignLo(L1 / a.microD / a.K / 2, a.microC), a.microC, a.srcC);
7073
a.macroO = a.macroC * a.K / a.microC;

src/Simd/SimdSynetConvolution16b.h

+1
Original file line numberDiff line numberDiff line change
@@ -176,6 +176,7 @@ namespace Simd
176176
struct AlgParam
177177
{
178178
size_t batch, srcC, srcH, srcW, dstC, K;
179+
size_t padV, padH, padE;
179180
size_t F, microD, microS, microC;
180181
size_t macroD, macroH, macroC, numH, macroO;
181182
size_t bufS, bufD, elem;

0 commit comments

Comments
 (0)