Skip to content

Instantly share code, notes, and snippets.

@emfomenk
Created November 1, 2017 17:14
Show Gist options
  • Save emfomenk/d0ac0cccef7df32ac81d539e1874c45c to your computer and use it in GitHub Desktop.
Save emfomenk/d0ac0cccef7df32ac81d539e1874c45c to your computer and use it in GitHub Desktop.
diff --git a/src/cpu/jit_avx512_common_conv_kernel.cpp b/src/cpu/jit_avx512_common_conv_kernel.cpp
index 6414495..7104423 100644
--- a/src/cpu/jit_avx512_common_conv_kernel.cpp
+++ b/src/cpu/jit_avx512_common_conv_kernel.cpp
@@ -2672,12 +2672,14 @@ bool jit_avx512_common_conv_bwd_weights_kernel_f32::flat_4ops_compute() {
}
for (int ow = 0; ow < j.ow; ow += 4) {
- for (int _ow = ow; _ow < ow + 4; ++_ow) {
+ for (int _ow = ow; /*_ow < ow + 4*/; ++_ow) {
auto vdst = zmm_dst(_ow);
if (_ow < j.ow)
vmovups(vdst, addr_dst(_ow));
else
vpxord(vdst, vdst, vdst);
+
+ if (_ow >= ow + 4) break;
}
for (int kh = 0; kh < kh_step; ++kh) {
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment