Created
August 9, 2017 09:37
-
-
Save rsdubtso/4c2bb282ddd9c0018ce4c9909a561181 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
From 48e0f053bd21363211b8901582c07952fed025f8 Mon Sep 17 00:00:00 2001 | |
From: Roman Dubtsov <roman.s.dubtsov@intel.com> | |
Date: Wed, 9 Aug 2017 12:35:23 +0300 | |
Subject: cpu: pooling: generate proper movups when zeroing diff_src | |
--- | |
src/cpu/jit_uni_pool_kernel_f32.cpp | 2 +- | |
1 file changed, 1 insertion(+), 1 deletion(-) | |
diff --git a/src/cpu/jit_uni_pool_kernel_f32.cpp b/src/cpu/jit_uni_pool_kernel_f32.cpp | |
index 44ba23af..5d26bb5b 100644 | |
--- a/src/cpu/jit_uni_pool_kernel_f32.cpp | |
+++ b/src/cpu/jit_uni_pool_kernel_f32.cpp | |
@@ -367,7 +367,7 @@ void jit_uni_pool_kernel_f32<isa>::maybe_zero_diff_src() { | |
{ | |
const int dim = jpp.iw * jpp.c_block * sizeof(float); | |
for (int i = 0; i < dim; i += cpu_isa_traits<isa>::vlen) | |
- vmovups(ptr[reg_input + reg_off + i], vzero); | |
+ uni_vmovups(ptr[reg_input + reg_off + i], vzero); | |
add(reg_off, dim); | |
cmp(reg_off, jpp.ih * dim); | |
jl(l_zero, T_NEAR); | |
-- | |
2.12.2 | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment