projects
/
platform
/
upstream
/
opencv.git
/ commitdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
| commitdiff |
tree
raw
|
patch
| inline |
side by side
(parent:
ecbec72
)
Neon optimization of cv::scaleAdd (CV_32F)
author
Ilya Lavrenov
<ilya.lavrenov@itseez.com>
Tue, 23 Sep 2014 17:14:42 +0000
(21:14 +0400)
committer
Ilya Lavrenov
<ilya.lavrenov@itseez.com>
Tue, 23 Sep 2014 17:16:29 +0000
(21:16 +0400)
modules/core/src/matmul.cpp
patch
|
blob
|
history
diff --git
a/modules/core/src/matmul.cpp
b/modules/core/src/matmul.cpp
index
7819a15
..
c5ce6d0
100644
(file)
--- a/
modules/core/src/matmul.cpp
+++ b/
modules/core/src/matmul.cpp
@@
-2102,6
+2102,16
@@
static void scaleAdd_32f(const float* src1, const float* src2, float* dst,
}
}
else
+#elif CV_NEON
+ if (true)
+ {
+ for ( ; i <= len - 4; i += 4)
+ {
+ float32x4_t v_src1 = vld1q_f32(src1 + i), v_src2 = vld1q_f32(src2 + i);
+ vst1q_f32(dst + i, vaddq_f32(vmulq_n_f32(v_src1, alpha), v_src2));
+ }
+ }
+ else
#endif
//vz why do we need unroll here?
for( ; i <= len - 4; i += 4 )