x86/float_dsp: zero extend offset from ff_scalarproduct_float_sse
authorJames Almer <jamrial@gmail.com>
Fri, 8 Jan 2016 15:08:56 +0000 (12:08 -0300)
committerJames Almer <jamrial@gmail.com>
Fri, 8 Jan 2016 17:02:47 +0000 (14:02 -0300)
Reviewed-by: Christophe Gisquet <christophe.gisquet@gmail.com>
Signed-off-by: James Almer <jamrial@gmail.com>
(cherry picked from commit dc79824deb6ac0ce236589c618744b33629201cd)

libavutil/x86/float_dsp.asm

index ec3d22b..c4484a2 100644 (file)
@@ -332,10 +332,10 @@ VECTOR_FMUL_REVERSE
 ; float scalarproduct_float_sse(const float *v1, const float *v2, int len)
 INIT_XMM sse
 cglobal scalarproduct_float, 3,3,2, v1, v2, offset
+    shl   offsetd, 2
+    add       v1q, offsetq
+    add       v2q, offsetq
     neg   offsetq
-    shl   offsetq, 2
-    sub       v1q, offsetq
-    sub       v2q, offsetq
     xorps    xmm0, xmm0
 .loop:
     movaps   xmm1, [v1q+offsetq]