Skip to content

Commit 0fbc7a2

Browse files
committed
x86/float_dsp: remove usage of integer instructions
1 parent 96cbaaa commit 0fbc7a2

File tree

1 file changed

+7
-7
lines changed

1 file changed

+7
-7
lines changed

libavutil/x86/float_dsp.asm

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -243,8 +243,8 @@ cglobal vector_dmul_scalar, 4,4,3, dst, src, mul, len
243243
.loop:
244244
mulpd m1, m0, [srcq+lenq ]
245245
mulpd m2, m0, [srcq+lenq+mmsize]
246-
mova [dstq+lenq ], m1
247-
mova [dstq+lenq+mmsize], m2
246+
movaps [dstq+lenq ], m1
247+
movaps [dstq+lenq+mmsize], m2
248248
sub lenq, 2*mmsize
249249
jge .loop
250250
REP_RET
@@ -363,14 +363,14 @@ VECTOR_FMUL_ADD
363363
%macro VECTOR_FMUL_REVERSE 0
364364
cglobal vector_fmul_reverse, 4,4,2, dst, src0, src1, len
365365
%if cpuflag(avx2)
366-
mova m2, [pd_reverse]
366+
movaps m2, [pd_reverse]
367367
%endif
368368
lea lenq, [lend*4 - 2*mmsize]
369369
ALIGN 16
370370
.loop:
371371
%if cpuflag(avx2)
372-
vpermd m0, m2, [src1q]
373-
vpermd m1, m2, [src1q+mmsize]
372+
vpermps m0, m2, [src1q]
373+
vpermps m1, m2, [src1q+mmsize]
374374
%elif cpuflag(avx)
375375
vmovaps xmm0, [src1q + 16]
376376
vinsertf128 m0, m0, [src1q], 1
@@ -386,8 +386,8 @@ ALIGN 16
386386
%endif
387387
mulps m0, m0, [src0q + lenq + mmsize]
388388
mulps m1, m1, [src0q + lenq]
389-
mova [dstq + lenq + mmsize], m0
390-
mova [dstq + lenq], m1
389+
movaps [dstq + lenq + mmsize], m0
390+
movaps [dstq + lenq], m1
391391
add src1q, 2*mmsize
392392
sub lenq, 2*mmsize
393393
jge .loop

0 commit comments

Comments
 (0)