[FFmpeg-devel] [PATCH] x86/scale_avx2: Change asm indent from 2 to 4 spaces.
James Almer
jamrial at gmail.com
Thu Dec 16 18:43:03 EET 2021
On 12/16/2021 1:27 PM, Alan Kelly wrote:
> ---
> libswscale/x86/scale_avx2.asm | 96 +++++++++++++++++------------------
> 1 file changed, 48 insertions(+), 48 deletions(-)
>
> diff --git a/libswscale/x86/scale_avx2.asm b/libswscale/x86/scale_avx2.asm
> index 2cd7e968d3..eb472db12f 100644
> --- a/libswscale/x86/scale_avx2.asm
> +++ b/libswscale/x86/scale_avx2.asm
> @@ -45,63 +45,63 @@ SECTION .text
>
> %macro SCALE_FUNC 1
> cglobal hscale8to15_%1, 7, 9, 16, pos0, dst, w, srcmem, filter, fltpos, fltsize, count, inner
> - pxor m0, m0
> - mova m15, [swizzle]
> - mov countq, $0
> - movsxd wq, wd
> + pxor m0, m0
> + mova m15, [swizzle]
> + mov countq, $0
> + movsxd wq, wd
> %ifidn %1, X4
> - mova m14, [four]
> - shr fltsized, 2
> + mova m14, [four]
> + shr fltsized, 2
> %endif
> .loop:
> - movu m1, [fltposq]
> - movu m2, [fltposq+32]
> + movu m1, [fltposq]
> + movu m2, [fltposq+32]
> %ifidn %1, X4
> - pxor m9, m9
> - pxor m10, m10
> - pxor m11, m11
> - pxor m12, m12
> - mov innerq, $0
> + pxor m9, m9
> + pxor m10, m10
> + pxor m11, m11
> + pxor m12, m12
> + mov innerq, $0
> .innerloop:
> %endif
> - vpcmpeqd m13, m13
> - vpgatherdd m3,[srcmemq + m1], m13
> - vpcmpeqd m13, m13
> - vpgatherdd m4,[srcmemq + m2], m13
> - vpunpcklbw m5, m3, m0
> - vpunpckhbw m6, m3, m0
> - vpunpcklbw m7, m4, m0
> - vpunpckhbw m8, m4, m0
> - vpmaddwd m5, m5, [filterq]
> - vpmaddwd m6, m6, [filterq + 32]
> - vpmaddwd m7, m7, [filterq + 64]
> - vpmaddwd m8, m8, [filterq + 96]
> - add filterq, $80
> + vpcmpeqd m13, m13
> + vpgatherdd m3,[srcmemq + m1], m13
> + vpcmpeqd m13, m13
> + vpgatherdd m4,[srcmemq + m2], m13
> + vpunpcklbw m5, m3, m0
> + vpunpckhbw m6, m3, m0
> + vpunpcklbw m7, m4, m0
> + vpunpckhbw m8, m4, m0
> + vpmaddwd m5, m5, [filterq]
> + vpmaddwd m6, m6, [filterq + 32]
> + vpmaddwd m7, m7, [filterq + 64]
> + vpmaddwd m8, m8, [filterq + 96]
> + add filterq, $80
> %ifidn %1, X4
> - paddd m9, m5
> - paddd m10, m6
> - paddd m11, m7
> - paddd m12, m8
> - paddd m1, m14
> - paddd m2, m14
> - add innerq, $1
> - cmp innerq, fltsizeq
> - jl .innerloop
> - vphaddd m5, m9, m10
> - vphaddd m6, m11, m12
> + paddd m9, m5
> + paddd m10, m6
> + paddd m11, m7
> + paddd m12, m8
> + paddd m1, m14
> + paddd m2, m14
> + add innerq, $1
> + cmp innerq, fltsizeq
> + jl .innerloop
> + vphaddd m5, m9, m10
> + vphaddd m6, m11, m12
> %else
> - vphaddd m5, m5, m6
> - vphaddd m6, m7, m8
> + vphaddd m5, m5, m6
> + vphaddd m6, m7, m8
> %endif
> - vpsrad m5, 7
> - vpsrad m6, 7
> - vpackssdw m5, m5, m6
> - vpermd m5, m15, m5
> - vmovdqu [dstq + countq * 2], m5
> - add fltposq, $40
> - add countq, $10
> - cmp countq, wq
> - jl .loop
> + vpsrad m5, 7
> + vpsrad m6, 7
> + vpackssdw m5, m5, m6
> + vpermd m5, m15, m5
> + vmovdqu [dstq + countq * 2], m5
> + add fltposq, $40
> + add countq, $10
> + cmp countq, wq
> + jl .loop
> REP_RET
> %endmacro
Applied, thanks.
More information about the ffmpeg-devel
mailing list