[FFmpeg-cvslog] proresdsp: Optimize series of padds out
Michael Niedermayer
git at videolan.org
Wed Oct 12 22:27:35 CEST 2011
ffmpeg | branch: master | Michael Niedermayer <michaelni at gmx.at> | Wed Oct 12 21:59:44 2011 +0200| [370d7ef2c7a9d00ee885da7ff5dec1b879b33650] | committer: Michael Niedermayer
proresdsp: Optimize series of padds out
Signed-off-by: Michael Niedermayer <michaelni at gmx.at>
> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=370d7ef2c7a9d00ee885da7ff5dec1b879b33650
---
libavcodec/x86/proresdsp.asm | 13 ++-----------
1 files changed, 2 insertions(+), 11 deletions(-)
diff --git a/libavcodec/x86/proresdsp.asm b/libavcodec/x86/proresdsp.asm
index 324e7f6..5e2004f 100644
--- a/libavcodec/x86/proresdsp.asm
+++ b/libavcodec/x86/proresdsp.asm
@@ -49,9 +49,9 @@ w5_min_w1: times 4 dw W5sh2, -W1sh2
w5_plus_w7: times 4 dw W5sh2, +W7sh2
w7_min_w5: times 4 dw W7sh2, -W5sh2
row_round: times 8 dw (1<<14)
+pw_88: times 8 dw 0x2008
cextern pw_4
-cextern pw_8
cextern pw_512
cextern pw_1019
@@ -93,7 +93,7 @@ section .text align=16
; a2 -= W6 * row[2];
; a3 -= W2 * row[2];
%ifidn %1, col
- paddw m10,[pw_8]
+ paddw m10,[pw_88]
%endif
SBUTTERFLY3 wd, 0, 1, 10, 8 ; { row[0], row[2] }[0-3]/[4-7]
%ifidn %1, row
@@ -269,17 +269,8 @@ cglobal prores_idct_put_10_%1, 4, 4, %2
IDCT_1D col, 18, %1
; clip/store
- mova m6, [pw_512]
mova m3, [pw_4]
mova m5, [pw_1019]
- paddw m8, m6
- paddw m0, m6
- paddw m1, m6
- paddw m2, m6
- paddw m4, m6
- paddw m11, m6
- paddw m9, m6
- paddw m10, m6
pmaxsw m8, m3
pmaxsw m0, m3
pmaxsw m1, m3
More information about the ffmpeg-cvslog
mailing list