[FFmpeg-devel] [PATCH] x86/intreadwrite: add SSE2 optimized AV_COPY128U
James Almer
jamrial at gmail.com
Thu Jul 25 19:20:07 EEST 2024
Signed-off-by: James Almer <jamrial at gmail.com>
---
libavutil/x86/intreadwrite.h | 7 +++++++
1 file changed, 7 insertions(+)
diff --git a/libavutil/x86/intreadwrite.h b/libavutil/x86/intreadwrite.h
index 65cc6b39a1..c92b75ed12 100644
--- a/libavutil/x86/intreadwrite.h
+++ b/libavutil/x86/intreadwrite.h
@@ -37,6 +37,13 @@ static av_always_inline void AV_COPY128(void *d, const void *s)
_mm_store_si128((__m128i *)d, tmp);
}
+#define AV_COPY128U AV_COPY128U
+static av_always_inline void AV_COPY128U(void *d, const void *s)
+{
+ __m128i tmp = _mm_loadu_si128((const __m128i *)s);
+ _mm_storeu_si128((__m128i *)d, tmp);
+}
+
#define AV_ZERO128 AV_ZERO128
static av_always_inline void AV_ZERO128(void *d)
{
--
2.45.2
More information about the ffmpeg-devel
mailing list