diff mbox series

[FFmpeg-devel] x86/intreadwrite: add SSE2 optimized AV_COPY128U

Message ID 20240725162007.2048-1-jamrial@gmail.com
State New
Headers show
Series [FFmpeg-devel] x86/intreadwrite: add SSE2 optimized AV_COPY128U | expand

Checks

Context Check Description
andriy/make_x86 success Make finished
andriy/make_fate_x86 success Make fate finished

Commit Message

James Almer July 25, 2024, 4:20 p.m. UTC
Signed-off-by: James Almer <jamrial@gmail.com>
---
 libavutil/x86/intreadwrite.h | 7 +++++++
 1 file changed, 7 insertions(+)
diff mbox series

Patch

diff --git a/libavutil/x86/intreadwrite.h b/libavutil/x86/intreadwrite.h
index 65cc6b39a1..c92b75ed12 100644
--- a/libavutil/x86/intreadwrite.h
+++ b/libavutil/x86/intreadwrite.h
@@ -37,6 +37,13 @@  static av_always_inline void AV_COPY128(void *d, const void *s)
     _mm_store_si128((__m128i *)d, tmp);
 }
 
+#define AV_COPY128U AV_COPY128U
+static av_always_inline void AV_COPY128U(void *d, const void *s)
+{
+    __m128i tmp = _mm_loadu_si128((const __m128i *)s);
+    _mm_storeu_si128((__m128i *)d, tmp);
+}
+
 #define AV_ZERO128 AV_ZERO128
 static av_always_inline void AV_ZERO128(void *d)
 {