diff mbox series

[FFmpeg-devel] avutil/aarch64: add AV_COPY128 and AV_ZERO128 macros

Message ID 20240821232455.238469-3-ramiro.polla@gmail.com
State New
Headers show
Series [FFmpeg-devel] avutil/aarch64: add AV_COPY128 and AV_ZERO128 macros | expand

Checks

Context Check Description
yinshiyou/make_loongarch64 success Make finished
yinshiyou/make_fate_loongarch64 success Make fate finished
andriy/make_x86 success Make finished
andriy/make_fate_x86 success Make fate finished

Commit Message

Ramiro Polla Aug. 21, 2024, 11:24 p.m. UTC
---
 libavutil/aarch64/intreadwrite.h | 42 ++++++++++++++++++++++++++++++++
 libavutil/intreadwrite.h         |  4 ++-
 2 files changed, 45 insertions(+), 1 deletion(-)
 create mode 100644 libavutil/aarch64/intreadwrite.h

Comments

Martin Storsjö Aug. 22, 2024, 11:57 a.m. UTC | #1
On Thu, 22 Aug 2024, Ramiro Polla wrote:

> ---
> libavutil/aarch64/intreadwrite.h | 42 ++++++++++++++++++++++++++++++++
> libavutil/intreadwrite.h         |  4 ++-
> 2 files changed, 45 insertions(+), 1 deletion(-)
> create mode 100644 libavutil/aarch64/intreadwrite.h
>
> diff --git a/libavutil/aarch64/intreadwrite.h b/libavutil/aarch64/intreadwrite.h
> new file mode 100644
> index 0000000000..4ce2d64987
> --- /dev/null
> +++ b/libavutil/aarch64/intreadwrite.h
> @@ -0,0 +1,42 @@
> +/*
> + * This file is part of FFmpeg.
> + *
> + * FFmpeg is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * FFmpeg is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with FFmpeg; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
> + */
> +
> +#ifndef AVUTIL_AARCH64_INTREADWRITE_H
> +#define AVUTIL_AARCH64_INTREADWRITE_H
> +
> +#if HAVE_INTRINSICS_NEON
> +
> +#include <arm_neon.h>
> +
> +#define AV_COPY128 AV_COPY128
> +static av_always_inline void AV_COPY128(void *d, const void *s)
> +{
> +    uint8x16_t tmp = vld1q_u8((const uint8_t *)s);
> +    vst1q_u8((uint8_t *)d, tmp);
> +}
> +
> +#define AV_ZERO128 AV_ZERO128
> +static av_always_inline void AV_ZERO128(void *d)
> +{
> +    uint8x16_t zero = vdupq_n_u8(0);
> +    vst1q_u8((uint8_t *)d, zero);
> +}
> +
> +#endif /* HAVE_INTRINSICS_NEON */
> +
> +#endif /* AVUTIL_AARCH64_INTREADWRITE_H */
> diff --git a/libavutil/intreadwrite.h b/libavutil/intreadwrite.h
> index 120bdbc8f0..ffd15a1502 100644
> --- a/libavutil/intreadwrite.h
> +++ b/libavutil/intreadwrite.h
> @@ -64,7 +64,9 @@ typedef union {
>
> #include "config.h"
>
> -#if ARCH_MIPS
> +#if ARCH_AARCH64
> +#   include "aarch64/intreadwrite.h"
> +#elif ARCH_MIPS
> #   include "mips/intreadwrite.h"
> #elif ARCH_PPC
> #   include "ppc/intreadwrite.h"
> -- 
> 2.39.2

LGTM, this seems like a valid use case for intrinsics.

// Martin
Ramiro Polla Aug. 26, 2024, 8:28 a.m. UTC | #2
On Thu, Aug 22, 2024 at 2:06 PM Martin Storsjö <martin@martin.st> wrote:
> On Thu, 22 Aug 2024, Ramiro Polla wrote:
>
> > ---
> > libavutil/aarch64/intreadwrite.h | 42 ++++++++++++++++++++++++++++++++
> > libavutil/intreadwrite.h         |  4 ++-
> > 2 files changed, 45 insertions(+), 1 deletion(-)
> > create mode 100644 libavutil/aarch64/intreadwrite.h
> >
> > diff --git a/libavutil/aarch64/intreadwrite.h b/libavutil/aarch64/intreadwrite.h
> > new file mode 100644
> > index 0000000000..4ce2d64987
> > --- /dev/null
> > +++ b/libavutil/aarch64/intreadwrite.h
> > @@ -0,0 +1,42 @@
> > +/*
> > + * This file is part of FFmpeg.
> > + *
> > + * FFmpeg is free software; you can redistribute it and/or
> > + * modify it under the terms of the GNU Lesser General Public
> > + * License as published by the Free Software Foundation; either
> > + * version 2.1 of the License, or (at your option) any later version.
> > + *
> > + * FFmpeg is distributed in the hope that it will be useful,
> > + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> > + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> > + * Lesser General Public License for more details.
> > + *
> > + * You should have received a copy of the GNU Lesser General Public
> > + * License along with FFmpeg; if not, write to the Free Software
> > + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
> > + */
> > +
> > +#ifndef AVUTIL_AARCH64_INTREADWRITE_H
> > +#define AVUTIL_AARCH64_INTREADWRITE_H
> > +
> > +#if HAVE_INTRINSICS_NEON
> > +
> > +#include <arm_neon.h>
> > +
> > +#define AV_COPY128 AV_COPY128
> > +static av_always_inline void AV_COPY128(void *d, const void *s)
> > +{
> > +    uint8x16_t tmp = vld1q_u8((const uint8_t *)s);
> > +    vst1q_u8((uint8_t *)d, tmp);
> > +}
> > +
> > +#define AV_ZERO128 AV_ZERO128
> > +static av_always_inline void AV_ZERO128(void *d)
> > +{
> > +    uint8x16_t zero = vdupq_n_u8(0);
> > +    vst1q_u8((uint8_t *)d, zero);
> > +}
> > +
> > +#endif /* HAVE_INTRINSICS_NEON */
> > +
> > +#endif /* AVUTIL_AARCH64_INTREADWRITE_H */
> > diff --git a/libavutil/intreadwrite.h b/libavutil/intreadwrite.h
> > index 120bdbc8f0..ffd15a1502 100644
> > --- a/libavutil/intreadwrite.h
> > +++ b/libavutil/intreadwrite.h
> > @@ -64,7 +64,9 @@ typedef union {
> >
> > #include "config.h"
> >
> > -#if ARCH_MIPS
> > +#if ARCH_AARCH64
> > +#   include "aarch64/intreadwrite.h"
> > +#elif ARCH_MIPS
> > #   include "mips/intreadwrite.h"
> > #elif ARCH_PPC
> > #   include "ppc/intreadwrite.h"
> > --
> > 2.39.2
>
> LGTM, this seems like a valid use case for intrinsics.

Thanks. Pushed.
diff mbox series

Patch

diff --git a/libavutil/aarch64/intreadwrite.h b/libavutil/aarch64/intreadwrite.h
new file mode 100644
index 0000000000..4ce2d64987
--- /dev/null
+++ b/libavutil/aarch64/intreadwrite.h
@@ -0,0 +1,42 @@ 
+/*
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#ifndef AVUTIL_AARCH64_INTREADWRITE_H
+#define AVUTIL_AARCH64_INTREADWRITE_H
+
+#if HAVE_INTRINSICS_NEON
+
+#include <arm_neon.h>
+
+#define AV_COPY128 AV_COPY128
+static av_always_inline void AV_COPY128(void *d, const void *s)
+{
+    uint8x16_t tmp = vld1q_u8((const uint8_t *)s);
+    vst1q_u8((uint8_t *)d, tmp);
+}
+
+#define AV_ZERO128 AV_ZERO128
+static av_always_inline void AV_ZERO128(void *d)
+{
+    uint8x16_t zero = vdupq_n_u8(0);
+    vst1q_u8((uint8_t *)d, zero);
+}
+
+#endif /* HAVE_INTRINSICS_NEON */
+
+#endif /* AVUTIL_AARCH64_INTREADWRITE_H */
diff --git a/libavutil/intreadwrite.h b/libavutil/intreadwrite.h
index 120bdbc8f0..ffd15a1502 100644
--- a/libavutil/intreadwrite.h
+++ b/libavutil/intreadwrite.h
@@ -64,7 +64,9 @@  typedef union {
 
 #include "config.h"
 
-#if ARCH_MIPS
+#if ARCH_AARCH64
+#   include "aarch64/intreadwrite.h"
+#elif ARCH_MIPS
 #   include "mips/intreadwrite.h"
 #elif ARCH_PPC
 #   include "ppc/intreadwrite.h"