Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
 help / color / mirror / Atom feed
From: remi@remlab.net
To: ffmpeg-devel@ffmpeg.org
Subject: [FFmpeg-devel] [PATCH 03/29] lavc/audiodsp: RISC-V F vector_clipf
Date: Thu, 22 Sep 2022 21:37:00 +0300
Message-ID: <20220922183726.38624-3-remi@remlab.net> (raw)
In-Reply-To: <12078904.O9o76ZdvQC@basile.remlab.net>

From: Rémi Denis-Courmont <remi@remlab.net>

RV64G supports MIN & MAX instructions natively only on floating point
registers, not general purpose ones. The later would require the Zbb
extension. Due to that, it is actually faster to perform the clipping
"properly" in FPU.

Benchmarks on SiFive U74-MC (courtesy of Shanghai StarFive Tech):
audiodsp.vector_clipf_c: 29551.5
audiodsp.vector_clipf_rvf: 17871.0

Also tried unrolling with 2 or 8 elements but it gets worse either way.
---
 libavcodec/audiodsp.c            |  2 ++
 libavcodec/audiodsp.h            |  1 +
 libavcodec/riscv/Makefile        |  2 ++
 libavcodec/riscv/audiodsp_init.c | 33 +++++++++++++++++++++
 libavcodec/riscv/audiodsp_rvf.S  | 49 ++++++++++++++++++++++++++++++++
 5 files changed, 87 insertions(+)
 create mode 100644 libavcodec/riscv/Makefile
 create mode 100644 libavcodec/riscv/audiodsp_init.c
 create mode 100644 libavcodec/riscv/audiodsp_rvf.S

diff --git a/libavcodec/audiodsp.c b/libavcodec/audiodsp.c
index ff43e87dce..eba6e809fd 100644
--- a/libavcodec/audiodsp.c
+++ b/libavcodec/audiodsp.c
@@ -113,6 +113,8 @@ av_cold void ff_audiodsp_init(AudioDSPContext *c)
     ff_audiodsp_init_arm(c);
 #elif ARCH_PPC
     ff_audiodsp_init_ppc(c);
+#elif ARCH_RISCV
+    ff_audiodsp_init_riscv(c);
 #elif ARCH_X86
     ff_audiodsp_init_x86(c);
 #endif
diff --git a/libavcodec/audiodsp.h b/libavcodec/audiodsp.h
index aa6fa7898b..485b512839 100644
--- a/libavcodec/audiodsp.h
+++ b/libavcodec/audiodsp.h
@@ -55,6 +55,7 @@ typedef struct AudioDSPContext {
 void ff_audiodsp_init(AudioDSPContext *c);
 void ff_audiodsp_init_arm(AudioDSPContext *c);
 void ff_audiodsp_init_ppc(AudioDSPContext *c);
+void ff_audiodsp_init_riscv(AudioDSPContext *c);
 void ff_audiodsp_init_x86(AudioDSPContext *c);
 
 #endif /* AVCODEC_AUDIODSP_H */
diff --git a/libavcodec/riscv/Makefile b/libavcodec/riscv/Makefile
new file mode 100644
index 0000000000..414a9e9bd8
--- /dev/null
+++ b/libavcodec/riscv/Makefile
@@ -0,0 +1,2 @@
+OBJS-$(CONFIG_AUDIODSP) += riscv/audiodsp_init.o \
+                           riscv/audiodsp_rvf.o
diff --git a/libavcodec/riscv/audiodsp_init.c b/libavcodec/riscv/audiodsp_init.c
new file mode 100644
index 0000000000..c5842815d6
--- /dev/null
+++ b/libavcodec/riscv/audiodsp_init.c
@@ -0,0 +1,33 @@
+/*
+ * Copyright © 2022 Rémi Denis-Courmont.
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include "libavutil/attributes.h"
+#include "libavutil/cpu.h"
+#include "libavcodec/audiodsp.h"
+
+void ff_vector_clipf_rvf(float *dst, const float *src, int len, float min, float max);
+
+av_cold void ff_audiodsp_init_riscv(AudioDSPContext *c)
+{
+    int flags = av_get_cpu_flags();
+
+    if (flags & AV_CPU_FLAG_RVF)
+        c->vector_clipf = ff_vector_clipf_rvf;
+}
diff --git a/libavcodec/riscv/audiodsp_rvf.S b/libavcodec/riscv/audiodsp_rvf.S
new file mode 100644
index 0000000000..2ec8a11691
--- /dev/null
+++ b/libavcodec/riscv/audiodsp_rvf.S
@@ -0,0 +1,49 @@
+/*
+ * Copyright © 2022 Rémi Denis-Courmont.
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include "libavutil/riscv/asm.S"
+
+func ff_vector_clipf_rvf, f
+NOHWF   fmv.w.x fa0, a3
+NOHWF   fmv.w.x fa1, a4
+1:
+        flw     ft0,   (a1)
+        flw     ft1,  4(a1)
+        fmax.s  ft0, ft0, fa0
+        flw     ft2,  8(a1)
+        fmax.s  ft1, ft1, fa0
+        flw     ft3, 12(a1)
+        fmax.s  ft2, ft2, fa0
+        addi    a2, a2, -4
+        fmax.s  ft3, ft3, fa0
+        addi    a1, a1, 16
+        fmin.s  ft0, ft0, fa1
+        fmin.s  ft1, ft1, fa1
+        fsw     ft0,   (a0)
+        fmin.s  ft2, ft2, fa1
+        fsw     ft1,  4(a0)
+        fmin.s  ft3, ft3, fa1
+        fsw     ft2,  8(a0)
+        fsw     ft3, 12(a0)
+        addi    a0, a0, 16
+        bnez    a2, 1b
+
+        ret
+endfunc
-- 
2.37.2

_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

  parent reply	other threads:[~2022-09-22 18:37 UTC|newest]

Thread overview: 31+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2022-09-22 18:37 [FFmpeg-devel] [PATCHv4 00/29] RISC-V CPU extensions Rémi Denis-Courmont
2022-09-22 18:36 ` [FFmpeg-devel] [PATCH 01/29] lavu/cpu: detect RISC-V base extensions remi
2022-09-22 18:36 ` [FFmpeg-devel] [PATCH 02/29] lavu/riscv: initial common header for assembler macros remi
2022-09-22 18:37 ` remi [this message]
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 04/29] lavc/pixblockdsp: RISC-V I get_pixels remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 05/29] lavu/cpu: CPU flags for the RISC-V Vector extension remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 06/29] configure: probe " remi
2022-09-23 14:57   ` Rémi Denis-Courmont
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 07/29] lavu/floatdsp: RISC-V V vector_fmul_scalar remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 08/29] lavu/floatdsp: RISC-V V vector_dmul_scalar remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 09/29] lavu/floatdsp: RISC-V V vector_fmul remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 10/29] lavu/floatdsp: RISC-V V vector_dmul remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 11/29] lavu/floatdsp: RISC-V V vector_fmac_scalar remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 12/29] lavu/floatdsp: RISC-V V vector_dmac_scalar remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 13/29] lavu/floatdsp: RISC-V V vector_fmul_add remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 14/29] lavu/floatdsp: RISC-V V butterflies_float remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 15/29] lavu/floatdsp: RISC-V V vector_fmul_reversed remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 16/29] lavu/floatdsp: RISC-V V vector_fmul_window remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 17/29] lavu/floatdsp: RISC-V V scalarproduct_float remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 18/29] lavu/fixeddsp: RISC-V V butterflies_fixed remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 19/29] lavc/audiodsp: RISC-V V vector_clip_int32 remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 20/29] lavc/audiodsp: RISC-V V vector_clipf remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 21/29] lavc/audiodsp: RISC-V V scalarproduct_int16 remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 22/29] lavc/fmtconvert: RISC-V V int32_to_float_fmul_scalar remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 23/29] lavc/fmtconvert: RISC-V V int32_to_float_fmul_array8 remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 24/29] lavc/vorbisdsp: RISC-V V inverse_coupling remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 25/29] lavc/aacpsdsp: RISC-V V add_squares remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 26/29] lavc/aacpsdsp: RISC-V V mul_pair_single remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 27/29] lavc/aacpsdsp: RISC-V V hybrid_analysis remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 28/29] lavc/aacpsdsp: RISC-V V hybrid_analysis_ileave remi
2022-09-22 18:37 ` [FFmpeg-devel] [PATCH 29/29] lavc/aacpsdsp: RISC-V V hybrid_synthesis_deint remi

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=20220922183726.38624-3-remi@remlab.net \
    --to=remi@remlab.net \
    --cc=ffmpeg-devel@ffmpeg.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link

Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

This inbox may be cloned and mirrored by anyone:

	git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git

	# If you have public-inbox 1.1+ installed, you may
	# initialize and index your mirror using the following commands:
	public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
		ffmpegdev@gitmailbox.com
	public-inbox-index ffmpegdev

Example config snippet for mirrors.


AGPL code for this site: git clone https://public-inbox.org/public-inbox.git