Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
 help / color / mirror / Atom feed
* [FFmpeg-devel] [PATCH] avcodec/x86/audiodsp: add scalarproduct avx2
@ 2022-09-12 18:29 Paul B Mahol
  2022-09-12 18:39 ` James Almer
  2022-09-13  9:25 ` Paul B Mahol
  0 siblings, 2 replies; 6+ messages in thread
From: Paul B Mahol @ 2022-09-12 18:29 UTC (permalink / raw)
  To: FFmpeg development discussions and patches

[-- Attachment #1: Type: text/plain, Size: 40 bytes --]

Patch attached.

How to get more speed?

[-- Attachment #2: 0001-avcodec-x86-audiodsp-add-scalarproduct-avx2.patch --]
[-- Type: text/x-patch, Size: 2187 bytes --]

From 55eb5a18b4bf029f52f9d9108a750c576ba780ee Mon Sep 17 00:00:00 2001
From: Paul B Mahol <onemda@gmail.com>
Date: Mon, 12 Sep 2022 18:53:31 +0200
Subject: [PATCH] avcodec/x86/audiodsp: add scalarproduct avx2

Signed-off-by: Paul B Mahol <onemda@gmail.com>
---
 libavcodec/x86/audiodsp.asm    | 24 ++++++++++++++++++++++++
 libavcodec/x86/audiodsp_init.c |  6 ++++++
 2 files changed, 30 insertions(+)

diff --git a/libavcodec/x86/audiodsp.asm b/libavcodec/x86/audiodsp.asm
index b604b0443c..55051f6aa7 100644
--- a/libavcodec/x86/audiodsp.asm
+++ b/libavcodec/x86/audiodsp.asm
@@ -44,6 +44,30 @@ cglobal scalarproduct_int16, 3,3,3, v1, v2, order
     movd   eax, m2
     RET
 
+INIT_YMM avx2
+cglobal scalarproduct_int16, 3,4,3, v1, v2, order, offset
+    xor offsetq, offsetq
+    add orderd, orderd
+    pxor    m1, m1
+    cmp orderd, 32
+    jl   .l16
+.loop:
+    movu    m0, [v1q + offsetq]
+    pmaddwd m0, [v2q + offsetq]
+    paddd   m1, m0
+    add     offsetq, mmsize
+    cmp     offsetq, orderq
+    jl .loop
+    HADDD   m1, m0
+    movd   eax, xm1
+    RET
+.l16:
+    movu    xm0, [v1q + offsetq]
+    pmaddwd xm0, [v2q + offsetq]
+    paddd   xm1, xm0
+    HADDD  xm1, xm0
+    movd   eax, xm1
+    RET
 
 ;-----------------------------------------------------------------------------
 ; void ff_vector_clip_int32(int32_t *dst, const int32_t *src, int32_t min,
diff --git a/libavcodec/x86/audiodsp_init.c b/libavcodec/x86/audiodsp_init.c
index aa5e43e570..77d5948442 100644
--- a/libavcodec/x86/audiodsp_init.c
+++ b/libavcodec/x86/audiodsp_init.c
@@ -24,6 +24,9 @@
 #include "libavutil/x86/cpu.h"
 #include "libavcodec/audiodsp.h"
 
+int32_t ff_scalarproduct_int16_avx2(const int16_t *v1, const int16_t *v2,
+                                    int order);
+
 int32_t ff_scalarproduct_int16_sse2(const int16_t *v1, const int16_t *v2,
                                     int order);
 
@@ -53,4 +56,7 @@ av_cold void ff_audiodsp_init_x86(AudioDSPContext *c)
 
     if (EXTERNAL_SSE4(cpu_flags))
         c->vector_clip_int32 = ff_vector_clip_int32_sse4;
+
+    if (EXTERNAL_AVX2(cpu_flags))
+        c->scalarproduct_int16 = ff_scalarproduct_int16_avx2;
 }
-- 
2.37.2


[-- Attachment #3: Type: text/plain, Size: 251 bytes --]

_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

end of thread, other threads:[~2022-09-13  9:35 UTC | newest]

Thread overview: 6+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2022-09-12 18:29 [FFmpeg-devel] [PATCH] avcodec/x86/audiodsp: add scalarproduct avx2 Paul B Mahol
2022-09-12 18:39 ` James Almer
2022-09-12 19:00   ` James Almer
2022-09-13  9:25 ` Paul B Mahol
2022-09-13  9:28   ` Andreas Rheinhardt
2022-09-13  9:35   ` Paul B Mahol

Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

This inbox may be cloned and mirrored by anyone:

	git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git

	# If you have public-inbox 1.1+ installed, you may
	# initialize and index your mirror using the following commands:
	public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
		ffmpegdev@gitmailbox.com
	public-inbox-index ffmpegdev

Example config snippet for mirrors.


AGPL code for this site: git clone https://public-inbox.org/public-inbox.git