From: wenbin.chen-at-intel.com@ffmpeg.org
To: ffmpeg-devel@ffmpeg.org
Subject: [FFmpeg-devel] [PATCH 2/2] libavfilter/vf_dnn_detect: Add two outputs ssd support
Date: Wed, 27 Dec 2023 12:16:58 +0800
Message-ID: <20231227041658.392174-2-wenbin.chen@intel.com> (raw)
In-Reply-To: <20231227041658.392174-1-wenbin.chen@intel.com>
From: Wenbin Chen <wenbin.chen@intel.com>
For this kind of model, we can directly use its output as final result
just like ssd model. The difference is that it splits output into two
tensors. [x_min, y_min, x_max, y_max, confidence] and [lable_id].
Model example refer to: https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/intel/person-detection-0106
Signed-off-by: Wenbin Chen <wenbin.chen@intel.com>
---
libavfilter/vf_dnn_detect.c | 64 +++++++++++++++++++++++++++++--------
1 file changed, 50 insertions(+), 14 deletions(-)
diff --git a/libavfilter/vf_dnn_detect.c b/libavfilter/vf_dnn_detect.c
index 88865c8a8e..249cbba0f7 100644
--- a/libavfilter/vf_dnn_detect.c
+++ b/libavfilter/vf_dnn_detect.c
@@ -359,24 +359,48 @@ static int dnn_detect_post_proc_yolov3(AVFrame *frame, DNNData *output,
return 0;
}
-static int dnn_detect_post_proc_ssd(AVFrame *frame, DNNData *output, AVFilterContext *filter_ctx)
+static int dnn_detect_post_proc_ssd(AVFrame *frame, DNNData *output, int nb_outputs,
+ AVFilterContext *filter_ctx)
{
DnnDetectContext *ctx = filter_ctx->priv;
float conf_threshold = ctx->confidence;
- int proposal_count = output->height;
- int detect_size = output->width;
- float *detections = output->data;
+ int proposal_count = 0;
+ int detect_size = 0;
+ float *detections = NULL, *labels = NULL;
int nb_bboxes = 0;
AVDetectionBBoxHeader *header;
AVDetectionBBox *bbox;
-
- if (output->width != 7) {
+ int scale_w = ctx->scale_width;
+ int scale_h = ctx->scale_height;
+
+ if (nb_outputs == 1 && output->width == 7) {
+ proposal_count = output->height;
+ detect_size = output->width;
+ detections = output->data;
+ } else if (nb_outputs == 2 && output[0].width == 5) {
+ proposal_count = output[0].height;
+ detect_size = output[0].width;
+ detections = output[0].data;
+ labels = output[1].data;
+ } else if (nb_outputs == 2 && output[1].width == 5) {
+ proposal_count = output[1].height;
+ detect_size = output[1].width;
+ detections = output[1].data;
+ labels = output[0].data;
+ } else {
av_log(filter_ctx, AV_LOG_ERROR, "Model output shape doesn't match ssd requirement.\n");
return AVERROR(EINVAL);
}
+ if (proposal_count == 0)
+ return 0;
+
for (int i = 0; i < proposal_count; ++i) {
- float conf = detections[i * detect_size + 2];
+ float conf;
+ if (nb_outputs == 1)
+ conf = detections[i * detect_size + 2];
+ else
+ conf = detections[i * detect_size + 4];
if (conf < conf_threshold) {
continue;
}
@@ -398,12 +422,24 @@ static int dnn_detect_post_proc_ssd(AVFrame *frame, DNNData *output, AVFilterCon
for (int i = 0; i < proposal_count; ++i) {
int av_unused image_id = (int)detections[i * detect_size + 0];
- int label_id = (int)detections[i * detect_size + 1];
- float conf = detections[i * detect_size + 2];
- float x0 = detections[i * detect_size + 3];
- float y0 = detections[i * detect_size + 4];
- float x1 = detections[i * detect_size + 5];
- float y1 = detections[i * detect_size + 6];
+ int label_id;
+ float conf, x0, y0, x1, y1;
+
+ if (nb_outputs == 1) {
+ label_id = (int)detections[i * detect_size + 1];
+ conf = detections[i * detect_size + 2];
+ x0 = detections[i * detect_size + 3];
+ y0 = detections[i * detect_size + 4];
+ x1 = detections[i * detect_size + 5];
+ y1 = detections[i * detect_size + 6];
+ } else {
+ label_id = (int)labels[i];
+ x0 = detections[i * detect_size] / scale_w;
+ y0 = detections[i * detect_size + 1] / scale_h;
+ x1 = detections[i * detect_size + 2] / scale_w;
+ y1 = detections[i * detect_size + 3] / scale_h;
+ conf = detections[i * detect_size + 4];
+ }
if (conf < conf_threshold) {
continue;
@@ -447,7 +483,7 @@ static int dnn_detect_post_proc_ov(AVFrame *frame, DNNData *output, int nb_outpu
switch (ctx->model_type) {
case DDMT_SSD:
- ret = dnn_detect_post_proc_ssd(frame, output, filter_ctx);
+ ret = dnn_detect_post_proc_ssd(frame, output, nb_outputs, filter_ctx);
if (ret < 0)
return ret;
break;
--
2.34.1
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
next prev parent reply other threads:[~2023-12-27 4:17 UTC|newest]
Thread overview: 3+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-12-27 4:16 [FFmpeg-devel] [PATCH 1/2] libavfilter/dnn_backend_openvino: Add dynamic output support wenbin.chen-at-intel.com
2023-12-27 4:16 ` wenbin.chen-at-intel.com [this message]
2023-12-29 10:37 ` Guo, Yejun
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20231227041658.392174-2-wenbin.chen@intel.com \
--to=wenbin.chen-at-intel.com@ffmpeg.org \
--cc=ffmpeg-devel@ffmpeg.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
This inbox may be cloned and mirrored by anyone:
git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git
# If you have public-inbox 1.1+ installed, you may
# initialize and index your mirror using the following commands:
public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
ffmpegdev@gitmailbox.com
public-inbox-index ffmpegdev
Example config snippet for mirrors.
AGPL code for this site: git clone https://public-inbox.org/public-inbox.git