Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
 help / color / mirror / Atom feed
* [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb
@ 2025-03-31  2:37 Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
                   ` (4 more replies)
  0 siblings, 5 replies; 6+ messages in thread
From: Lynne @ 2025-03-31  2:37 UTC (permalink / raw)
  To: ffmpeg-devel; +Cc: Lynne

This allows for the upcoming refactor.
---
 libavcodec/vulkan_av1.c    |  6 +++---
 libavcodec/vulkan_decode.c | 23 ++++++-----------------
 libavcodec/vulkan_decode.h |  5 +++--
 libavcodec/vulkan_ffv1.c   | 22 ++++++++--------------
 libavcodec/vulkan_h264.c   |  9 +++------
 libavcodec/vulkan_hevc.c   |  6 +++---
 6 files changed, 26 insertions(+), 45 deletions(-)

diff --git a/libavcodec/vulkan_av1.c b/libavcodec/vulkan_av1.c
index ccb88004b5..13df24a44b 100644
--- a/libavcodec/vulkan_av1.c
+++ b/libavcodec/vulkan_av1.c
@@ -577,9 +577,7 @@ static int vk_av1_decode_slice(AVCodecContext *avctx,
 
         err = ff_vk_decode_add_slice(avctx, vp,
                                      data + s->tile_group_info[i].tile_offset,
-                                     s->tile_group_info[i].tile_size, 0,
-                                     &ap->av1_pic_info.tileCount,
-                                     &ap->av1_pic_info.pTileOffsets);
+                                     s->tile_group_info[i].tile_size, 0);
         if (err < 0)
             return err;
     }
@@ -616,6 +614,8 @@ static int vk_av1_end_frame(AVCodecContext *avctx)
     }
 #endif
 
+    ap->av1_pic_info.pTileOffsets = vp->slice_offsets;
+    ap->av1_pic_info.tileCount = vp->nb_slices;
     if (!ap->av1_pic_info.tileCount)
         return 0;
 
diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 93aa0ce5b3..48a206e3c0 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -249,33 +249,23 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
 }
 
 int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
-                           const uint8_t *data, size_t size, int add_startcode,
-                           uint32_t *nb_slices, const uint32_t **offsets)
+                           const uint8_t *data, size_t size, int add_startcode)
 {
     FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
     FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
     static const uint8_t startcode_prefix[3] = { 0x0, 0x0, 0x1 };
     const size_t startcode_len = add_startcode ? sizeof(startcode_prefix) : 0;
-    const int nb = nb_slices ? *nb_slices : 0;
     uint8_t *slices;
-    uint32_t *slice_off;
     FFVkBuffer *vkbuf;
 
     size_t new_size = vp->slices_size + startcode_len + size +
                       ctx->caps.minBitstreamBufferSizeAlignment;
     new_size = FFALIGN(new_size, ctx->caps.minBitstreamBufferSizeAlignment);
 
-    if (offsets) {
-        slice_off = av_fast_realloc(dec->slice_off, &dec->slice_off_max,
-                                    (nb + 1)*sizeof(slice_off));
-        if (!slice_off)
-            return AVERROR(ENOMEM);
-
-        *offsets = dec->slice_off = slice_off;
-
-        slice_off[nb] = vp->slices_size;
-    }
+    /* Should never happen */
+    if (vp->nb_slices > FF_ARRAY_ELEMS(vp->slice_offsets))
+        return AVERROR(EINVAL);
 
     vkbuf = vp->slices_buf ? (FFVkBuffer *)vp->slices_buf->data : NULL;
     if (!vkbuf || vkbuf->size < new_size) {
@@ -321,9 +311,8 @@ int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
     /* Slice data */
     memcpy(slices + vp->slices_size + startcode_len, data, size);
 
-    if (nb_slices)
-        *nb_slices = nb + 1;
-
+    vp->slice_offsets[vp->nb_slices] = vp->slices_size;
+    vp->nb_slices = vp->nb_slices + 1;
     vp->slices_size += startcode_len + size;
 
     return 0;
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index cbd22b3591..4bd755c1f6 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -110,6 +110,8 @@ typedef struct FFVulkanDecodePicture {
     /* Slice data */
     AVBufferRef                    *slices_buf;
     size_t                          slices_size;
+    uint32_t                        slice_offsets[1024];
+    uint32_t                        nb_slices;
 
     /* Vulkan functions needed for destruction, as no other context is guaranteed to exist */
     PFN_vkWaitSemaphores            wait_semaphores;
@@ -158,8 +160,7 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
  * Add slice data to frame.
  */
 int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
-                           const uint8_t *data, size_t size, int add_startcode,
-                           uint32_t *nb_slices, const uint32_t **offsets);
+                           const uint8_t *data, size_t size, int add_startcode);
 
 /**
  * Decode a frame.
diff --git a/libavcodec/vulkan_ffv1.c b/libavcodec/vulkan_ffv1.c
index 17bfc943d4..7eb51b0dab 100644
--- a/libavcodec/vulkan_ffv1.c
+++ b/libavcodec/vulkan_ffv1.c
@@ -55,8 +55,6 @@ typedef struct FFv1VulkanDecodePicture {
     uint32_t max_context_count;
 
     AVBufferRef *slice_offset_buf;
-    uint32_t    *slice_offset;
-    int          slice_num;
 
     AVBufferRef *slice_status_buf;
     int crc_checked;
@@ -163,8 +161,6 @@ static int vk_ffv1_start_frame(AVCodecContext          *avctx,
     int is_rgb = !(f->colorspace == 0 && sw_format != AV_PIX_FMT_YA8) &&
                  !(sw_format == AV_PIX_FMT_YA8);
 
-    fp->slice_num = 0;
-
     for (int i = 0; i < f->quant_table_count; i++)
         fp->max_context_count = FFMAX(f->context_count[i], fp->max_context_count);
 
@@ -278,22 +274,20 @@ static int vk_ffv1_decode_slice(AVCodecContext *avctx,
 
     if (ctx->s.extensions & FF_VK_EXT_EXTERNAL_HOST_MEMORY) {
         FFVkBuffer *slices_buf = (FFVkBuffer *)vp->slices_buf->data;
-        AV_WN32(slice_offset->mapped_mem + (2*fp->slice_num + 0)*sizeof(uint32_t),
+        AV_WN32(slice_offset->mapped_mem + (2*vp->nb_slices + 0)*sizeof(uint32_t),
                 data - slices_buf->mapped_mem);
-        AV_WN32(slice_offset->mapped_mem + (2*fp->slice_num + 1)*sizeof(uint32_t),
+        AV_WN32(slice_offset->mapped_mem + (2*vp->nb_slices + 1)*sizeof(uint32_t),
                 size);
 
-        fp->slice_num++;
+        vp->nb_slices++;
     } else {
-        int err = ff_vk_decode_add_slice(avctx, vp, data, size, 0,
-                                         &fp->slice_num,
-                                         (const uint32_t **)&fp->slice_offset);
+        int err = ff_vk_decode_add_slice(avctx, vp, data, size, 0);
         if (err < 0)
             return err;
 
-        AV_WN32(slice_offset->mapped_mem + (2*(fp->slice_num - 1) + 0)*sizeof(uint32_t),
-                fp->slice_offset[fp->slice_num - 1]);
-        AV_WN32(slice_offset->mapped_mem + (2*(fp->slice_num - 1) + 1)*sizeof(uint32_t),
+        AV_WN32(slice_offset->mapped_mem + (2*(vp->nb_slices - 1) + 0)*sizeof(uint32_t),
+                vp->slice_offsets[vp->nb_slices - 1]);
+        AV_WN32(slice_offset->mapped_mem + (2*(vp->nb_slices - 1) + 1)*sizeof(uint32_t),
                 size);
     }
 
@@ -1280,7 +1274,7 @@ static void vk_ffv1_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
 
     if (fp->crc_checked) {
         FFVkBuffer *slice_status = (FFVkBuffer *)fp->slice_status_buf->data;
-        for (int i = 0; i < fp->slice_num; i++) {
+        for (int i = 0; i < vp->nb_slices; i++) {
             uint32_t crc_res;
             crc_res = AV_RN32(slice_status->mapped_mem + i*sizeof(uint32_t));
             if (crc_res != 0)
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index 73aaed7f6a..af37e0800b 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -491,9 +491,7 @@ static int vk_h264_decode_slice(AVCodecContext *avctx,
     H264VulkanDecodePicture *hp = h->cur_pic_ptr->hwaccel_picture_private;
     FFVulkanDecodePicture *vp = &hp->vp;
 
-    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1,
-                                     &hp->h264_pic_info.sliceCount,
-                                     &hp->h264_pic_info.pSliceOffsets);
+    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
     if (err < 0)
         return err;
 
@@ -541,12 +539,11 @@ static int vk_h264_end_frame(AVCodecContext *avctx)
     }
 #endif
 
+    hp->h264_pic_info.pSliceOffsets = vp->slice_offsets;
+    hp->h264_pic_info.sliceCount = vp->nb_slices;
     if (!hp->h264_pic_info.sliceCount)
         return 0;
 
-    if (!vp->slices_buf)
-        return AVERROR(EINVAL);
-
     if (!dec->session_params &&
         !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
         int err = vk_h264_create_params(avctx, &dec->session_params);
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index e4a946ae0d..e95f554756 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -842,9 +842,7 @@ static int vk_hevc_decode_slice(AVCodecContext *avctx,
     HEVCVulkanDecodePicture *hp = h->cur_frame->hwaccel_picture_private;
     FFVulkanDecodePicture *vp = &hp->vp;
 
-    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1,
-                                     &hp->h265_pic_info.sliceSegmentCount,
-                                     &hp->h265_pic_info.pSliceSegmentOffsets);
+    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
     if (err < 0)
         return err;
 
@@ -898,6 +896,8 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
     }
 #endif
 
+    hp->h265_pic_info.pSliceSegmentOffsets = vp->slice_offsets;
+    hp->h265_pic_info.sliceSegmentCount = vp->nb_slices;
     if (!hp->h265_pic_info.sliceSegmentCount)
         return 0;
 
-- 
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

* [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame
  2025-03-31  2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
@ 2025-03-31  2:37 ` Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec Lynne
                   ` (3 subsequent siblings)
  4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31  2:37 UTC (permalink / raw)
  To: ffmpeg-devel; +Cc: Lynne

We tried to create sequence params in both start_frame and end_frame.
This was redundant.

Just always create them in end_frame.
---
 libavcodec/vulkan_av1.c  | 8 --------
 libavcodec/vulkan_h264.c | 9 ---------
 libavcodec/vulkan_hevc.c | 9 ---------
 3 files changed, 26 deletions(-)

diff --git a/libavcodec/vulkan_av1.c b/libavcodec/vulkan_av1.c
index 13df24a44b..115db8badb 100644
--- a/libavcodec/vulkan_av1.c
+++ b/libavcodec/vulkan_av1.c
@@ -254,7 +254,6 @@ static int vk_av1_start_frame(AVCodecContext          *avctx,
     AV1DecContext *s = avctx->priv_data;
     const AV1Frame *pic = &s->cur_frame;
     FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
-    FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
     AV1VulkanDecodePicture *ap = pic->hwaccel_picture_private;
     FFVulkanDecodePicture *vp = &ap->vp;
@@ -269,13 +268,6 @@ static int vk_av1_start_frame(AVCodecContext          *avctx,
                                                          STD_VIDEO_AV1_FRAME_RESTORATION_TYPE_WIENER,
                                                          STD_VIDEO_AV1_FRAME_RESTORATION_TYPE_SGRPROJ };
 
-    if (!dec->session_params &&
-        !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
-        err = vk_av1_create_params(avctx, &dec->session_params, ap);
-        if (err < 0)
-            return err;
-    }
-
     if (!ap->frame_id_set) {
         unsigned slot_idx = 0;
         for (unsigned i = 0; i < 32; i++) {
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index af37e0800b..d950c6948f 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -366,20 +366,11 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
     int err;
     int dpb_slot_index = 0;
     H264Context *h = avctx->priv_data;
-    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
-    FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
     H264Picture *pic = h->cur_pic_ptr;
     H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
     FFVulkanDecodePicture *vp = &hp->vp;
 
-    if (!dec->session_params &&
-        !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
-        err = vk_h264_create_params(avctx, &dec->session_params);
-        if (err < 0)
-            return err;
-    }
-
     /* Fill in main slot */
     dpb_slot_index = 0;
     for (unsigned slot = 0; slot < H264_MAX_PICTURE_COUNT; slot++) {
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index e95f554756..bc43591e19 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -716,8 +716,6 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
     int err;
     HEVCContext *h = avctx->priv_data;
     HEVCLayerContext *l = &h->layers[h->cur_layer];
-    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
-    FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
     HEVCFrame *pic = h->cur_frame;
     HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
@@ -726,13 +724,6 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
     const HEVCSPS *sps = pps->sps;
     int nb_refs = 0;
 
-    if (!dec->session_params &&
-        !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
-        err = vk_hevc_create_params(avctx, &dec->session_params);
-        if (err < 0)
-            return err;
-    }
-
     hp->h265pic = (StdVideoDecodeH265PictureInfo) {
         .flags = (StdVideoDecodeH265PictureInfoFlags) {
             .IrapPicFlag = IS_IRAP(h),
-- 
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

* [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec
  2025-03-31  2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
@ 2025-03-31  2:37 ` Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function Lynne
                   ` (2 subsequent siblings)
  4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31  2:37 UTC (permalink / raw)
  To: ffmpeg-devel; +Cc: Lynne

Required for next refactor.
---
 libavcodec/vulkan_av1.c    | 30 +++++++++++++++++++++---------
 libavcodec/vulkan_decode.c | 20 ++++++++++----------
 libavcodec/vulkan_decode.h | 13 +------------
 libavcodec/vulkan_h264.c   | 32 ++++++++++++++++++++++----------
 libavcodec/vulkan_hevc.c   | 28 ++++++++++++++++++++--------
 5 files changed, 74 insertions(+), 49 deletions(-)

diff --git a/libavcodec/vulkan_av1.c b/libavcodec/vulkan_av1.c
index 115db8badb..c4ae0bb2ab 100644
--- a/libavcodec/vulkan_av1.c
+++ b/libavcodec/vulkan_av1.c
@@ -66,6 +66,17 @@ typedef struct AV1VulkanDecodePicture {
     StdVideoDecodeAV1ReferenceInfo      std_refs  [AV1_NUM_REF_FRAMES];
     VkVideoDecodeAV1DpbSlotInfoKHR      vkav1_refs[AV1_NUM_REF_FRAMES];
 
+    /* Current picture */
+    VkVideoPictureResourceInfoKHR   ref;
+    VkVideoReferenceSlotInfoKHR     ref_slot;
+
+    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+    VkVideoPictureResourceInfoKHR   refs     [36];
+    VkVideoReferenceSlotInfoKHR     ref_slots[36];
+
+    /* Main decoding struct */
+    VkVideoDecodeInfoKHR            decode_info;
+
     uint8_t frame_id_set;
     uint8_t frame_id;
     uint8_t ref_frame_sign_bias_mask;
@@ -295,7 +306,7 @@ static int vk_av1_start_frame(AVCodecContext          *avctx,
             continue;
 
         for (int j = 0; j < ref_count; j++) {
-            if (vp->ref_slots[j].slotIndex == hp->frame_id) {
+            if (ap->ref_slots[j].slotIndex == hp->frame_id) {
                 found = 1;
                 break;
             }
@@ -303,8 +314,8 @@ static int vk_av1_start_frame(AVCodecContext          *avctx,
         if (found)
             continue;
 
-        err = vk_av1_fill_pict(avctx, &ap->ref_src[ref_count], &vp->ref_slots[ref_count],
-                               &vp->refs[ref_count], &ap->std_refs[ref_count], &ap->vkav1_refs[ref_count],
+        err = vk_av1_fill_pict(avctx, &ap->ref_src[ref_count], &ap->ref_slots[ref_count],
+                               &ap->refs[ref_count], &ap->std_refs[ref_count], &ap->vkav1_refs[ref_count],
                                ref_frame, 0, 0, ref_frame->order_hints);
         if (err < 0)
             return err;
@@ -312,7 +323,7 @@ static int vk_av1_start_frame(AVCodecContext          *avctx,
         ref_count++;
     }
 
-    err = vk_av1_fill_pict(avctx, NULL, &vp->ref_slot, &vp->ref,
+    err = vk_av1_fill_pict(avctx, NULL, &ap->ref_slot, &ap->ref,
                            &ap->std_ref,
                            &ap->vkav1_ref,
                            pic, 1, apply_grain, NULL);
@@ -339,13 +350,13 @@ static int vk_av1_start_frame(AVCodecContext          *avctx,
             ap->av1_pic_info.referenceNameSlotIndices[i] = hp->frame_id;
     }
 
-    vp->decode_info = (VkVideoDecodeInfoKHR) {
+    ap->decode_info = (VkVideoDecodeInfoKHR) {
         .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_INFO_KHR,
         .pNext = &ap->av1_pic_info,
         .flags = 0x0,
-        .pSetupReferenceSlot = &vp->ref_slot,
+        .pSetupReferenceSlot = &ap->ref_slot,
         .referenceSlotCount = ref_count,
-        .pReferenceSlots = vp->ref_slots,
+        .pReferenceSlots = ap->ref_slots,
         .dstPictureResource = (VkVideoPictureResourceInfoKHR) {
             .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
             .codedOffset = (VkOffset2D){ 0, 0 },
@@ -618,7 +629,7 @@ static int vk_av1_end_frame(AVCodecContext *avctx)
             return err;
     }
 
-    for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+    for (int i = 0; i < ap->decode_info.referenceSlotCount; i++) {
         const AV1Frame *rp = ap->ref_src[i];
         AV1VulkanDecodePicture *rhp = rp->hwaccel_picture_private;
 
@@ -629,7 +640,8 @@ static int vk_av1_end_frame(AVCodecContext *avctx)
     av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i tiles\n",
            vp->slices_size, ap->av1_pic_info.tileCount);
 
-    return ff_vk_decode_frame(avctx, pic->f, vp, rav, rvp);
+    return ff_vk_decode_frame(avctx, &ap->decode_info,
+                              pic->f, vp, rav, rvp);
 }
 
 static void vk_av1_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 48a206e3c0..058efe3037 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -354,7 +354,7 @@ void ff_vk_decode_flush(AVCodecContext *avctx)
     ff_vk_exec_submit(&ctx->s, exec);
 }
 
-int ff_vk_decode_frame(AVCodecContext *avctx,
+int ff_vk_decode_frame(AVCodecContext *avctx, VkVideoDecodeInfoKHR *decode_info,
                        AVFrame *pic,    FFVulkanDecodePicture *vp,
                        AVFrame *rpic[], FFVulkanDecodePicture *rvkp[])
 {
@@ -379,8 +379,8 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
         .videoSessionParameters = dec->session_params ?
                                   *((VkVideoSessionParametersKHR *)dec->session_params->data) :
                                   VK_NULL_HANDLE,
-        .referenceSlotCount = vp->decode_info.referenceSlotCount,
-        .pReferenceSlots = vp->decode_info.pReferenceSlots,
+        .referenceSlotCount = decode_info->referenceSlotCount,
+        .pReferenceSlots = decode_info->pReferenceSlots,
     };
     VkVideoEndCodingInfoKHR decode_end = {
         .sType = VK_STRUCTURE_TYPE_VIDEO_END_CODING_INFO_KHR,
@@ -396,7 +396,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
     /* The current decoding reference has to be bound as an inactive reference */
     VkVideoReferenceSlotInfoKHR *cur_vk_ref;
     cur_vk_ref = (void *)&decode_start.pReferenceSlots[decode_start.referenceSlotCount];
-    cur_vk_ref[0] = vp->ref_slot;
+    cur_vk_ref[0] = *decode_info->pSetupReferenceSlot;
     cur_vk_ref[0].slotIndex = -1;
     decode_start.referenceSlotCount++;
 
@@ -420,9 +420,9 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
         }
     }
 
-    vp->decode_info.srcBuffer       = sd_buf->buf;
-    vp->decode_info.srcBufferOffset = 0;
-    vp->decode_info.srcBufferRange  = data_size;
+    decode_info->srcBuffer       = sd_buf->buf;
+    decode_info->srcBufferOffset = 0;
+    decode_info->srcBufferRange  = data_size;
 
     /* Start command buffer recording */
     err = ff_vk_exec_start(&ctx->s, exec);
@@ -488,7 +488,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
     if (!layered_dpb) {
         /* All references (apart from the current) for non-layered refs */
 
-        for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+        for (int i = 0; i < decode_info->referenceSlotCount; i++) {
             AVFrame *ref_frame = rpic[i];
             FFVulkanDecodePicture *rvp = rvkp[i];
             AVFrame *ref = rvp->dpb_frame ? rvp->dpb_frame : ref_frame;
@@ -533,7 +533,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
                                         &img_bar[nb_img_bar], &nb_img_bar);
             }
         }
-    } else if (vp->decode_info.referenceSlotCount ||
+    } else if (decode_info->referenceSlotCount ||
                vp->view.out[0] != vp->view.ref[0]) {
         /* Single barrier for a single layered ref */
         err = ff_vk_exec_add_dep_frame(&ctx->s, exec, ctx->common.layered_frame,
@@ -553,7 +553,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
 
     /* Start, use parameters, decode and end decoding */
     vk->CmdBeginVideoCodingKHR(cmd_buf, &decode_start);
-    vk->CmdDecodeVideoKHR(cmd_buf, &vp->decode_info);
+    vk->CmdDecodeVideoKHR(cmd_buf, decode_info);
     vk->CmdEndVideoCodingKHR(cmd_buf, &decode_end);
 
     /* End recording and submit for execution */
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index 4bd755c1f6..6c3e1486b0 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -96,17 +96,6 @@ typedef struct FFVulkanDecodePicture {
     VkSemaphore                     sem;
     uint64_t                        sem_value;
 
-    /* Current picture */
-    VkVideoPictureResourceInfoKHR   ref;
-    VkVideoReferenceSlotInfoKHR     ref_slot;
-
-    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
-    VkVideoPictureResourceInfoKHR   refs     [36];
-    VkVideoReferenceSlotInfoKHR     ref_slots[36];
-
-    /* Main decoding struct */
-    VkVideoDecodeInfoKHR            decode_info;
-
     /* Slice data */
     AVBufferRef                    *slices_buf;
     size_t                          slices_size;
@@ -165,7 +154,7 @@ int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
 /**
  * Decode a frame.
  */
-int ff_vk_decode_frame(AVCodecContext *avctx,
+int ff_vk_decode_frame(AVCodecContext *avctx, VkVideoDecodeInfoKHR *decode_info,
                        AVFrame *pic,    FFVulkanDecodePicture *vp,
                        AVFrame *rpic[], FFVulkanDecodePicture *rvkp[]);
 
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index d950c6948f..71a9c06801 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -47,6 +47,17 @@ typedef struct H264VulkanDecodePicture {
     /* Current picture (contd.) */
     StdVideoDecodeH264PictureInfo   h264pic;
     VkVideoDecodeH264PictureInfoKHR h264_pic_info;
+
+    /* Current picture */
+    VkVideoPictureResourceInfoKHR   ref;
+    VkVideoReferenceSlotInfoKHR     ref_slot;
+
+    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+    VkVideoPictureResourceInfoKHR   refs     [36];
+    VkVideoReferenceSlotInfoKHR     ref_slots[36];
+
+    /* Main decoding struct */
+    VkVideoDecodeInfoKHR            decode_info;
 } H264VulkanDecodePicture;
 
 const static int h264_scaling_list8_order[] = { 0, 3, 1, 4, 2, 5 };
@@ -380,7 +391,7 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
         }
     }
 
-    err = vk_h264_fill_pict(avctx, NULL, &vp->ref_slot, &vp->ref,
+    err = vk_h264_fill_pict(avctx, NULL, &hp->ref_slot, &hp->ref,
                             &hp->vkh264_ref, &hp->h264_ref, pic, 1,
                             h->DPB[dpb_slot_index].field_picture,
                             h->DPB[dpb_slot_index].reference,
@@ -397,8 +408,8 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
                 break;
             }
         }
-        err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &vp->ref_slots[i],
-                                &vp->refs[i], &hp->vkh264_refs[i],
+        err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &hp->ref_slots[i],
+                                &hp->refs[i], &hp->vkh264_refs[i],
                                 &hp->h264_refs[i], h->short_ref[i], 0,
                                 h->DPB[dpb_slot_index].field_picture,
                                 h->DPB[dpb_slot_index].reference,
@@ -420,8 +431,8 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
                 break;
             }
         }
-        err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &vp->ref_slots[i],
-                                &vp->refs[i], &hp->vkh264_refs[i],
+        err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &hp->ref_slots[i],
+                                &hp->refs[i], &hp->vkh264_refs[i],
                                 &hp->h264_refs[i], h->long_ref[r], 0,
                                 h->DPB[dpb_slot_index].field_picture,
                                 h->DPB[dpb_slot_index].reference,
@@ -454,13 +465,13 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
         .pStdPictureInfo = &hp->h264pic,
     };
 
-    vp->decode_info = (VkVideoDecodeInfoKHR) {
+    hp->decode_info = (VkVideoDecodeInfoKHR) {
         .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_INFO_KHR,
         .pNext = &hp->h264_pic_info,
         .flags = 0x0,
-        .pSetupReferenceSlot = &vp->ref_slot,
+        .pSetupReferenceSlot = &hp->ref_slot,
         .referenceSlotCount = h->short_ref_count + h->long_ref_count,
-        .pReferenceSlots = vp->ref_slots,
+        .pReferenceSlots = hp->ref_slots,
         .dstPictureResource = (VkVideoPictureResourceInfoKHR) {
             .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
             .codedOffset = (VkOffset2D){ 0, 0 },
@@ -545,7 +556,7 @@ static int vk_h264_end_frame(AVCodecContext *avctx)
         hp->h264pic.pic_parameter_set_id = pic->pps->pps_id;
     }
 
-    for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+    for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
         H264Picture *rp = hp->ref_src[i];
         H264VulkanDecodePicture *rhp = rp->hwaccel_picture_private;
 
@@ -556,7 +567,8 @@ static int vk_h264_end_frame(AVCodecContext *avctx)
     av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
            vp->slices_size, hp->h264_pic_info.sliceCount);
 
-    return ff_vk_decode_frame(avctx, pic->f, vp, rav, rvp);
+    return ff_vk_decode_frame(avctx, &hp->decode_info,
+                              pic->f, vp, rav, rvp);
 }
 
 static void vk_h264_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index bc43591e19..e83f8346a0 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -127,6 +127,17 @@ typedef struct HEVCVulkanDecodePicture {
     /* Current picture (contd.) */
     StdVideoDecodeH265PictureInfo   h265pic;
     VkVideoDecodeH265PictureInfoKHR h265_pic_info;
+
+    /* Current picture */
+    VkVideoPictureResourceInfoKHR   ref;
+    VkVideoReferenceSlotInfoKHR     ref_slot;
+
+    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+    VkVideoPictureResourceInfoKHR   refs     [36];
+    VkVideoReferenceSlotInfoKHR     ref_slots[36];
+
+    /* Main decoding struct */
+    VkVideoDecodeInfoKHR            decode_info;
 } HEVCVulkanDecodePicture;
 
 static int vk_hevc_fill_pict(AVCodecContext *avctx, HEVCFrame **ref_src,
@@ -749,7 +760,7 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
             continue;
 
         if (ref == pic) {
-            err = vk_hevc_fill_pict(avctx, NULL, &vp->ref_slot, &vp->ref,
+            err = vk_hevc_fill_pict(avctx, NULL, &hp->ref_slot, &hp->ref,
                                     &hp->vkh265_ref, &hp->h265_ref, pic, 1, i);
             if (err < 0)
                 return err;
@@ -757,8 +768,8 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
             continue;
         }
 
-        err = vk_hevc_fill_pict(avctx, &hp->ref_src[idx], &vp->ref_slots[idx],
-                                &vp->refs[idx], &hp->vkh265_refs[idx],
+        err = vk_hevc_fill_pict(avctx, &hp->ref_src[idx], &hp->ref_slots[idx],
+                                &hp->refs[idx], &hp->vkh265_refs[idx],
                                 &hp->h265_refs[idx], (HEVCFrame *)ref, 0, i);
         if (err < 0)
             return err;
@@ -806,13 +817,13 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
         .sliceSegmentCount = 0,
     };
 
-    vp->decode_info = (VkVideoDecodeInfoKHR) {
+    hp->decode_info = (VkVideoDecodeInfoKHR) {
         .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_INFO_KHR,
         .pNext = &hp->h265_pic_info,
         .flags = 0x0,
-        .pSetupReferenceSlot = &vp->ref_slot,
+        .pSetupReferenceSlot = &hp->ref_slot,
         .referenceSlotCount = nb_refs,
-        .pReferenceSlots = vp->ref_slots,
+        .pReferenceSlots = hp->ref_slots,
         .dstPictureResource = (VkVideoPictureResourceInfoKHR) {
             .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
             .codedOffset = (VkOffset2D){ 0, 0 },
@@ -915,7 +926,7 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
         hp->h265pic.pps_pic_parameter_set_id = pps->pps_id;
     }
 
-    for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+    for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
         HEVCVulkanDecodePicture *rfhp = hp->ref_src[i]->hwaccel_picture_private;
         rav[i] = hp->ref_src[i]->f;
         rvp[i] = &rfhp->vp;
@@ -924,7 +935,8 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
     av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
            vp->slices_size, hp->h265_pic_info.sliceSegmentCount);
 
-    return ff_vk_decode_frame(avctx, pic->f, vp, rav, rvp);
+    return ff_vk_decode_frame(avctx, &hp->decode_info,
+                              pic->f, vp, rav, rvp);
 }
 
 static void vk_hevc_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
-- 
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

* [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function
  2025-03-31  2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec Lynne
@ 2025-03-31  2:37 ` Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: " Lynne
  4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31  2:37 UTC (permalink / raw)
  To: ffmpeg-devel; +Cc: Lynne

---
 libavcodec/vulkan_decode.c | 38 ++++++++++++++++++++++++++++++++++----
 libavcodec/vulkan_decode.h |  6 ++++++
 2 files changed, 40 insertions(+), 4 deletions(-)

diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 058efe3037..893f8fca3d 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -151,8 +151,6 @@ int ff_vk_decode_prepare_frame(FFVulkanDecodeContext *dec, AVFrame *pic,
     int err;
     FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
-    vkpic->slices_size = 0;
-
     /* If the decoder made a blank frame to make up for a missing ref, or the
      * frame is the current frame so it's missing one, create a re-representation */
     if (vkpic->view.ref[0])
@@ -209,8 +207,6 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
     FFVulkanDecodeShared *ctx = dec->shared_ctx;
     AVHWFramesContext *frames = (AVHWFramesContext *)pic->hw_frames_ctx->data;
 
-    vkpic->slices_size = 0;
-
     if (vkpic->view.ref[0])
         return 0;
 
@@ -248,6 +244,31 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
     return 0;
 }
 
+int ff_vk_decode_start_frame(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+                             const AVBufferRef *buffer_ref, int complete)
+{
+    int err;
+    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
+    FFVulkanDecodeShared *ctx = dec->shared_ctx;
+
+    vp->nb_slices = 0;
+    vp->slices_size = 0;
+
+    /* Host map the input slices data if supported */
+    if (complete && ctx->s.extensions & FF_VK_EXT_EXTERNAL_HOST_MEMORY) {
+        err = ff_vk_host_map_buffer(&ctx->s, &vp->slices_buf, buffer_ref->data,
+                                    buffer_ref,
+                                    DECODER_IS_SDR(avctx->codec_id) ?
+                                    (VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
+                                     VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT) :
+                                    VK_BUFFER_USAGE_VIDEO_DECODE_SRC_BIT_KHR);
+        if (err < 0)
+            return err;
+    }
+
+    return 0;
+}
+
 int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
                            const uint8_t *data, size_t size, int add_startcode)
 {
@@ -268,6 +289,15 @@ int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
         return AVERROR(EINVAL);
 
     vkbuf = vp->slices_buf ? (FFVkBuffer *)vp->slices_buf->data : NULL;
+
+    /* Buffer exists, and is a single complete host-mapped buffer. */
+    if (vkbuf && vkbuf->host_ref) {
+        vp->slice_offsets[vp->nb_slices] = vp->slices_size;
+        vp->nb_slices = vp->nb_slices + 1;
+        vp->slices_size += startcode_len + size;
+        return 0;
+    }
+
     if (!vkbuf || vkbuf->size < new_size) {
         int err;
         AVBufferRef *new_ref;
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index 6c3e1486b0..103be09943 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -145,6 +145,12 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
                                    FFVulkanDecodePicture *vkpic, int is_current,
                                    enum FFVkShaderRepFormat rep_fmt, int alloc_dpb);
 
+/**
+ * Generic start_frame function.
+ */
+int ff_vk_decode_start_frame(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+                             const AVBufferRef *buffer_ref, int complete);
+
 /**
  * Add slice data to frame.
  */
-- 
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

* [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary
  2025-03-31  2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
                   ` (2 preceding siblings ...)
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function Lynne
@ 2025-03-31  2:37 ` Lynne
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: " Lynne
  4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31  2:37 UTC (permalink / raw)
  To: ffmpeg-devel; +Cc: Lynne

This commit moves all temporary structs used for decoding out
of the common picture header and onto stack.
---
 libavcodec/vulkan_decode.c |   1 +
 libavcodec/vulkan_decode.h |   3 +
 libavcodec/vulkan_h264.c   | 322 +++++++++++++++++++------------------
 3 files changed, 168 insertions(+), 158 deletions(-)

diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 893f8fca3d..5505fbda28 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -253,6 +253,7 @@ int ff_vk_decode_start_frame(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
 
     vp->nb_slices = 0;
     vp->slices_size = 0;
+    vp->intra_pic_flag = 1;
 
     /* Host map the input slices data if supported */
     if (complete && ctx->s.extensions & FF_VK_EXT_EXTERNAL_HOST_MEMORY) {
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index 103be09943..5b14d962f2 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -105,6 +105,9 @@ typedef struct FFVulkanDecodePicture {
     /* Vulkan functions needed for destruction, as no other context is guaranteed to exist */
     PFN_vkWaitSemaphores            wait_semaphores;
     PFN_vkDestroyImageView          destroy_image_view;
+
+    /* Codec specific */
+    int intra_pic_flag; /* Only used by H264 */
 } FFVulkanDecodePicture;
 
 /**
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index 71a9c06801..e697583ba9 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -32,99 +32,8 @@ const FFVulkanDecodeDescriptor ff_vk_dec_h264_desc = {
     },
 };
 
-typedef struct H264VulkanDecodePicture {
-    FFVulkanDecodePicture           vp;
-
-    /* Current picture */
-    StdVideoDecodeH264ReferenceInfo h264_ref;
-    VkVideoDecodeH264DpbSlotInfoKHR vkh264_ref;
-
-    /* Picture refs */
-    H264Picture                    *ref_src    [H264_MAX_PICTURE_COUNT];
-    StdVideoDecodeH264ReferenceInfo h264_refs  [H264_MAX_PICTURE_COUNT];
-    VkVideoDecodeH264DpbSlotInfoKHR vkh264_refs[H264_MAX_PICTURE_COUNT];
-
-    /* Current picture (contd.) */
-    StdVideoDecodeH264PictureInfo   h264pic;
-    VkVideoDecodeH264PictureInfoKHR h264_pic_info;
-
-    /* Current picture */
-    VkVideoPictureResourceInfoKHR   ref;
-    VkVideoReferenceSlotInfoKHR     ref_slot;
-
-    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
-    VkVideoPictureResourceInfoKHR   refs     [36];
-    VkVideoReferenceSlotInfoKHR     ref_slots[36];
-
-    /* Main decoding struct */
-    VkVideoDecodeInfoKHR            decode_info;
-} H264VulkanDecodePicture;
-
 const static int h264_scaling_list8_order[] = { 0, 3, 1, 4, 2, 5 };
 
-static int vk_h264_fill_pict(AVCodecContext *avctx, H264Picture **ref_src,
-                             VkVideoReferenceSlotInfoKHR *ref_slot,       /* Main structure */
-                             VkVideoPictureResourceInfoKHR *ref,          /* Goes in ^ */
-                             VkVideoDecodeH264DpbSlotInfoKHR *vkh264_ref, /* Goes in ^ */
-                             StdVideoDecodeH264ReferenceInfo *h264_ref,   /* Goes in ^ */
-                             H264Picture *pic, int is_current,
-                             int is_field, int picture_structure,
-                             int dpb_slot_index)
-{
-    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
-    FFVulkanDecodeShared *ctx = dec->shared_ctx;
-    H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
-    FFVulkanDecodePicture *vkpic = &hp->vp;
-
-    int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
-                                         dec->dedicated_dpb);
-    if (err < 0)
-        return err;
-
-    *h264_ref = (StdVideoDecodeH264ReferenceInfo) {
-        .FrameNum = pic->long_ref ? pic->pic_id : pic->frame_num,
-        .PicOrderCnt = { pic->field_poc[0], pic->field_poc[1] },
-        .flags = (StdVideoDecodeH264ReferenceInfoFlags) {
-            .top_field_flag    = is_field ? !!(picture_structure & PICT_TOP_FIELD)    : 0,
-            .bottom_field_flag = is_field ? !!(picture_structure & PICT_BOTTOM_FIELD) : 0,
-            .used_for_long_term_reference = pic->reference && pic->long_ref,
-            /*
-             * flags.is_non_existing is used to indicate whether the picture is marked as
-             * “non-existing” as defined in section 8.2.5.2 of the ITU-T H.264 Specification;
-             * 8.2.5.2 Decoding process for gaps in frame_num
-             * corresponds to the code in h264_slice.c:h264_field_start,
-             * which sets the invalid_gap flag when decoding.
-             */
-            .is_non_existing = pic->invalid_gap,
-        },
-    };
-
-    *vkh264_ref = (VkVideoDecodeH264DpbSlotInfoKHR) {
-        .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_DPB_SLOT_INFO_KHR,
-        .pStdReferenceInfo = h264_ref,
-    };
-
-    *ref = (VkVideoPictureResourceInfoKHR) {
-        .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
-        .codedOffset = (VkOffset2D){ 0, 0 },
-        .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
-        .baseArrayLayer = ctx->common.layered_dpb ? dpb_slot_index : 0,
-        .imageViewBinding = vkpic->view.ref[0],
-    };
-
-    *ref_slot = (VkVideoReferenceSlotInfoKHR) {
-        .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
-        .pNext = vkh264_ref,
-        .slotIndex = dpb_slot_index,
-        .pPictureResource = ref,
-    };
-
-    if (ref_src)
-        *ref_src = pic;
-
-    return 0;
-}
-
 static StdVideoH264LevelIdc convert_to_vk_level_idc(int level_idc)
 {
     switch (level_idc) {
@@ -369,18 +278,124 @@ static int vk_h264_create_params(AVCodecContext *avctx, AVBufferRef **buf)
     return 0;
 }
 
+static int vk_h264_fill_pict(AVCodecContext *avctx, H264Picture **ref_src,
+                             VkVideoReferenceSlotInfoKHR *ref_slot,       /* Main structure */
+                             VkVideoPictureResourceInfoKHR *ref,          /* Goes in ^ */
+                             VkVideoDecodeH264DpbSlotInfoKHR *vkh264_ref, /* Goes in ^ */
+                             StdVideoDecodeH264ReferenceInfo *h264_ref,   /* Goes in ^ */
+                             H264Picture *pic, int is_current,
+                             int is_field, int picture_structure,
+                             int dpb_slot_index)
+{
+    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
+    FFVulkanDecodeShared *ctx = dec->shared_ctx;
+    FFVulkanDecodePicture *vkpic = pic->hwaccel_picture_private;
+
+    int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
+                                         dec->dedicated_dpb);
+    if (err < 0)
+        return err;
+
+    *h264_ref = (StdVideoDecodeH264ReferenceInfo) {
+        .FrameNum = pic->long_ref ? pic->pic_id : pic->frame_num,
+        .PicOrderCnt = { pic->field_poc[0], pic->field_poc[1] },
+        .flags = (StdVideoDecodeH264ReferenceInfoFlags) {
+            .top_field_flag    = is_field ? !!(picture_structure & PICT_TOP_FIELD)    : 0,
+            .bottom_field_flag = is_field ? !!(picture_structure & PICT_BOTTOM_FIELD) : 0,
+            .used_for_long_term_reference = pic->reference && pic->long_ref,
+            /*
+             * flags.is_non_existing is used to indicate whether the picture is marked as
+             * “non-existing” as defined in section 8.2.5.2 of the ITU-T H.264 Specification;
+             * 8.2.5.2 Decoding process for gaps in frame_num
+             * corresponds to the code in h264_slice.c:h264_field_start,
+             * which sets the invalid_gap flag when decoding.
+             */
+            .is_non_existing = pic->invalid_gap,
+        },
+    };
+
+    *vkh264_ref = (VkVideoDecodeH264DpbSlotInfoKHR) {
+        .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_DPB_SLOT_INFO_KHR,
+        .pStdReferenceInfo = h264_ref,
+    };
+
+    *ref = (VkVideoPictureResourceInfoKHR) {
+        .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
+        .codedOffset = (VkOffset2D){ 0, 0 },
+        .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
+        .baseArrayLayer = ctx->common.layered_dpb ? dpb_slot_index : 0,
+        .imageViewBinding = vkpic->view.ref[0],
+    };
+
+    *ref_slot = (VkVideoReferenceSlotInfoKHR) {
+        .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
+        .pNext = vkh264_ref,
+        .slotIndex = dpb_slot_index,
+        .pPictureResource = ref,
+    };
+
+    if (ref_src)
+        *ref_src = pic;
+
+    return 0;
+}
+
 static int vk_h264_start_frame(AVCodecContext          *avctx,
                                av_unused const AVBufferRef *buffer_ref,
                                av_unused const uint8_t *buffer,
                                av_unused uint32_t       size)
+{
+    const H264Context *h = avctx->priv_data;
+    H264Picture *pic = h->cur_pic_ptr;
+    FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
+
+    return ff_vk_decode_start_frame(avctx, vp, buffer_ref, 0);
+}
+
+typedef struct H264VulkanDecodeParams {
+    /* Current picture */
+    StdVideoDecodeH264ReferenceInfo h264_ref;
+    VkVideoDecodeH264DpbSlotInfoKHR vkh264_ref;
+
+    /* Picture refs */
+    H264Picture                    *ref_src    [H264_MAX_PICTURE_COUNT];
+    StdVideoDecodeH264ReferenceInfo h264_refs  [H264_MAX_PICTURE_COUNT];
+    VkVideoDecodeH264DpbSlotInfoKHR vkh264_refs[H264_MAX_PICTURE_COUNT];
+
+    /* Current picture (contd.) */
+    StdVideoDecodeH264PictureInfo   h264pic;
+    VkVideoDecodeH264PictureInfoKHR h264_pic_info;
+
+    /* Current picture */
+    VkVideoPictureResourceInfoKHR   ref;
+    VkVideoReferenceSlotInfoKHR     ref_slot;
+
+    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+    VkVideoPictureResourceInfoKHR   refs     [36];
+    VkVideoReferenceSlotInfoKHR     ref_slots[36];
+
+    /* Maintenance 2 */
+#ifdef VK_KHR_video_maintenance2
+    StdVideoH264ScalingLists vksps_scaling;
+    StdVideoH264HrdParameters vksps_vui_header;
+    StdVideoH264SequenceParameterSetVui vksps_vui;
+    StdVideoH264SequenceParameterSet vksps;
+    StdVideoH264ScalingLists vkpps_scaling;
+    StdVideoH264PictureParameterSet vkpps;
+    VkVideoDecodeH264InlineSessionParametersInfoKHR h264_params;
+#endif
+
+    /* Main decoding struct */
+    VkVideoDecodeInfoKHR            decode_info;
+} H264VulkanDecodeParams;
+
+static int vk_h264_fill_params(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+                               H264VulkanDecodeParams *hp)
 {
     int err;
     int dpb_slot_index = 0;
     H264Context *h = avctx->priv_data;
-
     H264Picture *pic = h->cur_pic_ptr;
-    H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
-    FFVulkanDecodePicture *vp = &hp->vp;
 
     /* Fill in main slot */
     dpb_slot_index = 0;
@@ -445,13 +460,13 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
     hp->h264pic = (StdVideoDecodeH264PictureInfo) {
         .seq_parameter_set_id = pic->pps->sps_id,
         .pic_parameter_set_id = pic->pps->pps_id,
-        .frame_num = 0,  /* Set later */
-        .idr_pic_id = 0, /* Set later */
+        .frame_num = h->slice_ctx[0].frame_num,
+        .idr_pic_id = h->slice_ctx[0].idr_pic_id,
         .PicOrderCnt[0] = pic->field_poc[0],
         .PicOrderCnt[1] = pic->field_poc[1],
         .flags = (StdVideoDecodeH264PictureInfoFlags) {
+            .is_intra = vp->intra_pic_flag,
             .field_pic_flag = FIELD_PICTURE(h),
-            .is_intra = 1, /* Set later */
             .IdrPicFlag = h->picture_idr,
             .bottom_field_flag = h->picture_structure != PICT_FRAME &&
                                  h->picture_structure & PICT_BOTTOM_FIELD,
@@ -463,6 +478,8 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
     hp->h264_pic_info = (VkVideoDecodeH264PictureInfoKHR) {
         .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_PICTURE_INFO_KHR,
         .pStdPictureInfo = &hp->h264pic,
+        .pSliceOffsets = vp->slice_offsets,
+        .sliceCount = vp->nb_slices,
     };
 
     hp->decode_info = (VkVideoDecodeInfoKHR) {
@@ -484,100 +501,89 @@ static int vk_h264_start_frame(AVCodecContext          *avctx,
     return 0;
 }
 
-static int vk_h264_decode_slice(AVCodecContext *avctx,
-                                const uint8_t  *data,
-                                uint32_t        size)
-{
-    const H264Context *h = avctx->priv_data;
-    const H264SliceContext *sl  = &h->slice_ctx[0];
-    H264VulkanDecodePicture *hp = h->cur_pic_ptr->hwaccel_picture_private;
-    FFVulkanDecodePicture *vp = &hp->vp;
-
-    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
-    if (err < 0)
-        return err;
-
-    hp->h264pic.frame_num = sl->frame_num;
-    hp->h264pic.idr_pic_id = sl->idr_pic_id;
-
-    /* Frame is only intra of all slices are marked as intra */
-    if (sl->slice_type != AV_PICTURE_TYPE_I && sl->slice_type != AV_PICTURE_TYPE_SI)
-        hp->h264pic.flags.is_intra = 0;
-
-    return 0;
-}
-
 static int vk_h264_end_frame(AVCodecContext *avctx)
 {
+    int err;
     const H264Context *h = avctx->priv_data;
     FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
     FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
     H264Picture *pic = h->cur_pic_ptr;
-    H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
-    FFVulkanDecodePicture *vp = &hp->vp;
+    FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
     FFVulkanDecodePicture *rvp[H264_MAX_PICTURE_COUNT] = { 0 };
     AVFrame *rav[H264_MAX_PICTURE_COUNT] = { 0 };
 
-#ifdef VK_KHR_video_maintenance2
-    StdVideoH264ScalingLists vksps_scaling;
-    StdVideoH264HrdParameters vksps_vui_header;
-    StdVideoH264SequenceParameterSetVui vksps_vui;
-    StdVideoH264SequenceParameterSet vksps;
-    StdVideoH264ScalingLists vkpps_scaling;
-    StdVideoH264PictureParameterSet vkpps;
-    VkVideoDecodeH264InlineSessionParametersInfoKHR h264_params;
+    H264VulkanDecodeParams hp = { 0 };
+
+    if (!vp->nb_slices)
+        return 0;
+
+    err = vk_h264_fill_params(avctx, vp, &hp);
+    if (err < 0)
+        return err;
 
+#ifdef VK_KHR_video_maintenance2
     if (ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2) {
-        set_sps(h->ps.sps, &vksps_scaling,
-                &vksps_vui_header, &vksps_vui, &vksps);
-        set_pps(h->ps.pps, h->ps.sps, &vkpps_scaling, &vkpps);
-        h264_params = (VkVideoDecodeH264InlineSessionParametersInfoKHR) {
+        set_sps(h->ps.sps, &hp.vksps_scaling,
+                &hp.vksps_vui_header, &hp.vksps_vui, &hp.vksps);
+        set_pps(h->ps.pps, h->ps.sps, &hp.vkpps_scaling, &hp.vkpps);
+        hp.h264_params = (VkVideoDecodeH264InlineSessionParametersInfoKHR) {
             .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_INLINE_SESSION_PARAMETERS_INFO_KHR,
-            .pStdSPS = &vksps,
-            .pStdPPS = &vkpps,
+            .pStdSPS = &hp.vksps,
+            .pStdPPS = &hp.vkpps,
         };
-        hp->h264_pic_info.pNext = &h264_params;
-    }
+        hp.h264_pic_info.pNext = &hp.h264_params;
+    } else
 #endif
 
-    hp->h264_pic_info.pSliceOffsets = vp->slice_offsets;
-    hp->h264_pic_info.sliceCount = vp->nb_slices;
-    if (!hp->h264_pic_info.sliceCount)
-        return 0;
-
-    if (!dec->session_params &&
-        !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
+    if (!dec->session_params) {
         int err = vk_h264_create_params(avctx, &dec->session_params);
         if (err < 0)
             return err;
 
-        hp->h264pic.seq_parameter_set_id = pic->pps->sps_id;
-        hp->h264pic.pic_parameter_set_id = pic->pps->pps_id;
+        hp.h264pic.seq_parameter_set_id = pic->pps->sps_id;
+        hp.h264pic.pic_parameter_set_id = pic->pps->pps_id;
     }
 
-    for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
-        H264Picture *rp = hp->ref_src[i];
-        H264VulkanDecodePicture *rhp = rp->hwaccel_picture_private;
-
-        rvp[i] = &rhp->vp;
-        rav[i] = hp->ref_src[i]->f;
+    for (int i = 0; i < hp.decode_info.referenceSlotCount; i++) {
+        H264Picture *rp = hp.ref_src[i];
+        rvp[i] = rp->hwaccel_picture_private;
+        rav[i] = hp.ref_src[i]->f;
     }
 
     av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
-           vp->slices_size, hp->h264_pic_info.sliceCount);
+           vp->slices_size, hp.h264_pic_info.sliceCount);
 
-    return ff_vk_decode_frame(avctx, &hp->decode_info,
+    return ff_vk_decode_frame(avctx, &hp.decode_info,
                               pic->f, vp, rav, rvp);
 }
 
+static int vk_h264_decode_slice(AVCodecContext *avctx,
+                                const uint8_t  *data,
+                                uint32_t        size)
+{
+    const H264Context *h = avctx->priv_data;
+    const H264SliceContext *sl  = &h->slice_ctx[0];
+    FFVulkanDecodePicture *vp = h->cur_pic_ptr->hwaccel_picture_private;
+
+    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
+    if (err < 0)
+        return err;
+
+    /* Frame is only intra of all slices are marked as intra */
+    if (sl->slice_type != AV_PICTURE_TYPE_I && sl->slice_type != AV_PICTURE_TYPE_SI)
+        vp->intra_pic_flag = 0;
+
+    return 0;
+}
+
 static void vk_h264_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
 {
     AVHWDeviceContext *hwctx = _hwctx.nc;
-    H264VulkanDecodePicture *hp = data;
+    FFVulkanDecodePicture *vp = data;
 
     /* Free frame resources, this also destroys the session parameters. */
-    ff_vk_decode_free_frame(hwctx, &hp->vp);
+    ff_vk_decode_free_frame(hwctx, vp);
 }
 
 const FFHWAccel ff_h264_vulkan_hwaccel = {
@@ -589,7 +595,7 @@ const FFHWAccel ff_h264_vulkan_hwaccel = {
     .decode_slice          = &vk_h264_decode_slice,
     .end_frame             = &vk_h264_end_frame,
     .free_frame_priv       = &vk_h264_free_frame_priv,
-    .frame_priv_data_size  = sizeof(H264VulkanDecodePicture),
+    .frame_priv_data_size  = sizeof(FFVulkanDecodePicture),
     .init                  = &ff_vk_decode_init,
     .update_thread_context = &ff_vk_update_thread_context,
     .decode_params         = &ff_vk_params_invalidate,
-- 
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

* [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: make all temporary structs temporary
  2025-03-31  2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
                   ` (3 preceding siblings ...)
  2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary Lynne
@ 2025-03-31  2:37 ` Lynne
  4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31  2:37 UTC (permalink / raw)
  To: ffmpeg-devel; +Cc: Lynne

---
 libavcodec/vulkan_hevc.c | 291 ++++++++++++++++++++-------------------
 1 file changed, 150 insertions(+), 141 deletions(-)

diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index e83f8346a0..baf8b0c3fd 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -112,85 +112,6 @@ static int alloc_hevc_header_structs(FFVulkanDecodeContext *s,
     return 0;
 }
 
-typedef struct HEVCVulkanDecodePicture {
-    FFVulkanDecodePicture           vp;
-
-    /* Current picture */
-    StdVideoDecodeH265ReferenceInfo h265_ref;
-    VkVideoDecodeH265DpbSlotInfoKHR vkh265_ref;
-
-    /* Picture refs */
-    HEVCFrame                      *ref_src    [HEVC_MAX_REFS];
-    StdVideoDecodeH265ReferenceInfo h265_refs  [HEVC_MAX_REFS];
-    VkVideoDecodeH265DpbSlotInfoKHR vkh265_refs[HEVC_MAX_REFS];
-
-    /* Current picture (contd.) */
-    StdVideoDecodeH265PictureInfo   h265pic;
-    VkVideoDecodeH265PictureInfoKHR h265_pic_info;
-
-    /* Current picture */
-    VkVideoPictureResourceInfoKHR   ref;
-    VkVideoReferenceSlotInfoKHR     ref_slot;
-
-    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
-    VkVideoPictureResourceInfoKHR   refs     [36];
-    VkVideoReferenceSlotInfoKHR     ref_slots[36];
-
-    /* Main decoding struct */
-    VkVideoDecodeInfoKHR            decode_info;
-} HEVCVulkanDecodePicture;
-
-static int vk_hevc_fill_pict(AVCodecContext *avctx, HEVCFrame **ref_src,
-                             VkVideoReferenceSlotInfoKHR *ref_slot,       /* Main structure */
-                             VkVideoPictureResourceInfoKHR *ref,          /* Goes in ^ */
-                             VkVideoDecodeH265DpbSlotInfoKHR *vkh265_ref, /* Goes in ^ */
-                             StdVideoDecodeH265ReferenceInfo *h265_ref,   /* Goes in ^ */
-                             HEVCFrame *pic, int is_current, int pic_id)
-{
-    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
-    FFVulkanDecodeShared *ctx = dec->shared_ctx;
-    HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
-    FFVulkanDecodePicture *vkpic = &hp->vp;
-
-    int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
-                                         dec->dedicated_dpb);
-    if (err < 0)
-        return err;
-
-    *h265_ref = (StdVideoDecodeH265ReferenceInfo) {
-        .flags = (StdVideoDecodeH265ReferenceInfoFlags) {
-            .used_for_long_term_reference = pic->flags & HEVC_FRAME_FLAG_LONG_REF,
-            .unused_for_reference = 0,
-        },
-        .PicOrderCntVal = pic->poc,
-    };
-
-    *vkh265_ref = (VkVideoDecodeH265DpbSlotInfoKHR) {
-        .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_DPB_SLOT_INFO_KHR,
-        .pStdReferenceInfo = h265_ref,
-    };
-
-    *ref = (VkVideoPictureResourceInfoKHR) {
-        .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
-        .codedOffset = (VkOffset2D){ 0, 0 },
-        .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
-        .baseArrayLayer = ctx->common.layered_dpb ? pic_id : 0,
-        .imageViewBinding = vkpic->view.ref[0],
-    };
-
-    *ref_slot = (VkVideoReferenceSlotInfoKHR) {
-        .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
-        .pNext = vkh265_ref,
-        .slotIndex = pic_id,
-        .pPictureResource = ref,
-    };
-
-    if (ref_src)
-        *ref_src = pic;
-
-    return 0;
-}
-
 static void copy_scaling_list(const ScalingList *sl, StdVideoH265ScalingLists *vksl)
 {
     for (int i = 0; i < STD_VIDEO_H265_SCALING_LIST_4X4_NUM_LISTS; i++) {
@@ -719,18 +640,114 @@ static int vk_hevc_create_params(AVCodecContext *avctx, AVBufferRef **buf)
     return 0;
 }
 
+static int vk_hevc_fill_pict(AVCodecContext *avctx, HEVCFrame **ref_src,
+                             VkVideoReferenceSlotInfoKHR *ref_slot,       /* Main structure */
+                             VkVideoPictureResourceInfoKHR *ref,          /* Goes in ^ */
+                             VkVideoDecodeH265DpbSlotInfoKHR *vkh265_ref, /* Goes in ^ */
+                             StdVideoDecodeH265ReferenceInfo *h265_ref,   /* Goes in ^ */
+                             HEVCFrame *pic, int is_current, int pic_id)
+{
+    FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
+    FFVulkanDecodeShared *ctx = dec->shared_ctx;
+    FFVulkanDecodePicture *vkpic = pic->hwaccel_picture_private;
+
+    int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
+                                         dec->dedicated_dpb);
+    if (err < 0)
+        return err;
+
+    *h265_ref = (StdVideoDecodeH265ReferenceInfo) {
+        .flags = (StdVideoDecodeH265ReferenceInfoFlags) {
+            .used_for_long_term_reference = pic->flags & HEVC_FRAME_FLAG_LONG_REF,
+            .unused_for_reference = 0,
+        },
+        .PicOrderCntVal = pic->poc,
+    };
+
+    *vkh265_ref = (VkVideoDecodeH265DpbSlotInfoKHR) {
+        .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_DPB_SLOT_INFO_KHR,
+        .pStdReferenceInfo = h265_ref,
+    };
+
+    *ref = (VkVideoPictureResourceInfoKHR) {
+        .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
+        .codedOffset = (VkOffset2D){ 0, 0 },
+        .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
+        .baseArrayLayer = ctx->common.layered_dpb ? pic_id : 0,
+        .imageViewBinding = vkpic->view.ref[0],
+    };
+
+    *ref_slot = (VkVideoReferenceSlotInfoKHR) {
+        .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
+        .pNext = vkh265_ref,
+        .slotIndex = pic_id,
+        .pPictureResource = ref,
+    };
+
+    if (ref_src)
+        *ref_src = pic;
+
+    return 0;
+}
+
 static int vk_hevc_start_frame(AVCodecContext          *avctx,
                                av_unused const AVBufferRef *buffer_ref,
                                av_unused const uint8_t *buffer,
                                av_unused uint32_t       size)
+{
+    const HEVCContext *h = avctx->priv_data;
+    HEVCFrame *pic = h->cur_frame;
+    FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
+
+    return ff_vk_decode_start_frame(avctx, vp, buffer_ref, 0);
+}
+
+typedef struct HEVCVulkanDecodeParams {
+    /* Current picture */
+    StdVideoDecodeH265ReferenceInfo h265_ref;
+    VkVideoDecodeH265DpbSlotInfoKHR vkh265_ref;
+
+    /* Picture refs */
+    HEVCFrame                      *ref_src    [HEVC_MAX_REFS];
+    StdVideoDecodeH265ReferenceInfo h265_refs  [HEVC_MAX_REFS];
+    VkVideoDecodeH265DpbSlotInfoKHR vkh265_refs[HEVC_MAX_REFS];
+
+    /* Current picture (contd.) */
+    StdVideoDecodeH265PictureInfo   h265pic;
+    VkVideoDecodeH265PictureInfoKHR h265_pic_info;
+
+    /* Current picture */
+    VkVideoPictureResourceInfoKHR   ref;
+    VkVideoReferenceSlotInfoKHR     ref_slot;
+
+    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+    VkVideoPictureResourceInfoKHR   refs     [36];
+    VkVideoReferenceSlotInfoKHR     ref_slots[36];
+
+    /* Maintenance 2 */
+#ifdef VK_KHR_video_maintenance2
+    HEVCHeaderPPS vkpps_p;
+    StdVideoH265PictureParameterSet vkpps;
+    HEVCHeaderSPS vksps_p;
+    StdVideoH265SequenceParameterSet vksps;
+    HEVCHeaderVPSSet vkvps_ps[HEVC_MAX_SUB_LAYERS];
+    HEVCHeaderVPS vkvps_p;
+    StdVideoH265VideoParameterSet vkvps;
+    VkVideoDecodeH265InlineSessionParametersInfoKHR h265_params;
+#endif
+
+    /* Main decoding struct */
+    VkVideoDecodeInfoKHR            decode_info;
+} HEVCVulkanDecodeParams;
+
+static int vk_hevc_fill_params(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+                               HEVCVulkanDecodeParams *hp)
 {
     int err;
     HEVCContext *h = avctx->priv_data;
     HEVCLayerContext *l = &h->layers[h->cur_layer];
 
     HEVCFrame *pic = h->cur_frame;
-    HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
-    FFVulkanDecodePicture *vp = &hp->vp;
     const HEVCPPS *pps = h->pps;
     const HEVCSPS *sps = pps->sps;
     int nb_refs = 0;
@@ -814,7 +831,8 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
     hp->h265_pic_info = (VkVideoDecodeH265PictureInfoKHR) {
         .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_PICTURE_INFO_KHR,
         .pStdPictureInfo = &hp->h265pic,
-        .sliceSegmentCount = 0,
+        .pSliceSegmentOffsets = vp->slice_offsets,
+        .sliceSegmentCount = vp->nb_slices,
     };
 
     hp->decode_info = (VkVideoDecodeInfoKHR) {
@@ -836,21 +854,6 @@ static int vk_hevc_start_frame(AVCodecContext          *avctx,
     return 0;
 }
 
-static int vk_hevc_decode_slice(AVCodecContext *avctx,
-                                const uint8_t  *data,
-                                uint32_t        size)
-{
-    const HEVCContext *h = avctx->priv_data;
-    HEVCVulkanDecodePicture *hp = h->cur_frame->hwaccel_picture_private;
-    FFVulkanDecodePicture *vp = &hp->vp;
-
-    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
-    if (err < 0)
-        return err;
-
-    return 0;
-}
-
 static int vk_hevc_end_frame(AVCodecContext *avctx)
 {
     const HEVCContext *h = avctx->priv_data;
@@ -858,53 +861,46 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
     FFVulkanDecodeShared *ctx = dec->shared_ctx;
 
     HEVCFrame *pic = h->cur_frame;
-    HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
-    FFVulkanDecodePicture *vp = &hp->vp;
+    FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
     FFVulkanDecodePicture *rvp[HEVC_MAX_REFS] = { 0 };
     AVFrame *rav[HEVC_MAX_REFS] = { 0 };
     int err;
 
+    HEVCVulkanDecodeParams hp = { 0 };
+
     const HEVCPPS *pps = h->pps;
     const HEVCSPS *sps = pps->sps;
 
-#ifdef VK_KHR_video_maintenance2
-    HEVCHeaderPPS vkpps_p;
-    StdVideoH265PictureParameterSet vkpps;
-    HEVCHeaderSPS vksps_p;
-    StdVideoH265SequenceParameterSet vksps;
-    HEVCHeaderVPSSet vkvps_ps[HEVC_MAX_SUB_LAYERS];
-    HEVCHeaderVPS vkvps_p;
-    StdVideoH265VideoParameterSet vkvps;
-    VkVideoDecodeH265InlineSessionParametersInfoKHR h265_params;
+    if (!vp->nb_slices)
+        return 0;
 
+    err = vk_hevc_fill_params(avctx, vp, &hp);
+    if (err < 0)
+        return err;
+
+#ifdef VK_KHR_video_maintenance2
     if (ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2) {
-        set_pps(pps, sps, &vkpps_p.scaling, &vkpps, &vkpps_p.pal);
-        set_sps(sps, pps->sps_id, &vksps_p.scaling, &vksps_p.vui_header,
-                &vksps_p.vui, &vksps, vksps_p.nal_hdr,
-                vksps_p.vcl_hdr, &vksps_p.ptl, &vksps_p.dpbm,
-                &vksps_p.pal, vksps_p.str, &vksps_p.ltr);
+        set_pps(pps, sps, &hp.vkpps_p.scaling, &hp.vkpps, &hp.vkpps_p.pal);
+        set_sps(sps, pps->sps_id, &hp.vksps_p.scaling, &hp.vksps_p.vui_header,
+                &hp.vksps_p.vui, &hp.vksps, hp.vksps_p.nal_hdr,
+                hp.vksps_p.vcl_hdr, &hp.vksps_p.ptl, &hp.vksps_p.dpbm,
+                &hp.vksps_p.pal, hp.vksps_p.str, &hp.vksps_p.ltr);
 
-        vkvps_p.sls = vkvps_ps;
-        set_vps(sps->vps, &vkvps, &vkvps_p.ptl, &vkvps_p.dpbm,
-                vkvps_p.hdr, vkvps_p.sls);
+        hp.vkvps_p.sls = hp.vkvps_ps;
+        set_vps(sps->vps, &hp.vkvps, &hp.vkvps_p.ptl, &hp.vkvps_p.dpbm,
+                hp.vkvps_p.hdr, hp.vkvps_p.sls);
 
-        h265_params = (VkVideoDecodeH265InlineSessionParametersInfoKHR) {
+        hp.h265_params = (VkVideoDecodeH265InlineSessionParametersInfoKHR) {
             .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_INLINE_SESSION_PARAMETERS_INFO_KHR,
-            .pStdSPS = &vksps,
-            .pStdPPS = &vkpps,
-            .pStdVPS = &vkvps,
+            .pStdSPS = &hp.vksps,
+            .pStdPPS = &hp.vkpps,
+            .pStdVPS = &hp.vkvps,
         };
-        hp->h265_pic_info.pNext = &h265_params;
-    }
+        hp.h265_pic_info.pNext = &hp.h265_params;
+    } else
 #endif
 
-    hp->h265_pic_info.pSliceSegmentOffsets = vp->slice_offsets;
-    hp->h265_pic_info.sliceSegmentCount = vp->nb_slices;
-    if (!hp->h265_pic_info.sliceSegmentCount)
-        return 0;
-
-    if (!dec->session_params &&
-        !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
+    if (!dec->session_params) {
         if (!pps) {
             unsigned int pps_id = h->sh.pps_id;
             if (pps_id < HEVC_MAX_PPS_COUNT && h->ps.pps_list[pps_id] != NULL)
@@ -921,31 +917,44 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
         if (err < 0)
             return err;
 
-        hp->h265pic.sps_video_parameter_set_id = sps->vps_id;
-        hp->h265pic.pps_seq_parameter_set_id = pps->sps_id;
-        hp->h265pic.pps_pic_parameter_set_id = pps->pps_id;
+        hp.h265pic.sps_video_parameter_set_id = sps->vps_id;
+        hp.h265pic.pps_seq_parameter_set_id = pps->sps_id;
+        hp.h265pic.pps_pic_parameter_set_id = pps->pps_id;
     }
 
-    for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
-        HEVCVulkanDecodePicture *rfhp = hp->ref_src[i]->hwaccel_picture_private;
-        rav[i] = hp->ref_src[i]->f;
-        rvp[i] = &rfhp->vp;
+    for (int i = 0; i < hp.decode_info.referenceSlotCount; i++) {
+        rav[i] = hp.ref_src[i]->f;
+        rvp[i] = hp.ref_src[i]->hwaccel_picture_private;
     }
 
     av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
-           vp->slices_size, hp->h265_pic_info.sliceSegmentCount);
+           vp->slices_size, hp.h265_pic_info.sliceSegmentCount);
 
-    return ff_vk_decode_frame(avctx, &hp->decode_info,
+    return ff_vk_decode_frame(avctx, &hp.decode_info,
                               pic->f, vp, rav, rvp);
 }
 
+static int vk_hevc_decode_slice(AVCodecContext *avctx,
+                                const uint8_t  *data,
+                                uint32_t        size)
+{
+    const HEVCContext *h = avctx->priv_data;
+    FFVulkanDecodePicture *vp = h->cur_frame->hwaccel_picture_private;
+
+    int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
+    if (err < 0)
+        return err;
+
+    return 0;
+}
+
 static void vk_hevc_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
 {
     AVHWDeviceContext *hwctx = _hwctx.nc;
-    HEVCVulkanDecodePicture *hp = data;
+    FFVulkanDecodePicture *vp = data;
 
     /* Free frame resources */
-    ff_vk_decode_free_frame(hwctx, &hp->vp);
+    ff_vk_decode_free_frame(hwctx, vp);
 }
 
 const FFHWAccel ff_hevc_vulkan_hwaccel = {
@@ -957,7 +966,7 @@ const FFHWAccel ff_hevc_vulkan_hwaccel = {
     .decode_slice          = &vk_hevc_decode_slice,
     .end_frame             = &vk_hevc_end_frame,
     .free_frame_priv       = &vk_hevc_free_frame_priv,
-    .frame_priv_data_size  = sizeof(HEVCVulkanDecodePicture),
+    .frame_priv_data_size  = sizeof(FFVulkanDecodePicture),
     .init                  = &ff_vk_decode_init,
     .update_thread_context = &ff_vk_update_thread_context,
     .decode_params         = &ff_vk_params_invalidate,
-- 
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

^ permalink raw reply	[flat|nested] 6+ messages in thread

end of thread, other threads:[~2025-03-31  2:39 UTC | newest]

Thread overview: 6+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2025-03-31  2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec Lynne
2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function Lynne
2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary Lynne
2025-03-31  2:37 ` [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: " Lynne

Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

This inbox may be cloned and mirrored by anyone:

	git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git

	# If you have public-inbox 1.1+ installed, you may
	# initialize and index your mirror using the following commands:
	public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
		ffmpegdev@gitmailbox.com
	public-inbox-index ffmpegdev

Example config snippet for mirrors.


AGPL code for this site: git clone https://public-inbox.org/public-inbox.git