* [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb
@ 2025-03-31 2:37 Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
` (4 more replies)
0 siblings, 5 replies; 6+ messages in thread
From: Lynne @ 2025-03-31 2:37 UTC (permalink / raw)
To: ffmpeg-devel; +Cc: Lynne
This allows for the upcoming refactor.
---
libavcodec/vulkan_av1.c | 6 +++---
libavcodec/vulkan_decode.c | 23 ++++++-----------------
libavcodec/vulkan_decode.h | 5 +++--
libavcodec/vulkan_ffv1.c | 22 ++++++++--------------
libavcodec/vulkan_h264.c | 9 +++------
libavcodec/vulkan_hevc.c | 6 +++---
6 files changed, 26 insertions(+), 45 deletions(-)
diff --git a/libavcodec/vulkan_av1.c b/libavcodec/vulkan_av1.c
index ccb88004b5..13df24a44b 100644
--- a/libavcodec/vulkan_av1.c
+++ b/libavcodec/vulkan_av1.c
@@ -577,9 +577,7 @@ static int vk_av1_decode_slice(AVCodecContext *avctx,
err = ff_vk_decode_add_slice(avctx, vp,
data + s->tile_group_info[i].tile_offset,
- s->tile_group_info[i].tile_size, 0,
- &ap->av1_pic_info.tileCount,
- &ap->av1_pic_info.pTileOffsets);
+ s->tile_group_info[i].tile_size, 0);
if (err < 0)
return err;
}
@@ -616,6 +614,8 @@ static int vk_av1_end_frame(AVCodecContext *avctx)
}
#endif
+ ap->av1_pic_info.pTileOffsets = vp->slice_offsets;
+ ap->av1_pic_info.tileCount = vp->nb_slices;
if (!ap->av1_pic_info.tileCount)
return 0;
diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 93aa0ce5b3..48a206e3c0 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -249,33 +249,23 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
}
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
- const uint8_t *data, size_t size, int add_startcode,
- uint32_t *nb_slices, const uint32_t **offsets)
+ const uint8_t *data, size_t size, int add_startcode)
{
FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
FFVulkanDecodeShared *ctx = dec->shared_ctx;
static const uint8_t startcode_prefix[3] = { 0x0, 0x0, 0x1 };
const size_t startcode_len = add_startcode ? sizeof(startcode_prefix) : 0;
- const int nb = nb_slices ? *nb_slices : 0;
uint8_t *slices;
- uint32_t *slice_off;
FFVkBuffer *vkbuf;
size_t new_size = vp->slices_size + startcode_len + size +
ctx->caps.minBitstreamBufferSizeAlignment;
new_size = FFALIGN(new_size, ctx->caps.minBitstreamBufferSizeAlignment);
- if (offsets) {
- slice_off = av_fast_realloc(dec->slice_off, &dec->slice_off_max,
- (nb + 1)*sizeof(slice_off));
- if (!slice_off)
- return AVERROR(ENOMEM);
-
- *offsets = dec->slice_off = slice_off;
-
- slice_off[nb] = vp->slices_size;
- }
+ /* Should never happen */
+ if (vp->nb_slices > FF_ARRAY_ELEMS(vp->slice_offsets))
+ return AVERROR(EINVAL);
vkbuf = vp->slices_buf ? (FFVkBuffer *)vp->slices_buf->data : NULL;
if (!vkbuf || vkbuf->size < new_size) {
@@ -321,9 +311,8 @@ int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
/* Slice data */
memcpy(slices + vp->slices_size + startcode_len, data, size);
- if (nb_slices)
- *nb_slices = nb + 1;
-
+ vp->slice_offsets[vp->nb_slices] = vp->slices_size;
+ vp->nb_slices = vp->nb_slices + 1;
vp->slices_size += startcode_len + size;
return 0;
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index cbd22b3591..4bd755c1f6 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -110,6 +110,8 @@ typedef struct FFVulkanDecodePicture {
/* Slice data */
AVBufferRef *slices_buf;
size_t slices_size;
+ uint32_t slice_offsets[1024];
+ uint32_t nb_slices;
/* Vulkan functions needed for destruction, as no other context is guaranteed to exist */
PFN_vkWaitSemaphores wait_semaphores;
@@ -158,8 +160,7 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
* Add slice data to frame.
*/
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
- const uint8_t *data, size_t size, int add_startcode,
- uint32_t *nb_slices, const uint32_t **offsets);
+ const uint8_t *data, size_t size, int add_startcode);
/**
* Decode a frame.
diff --git a/libavcodec/vulkan_ffv1.c b/libavcodec/vulkan_ffv1.c
index 17bfc943d4..7eb51b0dab 100644
--- a/libavcodec/vulkan_ffv1.c
+++ b/libavcodec/vulkan_ffv1.c
@@ -55,8 +55,6 @@ typedef struct FFv1VulkanDecodePicture {
uint32_t max_context_count;
AVBufferRef *slice_offset_buf;
- uint32_t *slice_offset;
- int slice_num;
AVBufferRef *slice_status_buf;
int crc_checked;
@@ -163,8 +161,6 @@ static int vk_ffv1_start_frame(AVCodecContext *avctx,
int is_rgb = !(f->colorspace == 0 && sw_format != AV_PIX_FMT_YA8) &&
!(sw_format == AV_PIX_FMT_YA8);
- fp->slice_num = 0;
-
for (int i = 0; i < f->quant_table_count; i++)
fp->max_context_count = FFMAX(f->context_count[i], fp->max_context_count);
@@ -278,22 +274,20 @@ static int vk_ffv1_decode_slice(AVCodecContext *avctx,
if (ctx->s.extensions & FF_VK_EXT_EXTERNAL_HOST_MEMORY) {
FFVkBuffer *slices_buf = (FFVkBuffer *)vp->slices_buf->data;
- AV_WN32(slice_offset->mapped_mem + (2*fp->slice_num + 0)*sizeof(uint32_t),
+ AV_WN32(slice_offset->mapped_mem + (2*vp->nb_slices + 0)*sizeof(uint32_t),
data - slices_buf->mapped_mem);
- AV_WN32(slice_offset->mapped_mem + (2*fp->slice_num + 1)*sizeof(uint32_t),
+ AV_WN32(slice_offset->mapped_mem + (2*vp->nb_slices + 1)*sizeof(uint32_t),
size);
- fp->slice_num++;
+ vp->nb_slices++;
} else {
- int err = ff_vk_decode_add_slice(avctx, vp, data, size, 0,
- &fp->slice_num,
- (const uint32_t **)&fp->slice_offset);
+ int err = ff_vk_decode_add_slice(avctx, vp, data, size, 0);
if (err < 0)
return err;
- AV_WN32(slice_offset->mapped_mem + (2*(fp->slice_num - 1) + 0)*sizeof(uint32_t),
- fp->slice_offset[fp->slice_num - 1]);
- AV_WN32(slice_offset->mapped_mem + (2*(fp->slice_num - 1) + 1)*sizeof(uint32_t),
+ AV_WN32(slice_offset->mapped_mem + (2*(vp->nb_slices - 1) + 0)*sizeof(uint32_t),
+ vp->slice_offsets[vp->nb_slices - 1]);
+ AV_WN32(slice_offset->mapped_mem + (2*(vp->nb_slices - 1) + 1)*sizeof(uint32_t),
size);
}
@@ -1280,7 +1274,7 @@ static void vk_ffv1_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
if (fp->crc_checked) {
FFVkBuffer *slice_status = (FFVkBuffer *)fp->slice_status_buf->data;
- for (int i = 0; i < fp->slice_num; i++) {
+ for (int i = 0; i < vp->nb_slices; i++) {
uint32_t crc_res;
crc_res = AV_RN32(slice_status->mapped_mem + i*sizeof(uint32_t));
if (crc_res != 0)
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index 73aaed7f6a..af37e0800b 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -491,9 +491,7 @@ static int vk_h264_decode_slice(AVCodecContext *avctx,
H264VulkanDecodePicture *hp = h->cur_pic_ptr->hwaccel_picture_private;
FFVulkanDecodePicture *vp = &hp->vp;
- int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1,
- &hp->h264_pic_info.sliceCount,
- &hp->h264_pic_info.pSliceOffsets);
+ int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
if (err < 0)
return err;
@@ -541,12 +539,11 @@ static int vk_h264_end_frame(AVCodecContext *avctx)
}
#endif
+ hp->h264_pic_info.pSliceOffsets = vp->slice_offsets;
+ hp->h264_pic_info.sliceCount = vp->nb_slices;
if (!hp->h264_pic_info.sliceCount)
return 0;
- if (!vp->slices_buf)
- return AVERROR(EINVAL);
-
if (!dec->session_params &&
!(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
int err = vk_h264_create_params(avctx, &dec->session_params);
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index e4a946ae0d..e95f554756 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -842,9 +842,7 @@ static int vk_hevc_decode_slice(AVCodecContext *avctx,
HEVCVulkanDecodePicture *hp = h->cur_frame->hwaccel_picture_private;
FFVulkanDecodePicture *vp = &hp->vp;
- int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1,
- &hp->h265_pic_info.sliceSegmentCount,
- &hp->h265_pic_info.pSliceSegmentOffsets);
+ int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
if (err < 0)
return err;
@@ -898,6 +896,8 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
}
#endif
+ hp->h265_pic_info.pSliceSegmentOffsets = vp->slice_offsets;
+ hp->h265_pic_info.sliceSegmentCount = vp->nb_slices;
if (!hp->h265_pic_info.sliceSegmentCount)
return 0;
--
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
^ permalink raw reply [flat|nested] 6+ messages in thread
* [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame
2025-03-31 2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
@ 2025-03-31 2:37 ` Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec Lynne
` (3 subsequent siblings)
4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31 2:37 UTC (permalink / raw)
To: ffmpeg-devel; +Cc: Lynne
We tried to create sequence params in both start_frame and end_frame.
This was redundant.
Just always create them in end_frame.
---
libavcodec/vulkan_av1.c | 8 --------
libavcodec/vulkan_h264.c | 9 ---------
libavcodec/vulkan_hevc.c | 9 ---------
3 files changed, 26 deletions(-)
diff --git a/libavcodec/vulkan_av1.c b/libavcodec/vulkan_av1.c
index 13df24a44b..115db8badb 100644
--- a/libavcodec/vulkan_av1.c
+++ b/libavcodec/vulkan_av1.c
@@ -254,7 +254,6 @@ static int vk_av1_start_frame(AVCodecContext *avctx,
AV1DecContext *s = avctx->priv_data;
const AV1Frame *pic = &s->cur_frame;
FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
- FFVulkanDecodeShared *ctx = dec->shared_ctx;
AV1VulkanDecodePicture *ap = pic->hwaccel_picture_private;
FFVulkanDecodePicture *vp = &ap->vp;
@@ -269,13 +268,6 @@ static int vk_av1_start_frame(AVCodecContext *avctx,
STD_VIDEO_AV1_FRAME_RESTORATION_TYPE_WIENER,
STD_VIDEO_AV1_FRAME_RESTORATION_TYPE_SGRPROJ };
- if (!dec->session_params &&
- !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
- err = vk_av1_create_params(avctx, &dec->session_params, ap);
- if (err < 0)
- return err;
- }
-
if (!ap->frame_id_set) {
unsigned slot_idx = 0;
for (unsigned i = 0; i < 32; i++) {
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index af37e0800b..d950c6948f 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -366,20 +366,11 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
int err;
int dpb_slot_index = 0;
H264Context *h = avctx->priv_data;
- FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
- FFVulkanDecodeShared *ctx = dec->shared_ctx;
H264Picture *pic = h->cur_pic_ptr;
H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
FFVulkanDecodePicture *vp = &hp->vp;
- if (!dec->session_params &&
- !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
- err = vk_h264_create_params(avctx, &dec->session_params);
- if (err < 0)
- return err;
- }
-
/* Fill in main slot */
dpb_slot_index = 0;
for (unsigned slot = 0; slot < H264_MAX_PICTURE_COUNT; slot++) {
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index e95f554756..bc43591e19 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -716,8 +716,6 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
int err;
HEVCContext *h = avctx->priv_data;
HEVCLayerContext *l = &h->layers[h->cur_layer];
- FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
- FFVulkanDecodeShared *ctx = dec->shared_ctx;
HEVCFrame *pic = h->cur_frame;
HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
@@ -726,13 +724,6 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
const HEVCSPS *sps = pps->sps;
int nb_refs = 0;
- if (!dec->session_params &&
- !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
- err = vk_hevc_create_params(avctx, &dec->session_params);
- if (err < 0)
- return err;
- }
-
hp->h265pic = (StdVideoDecodeH265PictureInfo) {
.flags = (StdVideoDecodeH265PictureInfoFlags) {
.IrapPicFlag = IS_IRAP(h),
--
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
^ permalink raw reply [flat|nested] 6+ messages in thread
* [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec
2025-03-31 2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
@ 2025-03-31 2:37 ` Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function Lynne
` (2 subsequent siblings)
4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31 2:37 UTC (permalink / raw)
To: ffmpeg-devel; +Cc: Lynne
Required for next refactor.
---
libavcodec/vulkan_av1.c | 30 +++++++++++++++++++++---------
libavcodec/vulkan_decode.c | 20 ++++++++++----------
libavcodec/vulkan_decode.h | 13 +------------
libavcodec/vulkan_h264.c | 32 ++++++++++++++++++++++----------
libavcodec/vulkan_hevc.c | 28 ++++++++++++++++++++--------
5 files changed, 74 insertions(+), 49 deletions(-)
diff --git a/libavcodec/vulkan_av1.c b/libavcodec/vulkan_av1.c
index 115db8badb..c4ae0bb2ab 100644
--- a/libavcodec/vulkan_av1.c
+++ b/libavcodec/vulkan_av1.c
@@ -66,6 +66,17 @@ typedef struct AV1VulkanDecodePicture {
StdVideoDecodeAV1ReferenceInfo std_refs [AV1_NUM_REF_FRAMES];
VkVideoDecodeAV1DpbSlotInfoKHR vkav1_refs[AV1_NUM_REF_FRAMES];
+ /* Current picture */
+ VkVideoPictureResourceInfoKHR ref;
+ VkVideoReferenceSlotInfoKHR ref_slot;
+
+ /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+ VkVideoPictureResourceInfoKHR refs [36];
+ VkVideoReferenceSlotInfoKHR ref_slots[36];
+
+ /* Main decoding struct */
+ VkVideoDecodeInfoKHR decode_info;
+
uint8_t frame_id_set;
uint8_t frame_id;
uint8_t ref_frame_sign_bias_mask;
@@ -295,7 +306,7 @@ static int vk_av1_start_frame(AVCodecContext *avctx,
continue;
for (int j = 0; j < ref_count; j++) {
- if (vp->ref_slots[j].slotIndex == hp->frame_id) {
+ if (ap->ref_slots[j].slotIndex == hp->frame_id) {
found = 1;
break;
}
@@ -303,8 +314,8 @@ static int vk_av1_start_frame(AVCodecContext *avctx,
if (found)
continue;
- err = vk_av1_fill_pict(avctx, &ap->ref_src[ref_count], &vp->ref_slots[ref_count],
- &vp->refs[ref_count], &ap->std_refs[ref_count], &ap->vkav1_refs[ref_count],
+ err = vk_av1_fill_pict(avctx, &ap->ref_src[ref_count], &ap->ref_slots[ref_count],
+ &ap->refs[ref_count], &ap->std_refs[ref_count], &ap->vkav1_refs[ref_count],
ref_frame, 0, 0, ref_frame->order_hints);
if (err < 0)
return err;
@@ -312,7 +323,7 @@ static int vk_av1_start_frame(AVCodecContext *avctx,
ref_count++;
}
- err = vk_av1_fill_pict(avctx, NULL, &vp->ref_slot, &vp->ref,
+ err = vk_av1_fill_pict(avctx, NULL, &ap->ref_slot, &ap->ref,
&ap->std_ref,
&ap->vkav1_ref,
pic, 1, apply_grain, NULL);
@@ -339,13 +350,13 @@ static int vk_av1_start_frame(AVCodecContext *avctx,
ap->av1_pic_info.referenceNameSlotIndices[i] = hp->frame_id;
}
- vp->decode_info = (VkVideoDecodeInfoKHR) {
+ ap->decode_info = (VkVideoDecodeInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_INFO_KHR,
.pNext = &ap->av1_pic_info,
.flags = 0x0,
- .pSetupReferenceSlot = &vp->ref_slot,
+ .pSetupReferenceSlot = &ap->ref_slot,
.referenceSlotCount = ref_count,
- .pReferenceSlots = vp->ref_slots,
+ .pReferenceSlots = ap->ref_slots,
.dstPictureResource = (VkVideoPictureResourceInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
.codedOffset = (VkOffset2D){ 0, 0 },
@@ -618,7 +629,7 @@ static int vk_av1_end_frame(AVCodecContext *avctx)
return err;
}
- for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+ for (int i = 0; i < ap->decode_info.referenceSlotCount; i++) {
const AV1Frame *rp = ap->ref_src[i];
AV1VulkanDecodePicture *rhp = rp->hwaccel_picture_private;
@@ -629,7 +640,8 @@ static int vk_av1_end_frame(AVCodecContext *avctx)
av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i tiles\n",
vp->slices_size, ap->av1_pic_info.tileCount);
- return ff_vk_decode_frame(avctx, pic->f, vp, rav, rvp);
+ return ff_vk_decode_frame(avctx, &ap->decode_info,
+ pic->f, vp, rav, rvp);
}
static void vk_av1_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 48a206e3c0..058efe3037 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -354,7 +354,7 @@ void ff_vk_decode_flush(AVCodecContext *avctx)
ff_vk_exec_submit(&ctx->s, exec);
}
-int ff_vk_decode_frame(AVCodecContext *avctx,
+int ff_vk_decode_frame(AVCodecContext *avctx, VkVideoDecodeInfoKHR *decode_info,
AVFrame *pic, FFVulkanDecodePicture *vp,
AVFrame *rpic[], FFVulkanDecodePicture *rvkp[])
{
@@ -379,8 +379,8 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
.videoSessionParameters = dec->session_params ?
*((VkVideoSessionParametersKHR *)dec->session_params->data) :
VK_NULL_HANDLE,
- .referenceSlotCount = vp->decode_info.referenceSlotCount,
- .pReferenceSlots = vp->decode_info.pReferenceSlots,
+ .referenceSlotCount = decode_info->referenceSlotCount,
+ .pReferenceSlots = decode_info->pReferenceSlots,
};
VkVideoEndCodingInfoKHR decode_end = {
.sType = VK_STRUCTURE_TYPE_VIDEO_END_CODING_INFO_KHR,
@@ -396,7 +396,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
/* The current decoding reference has to be bound as an inactive reference */
VkVideoReferenceSlotInfoKHR *cur_vk_ref;
cur_vk_ref = (void *)&decode_start.pReferenceSlots[decode_start.referenceSlotCount];
- cur_vk_ref[0] = vp->ref_slot;
+ cur_vk_ref[0] = *decode_info->pSetupReferenceSlot;
cur_vk_ref[0].slotIndex = -1;
decode_start.referenceSlotCount++;
@@ -420,9 +420,9 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
}
}
- vp->decode_info.srcBuffer = sd_buf->buf;
- vp->decode_info.srcBufferOffset = 0;
- vp->decode_info.srcBufferRange = data_size;
+ decode_info->srcBuffer = sd_buf->buf;
+ decode_info->srcBufferOffset = 0;
+ decode_info->srcBufferRange = data_size;
/* Start command buffer recording */
err = ff_vk_exec_start(&ctx->s, exec);
@@ -488,7 +488,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
if (!layered_dpb) {
/* All references (apart from the current) for non-layered refs */
- for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+ for (int i = 0; i < decode_info->referenceSlotCount; i++) {
AVFrame *ref_frame = rpic[i];
FFVulkanDecodePicture *rvp = rvkp[i];
AVFrame *ref = rvp->dpb_frame ? rvp->dpb_frame : ref_frame;
@@ -533,7 +533,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
&img_bar[nb_img_bar], &nb_img_bar);
}
}
- } else if (vp->decode_info.referenceSlotCount ||
+ } else if (decode_info->referenceSlotCount ||
vp->view.out[0] != vp->view.ref[0]) {
/* Single barrier for a single layered ref */
err = ff_vk_exec_add_dep_frame(&ctx->s, exec, ctx->common.layered_frame,
@@ -553,7 +553,7 @@ int ff_vk_decode_frame(AVCodecContext *avctx,
/* Start, use parameters, decode and end decoding */
vk->CmdBeginVideoCodingKHR(cmd_buf, &decode_start);
- vk->CmdDecodeVideoKHR(cmd_buf, &vp->decode_info);
+ vk->CmdDecodeVideoKHR(cmd_buf, decode_info);
vk->CmdEndVideoCodingKHR(cmd_buf, &decode_end);
/* End recording and submit for execution */
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index 4bd755c1f6..6c3e1486b0 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -96,17 +96,6 @@ typedef struct FFVulkanDecodePicture {
VkSemaphore sem;
uint64_t sem_value;
- /* Current picture */
- VkVideoPictureResourceInfoKHR ref;
- VkVideoReferenceSlotInfoKHR ref_slot;
-
- /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
- VkVideoPictureResourceInfoKHR refs [36];
- VkVideoReferenceSlotInfoKHR ref_slots[36];
-
- /* Main decoding struct */
- VkVideoDecodeInfoKHR decode_info;
-
/* Slice data */
AVBufferRef *slices_buf;
size_t slices_size;
@@ -165,7 +154,7 @@ int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
/**
* Decode a frame.
*/
-int ff_vk_decode_frame(AVCodecContext *avctx,
+int ff_vk_decode_frame(AVCodecContext *avctx, VkVideoDecodeInfoKHR *decode_info,
AVFrame *pic, FFVulkanDecodePicture *vp,
AVFrame *rpic[], FFVulkanDecodePicture *rvkp[]);
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index d950c6948f..71a9c06801 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -47,6 +47,17 @@ typedef struct H264VulkanDecodePicture {
/* Current picture (contd.) */
StdVideoDecodeH264PictureInfo h264pic;
VkVideoDecodeH264PictureInfoKHR h264_pic_info;
+
+ /* Current picture */
+ VkVideoPictureResourceInfoKHR ref;
+ VkVideoReferenceSlotInfoKHR ref_slot;
+
+ /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+ VkVideoPictureResourceInfoKHR refs [36];
+ VkVideoReferenceSlotInfoKHR ref_slots[36];
+
+ /* Main decoding struct */
+ VkVideoDecodeInfoKHR decode_info;
} H264VulkanDecodePicture;
const static int h264_scaling_list8_order[] = { 0, 3, 1, 4, 2, 5 };
@@ -380,7 +391,7 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
}
}
- err = vk_h264_fill_pict(avctx, NULL, &vp->ref_slot, &vp->ref,
+ err = vk_h264_fill_pict(avctx, NULL, &hp->ref_slot, &hp->ref,
&hp->vkh264_ref, &hp->h264_ref, pic, 1,
h->DPB[dpb_slot_index].field_picture,
h->DPB[dpb_slot_index].reference,
@@ -397,8 +408,8 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
break;
}
}
- err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &vp->ref_slots[i],
- &vp->refs[i], &hp->vkh264_refs[i],
+ err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &hp->ref_slots[i],
+ &hp->refs[i], &hp->vkh264_refs[i],
&hp->h264_refs[i], h->short_ref[i], 0,
h->DPB[dpb_slot_index].field_picture,
h->DPB[dpb_slot_index].reference,
@@ -420,8 +431,8 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
break;
}
}
- err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &vp->ref_slots[i],
- &vp->refs[i], &hp->vkh264_refs[i],
+ err = vk_h264_fill_pict(avctx, &hp->ref_src[i], &hp->ref_slots[i],
+ &hp->refs[i], &hp->vkh264_refs[i],
&hp->h264_refs[i], h->long_ref[r], 0,
h->DPB[dpb_slot_index].field_picture,
h->DPB[dpb_slot_index].reference,
@@ -454,13 +465,13 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
.pStdPictureInfo = &hp->h264pic,
};
- vp->decode_info = (VkVideoDecodeInfoKHR) {
+ hp->decode_info = (VkVideoDecodeInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_INFO_KHR,
.pNext = &hp->h264_pic_info,
.flags = 0x0,
- .pSetupReferenceSlot = &vp->ref_slot,
+ .pSetupReferenceSlot = &hp->ref_slot,
.referenceSlotCount = h->short_ref_count + h->long_ref_count,
- .pReferenceSlots = vp->ref_slots,
+ .pReferenceSlots = hp->ref_slots,
.dstPictureResource = (VkVideoPictureResourceInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
.codedOffset = (VkOffset2D){ 0, 0 },
@@ -545,7 +556,7 @@ static int vk_h264_end_frame(AVCodecContext *avctx)
hp->h264pic.pic_parameter_set_id = pic->pps->pps_id;
}
- for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+ for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
H264Picture *rp = hp->ref_src[i];
H264VulkanDecodePicture *rhp = rp->hwaccel_picture_private;
@@ -556,7 +567,8 @@ static int vk_h264_end_frame(AVCodecContext *avctx)
av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
vp->slices_size, hp->h264_pic_info.sliceCount);
- return ff_vk_decode_frame(avctx, pic->f, vp, rav, rvp);
+ return ff_vk_decode_frame(avctx, &hp->decode_info,
+ pic->f, vp, rav, rvp);
}
static void vk_h264_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index bc43591e19..e83f8346a0 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -127,6 +127,17 @@ typedef struct HEVCVulkanDecodePicture {
/* Current picture (contd.) */
StdVideoDecodeH265PictureInfo h265pic;
VkVideoDecodeH265PictureInfoKHR h265_pic_info;
+
+ /* Current picture */
+ VkVideoPictureResourceInfoKHR ref;
+ VkVideoReferenceSlotInfoKHR ref_slot;
+
+ /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+ VkVideoPictureResourceInfoKHR refs [36];
+ VkVideoReferenceSlotInfoKHR ref_slots[36];
+
+ /* Main decoding struct */
+ VkVideoDecodeInfoKHR decode_info;
} HEVCVulkanDecodePicture;
static int vk_hevc_fill_pict(AVCodecContext *avctx, HEVCFrame **ref_src,
@@ -749,7 +760,7 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
continue;
if (ref == pic) {
- err = vk_hevc_fill_pict(avctx, NULL, &vp->ref_slot, &vp->ref,
+ err = vk_hevc_fill_pict(avctx, NULL, &hp->ref_slot, &hp->ref,
&hp->vkh265_ref, &hp->h265_ref, pic, 1, i);
if (err < 0)
return err;
@@ -757,8 +768,8 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
continue;
}
- err = vk_hevc_fill_pict(avctx, &hp->ref_src[idx], &vp->ref_slots[idx],
- &vp->refs[idx], &hp->vkh265_refs[idx],
+ err = vk_hevc_fill_pict(avctx, &hp->ref_src[idx], &hp->ref_slots[idx],
+ &hp->refs[idx], &hp->vkh265_refs[idx],
&hp->h265_refs[idx], (HEVCFrame *)ref, 0, i);
if (err < 0)
return err;
@@ -806,13 +817,13 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
.sliceSegmentCount = 0,
};
- vp->decode_info = (VkVideoDecodeInfoKHR) {
+ hp->decode_info = (VkVideoDecodeInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_INFO_KHR,
.pNext = &hp->h265_pic_info,
.flags = 0x0,
- .pSetupReferenceSlot = &vp->ref_slot,
+ .pSetupReferenceSlot = &hp->ref_slot,
.referenceSlotCount = nb_refs,
- .pReferenceSlots = vp->ref_slots,
+ .pReferenceSlots = hp->ref_slots,
.dstPictureResource = (VkVideoPictureResourceInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
.codedOffset = (VkOffset2D){ 0, 0 },
@@ -915,7 +926,7 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
hp->h265pic.pps_pic_parameter_set_id = pps->pps_id;
}
- for (int i = 0; i < vp->decode_info.referenceSlotCount; i++) {
+ for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
HEVCVulkanDecodePicture *rfhp = hp->ref_src[i]->hwaccel_picture_private;
rav[i] = hp->ref_src[i]->f;
rvp[i] = &rfhp->vp;
@@ -924,7 +935,8 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
vp->slices_size, hp->h265_pic_info.sliceSegmentCount);
- return ff_vk_decode_frame(avctx, pic->f, vp, rav, rvp);
+ return ff_vk_decode_frame(avctx, &hp->decode_info,
+ pic->f, vp, rav, rvp);
}
static void vk_hevc_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
--
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
^ permalink raw reply [flat|nested] 6+ messages in thread
* [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function
2025-03-31 2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec Lynne
@ 2025-03-31 2:37 ` Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: " Lynne
4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31 2:37 UTC (permalink / raw)
To: ffmpeg-devel; +Cc: Lynne
---
libavcodec/vulkan_decode.c | 38 ++++++++++++++++++++++++++++++++++----
libavcodec/vulkan_decode.h | 6 ++++++
2 files changed, 40 insertions(+), 4 deletions(-)
diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 058efe3037..893f8fca3d 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -151,8 +151,6 @@ int ff_vk_decode_prepare_frame(FFVulkanDecodeContext *dec, AVFrame *pic,
int err;
FFVulkanDecodeShared *ctx = dec->shared_ctx;
- vkpic->slices_size = 0;
-
/* If the decoder made a blank frame to make up for a missing ref, or the
* frame is the current frame so it's missing one, create a re-representation */
if (vkpic->view.ref[0])
@@ -209,8 +207,6 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
FFVulkanDecodeShared *ctx = dec->shared_ctx;
AVHWFramesContext *frames = (AVHWFramesContext *)pic->hw_frames_ctx->data;
- vkpic->slices_size = 0;
-
if (vkpic->view.ref[0])
return 0;
@@ -248,6 +244,31 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
return 0;
}
+int ff_vk_decode_start_frame(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+ const AVBufferRef *buffer_ref, int complete)
+{
+ int err;
+ FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
+ FFVulkanDecodeShared *ctx = dec->shared_ctx;
+
+ vp->nb_slices = 0;
+ vp->slices_size = 0;
+
+ /* Host map the input slices data if supported */
+ if (complete && ctx->s.extensions & FF_VK_EXT_EXTERNAL_HOST_MEMORY) {
+ err = ff_vk_host_map_buffer(&ctx->s, &vp->slices_buf, buffer_ref->data,
+ buffer_ref,
+ DECODER_IS_SDR(avctx->codec_id) ?
+ (VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
+ VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT) :
+ VK_BUFFER_USAGE_VIDEO_DECODE_SRC_BIT_KHR);
+ if (err < 0)
+ return err;
+ }
+
+ return 0;
+}
+
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
const uint8_t *data, size_t size, int add_startcode)
{
@@ -268,6 +289,15 @@ int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
return AVERROR(EINVAL);
vkbuf = vp->slices_buf ? (FFVkBuffer *)vp->slices_buf->data : NULL;
+
+ /* Buffer exists, and is a single complete host-mapped buffer. */
+ if (vkbuf && vkbuf->host_ref) {
+ vp->slice_offsets[vp->nb_slices] = vp->slices_size;
+ vp->nb_slices = vp->nb_slices + 1;
+ vp->slices_size += startcode_len + size;
+ return 0;
+ }
+
if (!vkbuf || vkbuf->size < new_size) {
int err;
AVBufferRef *new_ref;
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index 6c3e1486b0..103be09943 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -145,6 +145,12 @@ int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic,
FFVulkanDecodePicture *vkpic, int is_current,
enum FFVkShaderRepFormat rep_fmt, int alloc_dpb);
+/**
+ * Generic start_frame function.
+ */
+int ff_vk_decode_start_frame(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+ const AVBufferRef *buffer_ref, int complete);
+
/**
* Add slice data to frame.
*/
--
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
^ permalink raw reply [flat|nested] 6+ messages in thread
* [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary
2025-03-31 2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
` (2 preceding siblings ...)
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function Lynne
@ 2025-03-31 2:37 ` Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: " Lynne
4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31 2:37 UTC (permalink / raw)
To: ffmpeg-devel; +Cc: Lynne
This commit moves all temporary structs used for decoding out
of the common picture header and onto stack.
---
libavcodec/vulkan_decode.c | 1 +
libavcodec/vulkan_decode.h | 3 +
libavcodec/vulkan_h264.c | 322 +++++++++++++++++++------------------
3 files changed, 168 insertions(+), 158 deletions(-)
diff --git a/libavcodec/vulkan_decode.c b/libavcodec/vulkan_decode.c
index 893f8fca3d..5505fbda28 100644
--- a/libavcodec/vulkan_decode.c
+++ b/libavcodec/vulkan_decode.c
@@ -253,6 +253,7 @@ int ff_vk_decode_start_frame(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
vp->nb_slices = 0;
vp->slices_size = 0;
+ vp->intra_pic_flag = 1;
/* Host map the input slices data if supported */
if (complete && ctx->s.extensions & FF_VK_EXT_EXTERNAL_HOST_MEMORY) {
diff --git a/libavcodec/vulkan_decode.h b/libavcodec/vulkan_decode.h
index 103be09943..5b14d962f2 100644
--- a/libavcodec/vulkan_decode.h
+++ b/libavcodec/vulkan_decode.h
@@ -105,6 +105,9 @@ typedef struct FFVulkanDecodePicture {
/* Vulkan functions needed for destruction, as no other context is guaranteed to exist */
PFN_vkWaitSemaphores wait_semaphores;
PFN_vkDestroyImageView destroy_image_view;
+
+ /* Codec specific */
+ int intra_pic_flag; /* Only used by H264 */
} FFVulkanDecodePicture;
/**
diff --git a/libavcodec/vulkan_h264.c b/libavcodec/vulkan_h264.c
index 71a9c06801..e697583ba9 100644
--- a/libavcodec/vulkan_h264.c
+++ b/libavcodec/vulkan_h264.c
@@ -32,99 +32,8 @@ const FFVulkanDecodeDescriptor ff_vk_dec_h264_desc = {
},
};
-typedef struct H264VulkanDecodePicture {
- FFVulkanDecodePicture vp;
-
- /* Current picture */
- StdVideoDecodeH264ReferenceInfo h264_ref;
- VkVideoDecodeH264DpbSlotInfoKHR vkh264_ref;
-
- /* Picture refs */
- H264Picture *ref_src [H264_MAX_PICTURE_COUNT];
- StdVideoDecodeH264ReferenceInfo h264_refs [H264_MAX_PICTURE_COUNT];
- VkVideoDecodeH264DpbSlotInfoKHR vkh264_refs[H264_MAX_PICTURE_COUNT];
-
- /* Current picture (contd.) */
- StdVideoDecodeH264PictureInfo h264pic;
- VkVideoDecodeH264PictureInfoKHR h264_pic_info;
-
- /* Current picture */
- VkVideoPictureResourceInfoKHR ref;
- VkVideoReferenceSlotInfoKHR ref_slot;
-
- /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
- VkVideoPictureResourceInfoKHR refs [36];
- VkVideoReferenceSlotInfoKHR ref_slots[36];
-
- /* Main decoding struct */
- VkVideoDecodeInfoKHR decode_info;
-} H264VulkanDecodePicture;
-
const static int h264_scaling_list8_order[] = { 0, 3, 1, 4, 2, 5 };
-static int vk_h264_fill_pict(AVCodecContext *avctx, H264Picture **ref_src,
- VkVideoReferenceSlotInfoKHR *ref_slot, /* Main structure */
- VkVideoPictureResourceInfoKHR *ref, /* Goes in ^ */
- VkVideoDecodeH264DpbSlotInfoKHR *vkh264_ref, /* Goes in ^ */
- StdVideoDecodeH264ReferenceInfo *h264_ref, /* Goes in ^ */
- H264Picture *pic, int is_current,
- int is_field, int picture_structure,
- int dpb_slot_index)
-{
- FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
- FFVulkanDecodeShared *ctx = dec->shared_ctx;
- H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
- FFVulkanDecodePicture *vkpic = &hp->vp;
-
- int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
- dec->dedicated_dpb);
- if (err < 0)
- return err;
-
- *h264_ref = (StdVideoDecodeH264ReferenceInfo) {
- .FrameNum = pic->long_ref ? pic->pic_id : pic->frame_num,
- .PicOrderCnt = { pic->field_poc[0], pic->field_poc[1] },
- .flags = (StdVideoDecodeH264ReferenceInfoFlags) {
- .top_field_flag = is_field ? !!(picture_structure & PICT_TOP_FIELD) : 0,
- .bottom_field_flag = is_field ? !!(picture_structure & PICT_BOTTOM_FIELD) : 0,
- .used_for_long_term_reference = pic->reference && pic->long_ref,
- /*
- * flags.is_non_existing is used to indicate whether the picture is marked as
- * “non-existing” as defined in section 8.2.5.2 of the ITU-T H.264 Specification;
- * 8.2.5.2 Decoding process for gaps in frame_num
- * corresponds to the code in h264_slice.c:h264_field_start,
- * which sets the invalid_gap flag when decoding.
- */
- .is_non_existing = pic->invalid_gap,
- },
- };
-
- *vkh264_ref = (VkVideoDecodeH264DpbSlotInfoKHR) {
- .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_DPB_SLOT_INFO_KHR,
- .pStdReferenceInfo = h264_ref,
- };
-
- *ref = (VkVideoPictureResourceInfoKHR) {
- .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
- .codedOffset = (VkOffset2D){ 0, 0 },
- .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
- .baseArrayLayer = ctx->common.layered_dpb ? dpb_slot_index : 0,
- .imageViewBinding = vkpic->view.ref[0],
- };
-
- *ref_slot = (VkVideoReferenceSlotInfoKHR) {
- .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
- .pNext = vkh264_ref,
- .slotIndex = dpb_slot_index,
- .pPictureResource = ref,
- };
-
- if (ref_src)
- *ref_src = pic;
-
- return 0;
-}
-
static StdVideoH264LevelIdc convert_to_vk_level_idc(int level_idc)
{
switch (level_idc) {
@@ -369,18 +278,124 @@ static int vk_h264_create_params(AVCodecContext *avctx, AVBufferRef **buf)
return 0;
}
+static int vk_h264_fill_pict(AVCodecContext *avctx, H264Picture **ref_src,
+ VkVideoReferenceSlotInfoKHR *ref_slot, /* Main structure */
+ VkVideoPictureResourceInfoKHR *ref, /* Goes in ^ */
+ VkVideoDecodeH264DpbSlotInfoKHR *vkh264_ref, /* Goes in ^ */
+ StdVideoDecodeH264ReferenceInfo *h264_ref, /* Goes in ^ */
+ H264Picture *pic, int is_current,
+ int is_field, int picture_structure,
+ int dpb_slot_index)
+{
+ FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
+ FFVulkanDecodeShared *ctx = dec->shared_ctx;
+ FFVulkanDecodePicture *vkpic = pic->hwaccel_picture_private;
+
+ int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
+ dec->dedicated_dpb);
+ if (err < 0)
+ return err;
+
+ *h264_ref = (StdVideoDecodeH264ReferenceInfo) {
+ .FrameNum = pic->long_ref ? pic->pic_id : pic->frame_num,
+ .PicOrderCnt = { pic->field_poc[0], pic->field_poc[1] },
+ .flags = (StdVideoDecodeH264ReferenceInfoFlags) {
+ .top_field_flag = is_field ? !!(picture_structure & PICT_TOP_FIELD) : 0,
+ .bottom_field_flag = is_field ? !!(picture_structure & PICT_BOTTOM_FIELD) : 0,
+ .used_for_long_term_reference = pic->reference && pic->long_ref,
+ /*
+ * flags.is_non_existing is used to indicate whether the picture is marked as
+ * “non-existing” as defined in section 8.2.5.2 of the ITU-T H.264 Specification;
+ * 8.2.5.2 Decoding process for gaps in frame_num
+ * corresponds to the code in h264_slice.c:h264_field_start,
+ * which sets the invalid_gap flag when decoding.
+ */
+ .is_non_existing = pic->invalid_gap,
+ },
+ };
+
+ *vkh264_ref = (VkVideoDecodeH264DpbSlotInfoKHR) {
+ .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_DPB_SLOT_INFO_KHR,
+ .pStdReferenceInfo = h264_ref,
+ };
+
+ *ref = (VkVideoPictureResourceInfoKHR) {
+ .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
+ .codedOffset = (VkOffset2D){ 0, 0 },
+ .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
+ .baseArrayLayer = ctx->common.layered_dpb ? dpb_slot_index : 0,
+ .imageViewBinding = vkpic->view.ref[0],
+ };
+
+ *ref_slot = (VkVideoReferenceSlotInfoKHR) {
+ .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
+ .pNext = vkh264_ref,
+ .slotIndex = dpb_slot_index,
+ .pPictureResource = ref,
+ };
+
+ if (ref_src)
+ *ref_src = pic;
+
+ return 0;
+}
+
static int vk_h264_start_frame(AVCodecContext *avctx,
av_unused const AVBufferRef *buffer_ref,
av_unused const uint8_t *buffer,
av_unused uint32_t size)
+{
+ const H264Context *h = avctx->priv_data;
+ H264Picture *pic = h->cur_pic_ptr;
+ FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
+
+ return ff_vk_decode_start_frame(avctx, vp, buffer_ref, 0);
+}
+
+typedef struct H264VulkanDecodeParams {
+ /* Current picture */
+ StdVideoDecodeH264ReferenceInfo h264_ref;
+ VkVideoDecodeH264DpbSlotInfoKHR vkh264_ref;
+
+ /* Picture refs */
+ H264Picture *ref_src [H264_MAX_PICTURE_COUNT];
+ StdVideoDecodeH264ReferenceInfo h264_refs [H264_MAX_PICTURE_COUNT];
+ VkVideoDecodeH264DpbSlotInfoKHR vkh264_refs[H264_MAX_PICTURE_COUNT];
+
+ /* Current picture (contd.) */
+ StdVideoDecodeH264PictureInfo h264pic;
+ VkVideoDecodeH264PictureInfoKHR h264_pic_info;
+
+ /* Current picture */
+ VkVideoPictureResourceInfoKHR ref;
+ VkVideoReferenceSlotInfoKHR ref_slot;
+
+ /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+ VkVideoPictureResourceInfoKHR refs [36];
+ VkVideoReferenceSlotInfoKHR ref_slots[36];
+
+ /* Maintenance 2 */
+#ifdef VK_KHR_video_maintenance2
+ StdVideoH264ScalingLists vksps_scaling;
+ StdVideoH264HrdParameters vksps_vui_header;
+ StdVideoH264SequenceParameterSetVui vksps_vui;
+ StdVideoH264SequenceParameterSet vksps;
+ StdVideoH264ScalingLists vkpps_scaling;
+ StdVideoH264PictureParameterSet vkpps;
+ VkVideoDecodeH264InlineSessionParametersInfoKHR h264_params;
+#endif
+
+ /* Main decoding struct */
+ VkVideoDecodeInfoKHR decode_info;
+} H264VulkanDecodeParams;
+
+static int vk_h264_fill_params(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+ H264VulkanDecodeParams *hp)
{
int err;
int dpb_slot_index = 0;
H264Context *h = avctx->priv_data;
-
H264Picture *pic = h->cur_pic_ptr;
- H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
- FFVulkanDecodePicture *vp = &hp->vp;
/* Fill in main slot */
dpb_slot_index = 0;
@@ -445,13 +460,13 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
hp->h264pic = (StdVideoDecodeH264PictureInfo) {
.seq_parameter_set_id = pic->pps->sps_id,
.pic_parameter_set_id = pic->pps->pps_id,
- .frame_num = 0, /* Set later */
- .idr_pic_id = 0, /* Set later */
+ .frame_num = h->slice_ctx[0].frame_num,
+ .idr_pic_id = h->slice_ctx[0].idr_pic_id,
.PicOrderCnt[0] = pic->field_poc[0],
.PicOrderCnt[1] = pic->field_poc[1],
.flags = (StdVideoDecodeH264PictureInfoFlags) {
+ .is_intra = vp->intra_pic_flag,
.field_pic_flag = FIELD_PICTURE(h),
- .is_intra = 1, /* Set later */
.IdrPicFlag = h->picture_idr,
.bottom_field_flag = h->picture_structure != PICT_FRAME &&
h->picture_structure & PICT_BOTTOM_FIELD,
@@ -463,6 +478,8 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
hp->h264_pic_info = (VkVideoDecodeH264PictureInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_PICTURE_INFO_KHR,
.pStdPictureInfo = &hp->h264pic,
+ .pSliceOffsets = vp->slice_offsets,
+ .sliceCount = vp->nb_slices,
};
hp->decode_info = (VkVideoDecodeInfoKHR) {
@@ -484,100 +501,89 @@ static int vk_h264_start_frame(AVCodecContext *avctx,
return 0;
}
-static int vk_h264_decode_slice(AVCodecContext *avctx,
- const uint8_t *data,
- uint32_t size)
-{
- const H264Context *h = avctx->priv_data;
- const H264SliceContext *sl = &h->slice_ctx[0];
- H264VulkanDecodePicture *hp = h->cur_pic_ptr->hwaccel_picture_private;
- FFVulkanDecodePicture *vp = &hp->vp;
-
- int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
- if (err < 0)
- return err;
-
- hp->h264pic.frame_num = sl->frame_num;
- hp->h264pic.idr_pic_id = sl->idr_pic_id;
-
- /* Frame is only intra of all slices are marked as intra */
- if (sl->slice_type != AV_PICTURE_TYPE_I && sl->slice_type != AV_PICTURE_TYPE_SI)
- hp->h264pic.flags.is_intra = 0;
-
- return 0;
-}
-
static int vk_h264_end_frame(AVCodecContext *avctx)
{
+ int err;
const H264Context *h = avctx->priv_data;
FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
FFVulkanDecodeShared *ctx = dec->shared_ctx;
H264Picture *pic = h->cur_pic_ptr;
- H264VulkanDecodePicture *hp = pic->hwaccel_picture_private;
- FFVulkanDecodePicture *vp = &hp->vp;
+ FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
FFVulkanDecodePicture *rvp[H264_MAX_PICTURE_COUNT] = { 0 };
AVFrame *rav[H264_MAX_PICTURE_COUNT] = { 0 };
-#ifdef VK_KHR_video_maintenance2
- StdVideoH264ScalingLists vksps_scaling;
- StdVideoH264HrdParameters vksps_vui_header;
- StdVideoH264SequenceParameterSetVui vksps_vui;
- StdVideoH264SequenceParameterSet vksps;
- StdVideoH264ScalingLists vkpps_scaling;
- StdVideoH264PictureParameterSet vkpps;
- VkVideoDecodeH264InlineSessionParametersInfoKHR h264_params;
+ H264VulkanDecodeParams hp = { 0 };
+
+ if (!vp->nb_slices)
+ return 0;
+
+ err = vk_h264_fill_params(avctx, vp, &hp);
+ if (err < 0)
+ return err;
+#ifdef VK_KHR_video_maintenance2
if (ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2) {
- set_sps(h->ps.sps, &vksps_scaling,
- &vksps_vui_header, &vksps_vui, &vksps);
- set_pps(h->ps.pps, h->ps.sps, &vkpps_scaling, &vkpps);
- h264_params = (VkVideoDecodeH264InlineSessionParametersInfoKHR) {
+ set_sps(h->ps.sps, &hp.vksps_scaling,
+ &hp.vksps_vui_header, &hp.vksps_vui, &hp.vksps);
+ set_pps(h->ps.pps, h->ps.sps, &hp.vkpps_scaling, &hp.vkpps);
+ hp.h264_params = (VkVideoDecodeH264InlineSessionParametersInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H264_INLINE_SESSION_PARAMETERS_INFO_KHR,
- .pStdSPS = &vksps,
- .pStdPPS = &vkpps,
+ .pStdSPS = &hp.vksps,
+ .pStdPPS = &hp.vkpps,
};
- hp->h264_pic_info.pNext = &h264_params;
- }
+ hp.h264_pic_info.pNext = &hp.h264_params;
+ } else
#endif
- hp->h264_pic_info.pSliceOffsets = vp->slice_offsets;
- hp->h264_pic_info.sliceCount = vp->nb_slices;
- if (!hp->h264_pic_info.sliceCount)
- return 0;
-
- if (!dec->session_params &&
- !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
+ if (!dec->session_params) {
int err = vk_h264_create_params(avctx, &dec->session_params);
if (err < 0)
return err;
- hp->h264pic.seq_parameter_set_id = pic->pps->sps_id;
- hp->h264pic.pic_parameter_set_id = pic->pps->pps_id;
+ hp.h264pic.seq_parameter_set_id = pic->pps->sps_id;
+ hp.h264pic.pic_parameter_set_id = pic->pps->pps_id;
}
- for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
- H264Picture *rp = hp->ref_src[i];
- H264VulkanDecodePicture *rhp = rp->hwaccel_picture_private;
-
- rvp[i] = &rhp->vp;
- rav[i] = hp->ref_src[i]->f;
+ for (int i = 0; i < hp.decode_info.referenceSlotCount; i++) {
+ H264Picture *rp = hp.ref_src[i];
+ rvp[i] = rp->hwaccel_picture_private;
+ rav[i] = hp.ref_src[i]->f;
}
av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
- vp->slices_size, hp->h264_pic_info.sliceCount);
+ vp->slices_size, hp.h264_pic_info.sliceCount);
- return ff_vk_decode_frame(avctx, &hp->decode_info,
+ return ff_vk_decode_frame(avctx, &hp.decode_info,
pic->f, vp, rav, rvp);
}
+static int vk_h264_decode_slice(AVCodecContext *avctx,
+ const uint8_t *data,
+ uint32_t size)
+{
+ const H264Context *h = avctx->priv_data;
+ const H264SliceContext *sl = &h->slice_ctx[0];
+ FFVulkanDecodePicture *vp = h->cur_pic_ptr->hwaccel_picture_private;
+
+ int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
+ if (err < 0)
+ return err;
+
+ /* Frame is only intra of all slices are marked as intra */
+ if (sl->slice_type != AV_PICTURE_TYPE_I && sl->slice_type != AV_PICTURE_TYPE_SI)
+ vp->intra_pic_flag = 0;
+
+ return 0;
+}
+
static void vk_h264_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
{
AVHWDeviceContext *hwctx = _hwctx.nc;
- H264VulkanDecodePicture *hp = data;
+ FFVulkanDecodePicture *vp = data;
/* Free frame resources, this also destroys the session parameters. */
- ff_vk_decode_free_frame(hwctx, &hp->vp);
+ ff_vk_decode_free_frame(hwctx, vp);
}
const FFHWAccel ff_h264_vulkan_hwaccel = {
@@ -589,7 +595,7 @@ const FFHWAccel ff_h264_vulkan_hwaccel = {
.decode_slice = &vk_h264_decode_slice,
.end_frame = &vk_h264_end_frame,
.free_frame_priv = &vk_h264_free_frame_priv,
- .frame_priv_data_size = sizeof(H264VulkanDecodePicture),
+ .frame_priv_data_size = sizeof(FFVulkanDecodePicture),
.init = &ff_vk_decode_init,
.update_thread_context = &ff_vk_update_thread_context,
.decode_params = &ff_vk_params_invalidate,
--
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
^ permalink raw reply [flat|nested] 6+ messages in thread
* [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: make all temporary structs temporary
2025-03-31 2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
` (3 preceding siblings ...)
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary Lynne
@ 2025-03-31 2:37 ` Lynne
4 siblings, 0 replies; 6+ messages in thread
From: Lynne @ 2025-03-31 2:37 UTC (permalink / raw)
To: ffmpeg-devel; +Cc: Lynne
---
libavcodec/vulkan_hevc.c | 291 ++++++++++++++++++++-------------------
1 file changed, 150 insertions(+), 141 deletions(-)
diff --git a/libavcodec/vulkan_hevc.c b/libavcodec/vulkan_hevc.c
index e83f8346a0..baf8b0c3fd 100644
--- a/libavcodec/vulkan_hevc.c
+++ b/libavcodec/vulkan_hevc.c
@@ -112,85 +112,6 @@ static int alloc_hevc_header_structs(FFVulkanDecodeContext *s,
return 0;
}
-typedef struct HEVCVulkanDecodePicture {
- FFVulkanDecodePicture vp;
-
- /* Current picture */
- StdVideoDecodeH265ReferenceInfo h265_ref;
- VkVideoDecodeH265DpbSlotInfoKHR vkh265_ref;
-
- /* Picture refs */
- HEVCFrame *ref_src [HEVC_MAX_REFS];
- StdVideoDecodeH265ReferenceInfo h265_refs [HEVC_MAX_REFS];
- VkVideoDecodeH265DpbSlotInfoKHR vkh265_refs[HEVC_MAX_REFS];
-
- /* Current picture (contd.) */
- StdVideoDecodeH265PictureInfo h265pic;
- VkVideoDecodeH265PictureInfoKHR h265_pic_info;
-
- /* Current picture */
- VkVideoPictureResourceInfoKHR ref;
- VkVideoReferenceSlotInfoKHR ref_slot;
-
- /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
- VkVideoPictureResourceInfoKHR refs [36];
- VkVideoReferenceSlotInfoKHR ref_slots[36];
-
- /* Main decoding struct */
- VkVideoDecodeInfoKHR decode_info;
-} HEVCVulkanDecodePicture;
-
-static int vk_hevc_fill_pict(AVCodecContext *avctx, HEVCFrame **ref_src,
- VkVideoReferenceSlotInfoKHR *ref_slot, /* Main structure */
- VkVideoPictureResourceInfoKHR *ref, /* Goes in ^ */
- VkVideoDecodeH265DpbSlotInfoKHR *vkh265_ref, /* Goes in ^ */
- StdVideoDecodeH265ReferenceInfo *h265_ref, /* Goes in ^ */
- HEVCFrame *pic, int is_current, int pic_id)
-{
- FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
- FFVulkanDecodeShared *ctx = dec->shared_ctx;
- HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
- FFVulkanDecodePicture *vkpic = &hp->vp;
-
- int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
- dec->dedicated_dpb);
- if (err < 0)
- return err;
-
- *h265_ref = (StdVideoDecodeH265ReferenceInfo) {
- .flags = (StdVideoDecodeH265ReferenceInfoFlags) {
- .used_for_long_term_reference = pic->flags & HEVC_FRAME_FLAG_LONG_REF,
- .unused_for_reference = 0,
- },
- .PicOrderCntVal = pic->poc,
- };
-
- *vkh265_ref = (VkVideoDecodeH265DpbSlotInfoKHR) {
- .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_DPB_SLOT_INFO_KHR,
- .pStdReferenceInfo = h265_ref,
- };
-
- *ref = (VkVideoPictureResourceInfoKHR) {
- .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
- .codedOffset = (VkOffset2D){ 0, 0 },
- .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
- .baseArrayLayer = ctx->common.layered_dpb ? pic_id : 0,
- .imageViewBinding = vkpic->view.ref[0],
- };
-
- *ref_slot = (VkVideoReferenceSlotInfoKHR) {
- .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
- .pNext = vkh265_ref,
- .slotIndex = pic_id,
- .pPictureResource = ref,
- };
-
- if (ref_src)
- *ref_src = pic;
-
- return 0;
-}
-
static void copy_scaling_list(const ScalingList *sl, StdVideoH265ScalingLists *vksl)
{
for (int i = 0; i < STD_VIDEO_H265_SCALING_LIST_4X4_NUM_LISTS; i++) {
@@ -719,18 +640,114 @@ static int vk_hevc_create_params(AVCodecContext *avctx, AVBufferRef **buf)
return 0;
}
+static int vk_hevc_fill_pict(AVCodecContext *avctx, HEVCFrame **ref_src,
+ VkVideoReferenceSlotInfoKHR *ref_slot, /* Main structure */
+ VkVideoPictureResourceInfoKHR *ref, /* Goes in ^ */
+ VkVideoDecodeH265DpbSlotInfoKHR *vkh265_ref, /* Goes in ^ */
+ StdVideoDecodeH265ReferenceInfo *h265_ref, /* Goes in ^ */
+ HEVCFrame *pic, int is_current, int pic_id)
+{
+ FFVulkanDecodeContext *dec = avctx->internal->hwaccel_priv_data;
+ FFVulkanDecodeShared *ctx = dec->shared_ctx;
+ FFVulkanDecodePicture *vkpic = pic->hwaccel_picture_private;
+
+ int err = ff_vk_decode_prepare_frame(dec, pic->f, vkpic, is_current,
+ dec->dedicated_dpb);
+ if (err < 0)
+ return err;
+
+ *h265_ref = (StdVideoDecodeH265ReferenceInfo) {
+ .flags = (StdVideoDecodeH265ReferenceInfoFlags) {
+ .used_for_long_term_reference = pic->flags & HEVC_FRAME_FLAG_LONG_REF,
+ .unused_for_reference = 0,
+ },
+ .PicOrderCntVal = pic->poc,
+ };
+
+ *vkh265_ref = (VkVideoDecodeH265DpbSlotInfoKHR) {
+ .sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_DPB_SLOT_INFO_KHR,
+ .pStdReferenceInfo = h265_ref,
+ };
+
+ *ref = (VkVideoPictureResourceInfoKHR) {
+ .sType = VK_STRUCTURE_TYPE_VIDEO_PICTURE_RESOURCE_INFO_KHR,
+ .codedOffset = (VkOffset2D){ 0, 0 },
+ .codedExtent = (VkExtent2D){ pic->f->width, pic->f->height },
+ .baseArrayLayer = ctx->common.layered_dpb ? pic_id : 0,
+ .imageViewBinding = vkpic->view.ref[0],
+ };
+
+ *ref_slot = (VkVideoReferenceSlotInfoKHR) {
+ .sType = VK_STRUCTURE_TYPE_VIDEO_REFERENCE_SLOT_INFO_KHR,
+ .pNext = vkh265_ref,
+ .slotIndex = pic_id,
+ .pPictureResource = ref,
+ };
+
+ if (ref_src)
+ *ref_src = pic;
+
+ return 0;
+}
+
static int vk_hevc_start_frame(AVCodecContext *avctx,
av_unused const AVBufferRef *buffer_ref,
av_unused const uint8_t *buffer,
av_unused uint32_t size)
+{
+ const HEVCContext *h = avctx->priv_data;
+ HEVCFrame *pic = h->cur_frame;
+ FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
+
+ return ff_vk_decode_start_frame(avctx, vp, buffer_ref, 0);
+}
+
+typedef struct HEVCVulkanDecodeParams {
+ /* Current picture */
+ StdVideoDecodeH265ReferenceInfo h265_ref;
+ VkVideoDecodeH265DpbSlotInfoKHR vkh265_ref;
+
+ /* Picture refs */
+ HEVCFrame *ref_src [HEVC_MAX_REFS];
+ StdVideoDecodeH265ReferenceInfo h265_refs [HEVC_MAX_REFS];
+ VkVideoDecodeH265DpbSlotInfoKHR vkh265_refs[HEVC_MAX_REFS];
+
+ /* Current picture (contd.) */
+ StdVideoDecodeH265PictureInfo h265pic;
+ VkVideoDecodeH265PictureInfoKHR h265_pic_info;
+
+ /* Current picture */
+ VkVideoPictureResourceInfoKHR ref;
+ VkVideoReferenceSlotInfoKHR ref_slot;
+
+ /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
+ VkVideoPictureResourceInfoKHR refs [36];
+ VkVideoReferenceSlotInfoKHR ref_slots[36];
+
+ /* Maintenance 2 */
+#ifdef VK_KHR_video_maintenance2
+ HEVCHeaderPPS vkpps_p;
+ StdVideoH265PictureParameterSet vkpps;
+ HEVCHeaderSPS vksps_p;
+ StdVideoH265SequenceParameterSet vksps;
+ HEVCHeaderVPSSet vkvps_ps[HEVC_MAX_SUB_LAYERS];
+ HEVCHeaderVPS vkvps_p;
+ StdVideoH265VideoParameterSet vkvps;
+ VkVideoDecodeH265InlineSessionParametersInfoKHR h265_params;
+#endif
+
+ /* Main decoding struct */
+ VkVideoDecodeInfoKHR decode_info;
+} HEVCVulkanDecodeParams;
+
+static int vk_hevc_fill_params(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
+ HEVCVulkanDecodeParams *hp)
{
int err;
HEVCContext *h = avctx->priv_data;
HEVCLayerContext *l = &h->layers[h->cur_layer];
HEVCFrame *pic = h->cur_frame;
- HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
- FFVulkanDecodePicture *vp = &hp->vp;
const HEVCPPS *pps = h->pps;
const HEVCSPS *sps = pps->sps;
int nb_refs = 0;
@@ -814,7 +831,8 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
hp->h265_pic_info = (VkVideoDecodeH265PictureInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_PICTURE_INFO_KHR,
.pStdPictureInfo = &hp->h265pic,
- .sliceSegmentCount = 0,
+ .pSliceSegmentOffsets = vp->slice_offsets,
+ .sliceSegmentCount = vp->nb_slices,
};
hp->decode_info = (VkVideoDecodeInfoKHR) {
@@ -836,21 +854,6 @@ static int vk_hevc_start_frame(AVCodecContext *avctx,
return 0;
}
-static int vk_hevc_decode_slice(AVCodecContext *avctx,
- const uint8_t *data,
- uint32_t size)
-{
- const HEVCContext *h = avctx->priv_data;
- HEVCVulkanDecodePicture *hp = h->cur_frame->hwaccel_picture_private;
- FFVulkanDecodePicture *vp = &hp->vp;
-
- int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
- if (err < 0)
- return err;
-
- return 0;
-}
-
static int vk_hevc_end_frame(AVCodecContext *avctx)
{
const HEVCContext *h = avctx->priv_data;
@@ -858,53 +861,46 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
FFVulkanDecodeShared *ctx = dec->shared_ctx;
HEVCFrame *pic = h->cur_frame;
- HEVCVulkanDecodePicture *hp = pic->hwaccel_picture_private;
- FFVulkanDecodePicture *vp = &hp->vp;
+ FFVulkanDecodePicture *vp = pic->hwaccel_picture_private;
FFVulkanDecodePicture *rvp[HEVC_MAX_REFS] = { 0 };
AVFrame *rav[HEVC_MAX_REFS] = { 0 };
int err;
+ HEVCVulkanDecodeParams hp = { 0 };
+
const HEVCPPS *pps = h->pps;
const HEVCSPS *sps = pps->sps;
-#ifdef VK_KHR_video_maintenance2
- HEVCHeaderPPS vkpps_p;
- StdVideoH265PictureParameterSet vkpps;
- HEVCHeaderSPS vksps_p;
- StdVideoH265SequenceParameterSet vksps;
- HEVCHeaderVPSSet vkvps_ps[HEVC_MAX_SUB_LAYERS];
- HEVCHeaderVPS vkvps_p;
- StdVideoH265VideoParameterSet vkvps;
- VkVideoDecodeH265InlineSessionParametersInfoKHR h265_params;
+ if (!vp->nb_slices)
+ return 0;
+ err = vk_hevc_fill_params(avctx, vp, &hp);
+ if (err < 0)
+ return err;
+
+#ifdef VK_KHR_video_maintenance2
if (ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2) {
- set_pps(pps, sps, &vkpps_p.scaling, &vkpps, &vkpps_p.pal);
- set_sps(sps, pps->sps_id, &vksps_p.scaling, &vksps_p.vui_header,
- &vksps_p.vui, &vksps, vksps_p.nal_hdr,
- vksps_p.vcl_hdr, &vksps_p.ptl, &vksps_p.dpbm,
- &vksps_p.pal, vksps_p.str, &vksps_p.ltr);
+ set_pps(pps, sps, &hp.vkpps_p.scaling, &hp.vkpps, &hp.vkpps_p.pal);
+ set_sps(sps, pps->sps_id, &hp.vksps_p.scaling, &hp.vksps_p.vui_header,
+ &hp.vksps_p.vui, &hp.vksps, hp.vksps_p.nal_hdr,
+ hp.vksps_p.vcl_hdr, &hp.vksps_p.ptl, &hp.vksps_p.dpbm,
+ &hp.vksps_p.pal, hp.vksps_p.str, &hp.vksps_p.ltr);
- vkvps_p.sls = vkvps_ps;
- set_vps(sps->vps, &vkvps, &vkvps_p.ptl, &vkvps_p.dpbm,
- vkvps_p.hdr, vkvps_p.sls);
+ hp.vkvps_p.sls = hp.vkvps_ps;
+ set_vps(sps->vps, &hp.vkvps, &hp.vkvps_p.ptl, &hp.vkvps_p.dpbm,
+ hp.vkvps_p.hdr, hp.vkvps_p.sls);
- h265_params = (VkVideoDecodeH265InlineSessionParametersInfoKHR) {
+ hp.h265_params = (VkVideoDecodeH265InlineSessionParametersInfoKHR) {
.sType = VK_STRUCTURE_TYPE_VIDEO_DECODE_H265_INLINE_SESSION_PARAMETERS_INFO_KHR,
- .pStdSPS = &vksps,
- .pStdPPS = &vkpps,
- .pStdVPS = &vkvps,
+ .pStdSPS = &hp.vksps,
+ .pStdPPS = &hp.vkpps,
+ .pStdVPS = &hp.vkvps,
};
- hp->h265_pic_info.pNext = &h265_params;
- }
+ hp.h265_pic_info.pNext = &hp.h265_params;
+ } else
#endif
- hp->h265_pic_info.pSliceSegmentOffsets = vp->slice_offsets;
- hp->h265_pic_info.sliceSegmentCount = vp->nb_slices;
- if (!hp->h265_pic_info.sliceSegmentCount)
- return 0;
-
- if (!dec->session_params &&
- !(ctx->s.extensions & FF_VK_EXT_VIDEO_MAINTENANCE_2)) {
+ if (!dec->session_params) {
if (!pps) {
unsigned int pps_id = h->sh.pps_id;
if (pps_id < HEVC_MAX_PPS_COUNT && h->ps.pps_list[pps_id] != NULL)
@@ -921,31 +917,44 @@ static int vk_hevc_end_frame(AVCodecContext *avctx)
if (err < 0)
return err;
- hp->h265pic.sps_video_parameter_set_id = sps->vps_id;
- hp->h265pic.pps_seq_parameter_set_id = pps->sps_id;
- hp->h265pic.pps_pic_parameter_set_id = pps->pps_id;
+ hp.h265pic.sps_video_parameter_set_id = sps->vps_id;
+ hp.h265pic.pps_seq_parameter_set_id = pps->sps_id;
+ hp.h265pic.pps_pic_parameter_set_id = pps->pps_id;
}
- for (int i = 0; i < hp->decode_info.referenceSlotCount; i++) {
- HEVCVulkanDecodePicture *rfhp = hp->ref_src[i]->hwaccel_picture_private;
- rav[i] = hp->ref_src[i]->f;
- rvp[i] = &rfhp->vp;
+ for (int i = 0; i < hp.decode_info.referenceSlotCount; i++) {
+ rav[i] = hp.ref_src[i]->f;
+ rvp[i] = hp.ref_src[i]->hwaccel_picture_private;
}
av_log(avctx, AV_LOG_VERBOSE, "Decoding frame, %"SIZE_SPECIFIER" bytes, %i slices\n",
- vp->slices_size, hp->h265_pic_info.sliceSegmentCount);
+ vp->slices_size, hp.h265_pic_info.sliceSegmentCount);
- return ff_vk_decode_frame(avctx, &hp->decode_info,
+ return ff_vk_decode_frame(avctx, &hp.decode_info,
pic->f, vp, rav, rvp);
}
+static int vk_hevc_decode_slice(AVCodecContext *avctx,
+ const uint8_t *data,
+ uint32_t size)
+{
+ const HEVCContext *h = avctx->priv_data;
+ FFVulkanDecodePicture *vp = h->cur_frame->hwaccel_picture_private;
+
+ int err = ff_vk_decode_add_slice(avctx, vp, data, size, 1);
+ if (err < 0)
+ return err;
+
+ return 0;
+}
+
static void vk_hevc_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
{
AVHWDeviceContext *hwctx = _hwctx.nc;
- HEVCVulkanDecodePicture *hp = data;
+ FFVulkanDecodePicture *vp = data;
/* Free frame resources */
- ff_vk_decode_free_frame(hwctx, &hp->vp);
+ ff_vk_decode_free_frame(hwctx, vp);
}
const FFHWAccel ff_hevc_vulkan_hwaccel = {
@@ -957,7 +966,7 @@ const FFHWAccel ff_hevc_vulkan_hwaccel = {
.decode_slice = &vk_hevc_decode_slice,
.end_frame = &vk_hevc_end_frame,
.free_frame_priv = &vk_hevc_free_frame_priv,
- .frame_priv_data_size = sizeof(HEVCVulkanDecodePicture),
+ .frame_priv_data_size = sizeof(FFVulkanDecodePicture),
.init = &ff_vk_decode_init,
.update_thread_context = &ff_vk_update_thread_context,
.decode_params = &ff_vk_params_invalidate,
--
2.49.0
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
^ permalink raw reply [flat|nested] 6+ messages in thread
end of thread, other threads:[~2025-03-31 2:39 UTC | newest]
Thread overview: 6+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2025-03-31 2:37 [FFmpeg-devel] [PATCH 1/6] vulkan_decode: generalize handling of slice offsets/nb Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 2/6] vulkan_decode: only create sequence params in end_frame Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 3/6] vulkan_decode: move temporary Vulkan structs into each codec Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 4/6] vulkan_decode: add a generic start_frame function Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 5/6] vulkan_h264: make all temporary structs temporary Lynne
2025-03-31 2:37 ` [FFmpeg-devel] [PATCH 6/6] vulkan_hevc: " Lynne
Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
This inbox may be cloned and mirrored by anyone:
git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git
# If you have public-inbox 1.1+ installed, you may
# initialize and index your mirror using the following commands:
public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
ffmpegdev@gitmailbox.com
public-inbox-index ffmpegdev
Example config snippet for mirrors.
AGPL code for this site: git clone https://public-inbox.org/public-inbox.git