From: Lynne <dev@lynne.ee>
To: FFmpeg development discussions and patches <ffmpeg-devel@ffmpeg.org>
Subject: Re: [FFmpeg-devel] [PATCH 55/97] Vulkan patchset part 2 - hwcontext rewrite and filtering
Date: Thu, 11 May 2023 20:55:40 +0200 (CEST)
Message-ID: <NVB9nuj--B-9@lynne.ee> (raw)
In-Reply-To: <168382101862.3843.5076464633158031795@lain.khirnov.net>
May 11, 2023, 18:04 by anton@khirnov.net:
> Quoting Lynne (2023-04-24 17:56:38)
>
>> From b0c429d0d77d1789b6349bc6b296449ae1f8e9da Mon Sep 17 00:00:00 2001
>> From: Lynne <dev@lynne.ee>
>> Date: Tue, 15 Mar 2022 23:00:32 +0100
>> Subject: [PATCH 26/97] hwcontext_vulkan: support threadsafe queue and frame
>> operations
>>
>> ---
>> libavutil/hwcontext_vulkan.c | 176 +++++++++++++++++++++++++----------
>> libavutil/hwcontext_vulkan.h | 40 +++++++-
>> 2 files changed, 167 insertions(+), 49 deletions(-)
>>
>> diff --git a/libavutil/hwcontext_vulkan.c b/libavutil/hwcontext_vulkan.c
>> index 894b4b83f3..b0db59b2d8 100644
>> --- a/libavutil/hwcontext_vulkan.c
>> +++ b/libavutil/hwcontext_vulkan.c
>> @@ -27,6 +27,7 @@
>> #include <dlfcn.h>
>> #endif
>>
>> +#include <pthread.h>
>> #include <unistd.h>
>>
>> #include "config.h"
>> @@ -92,8 +93,10 @@ typedef struct VulkanDevicePriv {
>> VkPhysicalDeviceVulkan13Features device_features_1_3;
>>
>> /* Queues */
>> - uint32_t qfs[5];
>> - int num_qfs;
>> + pthread_mutex_t **qf_mutex;
>> + int nb_tot_qfs;
>> + uint32_t img_qfs[5];
>> + int nb_img_qfs;
>>
>
> This patch would be so much more readable without random renamings.
>
They're not random, the meaning of each variable is different
to what they meant before.
nb_img_qfs is the total number of enabled queue familiesnb_tot_qfs is the total number of queue families listed by the driver
>> /* Debug callback */
>> VkDebugUtilsMessengerEXT debug_ctx;
>> @@ -127,6 +130,8 @@ typedef struct VulkanFramesPriv {
>> } VulkanFramesPriv;
>>
>> typedef struct AVVkFrameInternal {
>> + pthread_mutex_t update_mutex;
>>
>
> As far as I can see, none of the mutices you're adding here are
> ever destroyed.
>
Fixed.
>> +
>> #if CONFIG_CUDA
>> /* Importing external memory into cuda is really expensive so we keep the
>> * memory imported all the time */
>> @@ -1304,6 +1309,10 @@ static void vulkan_device_free(AVHWDeviceContext *ctx)
>> if (p->libvulkan)
>> dlclose(p->libvulkan);
>>
>> + for (int i = 0; i < p->nb_tot_qfs; i++)
>> + av_freep(&p->qf_mutex[i]);
>> + av_freep(&p->qf_mutex);
>> +
>> RELEASE_PROPS(hwctx->enabled_inst_extensions, hwctx->nb_enabled_inst_extensions);
>> RELEASE_PROPS(hwctx->enabled_dev_extensions, hwctx->nb_enabled_dev_extensions);
>> }
>> @@ -1436,13 +1445,26 @@ end:
>> return err;
>> }
>>
>> +static void lock_queue(AVHWDeviceContext *ctx, int queue_family, int index)
>>
>
> It'd be nice to be consistent with types.
> These are uint32 in vulkan, no?
>
Fixed. Though, they're more closely related to the
number of queue families given in the hwcontext, which
are 32-bit ints.
>> +{
>> + VulkanDevicePriv *p = ctx->internal->priv;
>> + pthread_mutex_lock(&p->qf_mutex[queue_family][index]);
>> +}
>> +
>> +static void unlock_queue(AVHWDeviceContext *ctx, int queue_family, int index)
>> +{
>> + VulkanDevicePriv *p = ctx->internal->priv;
>> + pthread_mutex_unlock(&p->qf_mutex[queue_family][index]);
>> +}
>> +
>> static int vulkan_device_init(AVHWDeviceContext *ctx)
>> {
>> int err;
>> - uint32_t queue_num;
>> + uint32_t qf_num;
>> AVVulkanDeviceContext *hwctx = ctx->hwctx;
>> VulkanDevicePriv *p = ctx->internal->priv;
>> FFVulkanFunctions *vk = &p->vkfn;
>> + VkQueueFamilyProperties *qf;
>> int graph_index, comp_index, tx_index, enc_index, dec_index;
>>
>> /* Set device extension flags */
>> @@ -1481,12 +1503,31 @@ static int vulkan_device_init(AVHWDeviceContext *ctx)
>> p->dev_is_nvidia = (p->props.properties.vendorID == 0x10de);
>> p->dev_is_intel = (p->props.properties.vendorID == 0x8086);
>>
>> - vk->GetPhysicalDeviceQueueFamilyProperties(hwctx->phys_dev, &queue_num, NULL);
>> - if (!queue_num) {
>> + vk->GetPhysicalDeviceQueueFamilyProperties(hwctx->phys_dev, &qf_num, NULL);
>> + if (!qf_num) {
>> av_log(ctx, AV_LOG_ERROR, "Failed to get queues!\n");
>> return AVERROR_EXTERNAL;
>> }
>>
>> + qf = av_malloc_array(qf_num, sizeof(VkQueueFamilyProperties));
>> + if (!qf)
>> + return AVERROR(ENOMEM);
>> +
>> + vk->GetPhysicalDeviceQueueFamilyProperties(hwctx->phys_dev, &qf_num, qf);
>> +
>> + p->qf_mutex = av_mallocz(qf_num*sizeof(*p->qf_mutex));
>>
>
> av_calloc()
>
>> + if (!p->qf_mutex)
>> + return AVERROR(ENOMEM);
>> + p->nb_tot_qfs = qf_num;
>> +
>> + for (int i = 0; i < qf_num; i++) {
>> + p->qf_mutex[i] = av_mallocz(qf[i].queueCount*sizeof(**p->qf_mutex));
>>
>
> av_calloc()
>
>> + if (!p->qf_mutex[i])
>> + return AVERROR(ENOMEM);
>> + for (int j = 0; j < qf[i].queueCount; j++)
>> + pthread_mutex_init(&p->qf_mutex[i][j], NULL);
>>
>
> Should be checked.
>
Fixed all three.
>> + }
>> +
>> graph_index = hwctx->queue_family_index;
>> comp_index = hwctx->queue_family_comp_index;
>> tx_index = hwctx->queue_family_tx_index;
>> @@ -1501,9 +1542,9 @@ static int vulkan_device_init(AVHWDeviceContext *ctx)
>> return AVERROR(EINVAL); \
>> } else if (fidx < 0 || ctx_qf < 0) { \
>> break; \
>> - } else if (ctx_qf >= queue_num) { \
>> + } else if (ctx_qf >= qf_num) { \
>> av_log(ctx, AV_LOG_ERROR, "Invalid %s family index %i (device has %i families)!\n", \
>> - type, ctx_qf, queue_num); \
>> + type, ctx_qf, qf_num); \
>> return AVERROR(EINVAL); \
>> } \
>> \
>> @@ -1520,7 +1561,7 @@ static int vulkan_device_init(AVHWDeviceContext *ctx)
>> tx_index = (ctx_qf == tx_index) ? -1 : tx_index; \
>> enc_index = (ctx_qf == enc_index) ? -1 : enc_index; \
>> dec_index = (ctx_qf == dec_index) ? -1 : dec_index; \
>> - p->qfs[p->num_qfs++] = ctx_qf; \
>> + p->img_qfs[p->nb_img_qfs++] = ctx_qf; \
>> } while (0)
>>
>> CHECK_QUEUE("graphics", 0, graph_index, hwctx->queue_family_index, hwctx->nb_graphics_queues);
>> @@ -1531,6 +1572,11 @@ static int vulkan_device_init(AVHWDeviceContext *ctx)
>>
>> #undef CHECK_QUEUE
>>
>> + if (!hwctx->lock_queue)
>> + hwctx->lock_queue = lock_queue;
>> + if (!hwctx->unlock_queue)
>> + hwctx->unlock_queue = unlock_queue;
>> +
>> /* Get device capabilities */
>> vk->GetPhysicalDeviceMemoryProperties(hwctx->phys_dev, &p->mprops);
>>
>> @@ -1732,9 +1778,6 @@ static void vulkan_free_internal(AVVkFrame *f)
>> {
>> AVVkFrameInternal *internal = f->internal;
>>
>> - if (!internal)
>> - return;
>> -
>> #if CONFIG_CUDA
>> if (internal->cuda_fc_ref) {
>> AVHWFramesContext *cuda_fc = (AVHWFramesContext *)internal->cuda_fc_ref->data;
>> @@ -1923,9 +1966,11 @@ static int prepare_frame(AVHWFramesContext *hwfc, VulkanExecCtx *ectx,
>> uint32_t src_qf, dst_qf;
>> VkImageLayout new_layout;
>> VkAccessFlags new_access;
>> + AVVulkanFramesContext *vkfc = hwfc->hwctx;
>> const int planes = av_pix_fmt_count_planes(hwfc->sw_format);
>> VulkanDevicePriv *p = hwfc->device_ctx->internal->priv;
>> FFVulkanFunctions *vk = &p->vkfn;
>> + AVFrame tmp = { .data[0] = (uint8_t *)frame };
>>
>
> ???
>
This enables us to use the common dependency/dispatch code.
The prepare_frame function is used for both frame initialization
and frame import/export queue family transfer operations.
In the former case, no AVFrame exists yet, so, as this is purely
libavutil code, we create a temporary frame on stack. Otherwise,
we'd need to allocate multiple frames somewhere, one for each
possible command buffer dispatch.
Comment added to commit message.
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
next prev parent reply other threads:[~2023-05-11 18:55 UTC|newest]
Thread overview: 49+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-04-24 15:56 Lynne
2023-04-28 13:28 ` Niklas Haas
[not found] ` <NTnyn9K--3-9@lynne.ee-NTnytIf----9>
2023-05-10 19:10 ` Lynne
2023-05-11 15:36 ` Anton Khirnov
2023-05-11 16:32 ` Lynne
2023-05-11 16:59 ` Anton Khirnov
2023-05-11 16:03 ` Anton Khirnov
2023-05-11 18:55 ` Lynne [this message]
2023-05-16 13:31 ` Anton Khirnov
2023-05-16 14:47 ` Lynne
[not found] ` <NV_0sN0--3-9@lynne.ee-NV_0vMs----9>
2023-05-22 8:26 ` Lynne
[not found] ` <NVyq4UQ--F-9@lynne.ee-NW1ZGRp----9>
2023-05-25 0:31 ` Lynne
[not found] ` <NWFJK4e--3-9@lynne.ee-NWFJONn----9>
2023-05-26 17:52 ` Lynne
2023-05-26 19:19 ` Anton Khirnov
2023-05-26 20:50 ` Lynne
2023-05-11 16:05 ` Anton Khirnov
2023-05-11 16:40 ` Lynne
2023-05-11 17:00 ` Anton Khirnov
2023-05-11 16:06 ` Anton Khirnov
2023-05-11 16:45 ` Lynne
2023-05-11 16:14 ` Anton Khirnov
2023-05-11 16:47 ` Lynne
2023-05-11 17:13 ` Anton Khirnov
2023-05-11 16:15 ` Anton Khirnov
2023-05-11 16:50 ` Lynne
2023-05-11 16:21 ` Anton Khirnov
2023-05-11 18:58 ` Lynne
2023-05-16 13:33 ` Anton Khirnov
2023-05-16 14:41 ` Lynne
2023-05-11 16:29 ` Anton Khirnov
2023-05-11 18:13 ` Lynne
2023-05-16 13:40 ` Anton Khirnov
2023-05-16 14:46 ` Lynne
2023-05-18 8:29 ` Anton Khirnov
2023-05-18 12:28 ` Lynne
2023-05-11 16:34 ` Anton Khirnov
2023-05-11 17:12 ` Lynne
2023-05-11 17:19 ` Anton Khirnov
2023-05-11 16:34 ` Anton Khirnov
2023-05-11 17:16 ` Lynne
2023-05-11 16:40 ` Anton Khirnov
2023-05-11 17:20 ` Lynne
2023-05-11 17:27 ` Anton Khirnov
2023-05-11 19:11 ` Lynne
2023-05-18 8:34 ` [FFmpeg-devel] libavcodec: add Vulkan common video code Anton Khirnov
2023-05-18 11:07 ` Lynne
2023-05-18 8:54 ` [FFmpeg-devel] libavcodec: add Vulkan common video decoding code Anton Khirnov
2023-05-18 12:27 ` Lynne
2023-05-19 12:11 ` [FFmpeg-devel] [PATCH 55/97] Vulkan patchset part 2 - hwcontext rewrite and filtering Leo Izen
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=NVB9nuj--B-9@lynne.ee \
--to=dev@lynne.ee \
--cc=ffmpeg-devel@ffmpeg.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
This inbox may be cloned and mirrored by anyone:
git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git
# If you have public-inbox 1.1+ installed, you may
# initialize and index your mirror using the following commands:
public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
ffmpegdev@gitmailbox.com
public-inbox-index ffmpegdev
Example config snippet for mirrors.
AGPL code for this site: git clone https://public-inbox.org/public-inbox.git