Go to the documentation of this file.
33 .queue_flags = VK_QUEUE_COMPUTE_BIT,
96 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
97 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT));
102 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT,
104 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
105 VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT));
130 if (slices_buf && slices_buf->host_ref && !pp->
slice_num)
138 if (!slices_buf || !slices_buf->host_ref) {
165 VkBufferMemoryBarrier2 buf_bar[2];
166 int nb_img_bar = 0, nb_buf_bar = 0, nb_imgs,
i, err;
180 .slice_data = slice_data->address,
183 .width = avctx->
width,
190 .log2_chroma_w = pix_desc->log2_chroma_w,
196 memcpy(pd.qmat_luma, pr->
qmat_luma,
sizeof(pd.qmat_luma ));
197 memcpy(pd.qmat_chroma, pr->
qmat_chroma,
sizeof(pd.qmat_chroma));
204 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
205 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT));
215 vkf->
layout[0] = VK_IMAGE_LAYOUT_UNDEFINED;
216 vkf->
access[0] = VK_ACCESS_2_NONE;
223 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
224 VK_PIPELINE_STAGE_2_CLEAR_BIT,
225 VK_ACCESS_2_TRANSFER_WRITE_BIT,
226 VK_IMAGE_LAYOUT_GENERAL,
227 VK_QUEUE_FAMILY_IGNORED);
229 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
230 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
231 .pBufferMemoryBarriers = buf_bar,
232 .bufferMemoryBarrierCount = nb_buf_bar,
233 .pImageMemoryBarriers = img_bar,
234 .imageMemoryBarrierCount = nb_img_bar,
236 nb_img_bar = nb_buf_bar = 0;
239 for (
i = 0;
i <
FFMIN(nb_imgs, 3); ++
i) {
240 vk->CmdClearColorImage(exec->
buf, vkf->
img[
i],
241 VK_IMAGE_LAYOUT_GENERAL,
242 &((VkClearColorValue) { 0 }),
243 1, &((VkImageSubresourceRange) {
244 .aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
254 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
255 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
256 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
257 VK_IMAGE_LAYOUT_GENERAL,
258 VK_QUEUE_FAMILY_IGNORED);
261 ALL_COMMANDS_BIT, NONE_KHR, NONE_KHR,
262 COMPUTE_SHADER_BIT, SHADER_WRITE_BIT, NONE_KHR,
264 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
265 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
266 .pBufferMemoryBarriers = buf_bar,
267 .bufferMemoryBarrierCount = nb_buf_bar,
268 .pImageMemoryBarriers = img_bar,
269 .imageMemoryBarrierCount = nb_img_bar,
271 nb_img_bar = nb_buf_bar = 0;
278 VK_FORMAT_UNDEFINED);
283 VK_FORMAT_UNDEFINED);
287 VK_IMAGE_LAYOUT_GENERAL,
292 VK_SHADER_STAGE_COMPUTE_BIT,
301 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
302 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
303 VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT,
304 VK_IMAGE_LAYOUT_GENERAL,
305 VK_QUEUE_FAMILY_IGNORED);
308 COMPUTE_SHADER_BIT, SHADER_WRITE_BIT, NONE_KHR,
309 COMPUTE_SHADER_BIT, SHADER_READ_BIT, NONE_KHR,
311 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
312 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
313 .pBufferMemoryBarriers = buf_bar,
314 .bufferMemoryBarrierCount = nb_buf_bar,
315 .pImageMemoryBarriers = img_bar,
316 .imageMemoryBarrierCount = nb_img_bar,
318 nb_img_bar = nb_buf_bar = 0;
325 VK_FORMAT_UNDEFINED);
329 VK_IMAGE_LAYOUT_GENERAL,
334 VK_SHADER_STAGE_COMPUTE_BIT,
347 GLSLC(0,
layout(push_constant, scalar) uniform pushConstants { );
348 GLSLC(1, u8buf slice_data; );
349 GLSLC(1, uint bitstream_size; );
353 GLSLC(1, uint16_t mb_width; );
354 GLSLC(1, uint16_t mb_height; );
355 GLSLC(1, uint16_t slice_width; );
356 GLSLC(1, uint16_t slice_height; );
357 GLSLC(1, uint8_t log2_slice_width; );
358 GLSLC(1, uint8_t log2_chroma_w; );
359 GLSLC(1, uint8_t depth; );
360 GLSLC(1, uint8_t alpha_info; );
361 GLSLC(1, uint8_t bottom_field; );
363 GLSLC(1, uint8_t qmat_luma [8*8]; );
364 GLSLC(1, uint8_t qmat_chroma[8*8]; );
368 VK_SHADER_STAGE_COMPUTE_BIT);
382 void *spv_opaque =
NULL;
385 VK_SHADER_STAGE_COMPUTE_BIT,
386 (
const char *[]) {
"GL_EXT_buffer_reference",
387 "GL_EXT_buffer_reference2" }, 2,
403 .
name =
"slice_offsets_buf",
404 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
405 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
406 .mem_quali =
"readonly",
407 .buf_content =
"uint32_t slice_offsets",
408 .buf_elems = max_num_mbs + 1,
411 .name =
"quant_idx_buf",
412 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
413 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
414 .mem_quali =
"writeonly",
415 .buf_content =
"uint8_t quant_idx",
416 .buf_elems = max_num_mbs,
420 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
424 .mem_quali =
"writeonly",
426 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
457 void *spv_opaque =
NULL;
460 VK_SHADER_STAGE_COMPUTE_BIT,
461 (
const char *[]) {
"GL_EXT_buffer_reference",
462 "GL_EXT_buffer_reference2" }, 2,
476 .
name =
"quant_idx_buf",
477 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
478 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
479 .mem_quali =
"readonly",
480 .buf_content =
"uint8_t quant_idx",
481 .buf_elems = max_num_mbs,
485 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
490 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
495 GLSLC(0, #define NB_BLOCKS 4*2);
533 int max_num_mbs, err;
537 spv = ff_vk_spirv_init();
580 .
p.
name =
"prores_vulkan",
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
void ff_vk_shader_free(FFVulkanContext *s, FFVulkanShader *shd)
Free a shader.
int ff_vk_shader_init(FFVulkanContext *s, FFVulkanShader *shd, const char *name, VkPipelineStageFlags stage, const char *extensions[], int nb_extensions, int lg_x, int lg_y, int lg_z, uint32_t required_subgroup_size)
Initialize a shader object, with a specific set of extensions, type+bind, local group size,...
static int init_decode_shader(AVCodecContext *avctx, FFVulkanContext *s, FFVkExecPool *pool, FFVkSPIRVCompiler *spv, FFVulkanShader *shd, int max_num_mbs, int interlaced)
int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic, FFVulkanDecodePicture *vkpic, int is_current, enum FFVkShaderRepFormat rep_fmt, int alloc_dpb)
Software-defined decoder version of ff_vk_decode_prepare_frame.
void * hwaccel_picture_private
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
uint8_t * data
The data buffer.
FFVulkanDecodeShared * shared_ctx
RefStruct is an API for creating reference-counted objects with minimal overhead.
AVHWAccel p
The public AVHWAccel.
This structure describes decoded (raw) audio or video data.
static void vk_prores_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
static int vk_prores_end_frame(AVCodecContext *avctx)
const char * ff_source_prores_vld_comp
FFVkExecContext * ff_vk_exec_get(FFVulkanContext *s, FFVkExecPool *pool)
Retrieve an execution pool.
void(* uninit)(struct FFVkSPIRVCompiler **ctx)
int slice_count
number of slices in the current picture
@ AV_PIX_FMT_VULKAN
Vulkan hardware images.
int ff_vk_exec_add_dep_frame(FFVulkanContext *s, FFVkExecContext *e, AVFrame *f, VkPipelineStageFlagBits2 wait_stage, VkPipelineStageFlagBits2 signal_stage)
unsigned slice_mb_width
maximum width of a slice in mb
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
VkImage img[AV_NUM_DATA_POINTERS]
Vulkan images to which the memory is bound to.
void ff_vk_shader_update_img_array(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, AVFrame *f, VkImageView *views, int set, int binding, VkImageLayout layout, VkSampler sampler)
Update a descriptor in a buffer with an image array.
void ff_vk_frame_barrier(FFVulkanContext *s, FFVkExecContext *e, AVFrame *pic, VkImageMemoryBarrier2 *bar, int *nb_bar, VkPipelineStageFlags2 src_stage, VkPipelineStageFlags2 dst_stage, VkAccessFlagBits2 new_access, VkImageLayout new_layout, uint32_t new_qf)
#define HWACCEL_CAP_THREAD_SAFE
int ff_vk_shader_register_exec(FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd)
Register a shader with an exec pool.
int ff_vk_host_map_buffer(FFVulkanContext *s, AVBufferRef **dst, uint8_t *src_data, const AVBufferRef *src_buf, VkBufferUsageFlags usage)
Maps a system RAM buffer into a Vulkan buffer.
int ff_vk_shader_add_descriptor_set(FFVulkanContext *s, FFVulkanShader *shd, FFVulkanDescriptorSetBinding *desc, int nb, int singular, int print_to_shader_only)
Add descriptor to a shader.
This struct aggregates all the (hardware/vendor-specific) "high-level" state, i.e.
static int init_idct_shader(AVCodecContext *avctx, FFVulkanContext *s, FFVkExecPool *pool, FFVkSPIRVCompiler *spv, FFVulkanShader *shd, int max_num_mbs, int interlaced)
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
static int vk_prores_start_frame(AVCodecContext *avctx, const AVBufferRef *buffer_ref, av_unused const uint8_t *buffer, av_unused uint32_t size)
int ff_vk_exec_mirror_sem_value(FFVulkanContext *s, FFVkExecContext *e, VkSemaphore *dst, uint64_t *dst_val, AVFrame *f)
#define AV_CEIL_RSHIFT(a, b)
static int vk_prores_decode_slice(AVCodecContext *avctx, const uint8_t *data, uint32_t size)
int bits_per_raw_sample
Bits per sample/pixel of internal libavcodec pixel/sample format.
int ff_vk_exec_add_dep_buf(FFVulkanContext *s, FFVkExecContext *e, AVBufferRef **deps, int nb_deps, int ref)
Execution dependency management.
static int vk_decode_prores_init(AVCodecContext *avctx)
#define HWACCEL_CAP_ASYNC_SAFE
Header providing the internals of AVHWAccel.
const char * ff_vk_shader_rep_fmt(enum AVPixelFormat pix_fmt, enum FFVkShaderRepFormat rep_fmt)
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
void ff_vk_decode_free_frame(AVHWDeviceContext *dev_ctx, FFVulkanDecodePicture *vp)
Free a frame and its state.
struct AVCodecInternal * internal
Private context used for internal data.
void av_buffer_pool_uninit(AVBufferPool **ppool)
Mark the pool as being available for freeing.
int ff_vk_decode_uninit(AVCodecContext *avctx)
Free decoder.
int ff_vk_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
Initialize hw_frames_ctx with the parameters needed to decode the stream using the parameters from av...
#define ff_vk_buf_barrier(dst, vkb, s_stage, s_access, s_access2, d_stage, d_access, d_access2, offs, bsz)
int(* init)(AVBSFContext *ctx)
VkAccessFlagBits access[AV_NUM_DATA_POINTERS]
Updated after every barrier.
void ff_vk_shader_update_push_const(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, VkShaderStageFlagBits stage, int offset, size_t size, void *src)
Update push constant in a shader.
uint32_t slice_offsets_sz
void * hwaccel_priv_data
hwaccel-specific private data
#define AV_NUM_DATA_POINTERS
const char * ff_source_dct_comp
int(* compile_shader)(FFVulkanContext *s, struct FFVkSPIRVCompiler *ctx, FFVulkanShader *shd, uint8_t **data, size_t *size, const char *entrypoint, void **opaque)
#define AVERROR_EXTERNAL
Generic error in an external library.
int ff_vk_shader_update_desc_buffer(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, int set, int bind, int elem, FFVkBuffer *buf, VkDeviceSize offset, VkDeviceSize len, VkFormat fmt)
Update a descriptor in a buffer with a buffer.
const FFHWAccel ff_prores_vulkan_hwaccel
const char * name
Name of the hardware accelerated codec.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel layout
unsigned mb_width
width of the current picture in mb
#define FF_VK_EXT_EXTERNAL_HOST_MEMORY
static void uninit(AVBSFContext *ctx)
struct FFVulkanDecodePicture::@328 view
VkImageView out[AV_NUM_DATA_POINTERS]
int ff_vk_exec_start(FFVulkanContext *s, FFVkExecContext *e)
Start/submit/wait an execution.
#define i(width, name, range_min, range_max)
int ff_vk_shader_link(FFVulkanContext *s, FFVulkanShader *shd, uint8_t *spirv, size_t spirv_len, const char *entrypoint)
Link a shader into an executable.
void(* free_shader)(struct FFVkSPIRVCompiler *ctx, void **opaque)
void ff_vk_exec_bind_shader(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd)
Bind a shader.
AVBufferRef * hw_frames_ctx
A reference to the AVHWFramesContext describing the input (for encoding) or output (decoding) frames.
This struct describes a set or pool of "hardware" frames (i.e.
const char * ff_source_common_comp
const FFVulkanDecodeDescriptor ff_vk_dec_prores_desc
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp, const uint8_t *data, size_t size, int add_startcode, uint32_t *nb_slices, const uint32_t **offsets)
Add slice data to frame.
void av_bprintf(AVBPrint *buf, const char *fmt,...)
int ff_vk_shader_add_push_const(FFVulkanShader *shd, int offset, int size, VkShaderStageFlagBits stage)
Add/update push constants for execution.
int frame_type
0 = progressive, 1 = tff, 2 = bff
main external API structure.
static int add_push_data(FFVulkanShader *shd)
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
the pkt_dts and pkt_pts fields in AVFrame will work as usual Restrictions on codec whose streams don t reset across will not work because their bitstreams cannot be decoded in parallel *The contents of buffers must not be read before as well as code calling up to before the decode process starts Call have update_thread_context() run it in the next thread. Add AV_CODEC_CAP_FRAME_THREADS to the codec capabilities. There will be very little speed gain at this point but it should work. Use ff_thread_get_buffer()(or ff_progress_frame_get_buffer() in case you have inter-frame dependencies and use the ProgressFrame API) to allocate frame buffers. Call ff_progress_frame_report() after some part of the current picture has decoded. A good place to put this is where draw_horiz_band() is called - add this if it isn 't called anywhere
AVBufferRef * metadata_buf
int ff_vk_update_thread_context(AVCodecContext *dst, const AVCodecContext *src)
Synchronize the contexts between 2 threads.
int coded_width
Bitstream width / height, may be different from width/height e.g.
VkImageLayout layout[AV_NUM_DATA_POINTERS]
A reference to a data buffer.
const char * ff_source_prores_idct_comp
AVBufferPool * metadata_pool
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
static int ff_vk_count_images(AVVkFrame *f)
VkDeviceAddress slice_data
int width
picture width / height.
int ff_vk_exec_submit(FFVulkanContext *s, FFVkExecContext *e)
int ff_vk_decode_init(AVCodecContext *avctx)
Initialize decoder.
enum AVPixelFormat sw_pix_fmt
Nominal unaccelerated pixel format, see AV_PIX_FMT_xxx.
static void vk_decode_prores_uninit(FFVulkanDecodeShared *ctx)
int ff_vk_get_pooled_buffer(FFVulkanContext *ctx, AVBufferPool **buf_pool, AVBufferRef **buf, VkBufferUsageFlags usage, void *create_pNext, size_t size, VkMemoryPropertyFlagBits mem_props)
Initialize a pool and create AVBufferRefs containing FFVkBuffer.
unsigned mb_height
height of the current picture in mb