Go to the documentation of this file.
33 .queue_flags = VK_QUEUE_COMPUTE_BIT,
95 ctx->s.props.properties.limits.minStorageBufferOffsetAlignment);
101 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
102 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT));
107 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT,
109 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
110 VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT));
135 if (slices_buf && slices_buf->host_ref && !pp->
slice_num)
143 if (!slices_buf || !slices_buf->host_ref) {
170 VkBufferMemoryBarrier2 buf_bar[2];
171 int nb_img_bar = 0, nb_buf_bar = 0, nb_imgs,
i, err;
185 .slice_data = slice_data->address,
188 .width = avctx->
width,
195 .log2_chroma_w = pix_desc->log2_chroma_w,
201 memcpy(pd.qmat_luma, pr->
qmat_luma,
sizeof(pd.qmat_luma ));
202 memcpy(pd.qmat_chroma, pr->
qmat_chroma,
sizeof(pd.qmat_chroma));
209 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
210 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT));
220 vkf->
layout[0] = VK_IMAGE_LAYOUT_UNDEFINED;
221 vkf->
access[0] = VK_ACCESS_2_NONE;
228 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
229 VK_PIPELINE_STAGE_2_CLEAR_BIT,
230 VK_ACCESS_2_TRANSFER_WRITE_BIT,
231 VK_IMAGE_LAYOUT_GENERAL,
232 VK_QUEUE_FAMILY_IGNORED);
234 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
235 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
236 .pBufferMemoryBarriers = buf_bar,
237 .bufferMemoryBarrierCount = nb_buf_bar,
238 .pImageMemoryBarriers = img_bar,
239 .imageMemoryBarrierCount = nb_img_bar,
241 nb_img_bar = nb_buf_bar = 0;
244 for (
i = 0;
i <
FFMIN(nb_imgs, 3); ++
i) {
245 vk->CmdClearColorImage(exec->
buf, vkf->
img[
i],
246 VK_IMAGE_LAYOUT_GENERAL,
247 &((VkClearColorValue) { 0 }),
248 1, &((VkImageSubresourceRange) {
249 .aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
259 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
260 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
261 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
262 VK_IMAGE_LAYOUT_GENERAL,
263 VK_QUEUE_FAMILY_IGNORED);
266 ALL_COMMANDS_BIT, NONE_KHR, NONE_KHR,
267 COMPUTE_SHADER_BIT, SHADER_WRITE_BIT, NONE_KHR,
269 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
270 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
271 .pBufferMemoryBarriers = buf_bar,
272 .bufferMemoryBarrierCount = nb_buf_bar,
273 .pImageMemoryBarriers = img_bar,
274 .imageMemoryBarrierCount = nb_img_bar,
276 nb_img_bar = nb_buf_bar = 0;
284 VK_FORMAT_UNDEFINED);
290 VK_FORMAT_UNDEFINED);
294 VK_IMAGE_LAYOUT_GENERAL,
299 VK_SHADER_STAGE_COMPUTE_BIT,
308 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
309 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
310 VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT,
311 VK_IMAGE_LAYOUT_GENERAL,
312 VK_QUEUE_FAMILY_IGNORED);
315 COMPUTE_SHADER_BIT, SHADER_WRITE_BIT, NONE_KHR,
316 COMPUTE_SHADER_BIT, SHADER_READ_BIT, NONE_KHR,
318 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
319 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
320 .pBufferMemoryBarriers = buf_bar,
321 .bufferMemoryBarrierCount = nb_buf_bar,
322 .pImageMemoryBarriers = img_bar,
323 .imageMemoryBarrierCount = nb_img_bar,
325 nb_img_bar = nb_buf_bar = 0;
333 VK_FORMAT_UNDEFINED);
337 VK_IMAGE_LAYOUT_GENERAL,
342 VK_SHADER_STAGE_COMPUTE_BIT,
365 VK_SHADER_STAGE_COMPUTE_BIT, sl,
366 (uint32_t []) { 8, 8, 1 }, 0);
369 VK_SHADER_STAGE_COMPUTE_BIT);
373 .
name =
"slice_offsets_buf",
374 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
375 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
378 .name =
"quant_idx_buf",
379 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
380 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
384 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
385 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
413 const double idct_8_scales[8] = {
414 cos(4.0*
M_PI/16.0) / 2.0, cos(1.0*
M_PI/16.0) / 2.0,
415 cos(2.0*
M_PI/16.0) / 2.0, cos(3.0*
M_PI/16.0) / 2.0,
416 cos(4.0*
M_PI/16.0) / 2.0, cos(5.0*
M_PI/16.0) / 2.0,
417 cos(6.0*
M_PI/16.0) / 2.0, cos(7.0*
M_PI/16.0) / 2.0,
419 for (
int i = 0;
i < 64;
i++)
424 VK_SHADER_STAGE_COMPUTE_BIT, sl,
425 (uint32_t []) { 32, 2, 1 }, 0);
428 VK_SHADER_STAGE_COMPUTE_BIT);
432 .
name =
"quant_idx_buf",
433 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
434 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
438 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
439 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
474 int max_num_mbs, err;
511 .
p.
name =
"prores_vulkan",
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
void ff_vk_shader_free(FFVulkanContext *s, FFVulkanShader *shd)
Free a shader.
int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic, FFVulkanDecodePicture *vkpic, int is_current, enum FFVkShaderRepFormat rep_fmt, int alloc_dpb)
Software-defined decoder version of ff_vk_decode_prepare_frame.
void * hwaccel_picture_private
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
uint8_t * data
The data buffer.
FFVulkanDecodeShared * shared_ctx
RefStruct is an API for creating reference-counted objects with minimal overhead.
const unsigned int ff_prores_idct_comp_spv_len
AVHWAccel p
The public AVHWAccel.
This structure describes decoded (raw) audio or video data.
static void vk_prores_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
static int vk_prores_end_frame(AVCodecContext *avctx)
FFVkExecContext * ff_vk_exec_get(FFVulkanContext *s, FFVkExecPool *pool)
Retrieve an execution pool.
#define SPEC_LIST_ADD(name, idx, val_bits, val)
static av_always_inline uint32_t av_float2int(float f)
Reinterpret a float as a 32-bit integer.
int slice_count
number of slices in the current picture
@ AV_PIX_FMT_VULKAN
Vulkan hardware images.
int ff_vk_exec_add_dep_frame(FFVulkanContext *s, FFVkExecContext *e, AVFrame *f, VkPipelineStageFlagBits2 wait_stage, VkPipelineStageFlagBits2 signal_stage)
unsigned slice_mb_width
maximum width of a slice in mb
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
VkImage img[AV_NUM_DATA_POINTERS]
Vulkan images to which the memory is bound to.
const unsigned char ff_prores_vld_comp_spv_data[]
void ff_vk_shader_update_img_array(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, AVFrame *f, VkImageView *views, int set, int binding, VkImageLayout layout, VkSampler sampler)
Update a descriptor in a buffer with an image array.
void ff_vk_frame_barrier(FFVulkanContext *s, FFVkExecContext *e, AVFrame *pic, VkImageMemoryBarrier2 *bar, int *nb_bar, VkPipelineStageFlags2 src_stage, VkPipelineStageFlags2 dst_stage, VkAccessFlagBits2 new_access, VkImageLayout new_layout, uint32_t new_qf)
#define HWACCEL_CAP_THREAD_SAFE
int ff_vk_shader_register_exec(FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd)
Register a shader with an exec pool.
int ff_vk_host_map_buffer(FFVulkanContext *s, AVBufferRef **dst, uint8_t *src_data, const AVBufferRef *src_buf, VkBufferUsageFlags usage)
Maps a system RAM buffer into a Vulkan buffer.
This struct aggregates all the (hardware/vendor-specific) "high-level" state, i.e.
static int vk_prores_start_frame(AVCodecContext *avctx, const AVBufferRef *buffer_ref, av_unused const uint8_t *buffer, av_unused uint32_t size)
int ff_vk_exec_mirror_sem_value(FFVulkanContext *s, FFVkExecContext *e, VkSemaphore *dst, uint64_t *dst_val, AVFrame *f)
static int init_idct_shader(AVCodecContext *avctx, FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd, int max_num_mbs, int interlaced)
#define AV_CEIL_RSHIFT(a, b)
static int vk_prores_decode_slice(AVCodecContext *avctx, const uint8_t *data, uint32_t size)
int bits_per_raw_sample
Bits per sample/pixel of internal libavcodec pixel/sample format.
int ff_vk_exec_add_dep_buf(FFVulkanContext *s, FFVkExecContext *e, AVBufferRef **deps, int nb_deps, int ref)
Execution dependency management.
static int vk_decode_prores_init(AVCodecContext *avctx)
#define HWACCEL_CAP_ASYNC_SAFE
Header providing the internals of AVHWAccel.
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
void ff_vk_decode_free_frame(AVHWDeviceContext *dev_ctx, FFVulkanDecodePicture *vp)
Free a frame and its state.
struct AVCodecInternal * internal
Private context used for internal data.
void av_buffer_pool_uninit(AVBufferPool **ppool)
Mark the pool as being available for freeing.
int ff_vk_decode_uninit(AVCodecContext *avctx)
Free decoder.
int ff_vk_shader_link(FFVulkanContext *s, FFVulkanShader *shd, const char *spirv, size_t spirv_len, const char *entrypoint)
Link a shader into an executable.
#define SPEC_LIST_CREATE(name, max_length, max_size)
const unsigned char ff_prores_idct_comp_spv_data[]
int ff_vk_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
Initialize hw_frames_ctx with the parameters needed to decode the stream using the parameters from av...
#define ff_vk_buf_barrier(dst, vkb, s_stage, s_access, s_access2, d_stage, d_access, d_access2, offs, bsz)
int(* init)(AVBSFContext *ctx)
VkAccessFlagBits access[AV_NUM_DATA_POINTERS]
Updated after every barrier.
void ff_vk_shader_update_push_const(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, VkShaderStageFlagBits stage, int offset, size_t size, void *src)
Update push constant in a shader.
uint32_t slice_offsets_sz
void * hwaccel_priv_data
hwaccel-specific private data
#define AV_NUM_DATA_POINTERS
int ff_vk_shader_update_desc_buffer(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, int set, int bind, int elem, FFVkBuffer *buf, VkDeviceSize offset, VkDeviceSize len, VkFormat fmt)
Update a descriptor in a buffer with a buffer.
const FFHWAccel ff_prores_vulkan_hwaccel
const char * name
Name of the hardware accelerated codec.
unsigned mb_width
width of the current picture in mb
#define FF_VK_EXT_EXTERNAL_HOST_MEMORY
static void uninit(AVBSFContext *ctx)
struct FFVulkanDecodePicture::@328 view
VkImageView out[AV_NUM_DATA_POINTERS]
int ff_vk_exec_start(FFVulkanContext *s, FFVkExecContext *e)
Start/submit/wait an execution.
#define i(width, name, range_min, range_max)
const unsigned int ff_prores_vld_comp_spv_len
void ff_vk_exec_bind_shader(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd)
Bind a shader.
AVBufferRef * hw_frames_ctx
A reference to the AVHWFramesContext describing the input (for encoding) or output (decoding) frames.
uint32_t slice_offsets_off
This struct describes a set or pool of "hardware" frames (i.e.
const FFVulkanDecodeDescriptor ff_vk_dec_prores_desc
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp, const uint8_t *data, size_t size, int add_startcode, uint32_t *nb_slices, const uint32_t **offsets)
Add slice data to frame.
int ff_vk_shader_add_push_const(FFVulkanShader *shd, int offset, int size, VkShaderStageFlagBits stage)
Add/update push constants for execution.
int frame_type
0 = progressive, 1 = tff, 2 = bff
main external API structure.
int ff_vk_shader_add_descriptor_set(FFVulkanContext *s, FFVulkanShader *shd, const FFVulkanDescriptorSetBinding *desc, int nb, int singular, int print_to_shader_only)
Add descriptor to a shader.
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
the pkt_dts and pkt_pts fields in AVFrame will work as usual Restrictions on codec whose streams don t reset across will not work because their bitstreams cannot be decoded in parallel *The contents of buffers must not be read before as well as code calling up to before the decode process starts Call have update_thread_context() run it in the next thread. Add AV_CODEC_CAP_FRAME_THREADS to the codec capabilities. There will be very little speed gain at this point but it should work. Use ff_thread_get_buffer()(or ff_progress_frame_get_buffer() in case you have inter-frame dependencies and use the ProgressFrame API) to allocate frame buffers. Call ff_progress_frame_report() after some part of the current picture has decoded. A good place to put this is where draw_horiz_band() is called - add this if it isn 't called anywhere
AVBufferRef * metadata_buf
int ff_vk_update_thread_context(AVCodecContext *dst, const AVCodecContext *src)
Synchronize the contexts between 2 threads.
int coded_width
Bitstream width / height, may be different from width/height e.g.
VkImageLayout layout[AV_NUM_DATA_POINTERS]
A reference to a data buffer.
AVBufferPool * metadata_pool
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
static int ff_vk_count_images(AVVkFrame *f)
VkDeviceAddress slice_data
int width
picture width / height.
int ff_vk_exec_submit(FFVulkanContext *s, FFVkExecContext *e)
static int init_decode_shader(AVCodecContext *avctx, FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd, int max_num_mbs, int interlaced)
int ff_vk_decode_init(AVCodecContext *avctx)
Initialize decoder.
enum AVPixelFormat sw_pix_fmt
Nominal unaccelerated pixel format, see AV_PIX_FMT_xxx.
static void vk_decode_prores_uninit(FFVulkanDecodeShared *ctx)
int ff_vk_shader_load(FFVulkanShader *shd, VkPipelineStageFlags stage, VkSpecializationInfo *spec, uint32_t wg_size[3], uint32_t required_subgroup_size)
Initialize a shader object.
int ff_vk_get_pooled_buffer(FFVulkanContext *ctx, AVBufferPool **buf_pool, AVBufferRef **buf, VkBufferUsageFlags usage, void *create_pNext, size_t size, VkMemoryPropertyFlagBits mem_props)
Initialize a pool and create AVBufferRefs containing FFVkBuffer.
unsigned mb_height
height of the current picture in mb