Go to the documentation of this file.
35 .queue_flags = VK_QUEUE_COMPUTE_BIT,
79 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
80 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT);
89 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
90 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT,
92 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
93 VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT);
142 if (slices_buf && slices_buf->host_ref) {
144 data - slices_buf->mapped_mem);
185 VkImageMemoryBarrier2 img_bar[8];
196 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
197 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT));
210 vkf->
layout[0] = VK_IMAGE_LAYOUT_UNDEFINED;
211 vkf->
access[0] = VK_ACCESS_2_NONE;
214 img_bar, &nb_img_bar,
215 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
216 VK_PIPELINE_STAGE_2_CLEAR_BIT,
217 VK_ACCESS_2_TRANSFER_WRITE_BIT,
218 VK_IMAGE_LAYOUT_GENERAL,
219 VK_QUEUE_FAMILY_IGNORED);
220 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
221 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
222 .pImageMemoryBarriers = img_bar,
223 .imageMemoryBarrierCount = nb_img_bar,
229 vk->CmdClearColorImage(exec->
buf, vkf->
img[
i],
230 VK_IMAGE_LAYOUT_GENERAL,
231 &((VkClearColorValue) { 0 }),
232 1, &((VkImageSubresourceRange) {
233 .aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
240 VK_PIPELINE_STAGE_2_CLEAR_BIT,
241 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
242 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
243 VK_IMAGE_LAYOUT_GENERAL,
244 VK_QUEUE_FAMILY_IGNORED);
245 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
246 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
247 .pImageMemoryBarriers = img_bar,
248 .imageMemoryBarrierCount = nb_img_bar,
256 .log2_chroma_sub = {
desc->log2_chroma_w,
desc->log2_chroma_h },
257 .components =
desc->nb_components,
265 VK_IMAGE_LAYOUT_GENERAL,
270 0, frame_data_buf->size,
271 VK_FORMAT_UNDEFINED);
275 VK_SHADER_STAGE_COMPUTE_BIT,
278 vk->CmdDispatch(exec->
buf,
280 desc->nb_components);
284 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
285 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
286 VK_ACCESS_2_SHADER_STORAGE_READ_BIT |
287 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
288 VK_IMAGE_LAYOUT_GENERAL,
289 VK_QUEUE_FAMILY_IGNORED);
290 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
291 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
292 .pImageMemoryBarriers = img_bar,
293 .imageMemoryBarrierCount = nb_img_bar,
301 VK_IMAGE_LAYOUT_GENERAL,
306 0, frame_data_buf->size,
307 VK_FORMAT_UNDEFINED);
311 VK_SHADER_STAGE_COMPUTE_BIT,
316 int idct_cx = 0, idct_by = 0;
318 int sw = (
comp == 0) ? 0 :
desc->log2_chroma_w;
319 int sh = (
comp == 0) ? 0 :
desc->log2_chroma_h;
320 int bx = (avctx->
coded_width + (1 << (3 + sw)) - 1) >> (3 + sw);
321 int by = (avctx->
coded_height + (1 << (3 + sh)) - 1) >> (3 + sh);
322 idct_cx =
FFMAX(idct_cx, (bx + 7) >> 3);
323 idct_by =
FFMAX(idct_by, by);
325 vk->CmdDispatch(exec->
buf, idct_cx, idct_by,
desc->nb_components);
343 (uint32_t []) { 1, 1, 1 }, 0);
345 VK_SHADER_STAGE_COMPUTE_BIT);
350 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
352 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
355 .name =
"frame_data_buf",
356 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
357 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
382 const double idct_8_scales[8] = {
383 cos(4.0*
M_PI/16.0) / 2.0, cos(1.0*
M_PI/16.0) / 2.0,
384 cos(2.0*
M_PI/16.0) / 2.0, cos(3.0*
M_PI/16.0) / 2.0,
385 cos(4.0*
M_PI/16.0) / 2.0, cos(5.0*
M_PI/16.0) / 2.0,
386 cos(6.0*
M_PI/16.0) / 2.0, cos(7.0*
M_PI/16.0) / 2.0,
388 for (
int i = 0;
i < 64;
i++)
393 (uint32_t []) { 32, 2, 1 }, 0);
395 VK_SHADER_STAGE_COMPUTE_BIT);
400 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
401 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
405 .name =
"frame_data_buf",
406 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
407 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
475 .
p.
name =
"apv_vulkan",
const FFVulkanDecodeDescriptor ff_vk_dec_apv_desc
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
void * priv_data
Internal codec-specific data.
void ff_vk_shader_free(FFVulkanContext *s, FFVulkanShader *shd)
Free a shader.
static void comp(unsigned char *dst, ptrdiff_t dst_stride, unsigned char *src, ptrdiff_t src_stride, int add)
int ff_vk_decode_prepare_frame_sdr(FFVulkanDecodeContext *dec, AVFrame *pic, FFVulkanDecodePicture *vkpic, int is_current, enum FFVkShaderRepFormat rep_fmt, int alloc_dpb)
Software-defined decoder version of ff_vk_decode_prepare_frame.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
uint8_t * data
The data buffer.
FFVulkanDecodeShared * shared_ctx
RefStruct is an API for creating reference-counted objects with minimal overhead.
static int vk_apv_decode_slice(AVCodecContext *avctx, const uint8_t *data, uint32_t size)
AVHWAccel p
The public AVHWAccel.
APVRawTile tile[APV_MAX_TILE_COUNT]
int ff_vk_flush_buffer(FFVulkanContext *s, FFVkBuffer *buf, VkDeviceSize offset, VkDeviceSize mem_size, int flush)
Flush or invalidate a single buffer, with a given size and offset.
FFVkExecContext * ff_vk_exec_get(FFVulkanContext *s, FFVkExecPool *pool)
Retrieve an execution pool.
#define SPEC_LIST_ADD(name, idx, val_bits, val)
static av_always_inline uint32_t av_float2int(float f)
Reinterpret a float as a 32-bit integer.
void ff_vk_exec_bind_shader(FFVulkanContext *s, FFVkExecContext *e, const FFVulkanShader *shd)
Bind a shader.
@ AV_PIX_FMT_VULKAN
Vulkan hardware images.
int ff_vk_exec_add_dep_frame(FFVulkanContext *s, FFVkExecContext *e, AVFrame *f, VkPipelineStageFlagBits2 wait_stage, VkPipelineStageFlagBits2 signal_stage)
APVDerivedTileInfo tile_info
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
VkImage img[AV_NUM_DATA_POINTERS]
Vulkan images to which the memory is bound to.
void ff_vk_shader_update_img_array(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, AVFrame *f, VkImageView *views, int set, int binding, VkImageLayout layout, VkSampler sampler)
Update a descriptor in a buffer with an image array.
void ff_vk_frame_barrier(FFVulkanContext *s, FFVkExecContext *e, AVFrame *pic, VkImageMemoryBarrier2 *bar, int *nb_bar, VkPipelineStageFlags2 src_stage, VkPipelineStageFlags2 dst_stage, VkAccessFlagBits2 new_access, VkImageLayout new_layout, uint32_t new_qf)
#define HWACCEL_CAP_THREAD_SAFE
int ff_vk_shader_register_exec(FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd)
Register a shader with an exec pool.
int ff_vk_host_map_buffer(FFVulkanContext *s, AVBufferRef **dst, uint8_t *src_data, const AVBufferRef *src_buf, VkBufferUsageFlags usage)
Maps a system RAM buffer into a Vulkan buffer.
This struct aggregates all the (hardware/vendor-specific) "high-level" state, i.e.
const unsigned int ff_apv_decode_comp_spv_len
static void vk_apv_free_frame_priv(AVRefStructOpaque _hwctx, void *data)
APVRawFrameHeader frame_header
static int init_idct_shader(AVCodecContext *avctx, FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd)
int ff_vk_exec_mirror_sem_value(FFVulkanContext *s, FFVkExecContext *e, VkSemaphore *dst, uint64_t *dst_val, AVFrame *f)
static int init_decode_shader(AVCodecContext *avctx, FFVulkanContext *s, FFVkExecPool *pool, FFVulkanShader *shd)
static AVFormatContext * ctx
int ff_vk_exec_add_dep_buf(FFVulkanContext *s, FFVkExecContext *e, AVBufferRef **deps, int nb_deps, int ref)
Execution dependency management.
APVRawFrame * cur_raw_frame
AVBufferPool * frame_data_pool
const unsigned char ff_apv_decode_comp_spv_data[]
#define HWACCEL_CAP_ASYNC_SAFE
Header providing the internals of AVHWAccel.
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
void ff_vk_decode_free_frame(AVHWDeviceContext *dev_ctx, FFVulkanDecodePicture *vp)
Free a frame and its state.
struct AVCodecInternal * internal
Private context used for internal data.
void av_buffer_pool_uninit(AVBufferPool **ppool)
Mark the pool as being available for freeing.
uint8_t q_matrix[APV_MAX_NUM_COMP][APV_TR_SIZE][APV_TR_SIZE]
int ff_vk_decode_uninit(AVCodecContext *avctx)
Free decoder.
AVBufferRef * frame_data_buf
int ff_vk_shader_link(FFVulkanContext *s, FFVulkanShader *shd, const char *spirv, size_t spirv_len, const char *entrypoint)
Link a shader into an executable.
#define SPEC_LIST_CREATE(name, max_length, max_size)
int ff_vk_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
Initialize hw_frames_ctx with the parameters needed to decode the stream using the parameters from av...
APVRawTileHeader tile_header
static int vk_decode_apv_init(AVCodecContext *avctx)
static int vk_apv_end_frame(AVCodecContext *avctx)
int(* init)(AVBSFContext *ctx)
const FFHWAccel ff_apv_vulkan_hwaccel
VkAccessFlagBits access[AV_NUM_DATA_POINTERS]
Updated after every barrier.
void ff_vk_shader_update_push_const(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, VkShaderStageFlagBits stage, int offset, size_t size, void *src)
Update push constant in a shader.
void * hwaccel_priv_data
hwaccel-specific private data
#define i(width, name, range_min, range_max)
FrameData * frame_data(AVFrame *frame)
Get our axiliary frame data attached to the frame, allocating it if needed.
int ff_vk_shader_update_desc_buffer(FFVulkanContext *s, FFVkExecContext *e, FFVulkanShader *shd, int set, int bind, int elem, FFVkBuffer *buf, VkDeviceSize offset, VkDeviceSize len, VkFormat fmt)
Update a descriptor in a buffer with a buffer.
const char * name
Name of the hardware accelerated codec.
VkDeviceAddress tile_data
#define FF_VK_EXT_EXTERNAL_HOST_MEMORY
uint16_t row_starts[APV_MAX_TILE_ROWS+1]
static void uninit(AVBSFContext *ctx)
static void vk_decode_apv_uninit(FFVulkanDecodeShared *ctx)
VkImageView out[AV_NUM_DATA_POINTERS]
int ff_vk_exec_start(FFVulkanContext *s, FFVkExecContext *e)
Start/submit/wait an execution.
struct FFVulkanDecodePicture::@340 view
static int vk_apv_start_frame(AVCodecContext *avctx, const AVBufferRef *buffer_ref, av_unused const uint8_t *buffer, av_unused uint32_t size)
const unsigned char ff_apv_idct_comp_spv_data[]
AVBufferRef * hw_frames_ctx
A reference to the AVHWFramesContext describing the input (for encoding) or output (decoding) frames.
This struct describes a set or pool of "hardware" frames (i.e.
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp, const uint8_t *data, size_t size, int add_startcode, uint32_t *nb_slices, const uint32_t **offsets)
Add slice data to frame.
int ff_vk_shader_add_push_const(FFVulkanShader *shd, int offset, int size, VkShaderStageFlagBits stage)
Add/update push constants for execution.
const unsigned int ff_apv_idct_comp_spv_len
main external API structure.
int ff_vk_shader_add_descriptor_set(FFVulkanContext *s, FFVulkanShader *shd, const FFVulkanDescriptorSetBinding *desc, int nb, int singular, int print_to_shader_only)
Add descriptor to a shader.
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
the pkt_dts and pkt_pts fields in AVFrame will work as usual Restrictions on codec whose streams don t reset across will not work because their bitstreams cannot be decoded in parallel *The contents of buffers must not be read before as well as code calling up to before the decode process starts Call have update_thread_context() run it in the next thread. Add AV_CODEC_CAP_FRAME_THREADS to the codec capabilities. There will be very little speed gain at this point but it should work. Use ff_thread_get_buffer()(or ff_progress_frame_get_buffer() in case you have inter-frame dependencies and use the ProgressFrame API) to allocate frame buffers. Call ff_progress_frame_report() after some part of the current picture has decoded. A good place to put this is where draw_horiz_band() is called - add this if it isn 't called anywhere
uint16_t col_starts[APV_MAX_TILE_COLS+1]
int ff_vk_update_thread_context(AVCodecContext *dst, const AVCodecContext *src)
Synchronize the contexts between 2 threads.
int coded_width
Bitstream width / height, may be different from width/height e.g.
VkImageLayout layout[AV_NUM_DATA_POINTERS]
A reference to a data buffer.
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
CodedBitstreamContext * cbc
static int ff_vk_count_images(AVVkFrame *f)
int ff_vk_exec_submit(FFVulkanContext *s, FFVkExecContext *e)
void * hwaccel_picture_private
int ff_vk_decode_init(AVCodecContext *avctx)
Initialize decoder.
int ff_vk_shader_load(FFVulkanShader *shd, VkPipelineStageFlags stage, VkSpecializationInfo *spec, uint32_t wg_size[3], uint32_t required_subgroup_size)
Initialize a shader object.
int ff_vk_get_pooled_buffer(FFVulkanContext *ctx, AVBufferPool **buf_pool, AVBufferRef **buf, VkBufferUsageFlags usage, void *create_pNext, size_t size, VkMemoryPropertyFlagBits mem_props)
Initialize a pool and create AVBufferRefs containing FFVkBuffer.