Go to the documentation of this file.
50 #define DIV_UP(a, b) ( ((a) + (b) - 1) / (b) )
51 #define ALIGN_UP(a, b) (((a) + (b) - 1) & ~((b) - 1))
55 #define CHECK_CU(x) FF_CUDA_CHECK_DL(ctx, s->hwctx->internal->cuda_dl, x)
58 CUdeviceptr prev, CUdeviceptr cur, CUdeviceptr next,
70 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
71 CUtexObject tex_prev = 0, tex_cur = 0, tex_next = 0;
73 int skip_spatial_check =
s->yadif.mode&2;
75 void *args[] = { &dst, &tex_prev, &tex_cur, &tex_next,
76 &dst_width, &dst_height, &dst_pitch,
77 &src_width, &src_height, &
parity, &tff,
78 &skip_spatial_check };
80 CUDA_TEXTURE_DESC tex_desc = {
81 .filterMode = CU_TR_FILTER_MODE_POINT,
82 .flags = CU_TRSF_READ_AS_INTEGER,
85 CUDA_RESOURCE_DESC res_desc = {
86 .resType = CU_RESOURCE_TYPE_PITCH2D,
87 .res.pitch2D.format =
format,
89 .res.pitch2D.width = src_width,
90 .res.pitch2D.height = src_height,
91 .res.pitch2D.pitchInBytes = src_pitch,
94 res_desc.res.pitch2D.devPtr = (CUdeviceptr)prev;
95 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex_prev, &res_desc, &tex_desc,
NULL));
99 res_desc.res.pitch2D.devPtr = (CUdeviceptr)cur;
100 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex_cur, &res_desc, &tex_desc,
NULL));
104 res_desc.res.pitch2D.devPtr = (CUdeviceptr)next;
105 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex_next, &res_desc, &tex_desc,
NULL));
112 0,
s->stream, args,
NULL));
116 CHECK_CU(cu->cuTexObjectDestroy(tex_prev));
118 CHECK_CU(cu->cuTexObjectDestroy(tex_cur));
120 CHECK_CU(cu->cuTexObjectDestroy(tex_next));
130 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
144 if (
comp->plane <
i) {
150 pixel_size = (
comp->depth +
comp->shift) / 8;
152 if (pixel_size > 2 ||
channels > 2) {
156 switch (pixel_size) {
159 format = CU_AD_FORMAT_UNSIGNED_INT8;
163 format = CU_AD_FORMAT_UNSIGNED_INT16;
170 "Deinterlacing plane %d: pixel_size: %d channels: %d\n",
180 (CUdeviceptr)dst->
data[
i],
198 if (
s->hwctx &&
s->cu_module) {
199 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
200 CHECK_CU(cu->cuCtxPushCurrent(
s->cu_ctx));
201 CHECK_CU(cu->cuModuleUnload(
s->cu_module));
212 s->input_frames =
NULL;
220 if (!
inlink->hw_frames_ctx) {
222 "required to associate the processing device.\n");
227 if (!
s->input_frames_ref) {
249 if (!
s->device_ref) {
255 s->cu_ctx =
s->hwctx->cuda_ctx;
256 s->stream =
s->hwctx->stream;
257 cu =
s->hwctx->internal->cuda_dl;
270 output_frames->
sw_format =
s->input_frames->sw_format;
271 output_frames->
width =
ctx->inputs[0]->w;
272 output_frames->
height =
ctx->inputs[0]->h;
283 "context for output: %d\n",
ret);
312 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar,
s->cu_module,
"yadif_uchar"));
316 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar2,
s->cu_module,
"yadif_uchar2"));
320 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort,
s->cu_module,
"yadif_ushort"));
324 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort2,
s->cu_module,
"yadif_ushort2"));
361 .
name =
"yadif_cuda",
int(* func)(AVBPrint *dst, const char *in, const char *arg)
@ AV_PIX_FMT_CUDA
HW acceleration through CUDA.
AVHWFramesContext * input_frames
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
#define FF_FILTER_FLAG_HWFRAME_AWARE
The filter is aware of hardware frames, and any hardware frame context should not be automatically pr...
static void comp(unsigned char *dst, ptrdiff_t dst_stride, unsigned char *src, ptrdiff_t src_stride, int add)
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
uint8_t * data
The data buffer.
enum AVPixelFormat format
The pixel format identifying the underlying HW surface type.
int ff_cuda_load_module(void *avctx, AVCUDADeviceContext *hwctx, CUmodule *cu_module, const unsigned char *data, const unsigned int length)
Loads a CUDA module and applies any decompression, if neccesary.
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
const AVPixFmtDescriptor * csp
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
int av_hwframe_ctx_init(AVBufferRef *ref)
Finalize the context before use.
This structure describes decoded (raw) audio or video data.
AVBufferRef * av_hwframe_ctx_alloc(AVBufferRef *device_ref_in)
Allocate an AVHWFramesContext tied to a given device context.
AVBufferRef * av_buffer_ref(const AVBufferRef *buf)
Create a new reference to an AVBuffer.
const char * name
Filter name.
int width
The allocated dimensions of the frames in this pool.
A link between two filters.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
static int config_input(AVFilterLink *inlink)
CUfunction cu_func_uchar2
A filter pad used for either input or output.
This struct aggregates all the (hardware/vendor-specific) "high-level" state, i.e.
static void filter(AVFilterContext *ctx, AVFrame *dst, int parity, int tff)
#define AV_LOG_TRACE
Extremely verbose debugging, useful for libav* development.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
static const AVFilterPad deint_cuda_outputs[]
CUfunction cu_func_ushort2
#define AV_CEIL_RSHIFT(a, b)
const unsigned char ff_vf_yadif_cuda_ptx_data[]
static const AVFilterPad deint_cuda_inputs[]
#define av_assert0(cond)
assert() equivalent, that is always enabled.
uint8_t log2_chroma_w
Amount to shift the luma width right to find the chroma width.
#define FILTER_INPUTS(array)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a link
#define LIBAVUTIL_VERSION_INT
static const AVClass yadif_cuda_class
Describe the class of an AVClass context structure.
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
uint8_t nb_components
The number of components each pixel has, (1-4)
Rational number (pair of numerator and denominator).
const char * av_default_item_name(void *ptr)
Return the context name.
static av_cold void deint_cuda_uninit(AVFilterContext *ctx)
@ AV_CLASS_CATEGORY_FILTER
const unsigned int ff_vf_yadif_cuda_ptx_len
const AVOption ff_yadif_options[]
static int config_output(AVFilterLink *link)
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
void(* filter)(AVFilterContext *ctx, AVFrame *dstpic, int parity, int tff)
AVRational time_base
Time base for the timestamps in this frame.
AVBufferRef * input_frames_ref
#define FILTER_SINGLE_PIXFMT(pix_fmt_)
static CUresult call_kernel(AVFilterContext *ctx, CUfunction func, CUdeviceptr prev, CUdeviceptr cur, CUdeviceptr next, CUarray_format format, int channels, int src_width, int src_height, int src_pitch, CUdeviceptr dst, int dst_width, int dst_height, int dst_pitch, int parity, int tff)
#define i(width, name, range_min, range_max)
const char * name
Pad name.
AVCUDADeviceContext * hwctx
This struct describes a set or pool of "hardware" frames (i.e.
This struct is allocated as AVHWDeviceContext.hwctx.
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
const AVFilter ff_vf_yadif_cuda
AVBufferRef * hw_frames_ctx
For hwaccel-format frames, this should be a reference to the AVHWFramesContext describing the frame.
int ff_yadif_request_frame(AVFilterLink *link)
AVComponentDescriptor comp[4]
Parameters that describe how pixels are packed.
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
int initial_pool_size
Initial size of the frame pool.
A reference to a data buffer.
#define FILTER_OUTPUTS(array)
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
int linesize[AV_NUM_DATA_POINTERS]
For video, a positive or negative value, which is typically indicating the size in bytes of each pict...
CUfunction cu_func_ushort
static av_cold int uninit(AVCodecContext *avctx)
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
int ff_yadif_filter_frame(AVFilterLink *link, AVFrame *frame)
int ff_filter_init_hw_frames(AVFilterContext *avctx, AVFilterLink *link, int default_pool_size)
Perform any additional setup required for hardware frames.