Go to the documentation of this file.
46 #define DIV_UP(a, b) ( ((a) + (b) - 1) / (b) )
47 #define ALIGN_UP(a, b) (((a) + (b) - 1) & ~((b) - 1))
51 #define CHECK_CU(x) FF_CUDA_CHECK_DL(ctx, s->hwctx->internal->cuda_dl, x)
54 CUdeviceptr prev, CUdeviceptr cur, CUdeviceptr next,
66 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
67 CUtexObject tex_prev = 0, tex_cur = 0, tex_next = 0;
69 int skip_spatial_check =
s->yadif.mode&2;
71 void *
args[] = { &dst, &tex_prev, &tex_cur, &tex_next,
73 &src_width, &src_height, &
parity, &tff,
74 &skip_spatial_check };
76 CUDA_TEXTURE_DESC tex_desc = {
77 .filterMode = CU_TR_FILTER_MODE_POINT,
78 .flags = CU_TRSF_READ_AS_INTEGER,
81 CUDA_RESOURCE_DESC res_desc = {
82 .resType = CU_RESOURCE_TYPE_PITCH2D,
83 .res.pitch2D.format =
format,
85 .res.pitch2D.width = src_width,
86 .res.pitch2D.height = src_height,
90 res_desc.res.pitch2D.devPtr = (CUdeviceptr)prev;
91 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex_prev, &res_desc, &tex_desc,
NULL));
95 res_desc.res.pitch2D.devPtr = (CUdeviceptr)cur;
96 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex_cur, &res_desc, &tex_desc,
NULL));
100 res_desc.res.pitch2D.devPtr = (CUdeviceptr)next;
101 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex_next, &res_desc, &tex_desc,
NULL));
112 CHECK_CU(cu->cuTexObjectDestroy(tex_prev));
114 CHECK_CU(cu->cuTexObjectDestroy(tex_cur));
116 CHECK_CU(cu->cuTexObjectDestroy(tex_next));
126 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
140 if (
comp->plane <
i) {
146 pixel_size = (
comp->depth +
comp->shift) / 8;
148 if (pixel_size > 2 ||
channels > 2) {
152 switch (pixel_size) {
155 format = CU_AD_FORMAT_UNSIGNED_INT8;
159 format = CU_AD_FORMAT_UNSIGNED_INT16;
166 "Deinterlacing plane %d: pixel_size: %d channels: %d\n",
176 (CUdeviceptr)dst->
data[
i],
194 if (
s->hwctx &&
s->cu_module) {
195 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
196 CHECK_CU(cu->cuCtxPushCurrent(
s->cu_ctx));
197 CHECK_CU(cu->cuModuleUnload(
s->cu_module));
208 s->input_frames =
NULL;
219 &
ctx->inputs[0]->out_formats)) < 0)
222 &
ctx->outputs[0]->in_formats)) < 0)
233 if (!
inlink->hw_frames_ctx) {
235 "required to associate the processing device.\n");
240 if (!
s->input_frames_ref) {
262 if (!
s->device_ref) {
268 s->cu_ctx =
s->hwctx->cuda_ctx;
269 s->stream =
s->hwctx->stream;
270 cu =
s->hwctx->internal->cuda_dl;
283 output_frames->
sw_format =
s->input_frames->sw_format;
284 output_frames->
width =
ctx->inputs[0]->w;
285 output_frames->
height =
ctx->inputs[0]->h;
296 "context for output: %d\n",
ret);
300 link->time_base.num =
ctx->inputs[0]->time_base.num;
301 link->time_base.den =
ctx->inputs[0]->time_base.den * 2;
326 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar,
s->cu_module,
"yadif_uchar"));
330 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar2,
s->cu_module,
"yadif_uchar2"));
334 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort,
s->cu_module,
"yadif_ushort"));
338 ret =
CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort2,
s->cu_module,
"yadif_ushort2"));
377 .
name =
"yadif_cuda",
int(* func)(AVBPrint *dst, const char *in, const char *arg)
@ AV_PIX_FMT_CUDA
HW acceleration through CUDA.
AVPixelFormat
Pixel format.
AVHWFramesContext * input_frames
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
AVFilter ff_vf_yadif_cuda
#define FF_FILTER_FLAG_HWFRAME_AWARE
The filter is aware of hardware frames, and any hardware frame context should not be automatically pr...
static void comp(unsigned char *dst, ptrdiff_t dst_stride, unsigned char *src, ptrdiff_t src_stride, int add)
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
uint8_t * data
The data buffer.
enum AVPixelFormat format
The pixel format identifying the underlying HW surface type.
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
const AVPixFmtDescriptor * csp
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
int av_hwframe_ctx_init(AVBufferRef *ref)
Finalize the context before use.
This structure describes decoded (raw) audio or video data.
AVBufferRef * av_hwframe_ctx_alloc(AVBufferRef *device_ref_in)
Allocate an AVHWFramesContext tied to a given device context.
const char * name
Filter name.
int width
The allocated dimensions of the frames in this pool.
A link between two filters.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
static int config_input(AVFilterLink *inlink)
CUfunction cu_func_uchar2
A filter pad used for either input or output.
This struct aggregates all the (hardware/vendor-specific) "high-level" state, i.e.
static void filter(AVFilterContext *ctx, AVFrame *dst, int parity, int tff)
#define AV_LOG_TRACE
Extremely verbose debugging, useful for libav* development.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
static const AVFilterPad deint_cuda_outputs[]
CUfunction cu_func_ushort2
#define AV_CEIL_RSHIFT(a, b)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample format(the sample packing is implied by the sample format) and sample rate. The lists are not just lists
static const AVFilterPad deint_cuda_inputs[]
#define av_assert0(cond)
assert() equivalent, that is always enabled.
static const AVFilterPad outputs[]
static enum AVPixelFormat pix_fmts[]
uint8_t log2_chroma_w
Amount to shift the luma width right to find the chroma width.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a link
#define LIBAVUTIL_VERSION_INT
static const AVClass yadif_cuda_class
Describe the class of an AVClass context structure.
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
uint8_t nb_components
The number of components each pixel has, (1-4)
Rational number (pair of numerator and denominator).
const char * av_default_item_name(void *ptr)
Return the context name.
static av_cold void deint_cuda_uninit(AVFilterContext *ctx)
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several inputs
@ AV_CLASS_CATEGORY_FILTER
const AVOption ff_yadif_options[]
static int config_output(AVFilterLink *link)
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
void(* filter)(AVFilterContext *ctx, AVFrame *dstpic, int parity, int tff)
static int deint_cuda_query_formats(AVFilterContext *ctx)
AVBufferRef * input_frames_ref
BYTE int const BYTE int src_pitch
static CUresult call_kernel(AVFilterContext *ctx, CUfunction func, CUdeviceptr prev, CUdeviceptr cur, CUdeviceptr next, CUarray_format format, int channels, int src_width, int src_height, int src_pitch, CUdeviceptr dst, int dst_width, int dst_height, int dst_pitch, int parity, int tff)
#define i(width, name, range_min, range_max)
const char AVS_Value args
const char * name
Pad name.
AVCUDADeviceContext * hwctx
This struct describes a set or pool of "hardware" frames (i.e.
This struct is allocated as AVHWDeviceContext.hwctx.
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
AVBufferRef * hw_frames_ctx
For hwaccel-format frames, this should be a reference to the AVHWFramesContext describing the frame.
int ff_yadif_request_frame(AVFilterLink *link)
AVComponentDescriptor comp[4]
Parameters that describe how pixels are packed.
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
AVBufferRef * av_buffer_ref(AVBufferRef *buf)
Create a new reference to an AVBuffer.
int initial_pool_size
Initial size of the frame pool.
A reference to a data buffer.
static int query_formats(AVFilterContext *ctx)
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
#define flags(name, subs,...)
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
CUfunction cu_func_ushort
static av_cold int uninit(AVCodecContext *avctx)
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
int ff_yadif_filter_frame(AVFilterLink *link, AVFrame *frame)
int ff_filter_init_hw_frames(AVFilterContext *avctx, AVFilterLink *link, int default_pool_size)
Perform any additional setup required for hardware frames.