FFmpeg
vf_scale_cuda.c
Go to the documentation of this file.
1 /*
2 * Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
18 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
19 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
20 * DEALINGS IN THE SOFTWARE.
21 */
22 
23 #include <float.h>
24 #include <stdio.h>
25 
26 #include "libavutil/common.h"
27 #include "libavutil/hwcontext.h"
29 #include "libavutil/cuda_check.h"
30 #include "libavutil/internal.h"
31 #include "libavutil/opt.h"
32 #include "libavutil/pixdesc.h"
33 
34 #include "avfilter.h"
35 #include "filters.h"
36 #include "scale_eval.h"
37 #include "video.h"
38 
39 #include "cuda/load_helper.h"
40 #include "vf_scale_cuda.h"
41 
42 static const enum AVPixelFormat supported_formats[] = {
53 };
54 
55 #define DIV_UP(a, b) ( ((a) + (b) - 1) / (b) )
56 #define BLOCKX 32
57 #define BLOCKY 16
58 
59 #define CHECK_CU(x) FF_CUDA_CHECK_DL(ctx, s->hwctx->internal->cuda_dl, x)
60 
61 enum {
63 
68 
70 };
71 
72 typedef struct CUDAScaleContext {
73  const AVClass *class;
74 
76 
77  enum AVPixelFormat in_fmt, out_fmt;
82 
85 
88 
89  /**
90  * Output sw format. AV_PIX_FMT_NONE for no conversion.
91  */
93 
94  char *w_expr; ///< width expression string
95  char *h_expr; ///< height expression string
96 
99  int reset_sar;
100 
101  CUcontext cu_ctx;
102  CUmodule cu_module;
103  CUfunction cu_func;
104  CUfunction cu_func_uv;
105  CUstream cu_stream;
106 
110 
111  float param;
113 
115 {
116  CUDAScaleContext *s = ctx->priv;
117 
118  s->frame = av_frame_alloc();
119  if (!s->frame)
120  return AVERROR(ENOMEM);
121 
122  s->tmp_frame = av_frame_alloc();
123  if (!s->tmp_frame)
124  return AVERROR(ENOMEM);
125 
126  return 0;
127 }
128 
130 {
131  CUDAScaleContext *s = ctx->priv;
132 
133  if (s->hwctx && s->cu_module) {
134  CudaFunctions *cu = s->hwctx->internal->cuda_dl;
135  CUcontext dummy;
136 
137  CHECK_CU(cu->cuCtxPushCurrent(s->hwctx->cuda_ctx));
138  CHECK_CU(cu->cuModuleUnload(s->cu_module));
139  s->cu_module = NULL;
140  CHECK_CU(cu->cuCtxPopCurrent(&dummy));
141  }
142 
143  av_frame_free(&s->frame);
144  av_buffer_unref(&s->frames_ctx);
145  av_frame_free(&s->tmp_frame);
146 }
147 
148 static av_cold int init_hwframe_ctx(CUDAScaleContext *s, AVBufferRef *device_ctx, int width, int height)
149 {
150  AVBufferRef *out_ref = NULL;
151  AVHWFramesContext *out_ctx;
152  int ret;
153 
154  out_ref = av_hwframe_ctx_alloc(device_ctx);
155  if (!out_ref)
156  return AVERROR(ENOMEM);
157  out_ctx = (AVHWFramesContext*)out_ref->data;
158 
159  out_ctx->format = AV_PIX_FMT_CUDA;
160  out_ctx->sw_format = s->out_fmt;
161  out_ctx->width = FFALIGN(width, 32);
162  out_ctx->height = FFALIGN(height, 32);
163 
164  ret = av_hwframe_ctx_init(out_ref);
165  if (ret < 0)
166  goto fail;
167 
168  av_frame_unref(s->frame);
169  ret = av_hwframe_get_buffer(out_ref, s->frame, 0);
170  if (ret < 0)
171  goto fail;
172 
173  s->frame->width = width;
174  s->frame->height = height;
175 
176  av_buffer_unref(&s->frames_ctx);
177  s->frames_ctx = out_ref;
178 
179  return 0;
180 fail:
181  av_buffer_unref(&out_ref);
182  return ret;
183 }
184 
185 static int format_is_supported(enum AVPixelFormat fmt)
186 {
187  int i;
188 
189  for (i = 0; i < FF_ARRAY_ELEMS(supported_formats); i++)
190  if (supported_formats[i] == fmt)
191  return 1;
192  return 0;
193 }
194 
195 static av_cold void set_format_info(AVFilterContext *ctx, enum AVPixelFormat in_format, enum AVPixelFormat out_format)
196 {
197  CUDAScaleContext *s = ctx->priv;
198  int i, p, d;
199 
200  s->in_fmt = in_format;
201  s->out_fmt = out_format;
202 
203  s->in_desc = av_pix_fmt_desc_get(s->in_fmt);
204  s->out_desc = av_pix_fmt_desc_get(s->out_fmt);
205  s->in_planes = av_pix_fmt_count_planes(s->in_fmt);
206  s->out_planes = av_pix_fmt_count_planes(s->out_fmt);
207 
208  // find maximum step of each component of each plane
209  // For our subset of formats, this should accurately tell us how many channels CUDA needs
210  // i.e. 1 for Y plane, 2 for UV plane of NV12, 4 for single plane of RGB0 formats
211 
212  for (i = 0; i < s->in_desc->nb_components; i++) {
213  d = (s->in_desc->comp[i].depth + 7) / 8;
214  p = s->in_desc->comp[i].plane;
215  s->in_plane_channels[p] = FFMAX(s->in_plane_channels[p], s->in_desc->comp[i].step / d);
216 
217  s->in_plane_depths[p] = s->in_desc->comp[i].depth;
218  }
219 }
220 
221 static av_cold int init_processing_chain(AVFilterContext *ctx, int in_width, int in_height,
222  int out_width, int out_height)
223 {
224  CUDAScaleContext *s = ctx->priv;
225  FilterLink *inl = ff_filter_link(ctx->inputs[0]);
226  FilterLink *outl = ff_filter_link(ctx->outputs[0]);
227 
228  AVHWFramesContext *in_frames_ctx;
229 
230  enum AVPixelFormat in_format;
231  enum AVPixelFormat out_format;
232  int ret;
233 
234  /* check that we have a hw context */
235  if (!inl->hw_frames_ctx) {
236  av_log(ctx, AV_LOG_ERROR, "No hw context provided on input\n");
237  return AVERROR(EINVAL);
238  }
239  in_frames_ctx = (AVHWFramesContext*)inl->hw_frames_ctx->data;
240  in_format = in_frames_ctx->sw_format;
241  out_format = (s->format == AV_PIX_FMT_NONE) ? in_format : s->format;
242 
243  if (!format_is_supported(in_format)) {
244  av_log(ctx, AV_LOG_ERROR, "Unsupported input format: %s\n",
245  av_get_pix_fmt_name(in_format));
246  return AVERROR(ENOSYS);
247  }
248  if (!format_is_supported(out_format)) {
249  av_log(ctx, AV_LOG_ERROR, "Unsupported output format: %s\n",
250  av_get_pix_fmt_name(out_format));
251  return AVERROR(ENOSYS);
252  }
253 
254  set_format_info(ctx, in_format, out_format);
255 
256  if (s->passthrough && in_width == out_width && in_height == out_height && in_format == out_format) {
257  s->frames_ctx = av_buffer_ref(inl->hw_frames_ctx);
258  if (!s->frames_ctx)
259  return AVERROR(ENOMEM);
260  } else {
261  s->passthrough = 0;
262 
263  ret = init_hwframe_ctx(s, in_frames_ctx->device_ref, out_width, out_height);
264  if (ret < 0)
265  return ret;
266 
267  if (in_width == out_width && in_height == out_height &&
268  in_format == out_format && s->interp_algo == INTERP_ALGO_DEFAULT)
269  s->interp_algo = INTERP_ALGO_NEAREST;
270  }
271 
272  outl->hw_frames_ctx = av_buffer_ref(s->frames_ctx);
273  if (!outl->hw_frames_ctx)
274  return AVERROR(ENOMEM);
275 
276  return 0;
277 }
278 
280 {
281  CUDAScaleContext *s = ctx->priv;
282  CUcontext dummy, cuda_ctx = s->hwctx->cuda_ctx;
283  CudaFunctions *cu = s->hwctx->internal->cuda_dl;
284  char buf[128];
285  int ret;
286 
287  const char *in_fmt_name = av_get_pix_fmt_name(s->in_fmt);
288  const char *out_fmt_name = av_get_pix_fmt_name(s->out_fmt);
289 
290  const char *function_infix = "";
291 
292  extern const unsigned char ff_vf_scale_cuda_ptx_data[];
293  extern const unsigned int ff_vf_scale_cuda_ptx_len;
294 
295  switch(s->interp_algo) {
296  case INTERP_ALGO_NEAREST:
297  function_infix = "Nearest";
298  s->interp_use_linear = 0;
299  s->interp_as_integer = 1;
300  break;
302  function_infix = "Bilinear";
303  s->interp_use_linear = 1;
304  s->interp_as_integer = 1;
305  break;
306  case INTERP_ALGO_DEFAULT:
307  case INTERP_ALGO_BICUBIC:
308  function_infix = "Bicubic";
309  s->interp_use_linear = 0;
310  s->interp_as_integer = 0;
311  break;
312  case INTERP_ALGO_LANCZOS:
313  function_infix = "Lanczos";
314  s->interp_use_linear = 0;
315  s->interp_as_integer = 0;
316  break;
317  default:
318  av_log(ctx, AV_LOG_ERROR, "Unknown interpolation algorithm\n");
319  return AVERROR_BUG;
320  }
321 
322  ret = CHECK_CU(cu->cuCtxPushCurrent(cuda_ctx));
323  if (ret < 0)
324  return ret;
325 
326  ret = ff_cuda_load_module(ctx, s->hwctx, &s->cu_module,
327  ff_vf_scale_cuda_ptx_data, ff_vf_scale_cuda_ptx_len);
328  if (ret < 0)
329  goto fail;
330 
331  snprintf(buf, sizeof(buf), "Subsample_%s_%s_%s", function_infix, in_fmt_name, out_fmt_name);
332  ret = CHECK_CU(cu->cuModuleGetFunction(&s->cu_func, s->cu_module, buf));
333  if (ret < 0) {
334  av_log(ctx, AV_LOG_FATAL, "Unsupported conversion: %s -> %s\n", in_fmt_name, out_fmt_name);
335  ret = AVERROR(ENOSYS);
336  goto fail;
337  }
338 
339  snprintf(buf, sizeof(buf), "Subsample_%s_%s_%s_uv", function_infix, in_fmt_name, out_fmt_name);
340  ret = CHECK_CU(cu->cuModuleGetFunction(&s->cu_func_uv, s->cu_module, buf));
341  if (ret < 0)
342  goto fail;
343 
344 fail:
345  CHECK_CU(cu->cuCtxPopCurrent(&dummy));
346 
347  return ret;
348 }
349 
351 {
352  AVFilterContext *ctx = outlink->src;
353  AVFilterLink *inlink = outlink->src->inputs[0];
355  CUDAScaleContext *s = ctx->priv;
356  AVHWFramesContext *frames_ctx;
357  AVCUDADeviceContext *device_hwctx;
358  int w, h;
359  double w_adj = 1.0;
360  int ret;
361 
363  s->w_expr, s->h_expr,
364  inlink, outlink,
365  &w, &h)) < 0)
366  goto fail;
367 
368  if (s->reset_sar)
369  w_adj = inlink->sample_aspect_ratio.num ?
370  (double)inlink->sample_aspect_ratio.num / inlink->sample_aspect_ratio.den : 1;
371 
373  s->force_original_aspect_ratio, s->force_divisible_by, w_adj);
374 
375  if (((int64_t)h * inlink->w) > INT_MAX ||
376  ((int64_t)w * inlink->h) > INT_MAX)
377  av_log(ctx, AV_LOG_ERROR, "Rescaled value for width or height is too big.\n");
378 
379  outlink->w = w;
380  outlink->h = h;
381 
383  if (ret < 0)
384  return ret;
385 
386  frames_ctx = (AVHWFramesContext*)inl->hw_frames_ctx->data;
387  device_hwctx = frames_ctx->device_ctx->hwctx;
388 
389  s->hwctx = device_hwctx;
390  s->cu_stream = s->hwctx->stream;
391 
392  if (s->reset_sar)
393  outlink->sample_aspect_ratio = (AVRational){1, 1};
394  else if (inlink->sample_aspect_ratio.num) {
395  outlink->sample_aspect_ratio = av_mul_q((AVRational){outlink->h*inlink->w,
396  outlink->w*inlink->h},
397  inlink->sample_aspect_ratio);
398  } else {
399  outlink->sample_aspect_ratio = inlink->sample_aspect_ratio;
400  }
401 
402  av_log(ctx, AV_LOG_VERBOSE, "w:%d h:%d fmt:%s -> w:%d h:%d fmt:%s%s\n",
403  inlink->w, inlink->h, av_get_pix_fmt_name(s->in_fmt),
404  outlink->w, outlink->h, av_get_pix_fmt_name(s->out_fmt),
405  s->passthrough ? " (passthrough)" : "");
406 
408  if (ret < 0)
409  return ret;
410 
411  return 0;
412 
413 fail:
414  return ret;
415 }
416 
417 static int call_resize_kernel(AVFilterContext *ctx, CUfunction func,
418  CUtexObject src_tex[4], int src_left, int src_top, int src_width, int src_height,
419  AVFrame *out_frame, int dst_width, int dst_height, int dst_pitch)
420 {
421  CUDAScaleContext *s = ctx->priv;
422  CudaFunctions *cu = s->hwctx->internal->cuda_dl;
423 
424  CUdeviceptr dst_devptr[4] = {
425  (CUdeviceptr)out_frame->data[0], (CUdeviceptr)out_frame->data[1],
426  (CUdeviceptr)out_frame->data[2], (CUdeviceptr)out_frame->data[3]
427  };
428 
429  void *args_uchar[] = {
430  &src_tex[0], &src_tex[1], &src_tex[2], &src_tex[3],
431  &dst_devptr[0], &dst_devptr[1], &dst_devptr[2], &dst_devptr[3],
432  &dst_width, &dst_height, &dst_pitch,
433  &src_left, &src_top, &src_width, &src_height, &s->param
434  };
435 
436  return CHECK_CU(cu->cuLaunchKernel(func,
437  DIV_UP(dst_width, BLOCKX), DIV_UP(dst_height, BLOCKY), 1,
438  BLOCKX, BLOCKY, 1, 0, s->cu_stream, args_uchar, NULL));
439 }
440 
442  AVFrame *out, AVFrame *in)
443 {
444  CUDAScaleContext *s = ctx->priv;
445  CudaFunctions *cu = s->hwctx->internal->cuda_dl;
446  CUcontext dummy, cuda_ctx = s->hwctx->cuda_ctx;
447  int i, ret;
448 
449  CUtexObject tex[4] = { 0, 0, 0, 0 };
450 
451  int crop_width = (in->width - in->crop_right) - in->crop_left;
452  int crop_height = (in->height - in->crop_bottom) - in->crop_top;
453 
454  ret = CHECK_CU(cu->cuCtxPushCurrent(cuda_ctx));
455  if (ret < 0)
456  return ret;
457 
458  for (i = 0; i < s->in_planes; i++) {
459  CUDA_TEXTURE_DESC tex_desc = {
460  .filterMode = s->interp_use_linear ?
461  CU_TR_FILTER_MODE_LINEAR :
462  CU_TR_FILTER_MODE_POINT,
463  .flags = s->interp_as_integer ? CU_TRSF_READ_AS_INTEGER : 0,
464  };
465 
466  CUDA_RESOURCE_DESC res_desc = {
467  .resType = CU_RESOURCE_TYPE_PITCH2D,
468  .res.pitch2D.format = s->in_plane_depths[i] <= 8 ?
469  CU_AD_FORMAT_UNSIGNED_INT8 :
470  CU_AD_FORMAT_UNSIGNED_INT16,
471  .res.pitch2D.numChannels = s->in_plane_channels[i],
472  .res.pitch2D.pitchInBytes = in->linesize[i],
473  .res.pitch2D.devPtr = (CUdeviceptr)in->data[i],
474  };
475 
476  if (i == 1 || i == 2) {
477  res_desc.res.pitch2D.width = AV_CEIL_RSHIFT(in->width, s->in_desc->log2_chroma_w);
478  res_desc.res.pitch2D.height = AV_CEIL_RSHIFT(in->height, s->in_desc->log2_chroma_h);
479  } else {
480  res_desc.res.pitch2D.width = in->width;
481  res_desc.res.pitch2D.height = in->height;
482  }
483 
484  ret = CHECK_CU(cu->cuTexObjectCreate(&tex[i], &res_desc, &tex_desc, NULL));
485  if (ret < 0)
486  goto exit;
487  }
488 
489  // scale primary plane(s). Usually Y (and A), or single plane of RGB frames.
490  ret = call_resize_kernel(ctx, s->cu_func,
491  tex, in->crop_left, in->crop_top, crop_width, crop_height,
492  out, out->width, out->height, out->linesize[0]);
493  if (ret < 0)
494  goto exit;
495 
496  if (s->out_planes > 1) {
497  // scale UV plane. Scale function sets both U and V plane, or singular interleaved plane.
498  ret = call_resize_kernel(ctx, s->cu_func_uv, tex,
499  AV_CEIL_RSHIFT(in->crop_left, s->in_desc->log2_chroma_w),
500  AV_CEIL_RSHIFT(in->crop_top, s->in_desc->log2_chroma_h),
501  AV_CEIL_RSHIFT(crop_width, s->in_desc->log2_chroma_w),
502  AV_CEIL_RSHIFT(crop_height, s->in_desc->log2_chroma_h),
503  out,
504  AV_CEIL_RSHIFT(out->width, s->out_desc->log2_chroma_w),
505  AV_CEIL_RSHIFT(out->height, s->out_desc->log2_chroma_h),
506  out->linesize[1]);
507  if (ret < 0)
508  goto exit;
509  }
510 
511 exit:
512  for (i = 0; i < s->in_planes; i++)
513  if (tex[i])
514  CHECK_CU(cu->cuTexObjectDestroy(tex[i]));
515 
516  CHECK_CU(cu->cuCtxPopCurrent(&dummy));
517 
518  return ret;
519 }
520 
522 {
523  CUDAScaleContext *s = ctx->priv;
524  AVFilterLink *outlink = ctx->outputs[0];
525  AVFrame *src = in;
526  int ret;
527 
528  ret = scalecuda_resize(ctx, s->frame, src);
529  if (ret < 0)
530  return ret;
531 
532  src = s->frame;
533  ret = av_hwframe_get_buffer(src->hw_frames_ctx, s->tmp_frame, 0);
534  if (ret < 0)
535  return ret;
536 
537  av_frame_move_ref(out, s->frame);
538  av_frame_move_ref(s->frame, s->tmp_frame);
539 
540  s->frame->width = outlink->w;
541  s->frame->height = outlink->h;
542 
543  ret = av_frame_copy_props(out, in);
544  if (ret < 0)
545  return ret;
546 
547  if (out->width != in->width || out->height != in->height) {
548  av_frame_side_data_remove_by_props(&out->side_data, &out->nb_side_data,
550  }
551 
552  return 0;
553 }
554 
556 {
557  AVFilterContext *ctx = link->dst;
558  CUDAScaleContext *s = ctx->priv;
559  AVFilterLink *outlink = ctx->outputs[0];
560  CudaFunctions *cu = s->hwctx->internal->cuda_dl;
561 
562  AVFrame *out = NULL;
563  CUcontext dummy;
564  int ret = 0;
565 
566  if (s->passthrough)
567  return ff_filter_frame(outlink, in);
568 
569  out = av_frame_alloc();
570  if (!out) {
571  ret = AVERROR(ENOMEM);
572  goto fail;
573  }
574 
575  ret = CHECK_CU(cu->cuCtxPushCurrent(s->hwctx->cuda_ctx));
576  if (ret < 0)
577  goto fail;
578 
579  ret = cudascale_scale(ctx, out, in);
580 
581  CHECK_CU(cu->cuCtxPopCurrent(&dummy));
582  if (ret < 0)
583  goto fail;
584 
585  if (s->reset_sar) {
586  out->sample_aspect_ratio = (AVRational){1, 1};
587  } else {
588  av_reduce(&out->sample_aspect_ratio.num, &out->sample_aspect_ratio.den,
589  (int64_t)in->sample_aspect_ratio.num * outlink->h * link->w,
590  (int64_t)in->sample_aspect_ratio.den * outlink->w * link->h,
591  INT_MAX);
592  }
593 
594  av_frame_free(&in);
595  return ff_filter_frame(outlink, out);
596 fail:
597  av_frame_free(&in);
598  av_frame_free(&out);
599  return ret;
600 }
601 
603 {
604  CUDAScaleContext *s = inlink->dst->priv;
605 
606  return s->passthrough ?
609 }
610 
611 #define OFFSET(x) offsetof(CUDAScaleContext, x)
612 #define FLAGS (AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM)
613 static const AVOption options[] = {
614  { "w", "Output video width", OFFSET(w_expr), AV_OPT_TYPE_STRING, { .str = "iw" }, .flags = FLAGS },
615  { "h", "Output video height", OFFSET(h_expr), AV_OPT_TYPE_STRING, { .str = "ih" }, .flags = FLAGS },
616  { "interp_algo", "Interpolation algorithm used for resizing", OFFSET(interp_algo), AV_OPT_TYPE_INT, { .i64 = INTERP_ALGO_DEFAULT }, 0, INTERP_ALGO_COUNT - 1, FLAGS, .unit = "interp_algo" },
617  { "nearest", "nearest neighbour", 0, AV_OPT_TYPE_CONST, { .i64 = INTERP_ALGO_NEAREST }, 0, 0, FLAGS, .unit = "interp_algo" },
618  { "bilinear", "bilinear", 0, AV_OPT_TYPE_CONST, { .i64 = INTERP_ALGO_BILINEAR }, 0, 0, FLAGS, .unit = "interp_algo" },
619  { "bicubic", "bicubic", 0, AV_OPT_TYPE_CONST, { .i64 = INTERP_ALGO_BICUBIC }, 0, 0, FLAGS, .unit = "interp_algo" },
620  { "lanczos", "lanczos", 0, AV_OPT_TYPE_CONST, { .i64 = INTERP_ALGO_LANCZOS }, 0, 0, FLAGS, .unit = "interp_algo" },
621  { "format", "Output video pixel format", OFFSET(format), AV_OPT_TYPE_PIXEL_FMT, { .i64 = AV_PIX_FMT_NONE }, INT_MIN, INT_MAX, .flags=FLAGS },
622  { "passthrough", "Do not process frames at all if parameters match", OFFSET(passthrough), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, FLAGS },
623  { "param", "Algorithm-Specific parameter", OFFSET(param), AV_OPT_TYPE_FLOAT, { .dbl = SCALE_CUDA_PARAM_DEFAULT }, -FLT_MAX, FLT_MAX, FLAGS },
624  { "force_original_aspect_ratio", "decrease or increase w/h if necessary to keep the original AR", OFFSET(force_original_aspect_ratio), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 2, FLAGS, .unit = "force_oar" },
625  { "disable", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 0 }, 0, 0, FLAGS, .unit = "force_oar" },
626  { "decrease", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 1 }, 0, 0, FLAGS, .unit = "force_oar" },
627  { "increase", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 2 }, 0, 0, FLAGS, .unit = "force_oar" },
628  { "force_divisible_by", "enforce that the output resolution is divisible by a defined integer when force_original_aspect_ratio is used", OFFSET(force_divisible_by), AV_OPT_TYPE_INT, { .i64 = 1 }, 1, 256, FLAGS },
629  { "reset_sar", "reset SAR to 1 and scale to square pixels if scaling proportionally", OFFSET(reset_sar), AV_OPT_TYPE_BOOL, { .i64 = 0}, 0, 1, FLAGS },
630  { NULL },
631 };
632 
633 static const AVClass cudascale_class = {
634  .class_name = "cudascale",
635  .item_name = av_default_item_name,
636  .option = options,
637  .version = LIBAVUTIL_VERSION_INT,
638 };
639 
640 static const AVFilterPad cudascale_inputs[] = {
641  {
642  .name = "default",
643  .type = AVMEDIA_TYPE_VIDEO,
644  .filter_frame = cudascale_filter_frame,
645  .get_buffer.video = cudascale_get_video_buffer,
646  },
647 };
648 
649 static const AVFilterPad cudascale_outputs[] = {
650  {
651  .name = "default",
652  .type = AVMEDIA_TYPE_VIDEO,
653  .config_props = cudascale_config_props,
654  },
655 };
656 
658  .p.name = "scale_cuda",
659  .p.description = NULL_IF_CONFIG_SMALL("GPU accelerated video resizer"),
660 
661  .p.priv_class = &cudascale_class,
662 
663  .init = cudascale_init,
664  .uninit = cudascale_uninit,
665 
666  .priv_size = sizeof(CUDAScaleContext),
667 
670 
672 
673  .flags_internal = FF_FILTER_FLAG_HWFRAME_AWARE,
674 };
options
static const AVOption options[]
Definition: vf_scale_cuda.c:613
func
int(* func)(AVBPrint *dst, const char *in, const char *arg)
Definition: jacosubdec.c:68
AVHWDeviceContext::hwctx
void * hwctx
The format-specific data, allocated and freed by libavutil along with this context.
Definition: hwcontext.h:86
AV_PIX_FMT_CUDA
@ AV_PIX_FMT_CUDA
HW acceleration through CUDA.
Definition: pixfmt.h:260
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:71
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
CUDAScaleContext::frames_ctx
AVBufferRef * frames_ctx
Definition: vf_scale_cuda.c:83
hwcontext_cuda_internal.h
cudascale_init
static av_cold int cudascale_init(AVFilterContext *ctx)
Definition: vf_scale_cuda.c:114
out
FILE * out
Definition: movenc.c:55
AV_PIX_FMT_BGR32
#define AV_PIX_FMT_BGR32
Definition: pixfmt.h:490
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1078
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:3248
AVBufferRef::data
uint8_t * data
The data buffer.
Definition: buffer.h:90
AVHWFramesContext::format
enum AVPixelFormat format
The pixel format identifying the underlying HW surface type.
Definition: hwcontext.h:198
ff_cuda_load_module
int ff_cuda_load_module(void *avctx, AVCUDADeviceContext *hwctx, CUmodule *cu_module, const unsigned char *data, const unsigned int length)
Loads a CUDA module and applies any decompression, if necessary.
Definition: load_helper.c:35
int64_t
long long int64_t
Definition: coverity.c:34
inlink
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
Definition: filter_design.txt:212
CUDAScaleContext::tmp_frame
AVFrame * tmp_frame
Definition: vf_scale_cuda.c:86
CUDAScaleContext::passthrough
int passthrough
Definition: vf_scale_cuda.c:87
cudascale_uninit
static av_cold void cudascale_uninit(AVFilterContext *ctx)
Definition: vf_scale_cuda.c:129
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:163
av_hwframe_ctx_init
int av_hwframe_ctx_init(AVBufferRef *ref)
Finalize the context before use.
Definition: hwcontext.c:326
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: filters.h:262
CUDAScaleContext::w_expr
char * w_expr
width expression string
Definition: vf_scale_cuda.c:94
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:410
pixdesc.h
AVFrame::width
int width
Definition: frame.h:482
w
uint8_t w
Definition: llviddspenc.c:38
av_hwframe_ctx_alloc
AVBufferRef * av_hwframe_ctx_alloc(AVBufferRef *device_ref_in)
Allocate an AVHWFramesContext tied to a given device context.
Definition: hwcontext.c:252
AVOption
AVOption.
Definition: opt.h:429
init_hwframe_ctx
static av_cold int init_hwframe_ctx(CUDAScaleContext *s, AVBufferRef *device_ctx, int width, int height)
Definition: vf_scale_cuda.c:148
call_resize_kernel
static int call_resize_kernel(AVFilterContext *ctx, CUfunction func, CUtexObject src_tex[4], int src_left, int src_top, int src_width, int src_height, AVFrame *out_frame, int dst_width, int dst_height, int dst_pitch)
Definition: vf_scale_cuda.c:417
CUDAScaleContext::interp_use_linear
int interp_use_linear
Definition: vf_scale_cuda.c:108
FLAGS
#define FLAGS
Definition: vf_scale_cuda.c:612
AV_LOG_VERBOSE
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:225
ff_scale_eval_dimensions
int ff_scale_eval_dimensions(void *log_ctx, const char *w_expr, const char *h_expr, AVFilterLink *inlink, AVFilterLink *outlink, int *ret_w, int *ret_h)
Parse and evaluate string expressions for width and height.
Definition: scale_eval.c:57
float.h
DIV_UP
#define DIV_UP(a, b)
Definition: vf_scale_cuda.c:55
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
av_buffer_ref
AVBufferRef * av_buffer_ref(const AVBufferRef *buf)
Create a new reference to an AVBuffer.
Definition: buffer.c:103
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:203
AVHWFramesContext::width
int width
The allocated dimensions of the frames in this pool.
Definition: hwcontext.h:218
INTERP_ALGO_COUNT
@ INTERP_ALGO_COUNT
Definition: vf_scale_cuda.c:69
video.h
AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:431
CUDAScaleContext::frame
AVFrame * frame
Definition: vf_scale_cuda.c:84
ff_default_get_video_buffer
AVFrame * ff_default_get_video_buffer(AVFilterLink *link, int w, int h)
Definition: video.c:111
av_pix_fmt_count_planes
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:3288
CUDAScaleContext::cu_func_uv
CUfunction cu_func_uv
Definition: vf_scale_cuda.c:104
vf_scale_cuda.h
INTERP_ALGO_DEFAULT
@ INTERP_ALGO_DEFAULT
Definition: vf_scale_cuda.c:62
fail
#define fail()
Definition: checkasm.h:193
CHECK_CU
#define CHECK_CU(x)
Definition: vf_scale_cuda.c:59
CUDAScaleContext::in_planes
int in_planes
Definition: vf_scale_cuda.c:79
dummy
int dummy
Definition: motion.c:66
scalecuda_resize
static int scalecuda_resize(AVFilterContext *ctx, AVFrame *out, AVFrame *in)
Definition: vf_scale_cuda.c:441
CUDAScaleContext::in_plane_channels
int in_plane_channels[4]
Definition: vf_scale_cuda.c:81
CUDAScaleContext::reset_sar
int reset_sar
Definition: vf_scale_cuda.c:99
av_reduce
int av_reduce(int *dst_num, int *dst_den, int64_t num, int64_t den, int64_t max)
Reduce a fraction.
Definition: rational.c:35
AVRational::num
int num
Numerator.
Definition: rational.h:59
cudascale_load_functions
static av_cold int cudascale_load_functions(AVFilterContext *ctx)
Definition: vf_scale_cuda.c:279
AV_SIDE_DATA_PROP_SIZE_DEPENDENT
@ AV_SIDE_DATA_PROP_SIZE_DEPENDENT
Side data depends on the video dimensions.
Definition: frame.h:292
AVFilterPad
A filter pad used for either input or output.
Definition: filters.h:38
av_frame_alloc
AVFrame * av_frame_alloc(void)
Allocate an AVFrame and set its fields to default values.
Definition: frame.c:151
cudascale_class
static const AVClass cudascale_class
Definition: vf_scale_cuda.c:633
cudascale_config_props
static av_cold int cudascale_config_props(AVFilterLink *outlink)
Definition: vf_scale_cuda.c:350
CUDAScaleContext::hwctx
AVCUDADeviceContext * hwctx
Definition: vf_scale_cuda.c:75
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:209
set_format_info
static av_cold void set_format_info(AVFilterContext *ctx, enum AVPixelFormat in_format, enum AVPixelFormat out_format)
Definition: vf_scale_cuda.c:195
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
av_cold
#define av_cold
Definition: attributes.h:90
AVHWFramesContext::height
int height
Definition: hwcontext.h:218
FFFilter
Definition: filters.h:265
CUDAScaleContext::interp_as_integer
int interp_as_integer
Definition: vf_scale_cuda.c:109
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_PIX_FMT_YUV444P16
#define AV_PIX_FMT_YUV444P16
Definition: pixfmt.h:528
AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:60
INTERP_ALGO_LANCZOS
@ INTERP_ALGO_LANCZOS
Definition: vf_scale_cuda.c:67
format
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample format(the sample packing is implied by the sample format) and sample rate. The lists are not just lists
AV_PIX_FMT_0BGR32
#define AV_PIX_FMT_0BGR32
Definition: pixfmt.h:493
INTERP_ALGO_BICUBIC
@ INTERP_ALGO_BICUBIC
Definition: vf_scale_cuda.c:66
ff_vf_scale_cuda
const FFFilter ff_vf_scale_cuda
Definition: vf_scale_cuda.c:657
CUDAScaleContext::cu_stream
CUstream cu_stream
Definition: vf_scale_cuda.c:105
filters.h
ctx
AVFormatContext * ctx
Definition: movenc.c:49
load_helper.h
AVFrame::crop_right
size_t crop_right
Definition: frame.h:798
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:73
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: filters.h:263
format_is_supported
static int format_is_supported(enum AVPixelFormat fmt)
Definition: vf_scale_cuda.c:185
link
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a link
Definition: filter_design.txt:23
CUDAScaleContext::param
float param
Definition: vf_scale_cuda.c:111
if
if(ret)
Definition: filter_design.txt:179
CUDAScaleContext::force_divisible_by
int force_divisible_by
Definition: vf_scale_cuda.c:98
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
CUDAScaleContext::interp_algo
int interp_algo
Definition: vf_scale_cuda.c:107
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:75
OFFSET
#define OFFSET(x)
Definition: vf_scale_cuda.c:611
NULL
#define NULL
Definition: coverity.c:32
AVHWFramesContext::sw_format
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
Definition: hwcontext.h:211
av_frame_copy_props
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
Definition: frame.c:726
av_buffer_unref
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
Definition: buffer.c:139
CUDAScaleContext::out_desc
const AVPixFmtDescriptor * out_desc
Definition: vf_scale_cuda.c:78
CUDAScaleContext::h_expr
char * h_expr
height expression string
Definition: vf_scale_cuda.c:95
BLOCKY
#define BLOCKY
Definition: vf_scale_cuda.c:57
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
AVHWFramesContext::device_ref
AVBufferRef * device_ref
A reference to the parent AVHWDeviceContext.
Definition: hwcontext.h:127
AVFilterContext::inputs
AVFilterLink ** inputs
array of pointers to input links
Definition: avfilter.h:265
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:239
options
Definition: swscale.c:42
double
double
Definition: af_crystalizer.c:132
ff_filter_link
static FilterLink * ff_filter_link(AVFilterLink *link)
Definition: filters.h:197
AVFrame::crop_bottom
size_t crop_bottom
Definition: frame.h:796
FF_FILTER_FLAG_HWFRAME_AWARE
#define FF_FILTER_FLAG_HWFRAME_AWARE
The filter is aware of hardware frames, and any hardware frame context should not be automatically pr...
Definition: filters.h:206
cudascale_inputs
static const AVFilterPad cudascale_inputs[]
Definition: vf_scale_cuda.c:640
AVFrame::crop_left
size_t crop_left
Definition: frame.h:797
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
height
#define height
Definition: dsp.h:85
CUDAScaleContext::cu_func
CUfunction cu_func
Definition: vf_scale_cuda.c:103
scale_eval.h
AV_PIX_FMT_RGB32
#define AV_PIX_FMT_RGB32
Definition: pixfmt.h:488
av_frame_side_data_remove_by_props
void av_frame_side_data_remove_by_props(AVFrameSideData ***sd, int *nb_sd, int props)
Remove and free all side data instances that match any of the given side data properties.
Definition: frame.c:967
CUDAScaleContext::cu_module
CUmodule cu_module
Definition: vf_scale_cuda.c:102
ff_null_get_video_buffer
AVFrame * ff_null_get_video_buffer(AVFilterLink *link, int w, int h)
Definition: video.c:44
CUDAScaleContext
Definition: vf_scale_cuda.c:72
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Underlying C type is float.
Definition: opt.h:271
supported_formats
static enum AVPixelFormat supported_formats[]
Definition: vf_scale_cuda.c:42
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
internal.h
common.h
av_frame_move_ref
void av_frame_move_ref(AVFrame *dst, AVFrame *src)
Move everything contained in src to dst and reset src.
Definition: frame.c:650
av_frame_unref
void av_frame_unref(AVFrame *frame)
Unreference all the buffers referenced by frame and reset the frame fields.
Definition: frame.c:623
AVFilterPad::name
const char * name
Pad name.
Definition: filters.h:44
AV_PIX_FMT_P016
#define AV_PIX_FMT_P016
Definition: pixfmt.h:570
CUDAScaleContext::in_plane_depths
int in_plane_depths[4]
Definition: vf_scale_cuda.c:80
AVHWFramesContext
This struct describes a set or pool of "hardware" frames (i.e.
Definition: hwcontext.h:116
AVCUDADeviceContext
This struct is allocated as AVHWDeviceContext.hwctx.
Definition: hwcontext_cuda.h:42
BLOCKX
#define BLOCKX
Definition: vf_scale_cuda.c:56
CUDAScaleContext::out_fmt
enum AVPixelFormat in_fmt out_fmt
Definition: vf_scale_cuda.c:77
ret
ret
Definition: filter_design.txt:187
AV_LOG_FATAL
#define AV_LOG_FATAL
Something went wrong and recovery is not possible.
Definition: log.h:203
AV_PIX_FMT_NV12
@ AV_PIX_FMT_NV12
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
Definition: pixfmt.h:96
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:80
AV_PIX_FMT_0RGB32
#define AV_PIX_FMT_0RGB32
Definition: pixfmt.h:492
AVHWFramesContext::device_ctx
AVHWDeviceContext * device_ctx
The parent AVHWDeviceContext.
Definition: hwcontext.h:135
cuda_check.h
AVFrame::sample_aspect_ratio
AVRational sample_aspect_ratio
Sample aspect ratio for the video frame, 0/1 if unknown/unspecified.
Definition: frame.h:517
AVFrame::height
int height
Definition: frame.h:482
cudascale_get_video_buffer
static AVFrame * cudascale_get_video_buffer(AVFilterLink *inlink, int w, int h)
Definition: vf_scale_cuda.c:602
AVRational::den
int den
Denominator.
Definition: rational.h:60
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Underlying C type is int.
Definition: opt.h:259
avfilter.h
INTERP_ALGO_BILINEAR
@ INTERP_ALGO_BILINEAR
Definition: vf_scale_cuda.c:65
AV_OPT_TYPE_PIXEL_FMT
@ AV_OPT_TYPE_PIXEL_FMT
Underlying C type is enum AVPixelFormat.
Definition: opt.h:307
av_mul_q
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
Definition: rational.c:80
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
INTERP_ALGO_NEAREST
@ INTERP_ALGO_NEAREST
Definition: vf_scale_cuda.c:64
AVFilterContext
An instance of a filter.
Definition: avfilter.h:257
AV_PIX_FMT_P010
#define AV_PIX_FMT_P010
Definition: pixfmt.h:568
cudascale_outputs
static const AVFilterPad cudascale_outputs[]
Definition: vf_scale_cuda.c:649
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
FFFilter::p
AVFilter p
The public AVFilter.
Definition: filters.h:269
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
cudascale_scale
static int cudascale_scale(AVFilterContext *ctx, AVFrame *out, AVFrame *in)
Definition: vf_scale_cuda.c:521
cudascale_filter_frame
static int cudascale_filter_frame(AVFilterLink *link, AVFrame *in)
Definition: vf_scale_cuda.c:555
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
CUDAScaleContext::force_original_aspect_ratio
int force_original_aspect_ratio
Definition: vf_scale_cuda.c:97
CUDAScaleContext::format
enum AVPixelFormat format
Output sw format.
Definition: vf_scale_cuda.c:92
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Underlying C type is int.
Definition: opt.h:327
AVFrame::crop_top
size_t crop_top
Definition: frame.h:795
SCALE_CUDA_PARAM_DEFAULT
#define SCALE_CUDA_PARAM_DEFAULT
Definition: vf_scale_cuda.h:26
CUDAScaleContext::in_desc
const AVPixFmtDescriptor * in_desc
Definition: vf_scale_cuda.c:78
init_processing_chain
static av_cold int init_processing_chain(AVFilterContext *ctx, int in_width, int in_height, int out_width, int out_height)
Definition: vf_scale_cuda.c:221
hwcontext.h
AVERROR_BUG
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
Definition: error.h:52
AVFrame::linesize
int linesize[AV_NUM_DATA_POINTERS]
For video, a positive or negative value, which is typically indicating the size in bytes of each pict...
Definition: frame.h:455
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
h
h
Definition: vp9dsp_template.c:2070
AV_OPT_TYPE_STRING
@ AV_OPT_TYPE_STRING
Underlying C type is a uint8_t* that is either NULL or points to a C string allocated with the av_mal...
Definition: opt.h:276
width
#define width
Definition: dsp.h:85
av_hwframe_get_buffer
int av_hwframe_get_buffer(AVBufferRef *hwframe_ref, AVFrame *frame, int flags)
Allocate a new frame attached to the given AVHWFramesContext.
Definition: hwcontext.c:495
AV_OPT_TYPE_CONST
@ AV_OPT_TYPE_CONST
Special option type for declaring named constants.
Definition: opt.h:299
FILTER_SINGLE_PIXFMT
#define FILTER_SINGLE_PIXFMT(pix_fmt_)
Definition: filters.h:252
snprintf
#define snprintf
Definition: snprintf.h:34
ff_scale_adjust_dimensions
int ff_scale_adjust_dimensions(AVFilterLink *inlink, int *ret_w, int *ret_h, int force_original_aspect_ratio, int force_divisible_by, double w_adj)
Transform evaluated width and height obtained from ff_scale_eval_dimensions into actual target width ...
Definition: scale_eval.c:113
src
#define src
Definition: vp8dsp.c:248
av_get_pix_fmt_name
const char * av_get_pix_fmt_name(enum AVPixelFormat pix_fmt)
Return the short name for a pixel format, NULL in case pix_fmt is unknown.
Definition: pixdesc.c:3168
CUDAScaleContext::out_planes
int out_planes
Definition: vf_scale_cuda.c:79
CUDAScaleContext::cu_ctx
CUcontext cu_ctx
Definition: vf_scale_cuda.c:101