FFmpeg
Data Structures | Macros | Functions | Variables
vf_dnn_classify.c File Reference
#include "libavutil/file_open.h"
#include "libavutil/mem.h"
#include "libavutil/opt.h"
#include "filters.h"
#include "dnn_filter_common.h"
#include "video.h"
#include "libavutil/time.h"
#include "libavutil/avstring.h"
#include "libavutil/detection_bbox.h"

Go to the source code of this file.

Data Structures

struct  DnnClassifyContext
 

Macros

#define OFFSET(x)   offsetof(DnnClassifyContext, dnnctx.x)
 
#define OFFSET2(x)   offsetof(DnnClassifyContext, x)
 
#define FLAGS   AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_VIDEO_PARAM
 

Functions

 AVFILTER_DNN_DEFINE_CLASS (dnn_classify, DNN_OV)
 
static int dnn_classify_post_proc (AVFrame *frame, DNNData *output, uint32_t bbox_index, AVFilterContext *filter_ctx)
 
static void free_classify_labels (DnnClassifyContext *ctx)
 
static int read_classify_label_file (AVFilterContext *context)
 
static av_cold int dnn_classify_init (AVFilterContext *context)
 
static int dnn_classify_flush_frame (AVFilterLink *outlink, int64_t pts, int64_t *out_pts)
 
static int dnn_classify_activate (AVFilterContext *filter_ctx)
 
static av_cold void dnn_classify_uninit (AVFilterContext *context)
 

Variables

static const AVOption dnn_classify_options []
 
static enum AVPixelFormat pix_fmts []
 
const AVFilter ff_vf_dnn_classify
 

Detailed Description

implementing an classification filter using deep learning networks.

Definition in file vf_dnn_classify.c.

Macro Definition Documentation

◆ OFFSET

#define OFFSET (   x)    offsetof(DnnClassifyContext, dnnctx.x)

Definition at line 44 of file vf_dnn_classify.c.

◆ OFFSET2

#define OFFSET2 (   x)    offsetof(DnnClassifyContext, x)

Definition at line 45 of file vf_dnn_classify.c.

◆ FLAGS

Definition at line 46 of file vf_dnn_classify.c.

Function Documentation

◆ AVFILTER_DNN_DEFINE_CLASS()

AVFILTER_DNN_DEFINE_CLASS ( dnn_classify  ,
DNN_OV   
)

◆ dnn_classify_post_proc()

static int dnn_classify_post_proc ( AVFrame frame,
DNNData output,
uint32_t  bbox_index,
AVFilterContext filter_ctx 
)
static

Definition at line 60 of file vf_dnn_classify.c.

Referenced by dnn_classify_init().

◆ free_classify_labels()

static void free_classify_labels ( DnnClassifyContext ctx)
static

Definition at line 115 of file vf_dnn_classify.c.

Referenced by dnn_classify_uninit().

◆ read_classify_label_file()

static int read_classify_label_file ( AVFilterContext context)
static

Definition at line 124 of file vf_dnn_classify.c.

Referenced by dnn_classify_init().

◆ dnn_classify_init()

static av_cold int dnn_classify_init ( AVFilterContext context)
static

Definition at line 182 of file vf_dnn_classify.c.

◆ dnn_classify_flush_frame()

static int dnn_classify_flush_frame ( AVFilterLink outlink,
int64_t  pts,
int64_t out_pts 
)
static

Definition at line 205 of file vf_dnn_classify.c.

Referenced by dnn_classify_activate().

◆ dnn_classify_activate()

static int dnn_classify_activate ( AVFilterContext filter_ctx)
static

Definition at line 233 of file vf_dnn_classify.c.

◆ dnn_classify_uninit()

static av_cold void dnn_classify_uninit ( AVFilterContext context)
static

Definition at line 289 of file vf_dnn_classify.c.

Variable Documentation

◆ dnn_classify_options

const AVOption dnn_classify_options[]
static
Initial value:
= {
{ "dnn_backend", "DNN backend", OFFSET(backend_type), AV_OPT_TYPE_INT, { .i64 = DNN_OV }, INT_MIN, INT_MAX, FLAGS, .unit = "backend" },
{ "confidence", "threshold of confidence", OFFSET2(confidence), AV_OPT_TYPE_FLOAT, { .dbl = 0.5 }, 0, 1, FLAGS},
{ "labels", "path to labels file", OFFSET2(labels_filename), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, FLAGS },
{ "target", "which one to be classified", OFFSET2(target), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, FLAGS },
{ NULL }
}

Definition at line 47 of file vf_dnn_classify.c.

◆ pix_fmts

enum AVPixelFormat pix_fmts[]
static

◆ ff_vf_dnn_classify

const AVFilter ff_vf_dnn_classify
Initial value:
= {
.name = "dnn_classify",
.description = NULL_IF_CONFIG_SMALL("Apply DNN classify filter to the input."),
.priv_size = sizeof(DnnClassifyContext),
.priv_class = &dnn_classify_class,
.activate = dnn_classify_activate,
}

Definition at line 296 of file vf_dnn_classify.c.

FILTER_PIXFMTS_ARRAY
#define FILTER_PIXFMTS_ARRAY(array)
Definition: filters.h:242
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: filters.h:262
AV_PIX_FMT_BGR24
@ AV_PIX_FMT_BGR24
packed RGB 8:8:8, 24bpp, BGRBGR...
Definition: pixfmt.h:76
preinit
static av_cold int preinit(AVFilterContext *ctx)
Definition: af_aresample.c:48
ff_dnn_filter_init_child_class
int ff_dnn_filter_init_child_class(AVFilterContext *filter)
Definition: dnn_filter_common.c:61
ff_video_default_filterpad
const AVFilterPad ff_video_default_filterpad[1]
An AVFilterPad array whose only entry has name "default" and is of type AVMEDIA_TYPE_VIDEO.
Definition: video.c:37
DnnClassifyContext
Definition: vf_dnn_classify.c:34
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:73
OFFSET2
#define OFFSET2(x)
Definition: vf_dnn_classify.c:45
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: filters.h:263
AV_PIX_FMT_GRAYF32
#define AV_PIX_FMT_GRAYF32
Definition: pixfmt.h:511
DNN_OV
@ DNN_OV
Definition: dnn_interface.h:37
NULL
#define NULL
Definition: coverity.c:32
dnn_classify_init
static av_cold int dnn_classify_init(AVFilterContext *context)
Definition: vf_dnn_classify.c:182
AV_PIX_FMT_GRAY8
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:81
init
int(* init)(AVBSFContext *ctx)
Definition: dts2pts.c:368
AV_PIX_FMT_RGB24
@ AV_PIX_FMT_RGB24
packed RGB 8:8:8, 24bpp, RGBRGB...
Definition: pixfmt.h:75
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Underlying C type is float.
Definition: opt.h:271
uninit
static void uninit(AVBSFContext *ctx)
Definition: pcm_rechunk.c:68
dnn_classify_uninit
static av_cold void dnn_classify_uninit(AVFilterContext *context)
Definition: vf_dnn_classify.c:289
AV_PIX_FMT_NV12
@ AV_PIX_FMT_NV12
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
Definition: pixfmt.h:96
OFFSET
#define OFFSET(x)
Definition: vf_dnn_classify.c:44
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Underlying C type is int.
Definition: opt.h:259
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
pix_fmts
static enum AVPixelFormat pix_fmts[]
Definition: vf_dnn_classify.c:196
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:77
FLAGS
#define FLAGS
Definition: vf_dnn_classify.c:46
AV_PIX_FMT_YUV411P
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:80
dnn_classify_activate
static int dnn_classify_activate(AVFilterContext *filter_ctx)
Definition: vf_dnn_classify.c:233
AV_PIX_FMT_YUV410P
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:79
AV_OPT_TYPE_STRING
@ AV_OPT_TYPE_STRING
Underlying C type is a uint8_t* that is either NULL or points to a C string allocated with the av_mal...
Definition: opt.h:276