Go to the documentation of this file.
37 #define NUM_DATA_BUFS 13
57 #define OFFSET(x) offsetof(VIFContext, x)
70 0.00745626912, 0.0142655009, 0.0250313189, 0.0402820669, 0.0594526194,
71 0.0804751068, 0.0999041125, 0.113746084, 0.118773937, 0.113746084,
72 0.0999041125, 0.0804751068, 0.0594526194, 0.0402820669, 0.0250313189,
73 0.0142655009, 0.00745626912
76 0.0189780835, 0.0558981746, 0.120920904, 0.192116052, 0.224173605,
77 0.192116052, 0.120920904, 0.0558981746, 0.0189780835
80 0.054488685, 0.244201347, 0.402619958, 0.244201347, 0.054488685
83 0.166378498, 0.667243004, 0.166378498
99 int src_stride,
int dst_stride)
101 const int dst_px_stride = dst_stride / 2;
103 for (
int i = 0;
i <
h / 2;
i++) {
104 for (
int j = 0; j <
w / 2; j++)
105 dst[
i * dst_px_stride + j] =
src[(
i * 2) * src_stride + (j * 2)];
110 const float *mu1_mu2,
const float *xx_filt,
111 const float *yy_filt,
const float *xy_filt,
112 float *num,
float *den,
int w,
int h)
114 static const float sigma_nsq = 2;
115 float mu1_sq_val, mu2_sq_val, mu1_mu2_val, xx_filt_val, yy_filt_val, xy_filt_val;
116 float sigma1_sq, sigma2_sq, sigma12,
g, sv_sq, eps = 1.0e-10
f;
117 float gain_limit = 100.f;
118 float num_val, den_val;
119 float accum_num = 0.0f;
120 float accum_den = 0.0f;
122 for (
int i = 0;
i <
h;
i++) {
123 float accum_inner_num = 0.f;
124 float accum_inner_den = 0.f;
126 for (
int j = 0; j <
w; j++) {
127 mu1_sq_val = mu1_sq[
i *
w + j];
128 mu2_sq_val = mu2_sq[
i *
w + j];
129 mu1_mu2_val = mu1_mu2[
i *
w + j];
130 xx_filt_val = xx_filt[
i *
w + j];
131 yy_filt_val = yy_filt[
i *
w + j];
132 xy_filt_val = xy_filt[
i *
w + j];
134 sigma1_sq = xx_filt_val - mu1_sq_val;
135 sigma2_sq = yy_filt_val - mu2_sq_val;
136 sigma12 = xy_filt_val - mu1_mu2_val;
138 sigma1_sq =
FFMAX(sigma1_sq, 0.0
f);
139 sigma2_sq =
FFMAX(sigma2_sq, 0.0
f);
140 sigma12 =
FFMAX(sigma12, 0.0
f);
142 g = sigma12 / (sigma1_sq + eps);
143 sv_sq = sigma2_sq -
g * sigma12;
145 if (sigma1_sq < eps) {
151 if (sigma2_sq < eps) {
160 sv_sq =
FFMAX(sv_sq, eps);
164 num_val =
log2f(1.0
f +
g *
g * sigma1_sq / (sv_sq + sigma_nsq));
165 den_val =
log2f(1.0
f + sigma1_sq / sigma_nsq);
168 num_val = den_val = 1.f;
170 accum_inner_num += num_val;
171 accum_inner_den += den_val;
174 accum_num += accum_inner_num;
175 accum_den += accum_inner_den;
182 static void vif_xx_yy_xy(
const float *x,
const float *y,
float *xx,
float *yy,
183 float *xy,
int w,
int h)
185 for (
int i = 0;
i <
h;
i++) {
186 for (
int j = 0; j <
w; j++) {
189 float xxval = xval * xval;
190 float yyval = yval * yval;
191 float xyval = xval * yval;
210 const float *
src = td->
src;
219 const int slice_end = (
h * (jobnr+1)) / nb_jobs;
223 for (
int j = 0; j <
w; j++) {
226 if (
i >= filt_w / 2 &&
i <
h - filt_w / 2 - 1) {
227 for (
int filt_i = 0; filt_i < filt_w; filt_i++) {
228 const float filt_coeff =
filter[filt_i];
230 int ii =
i - filt_w / 2 + filt_i;
232 img_coeff =
src[ii * src_stride + j];
233 sum += filt_coeff * img_coeff;
236 for (
int filt_i = 0; filt_i < filt_w; filt_i++) {
237 const float filt_coeff =
filter[filt_i];
238 int ii =
i - filt_w / 2 + filt_i;
241 ii = ii < 0 ? -ii : (ii >=
h ? 2 *
h - ii - 1 : ii);
243 img_coeff =
src[ii * src_stride + j];
244 sum += filt_coeff * img_coeff;
252 for (
int j = 0; j <
w; j++) {
255 if (j >= filt_w / 2 && j <
w - filt_w / 2 - 1) {
256 for (
int filt_j = 0; filt_j < filt_w; filt_j++) {
257 const float filt_coeff =
filter[filt_j];
258 int jj = j - filt_w / 2 + filt_j;
261 img_coeff =
temp[jj];
262 sum += filt_coeff * img_coeff;
265 for (
int filt_j = 0; filt_j < filt_w; filt_j++) {
266 const float filt_coeff =
filter[filt_j];
267 int jj = j - filt_w / 2 + filt_j;
270 jj = jj < 0 ? -jj : (jj >=
w ? 2 *
w - jj - 1 : jj);
272 img_coeff =
temp[jj];
273 sum += filt_coeff * img_coeff;
277 dst[
i * dst_stride + j] = sum;
285 const float *
ref,
const float *
main,
int w,
int h,
286 int ref_stride,
int main_stride,
float *score,
291 float *ref_scale = data_buf[0];
292 float *main_scale = data_buf[1];
293 float *ref_sq = data_buf[2];
294 float *main_sq = data_buf[3];
295 float *ref_main = data_buf[4];
296 float *mu1 = data_buf[5];
297 float *mu2 = data_buf[6];
298 float *mu1_sq = data_buf[7];
299 float *mu2_sq = data_buf[8];
300 float *mu1_mu2 = data_buf[9];
301 float *ref_sq_filt = data_buf[10];
302 float *main_sq_filt = data_buf[11];
303 float *ref_main_filt = data_buf[12];
305 const float *curr_ref_scale =
ref;
306 const float *curr_main_scale =
main;
307 int curr_ref_stride = ref_stride;
308 int curr_main_stride = main_stride;
316 const int nb_threads =
FFMIN(
h, gnb_threads);
324 td.
src = curr_ref_scale;
333 td.
src = curr_main_scale;
338 vif_dec2(mu1, ref_scale, buf_valid_w, buf_valid_h,
w,
w);
339 vif_dec2(mu2, main_scale, buf_valid_w, buf_valid_h,
w,
w);
347 curr_ref_scale = ref_scale;
348 curr_main_scale = main_scale;
351 curr_main_stride =
w;
354 td.
src = curr_ref_scale;
363 td.
src = curr_main_scale;
370 vif_xx_yy_xy(curr_ref_scale, curr_main_scale, ref_sq, main_sq, ref_main,
w,
h);
373 td.
dst = ref_sq_filt;
378 td.
dst = main_sq_filt;
383 td.
dst = ref_main_filt;
386 vif_statistic(mu1_sq, mu2_sq, mu1_mu2, ref_sq_filt, main_sq_filt,
387 ref_main_filt, &num, &den,
w,
h);
389 score[
scale] = den <= FLT_EPSILON ? 1.f : num / den;
395 #define offset_fn(type, bits) \
396 static void offset_##bits##bit(VIFContext *s, \
397 const AVFrame *ref, \
398 AVFrame *main, int stride)\
403 int ref_stride = ref->linesize[0]; \
404 int main_stride = main->linesize[0]; \
406 const type *ref_ptr = (const type *) ref->data[0]; \
407 const type *main_ptr = (const type *) main->data[0]; \
409 const float factor = s->factor; \
411 float *ref_ptr_data = s->ref_data; \
412 float *main_ptr_data = s->main_data; \
414 for (int i = 0; i < h; i++) { \
415 for (int j = 0; j < w; j++) { \
416 ref_ptr_data[j] = ref_ptr[j] * factor - 128.f; \
417 main_ptr_data[j] = main_ptr[j] * factor - 128.f; \
419 ref_ptr += ref_stride / sizeof(type); \
421 main_ptr += main_stride / sizeof(type); \
422 main_ptr_data += w; \
442 s->factor = 1.f / (1 << (
s->desc->comp[0].depth - 8));
443 if (
s->desc->comp[0].depth <= 8) {
450 s->width,
s->height,
s->width,
s->width,
451 score,
s->data_buf,
s->temp,
s->nb_threads);
453 set_meta(metadata,
"lavfi.vif.scale.0", score[0]);
454 set_meta(metadata,
"lavfi.vif.scale.1", score[1]);
455 set_meta(metadata,
"lavfi.vif.scale.2", score[2]);
456 set_meta(metadata,
"lavfi.vif.scale.3", score[3]);
458 for (
int i = 0;
i < 4;
i++) {
459 s->vif_min[
i] =
FFMIN(
s->vif_min[
i], score[
i]);
460 s->vif_max[
i] =
FFMAX(
s->vif_max[
i], score[
i]);
461 s->vif_sum[
i] += score[
i];
476 #define PF(suf) AV_PIX_FMT_YUV420##suf, AV_PIX_FMT_YUV422##suf, AV_PIX_FMT_YUV444##suf
486 if (
ctx->inputs[0]->w !=
ctx->inputs[1]->w ||
487 ctx->inputs[0]->h !=
ctx->inputs[1]->h) {
493 s->width =
ctx->inputs[0]->w;
494 s->height =
ctx->inputs[0]->h;
497 for (
int i = 0;
i < 4;
i++) {
498 s->vif_min[
i] = DBL_MAX;
499 s->vif_max[
i] = -DBL_MAX;
503 if (!(
s->data_buf[
i] =
av_calloc(
s->width,
s->height *
sizeof(
float))))
507 if (!(
s->ref_data =
av_calloc(
s->width,
s->height *
sizeof(
float))))
510 if (!(
s->main_data =
av_calloc(
s->width,
s->height *
sizeof(
float))))
513 if (!(
s->temp =
av_calloc(
s->nb_threads,
sizeof(
s->temp[0]))))
516 for (
int i = 0;
i <
s->nb_threads;
i++) {
537 out_frame = main_frame;
558 outlink->
w = mainlink->
w;
559 outlink->
h = mainlink->
h;
591 if (
s->nb_frames > 0) {
592 for (
int i = 0;
i < 4;
i++)
594 i,
s->vif_sum[
i] /
s->nb_frames,
s->vif_min[
i],
s->vif_max[
i]);
603 for (
int i = 0;
i <
s->nb_threads &&
s->temp;
i++)
633 .preinit = vif_framesync_preinit,
636 .priv_class = &vif_class,
static const AVFilterPad vif_outputs[]
AVRational time_base
Time base for the incoming frames.
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
#define FILTER_PIXFMTS_ARRAY(array)
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
static int process_frame(FFFrameSync *fs)
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
#define offset_fn(type, bits)
static void vif_xx_yy_xy(const float *x, const float *y, float *xx, float *yy, float *xy, int w, int h)
#define FILTER_INPUTS(array)
This structure describes decoded (raw) audio or video data.
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
static av_cold void uninit(AVFilterContext *ctx)
static const float vif_filter1d_table[4][17]
void(* filter)(uint8_t *src, int stride, int qscale)
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
const char * name
Filter name.
static int vif_filter1d(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
static enum AVPixelFormat pix_fmts[]
static const uint8_t vif_filter1d_width1[4]
A link between two filters.
Link properties exposed to filter code, but not external callers.
const AVPixFmtDescriptor * desc
@ EXT_STOP
Completely stop all streams with this one.
static int slice_end(AVCodecContext *avctx, AVFrame *pict, int *got_output)
Handle slice ends.
static void vif_dec2(const float *src, float *dst, int w, int h, int src_stride, int dst_stride)
#define AV_PIX_FMT_GRAY16
unsigned sync
Synchronization level: frames on input at the highest sync level will generate output frame events.
A filter pad used for either input or output.
@ AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
AVRational sample_aspect_ratio
agreed upon sample aspect ratio
#define AV_PIX_FMT_GRAY14
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
static AVFrame * do_vif(AVFilterContext *ctx, AVFrame *main, const AVFrame *ref)
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
#define FILTER_OUTPUTS(array)
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
#define AV_PIX_FMT_GRAY10
Describe the class of an AVClass context structure.
#define fs(width, name, subs,...)
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
static FilterLink * ff_filter_link(AVFilterLink *link)
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
static int ref_frame(VVCFrame *dst, const VVCFrame *src)
AVFilterContext * src
source filter
#define AV_LOG_INFO
Standard information.
static int compute_vif2(AVFilterContext *ctx, const float *ref, const float *main, int w, int h, int ref_stride, int main_stride, float *score, float *const data_buf[NUM_DATA_BUFS], float **temp, int gnb_threads)
#define i(width, name, range_min, range_max)
int w
agreed upon image width
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Used for passing data between threads.
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
const char * name
Pad name.
static int config_output(AVFilterLink *outlink)
void * av_calloc(size_t nmemb, size_t size)
static void vif_statistic(const float *mu1_sq, const float *mu2_sq, const float *mu1_mu2, const float *xx_filt, const float *yy_filt, const float *xy_filt, float *num, float *den, int w, int h)
static int slice_start(SliceContext *sc, VVCContext *s, VVCFrameContext *fc, const CodedBitstreamUnit *unit, const int is_first_slice)
int ff_framesync_init(FFFrameSync *fs, AVFilterContext *parent, unsigned nb_in)
Initialize a frame sync structure.
static void set_meta(AVDictionary **metadata, int chan, const char *key, const char *fmt, float val)
enum FFFrameSyncExtMode before
Extrapolation mode for timestamps before the first frame.
int h
agreed upon image height
int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
static const AVFilterPad vif_inputs[]
#define AVFILTER_FLAG_METADATA_ONLY
The filter is a "metadata" filter - it does not modify the frame data in any way.
static int ref[MAX_W *MAX_W]
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link.
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
float * data_buf[NUM_DATA_BUFS]
static int activate(AVFilterContext *ctx)
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
static void scale(int *out, const int *in, const int w, const int h, const int shift)
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
enum FFFrameSyncExtMode after
Extrapolation mode for timestamps after the last frame.
AVRational frame_rate
Frame rate of the stream on the link, or 1/0 if unknown or variable.
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
int ff_framesync_dualinput_get(FFFrameSync *fs, AVFrame **f0, AVFrame **f1)
static const AVOption vif_options[]
#define AV_PIX_FMT_GRAY12
FRAMESYNC_DEFINE_CLASS(vif, VIFContext, fs)
static int config_input_ref(AVFilterLink *inlink)