66 #define OFFSET(x) offsetof(SSIMContext, x)
67 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
80 snprintf(value,
sizeof(value),
"%0.2f", d);
83 snprintf(key2,
sizeof(key2),
"%s%c", key, comp);
91 const uint8_t *ref, ptrdiff_t ref_stride,
92 int (*sums)[4],
int width)
96 for (z = 0; z <
width; z++) {
97 uint32_t
s1 = 0,
s2 = 0, ss = 0, s12 = 0;
99 for (y = 0; y < 4; y++) {
100 for (x = 0; x < 4; x++) {
101 int a = main[x + y * main_stride];
102 int b = ref[x + y * ref_stride];
123 static const int ssim_c1 = (int)(.01*.01*255*255*64 + .5);
124 static const int ssim_c2 = (int)(.03*.03*255*255*64*63 + .5);
130 int vars = fss * 64 - fs1 * fs1 - fs2 * fs2;
131 int covar = fs12 * 64 - fs1 * fs2;
133 return (
float)(2 * fs1 * fs2 + ssim_c1) * (
float)(2 * covar + ssim_c2)
134 / ((
float)(fs1 * fs1 + fs2 * fs2 + ssim_c1) * (
float)(vars + ssim_c2));
142 for (i = 0; i <
width; i++)
143 ssim +=
ssim_end1(sum0[i][0] + sum0[i + 1][0] + sum1[i][0] + sum1[i + 1][0],
144 sum0[i][1] + sum0[i + 1][1] + sum1[i][1] + sum1[i + 1][1],
145 sum0[i][2] + sum0[i + 1][2] + sum1[i][2] + sum1[i + 1][2],
146 sum0[i][3] + sum0[i + 1][3] + sum1[i][3] + sum1[i + 1][3]);
151 uint8_t *main,
int main_stride,
157 int (*sum0)[4] =
temp;
158 int (*sum1)[4] = sum0 + (width >> 2) + 3;
163 for (y = 1; y <
height; y++) {
164 for (; z <= y; z++) {
165 FFSWAP(
void*, sum0, sum1);
167 &ref[4 * z * ref_stride], ref_stride,
171 ssim += dsp->
ssim_end_line((
const int (*)[4])sum0, (
const int (*)[4])sum1, width - 1);
174 return ssim / ((height - 1) * (width - 1));
179 return 10 * log10(weight / (weight - ssim));
187 float c[4], ssimv = 0.0;
196 ssimv += s->
coefs[i] * c[i];
205 set_meta(metadata,
"lavfi.ssim.All", 0, ssimv);
319 outlink->
w = mainlink->
w;
320 outlink->
h = mainlink->
h;
399 .priv_class = &ssim_class,
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
This structure describes decoded (raw) audio or video data.
FFDualInputContext dinput
static av_cold void uninit(AVFilterContext *ctx)
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Main libavfilter public API header.
int h
agreed upon image height
uint8_t log2_chroma_w
Amount to shift the luma width right to find the chroma width.
const char * name
Pad name.
AVFilterLink ** inputs
array of pointers to input links
static av_cold int init(AVFilterContext *ctx)
static const AVFilterPad ssim_inputs[]
int shortest
terminate stream when the second input terminates
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range...
static void ssim_4x4xn(const uint8_t *main, ptrdiff_t main_stride, const uint8_t *ref, ptrdiff_t ref_stride, int(*sums)[4], int width)
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
static float ssim_end1(int s1, int s2, int ss, int s12)
static AVFrame * do_ssim(AVFilterContext *ctx, AVFrame *main, const AVFrame *ref)
A filter pad used for either input or output.
A link between two filters.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
AVRational frame_rate
Frame rate of the stream on the link, or 1/0 if unknown or variable; if left to 0/0, will be automatically copied from the first input of the source filter if it exists.
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void ff_ssim_init_x86(SSIMDSPContext *dsp)
void * priv
private data for use by the filter
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link...
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
int w
agreed upon image width
uint8_t nb_components
The number of components each pixel has, (1-4)
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
GLsizei GLboolean const GLfloat * value
static int request_frame(AVFilterLink *outlink)
AVFilterContext * src
source filter
AVFrame *(* process)(AVFilterContext *ctx, AVFrame *main, const AVFrame *second)
static const AVFilterPad outputs[]
int format
agreed upon media format
int ff_fill_rgba_map(uint8_t *rgba_map, enum AVPixelFormat pix_fmt)
static const AVOption ssim_options[]
static const uint8_t vars[2][12]
#define AV_LOG_INFO
Standard information.
static const AVFilterPad inputs[]
AVDictionary ** avpriv_frame_get_metadatap(AVFrame *frame)
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
int repeatlast
repeat last second frame
static int filter_frame(AVFilterLink *inlink, AVFrame *buf)
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
BYTE int const BYTE int int int height
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
static int config_input_ref(AVFilterLink *inlink)
AVFILTER_DEFINE_CLASS(ssim)
Describe the class of an AVClass context structure.
void(* ssim_4x4_line)(const uint8_t *buf, ptrdiff_t buf_stride, const uint8_t *ref, ptrdiff_t ref_stride, int(*sums)[4], int w)
size_t av_strlcatf(char *dst, size_t size, const char *fmt,...)
const char * name
Filter name.
AVRational sample_aspect_ratio
agreed upon sample aspect ratio
static float ssim_plane(SSIMDSPContext *dsp, uint8_t *main, int main_stride, uint8_t *ref, int ref_stride, int width, int height, void *temp)
static int weight(int i, int blen, int offset)
static enum AVPixelFormat pix_fmts[]
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int av_strerror(int errnum, char *errbuf, size_t errbuf_size)
Put a description of the AVERROR code errnum in errbuf.
static double ssim_db(double ssim, double weight)
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
static int config_output(AVFilterLink *outlink)
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
static const AVFilterPad ssim_outputs[]
AVFilterContext * dst
dest filter
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
float(* ssim_end_line)(const int(*sum0)[4], const int(*sum1)[4], int w)
static int query_formats(AVFilterContext *ctx)
static void comp(unsigned char *dst, int dst_stride, unsigned char *src, int src_stride, int add)
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
#define FFSWAP(type, a, b)
int main(int argc, char **argv)
static void set_meta(AVDictionary **metadata, const char *key, char comp, float d)
AVPixelFormat
Pixel format.
static float ssim_endn(const int(*sum0)[4], const int(*sum1)[4], int width)
#define AV_CEIL_RSHIFT(a, b)