Go to the documentation of this file.
65 #define OFFSET(x) offsetof(DeshakeContext, x)
66 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
92 static int cmp(
const void *
a,
const void *
b)
94 return FFDIFFSIGN(*(
const double *)
a, *(
const double *)
b);
108 for (x = cut; x < count - cut; x++) {
112 return mean / (count - cut * 2);
127 int smallest = INT_MAX;
130 #define CMP(i, j) deshake->sad(src1 + cy * stride + cx, stride,\
131 src2 + (j) * stride + (i), stride)
135 for (y = -deshake->
ry; y <= deshake->ry; y++) {
136 for (x = -deshake->
rx; x <= deshake->rx; x++) {
138 if (
diff < smallest) {
147 for (y = -deshake->
ry + 1; y < deshake->ry; y += 2) {
148 for (x = -deshake->
rx + 1; x < deshake->rx; x += 2) {
150 if (
diff < smallest) {
162 for (y = tmp2 - 1; y <= tmp2 + 1; y++) {
163 for (x =
tmp - 1; x <=
tmp + 1; x++) {
164 if (x ==
tmp && y == tmp2)
168 if (
diff < smallest) {
177 if (smallest > 512) {
197 for (
i = 0;
i <= blocksize * 2;
i++) {
199 for (j = 0; j <= 15; j++) {
203 else if (
src[
pos] > highest) {
209 return highest - lowest;
219 a1 = atan2(y - cy, x - cx);
241 int count_max_value = 0;
245 int center_x = 0, center_y = 0;
251 for (x = 0; x < deshake->
rx * 2 + 1; x++) {
252 for (y = 0; y < deshake->
ry * 2 + 1; y++) {
253 deshake->
counts[x][y] = 0;
259 for (y = deshake->
ry; y < height - deshake->ry - (deshake->
blocksize * 2); y += deshake->
blocksize * 2) {
261 for (x = deshake->
rx; x < width - deshake->rx - 16; x += 16) {
268 if (
mv.x != -1 &&
mv.y != -1) {
270 if (x > deshake->
rx && y > deshake->
ry)
284 if (t->
angle < 0.001)
291 for (y = deshake->
ry * 2; y >= 0; y--) {
292 for (x = 0; x < deshake->
rx * 2 + 1; x++) {
294 if (deshake->
counts[x][y] > count_max_value) {
295 t->
vec.
x = x - deshake->
rx;
296 t->
vec.
y = y - deshake->
ry;
297 count_max_value = deshake->
counts[x][y];
303 p_x = (center_x -
width / 2.0);
304 p_y = (center_y -
height / 2.0);
318 const float *matrix_y,
const float *matrix_uv,
323 const float *matrixs[3];
324 int plane_w[3], plane_h[3];
325 matrixs[0] = matrix_y;
326 matrixs[1] = matrixs[2] = matrix_uv;
328 plane_w[1] = plane_w[2] = cw;
330 plane_h[1] = plane_h[2] = ch;
332 for (
i = 0;
i < 3;
i++) {
335 out->linesize[
i], plane_w[
i], plane_h[
i],
351 if (deshake->
rx % 16) {
359 fwrite(
"Ori x, Avg x, Fin x, Ori y, Avg y, Fin y, Ori angle, Avg angle, Fin angle, Ori zoom, Avg zoom, Fin zoom\n", 1, 104, deshake->
fp);
363 if (deshake->
cx > 0) {
364 deshake->
cw += deshake->
cx - (deshake->
cx & ~15);
369 av_log(
ctx,
AV_LOG_VERBOSE,
"cx: %d, cy: %d, cw: %d, ch: %d, rx: %d, ry: %d, edge: %d blocksize: %d contrast: %d search: %d\n",
370 deshake->
cx, deshake->
cy, deshake->
cw, deshake->
ch,
411 float matrix_y[9], matrix_uv[9];
419 float transform_zoom;
433 if (deshake->
cx < 0 || deshake->
cy < 0 || deshake->
cw < 0 || deshake->
ch < 0) {
443 if ((
unsigned)deshake->
cx + (
unsigned)deshake->
cw >
link->w) deshake->
cw =
link->w - deshake->
cx;
444 if ((
unsigned)deshake->
cy + (
unsigned)deshake->
ch >
link->h) deshake->
ch =
link->h - deshake->
cy;
457 orig.vec.x = t.
vec.
x;
458 orig.vec.y = t.
vec.
y;
459 orig.angle = t.
angle;
482 snprintf(
tmp, 256,
"%f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f\n", orig.vec.x, deshake->
avg.
vec.
x, t.
vec.
x, orig.vec.y, deshake->
avg.
vec.
y, t.
vec.
y, orig.angle, deshake->
avg.
angle, t.
angle, orig.zoom, deshake->
avg.
zoom, t.
zoom);
483 fwrite(
tmp, 1, strlen(
tmp), deshake->
fp);
504 transform_zoom = 1.0 + t.
zoom / 100.0;
548 .priv_class = &deshake_class,
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
@ SMART_EXHAUSTIVE
Search most possible positions (faster)
int ry
Maximum vertical shift.
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
#define FILTER_PIXFMTS_ARRAY(array)
static const int8_t mv[256][2]
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
This structure describes decoded (raw) audio or video data.
static const AVOption deshake_options[]
int(* transform)(AVFilterContext *ctx, int width, int height, int cw, int ch, const float *matrix_y, const float *matrix_uv, enum InterpolateMethod interpolate, enum FillMethod fill, AVFrame *in, AVFrame *out)
#define AV_LOG_VERBOSE
Detailed information.
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
static const AVFilterPad deshake_inputs[]
const char * name
Filter name.
A link between two filters.
static int block_contrast(uint8_t *src, int x, int y, int stride, int blocksize)
Find the contrast of a given block.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int blocksize
Size of blocks to compare.
AVFILTER_DEFINE_CLASS(deshake)
Transform last
Transform from last frame.
const AVFilter ff_vf_deshake
static av_cold int init(AVFilterContext *ctx)
static int cmp(const void *a, const void *b)
A filter pad used for either input or output.
#define FFDIFFSIGN(x, y)
Comparator.
static int aligned(int val)
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
const AVFilterPad ff_video_default_filterpad[1]
An AVFilterPad array whose only entry has name "default" and is of type AVMEDIA_TYPE_VIDEO.
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
int refcount
Number of reference frames (defines averaging window)
#define AV_CEIL_RSHIFT(a, b)
AVFrame * ref
Previous frame.
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
#define FILTER_INPUTS(array)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a link
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
char * filename
Motion search detailed log filename.
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
static double block_angle(int x, int y, int cx, int cy, IntMotionVector *shift)
Find the rotation for a given block.
int cw
Crop motion search to this box.
static void find_motion(DeshakeContext *deshake, uint8_t *src1, uint8_t *src2, int width, int height, int stride, Transform *t)
Find the estimated global motion for a scene given the most likely shift for each block in the frame.
static double clean_mean(double *values, int count)
Cleaned mean (cuts off 20% of values to remove outliers and then averages)
static void find_block_motion(DeshakeContext *deshake, uint8_t *src1, uint8_t *src2, int cx, int cy, int stride, IntMotionVector *mv)
Find the most likely shift in motion between two frames for a given macroblock.
static enum AVPixelFormat pix_fmts[]
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
static int shift(int a, int b)
int counts[2 *MAX_R+1][2 *MAX_R+1]
int format
format of the frame, -1 if unknown or unset Values correspond to enum AVPixelFormat for video frames,...
static av_always_inline int diff(const struct color_info *a, const struct color_info *b, const int trans_thresh)
double * angles
< Scratch buffer for motion search
The reader does not expect b to be semantically here and if the code is changed by maybe adding a a division or other the signedness will almost certainly be mistaken To avoid this confusion a new type was SUINT is the C unsigned type but it holds a signed int to use the same example SUINT a
static void interpolate(float *out, float v1, float v2, int size)
static int filter_frame(AVFilterLink *link, AVFrame *in)
static int config_props(AVFilterLink *link)
#define i(width, name, range_min, range_max)
#define AV_QSORT(p, num, type, cmp)
Quicksort This sort is fast, and fully inplace but not stable and it is possible to construct input t...
int w
agreed upon image width
int contrast
Contrast threshold.
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
int search
Motion search method.
const char * name
Pad name.
FILE * avpriv_fopen_utf8(const char *path, const char *mode)
Open a file using a UTF-8 filename.
static float search(FOCContext *foc, int pass, int maxpass, int xmin, int xmax, int ymin, int ymax, int *best_x, int *best_y, float best_score)
@ EXHAUSTIVE
Search all possible positions.
static int deshake_transform_c(AVFilterContext *ctx, int width, int height, int cw, int ch, const float *matrix_y, const float *matrix_uv, enum InterpolateMethod interpolate, enum FillMethod fill, AVFrame *in, AVFrame *out)
static av_cold void uninit(AVFilterContext *ctx)
int h
agreed upon image height
int edge
Edge fill method.
av_pixelutils_sad_fn av_pixelutils_get_sad_fn(int w_bits, int h_bits, int aligned, void *log_ctx)
Get a potentially optimized pointer to a Sum-of-absolute-differences function (see the av_pixelutils_...
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return values
static float mean(const float *input, int size)
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
static const int16_t alpha[]
int rx
Maximum horizontal shift.
#define FILTER_OUTPUTS(array)
void av_fast_malloc(void *ptr, unsigned int *size, size_t min_size)
Allocate a buffer, reusing the given one if large enough.
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
int linesize[AV_NUM_DATA_POINTERS]
For video, a positive or negative value, which is typically indicating the size in bytes of each pict...
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
av_pixelutils_sad_fn sad
Sum of the absolute difference function.