Go to the documentation of this file.
21 #define DEFAULT_INPUT_NAME "transforms.trf"
23 #include <vid.stab/libvidstab.h>
45 #define OFFSET(x) offsetof(TransformContext, x)
46 #define OFFSETC(x) (offsetof(TransformContext, conf)+offsetof(VSTransformConfig, x))
47 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
50 {
"input",
"set path to the file storing the transforms",
OFFSET(
input),
52 {
"smoothing",
"set number of frames*2 + 1 used for lowpass filtering",
OFFSETC(smoothing),
55 {
"optalgo",
"set camera path optimization algo",
OFFSETC(camPathAlgo),
57 {
"opt",
"global optimization", 0,
59 {
"gauss",
"gaussian kernel", 0,
61 {
"avg",
"simple averaging on motion", 0,
64 {
"maxshift",
"set maximal number of pixels to translate image",
OFFSETC(maxShift),
66 {
"maxangle",
"set maximal angle in rad to rotate image",
OFFSETC(maxAngle),
69 {
"crop",
"set cropping mode",
OFFSETC(crop),
71 {
"keep",
"keep border", 0,
73 {
"black",
"black border", 0,
78 {
"relative",
"consider transforms as relative",
OFFSETC(relative),
80 {
"zoom",
"set percentage to zoom (>0: zoom in, <0: zoom out",
OFFSETC(zoom),
82 {
"optzoom",
"set optimal zoom (0: nothing, 1: optimal static zoom, 2: optimal dynamic zoom)",
OFFSETC(optZoom),
84 {
"zoomspeed",
"for adative zoom: percent to zoom maximally each frame",
OFFSETC(zoomSpeed),
87 {
"interpol",
"set type of interpolation",
OFFSETC(interpolType),
89 {
"no",
"no interpolation", 0,
91 {
"linear",
"linear (horizontal)", 0,
93 {
"bilinear",
"bi-linear", 0,
95 {
"bicubic",
"bi-cubic", 0,
98 {
"tripod",
"enable virtual tripod mode (same as relative=0:smoothing=0)",
OFFSET(tripod),
100 {
"debug",
"enable debug mode and writer global motions information to file",
OFFSET(debug),
111 tc->class = &vidstabtransform_class;
120 vsTransformDataCleanup(&
tc->td);
121 vsTransformationsCleanup(&
tc->trans);
151 VSTransformData *
td = &(
tc->td);
166 fi_src.log2ChromaW !=
desc->log2_chroma_w ||
167 fi_src.log2ChromaH !=
desc->log2_chroma_h) {
171 fi_src.log2ChromaW,
desc->log2_chroma_w,
172 fi_src.log2ChromaH,
desc->log2_chroma_h);
177 tc->conf.modName =
"vidstabtransform";
178 tc->conf.verbose = 1 +
tc->debug;
181 tc->conf.relative = 0;
182 tc->conf.smoothing = 0;
184 tc->conf.simpleMotionCalculation = 0;
185 tc->conf.storeTransforms =
tc->debug;
186 tc->conf.smoothZoom = 0;
188 if (vsTransformDataInit(
td, &
tc->conf, &fi_src, &fi_dest) != VS_OK) {
193 vsTransformGetConfig(&
tc->conf,
td);
198 tc->conf.camPathAlgo == VSOptimalL1 ?
"opt" :
199 (
tc->conf.camPathAlgo == VSGaussian ?
"gauss" :
"avg"));
207 tc->conf.optZoom == 1 ?
"Static (1)" : (
tc->conf.optZoom == 2 ?
"Dynamic (2)" :
"Off (0)"));
208 if (
tc->conf.optZoom == 2)
212 f = fopen(
tc->input,
"r");
218 VSManyLocalMotions mlms;
219 if (vsReadLocalMotionsFile(
f, &mlms) == VS_OK) {
221 if (vsLocalmotions2Transforms(
td, &mlms, &
tc->trans) != VS_OK) {
226 if (!vsReadOldTransforms(
td,
f, &
tc->trans)) {
234 if (vsPreprocessTransforms(
td, &
tc->trans) != VS_OK) {
248 VSTransformData*
td = &(
tc->td);
268 for (plane = 0; plane < vsTransformGetSrcFrameInfo(
td)->planes; plane++) {
269 inframe.data[plane] =
in->data[plane];
270 inframe.linesize[plane] =
in->linesize[plane];
273 vsTransformPrepare(
td, &inframe, &inframe);
276 for (plane = 0; plane < vsTransformGetDestFrameInfo(
td)->planes; plane++) {
277 outframe.data[plane] =
out->data[plane];
278 outframe.linesize[plane] =
out->linesize[plane];
280 vsTransformPrepare(
td, &inframe, &outframe);
283 vsDoTransform(
td, vsGetNextTransform(
td, &
tc->trans));
285 vsTransformFinish(
td);
312 .
name =
"vidstabtransform",
314 "pass 2 of 2 for stabilization "
315 "(see vidstabdetect for pass 1)."),
322 .priv_class = &vidstabtransform_class,
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
static void direct(const float *in, const FFTComplex *ir, int len, float *out)
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
This structure describes decoded (raw) audio or video data.
#define AV_LOG_VERBOSE
Detailed information.
@ AV_PIX_FMT_BGR24
packed RGB 8:8:8, 24bpp, BGRBGR...
int av_get_bits_per_pixel(const AVPixFmtDescriptor *pixdesc)
Return the number of bits per pixel used by the pixel format described by pixdesc.
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
const char * name
Filter name.
A link between two filters.
A filter pad used for either input or output.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
VSPixelFormat ff_av2vs_pixfmt(AVFilterContext *ctx, enum AVPixelFormat pf)
convert AV's pixelformat to vid.stab pixelformat
static const AVFilterPad outputs[]
static enum AVPixelFormat pix_fmts[]
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
@ AV_PIX_FMT_RGBA
packed RGBA 8:8:8:8, 32bpp, RGBARGBA...
Describe the class of an AVClass context structure.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several inputs
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
@ AV_PIX_FMT_RGB24
packed RGB 8:8:8, 24bpp, RGBRGB...
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
int av_frame_is_writable(AVFrame *frame)
Check if the frame data is writable.
and forward the test the status of outputs and forward it to the corresponding return FFERROR_NOT_READY If the filters stores internally one or a few frame for some input
#define AV_LOG_INFO
Standard information.
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
int w
agreed upon image width
static void invert(float *h, int n)
const char * name
Pad name.
void ff_vs_init(void)
sets the memory allocation function and logging constants to av versions
int h
agreed upon image height
#define AV_PIX_FMT_FLAG_PLANAR
At least one pixel component is not in the first data plane.
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)