Go to the documentation of this file.
21 #define DEFAULT_INPUT_NAME "transforms.trf"
23 #include <vid.stab/libvidstab.h>
45 #define OFFSET(x) offsetof(TransformContext, x)
46 #define OFFSETC(x) (offsetof(TransformContext, conf)+offsetof(VSTransformConfig, x))
47 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
50 {
"input",
"set path to the file storing the transforms",
OFFSET(
input),
52 {
"smoothing",
"set number of frames*2 + 1 used for lowpass filtering",
OFFSETC(smoothing),
55 {
"optalgo",
"set camera path optimization algo",
OFFSETC(camPathAlgo),
57 {
"opt",
"global optimization", 0,
59 {
"gauss",
"gaussian kernel", 0,
61 {
"avg",
"simple averaging on motion", 0,
64 {
"maxshift",
"set maximal number of pixels to translate image",
OFFSETC(maxShift),
66 {
"maxangle",
"set maximal angle in rad to rotate image",
OFFSETC(maxAngle),
69 {
"crop",
"set cropping mode",
OFFSETC(crop),
71 {
"keep",
"keep border", 0,
73 {
"black",
"black border", 0,
78 {
"relative",
"consider transforms as relative",
OFFSETC(relative),
80 {
"zoom",
"set percentage to zoom (>0: zoom in, <0: zoom out",
OFFSETC(
zoom),
82 {
"optzoom",
"set optimal zoom (0: nothing, 1: optimal static zoom, 2: optimal dynamic zoom)",
OFFSETC(optZoom),
84 {
"zoomspeed",
"for adative zoom: percent to zoom maximally each frame",
OFFSETC(zoomSpeed),
87 {
"interpol",
"set type of interpolation",
OFFSETC(interpolType),
89 {
"no",
"no interpolation", 0,
91 {
"linear",
"linear (horizontal)", 0,
93 {
"bilinear",
"bi-linear", 0,
95 {
"bicubic",
"bi-cubic", 0,
98 {
"tripod",
"enable virtual tripod mode (same as relative=0:smoothing=0)",
OFFSET(tripod),
100 {
"debug",
"enable debug mode and writer global motions information to file",
OFFSET(debug),
111 tc->class = &vidstabtransform_class;
120 vsTransformDataCleanup(&
tc->td);
121 vsTransformationsCleanup(&
tc->trans);
133 VSTransformData *
td = &(
tc->td);
148 fi_src.log2ChromaW !=
desc->log2_chroma_w ||
149 fi_src.log2ChromaH !=
desc->log2_chroma_h) {
153 fi_src.log2ChromaW,
desc->log2_chroma_w,
154 fi_src.log2ChromaH,
desc->log2_chroma_h);
159 tc->conf.modName =
"vidstabtransform";
160 tc->conf.verbose = 1 +
tc->debug;
163 tc->conf.relative = 0;
164 tc->conf.smoothing = 0;
166 tc->conf.simpleMotionCalculation = 0;
167 tc->conf.storeTransforms =
tc->debug;
168 tc->conf.smoothZoom = 0;
170 if (vsTransformDataInit(
td, &
tc->conf, &fi_src, &fi_dest) != VS_OK) {
175 vsTransformGetConfig(&
tc->conf,
td);
180 tc->conf.camPathAlgo == VSOptimalL1 ?
"opt" :
181 (
tc->conf.camPathAlgo == VSGaussian ?
"gauss" :
"avg"));
189 tc->conf.optZoom == 1 ?
"Static (1)" : (
tc->conf.optZoom == 2 ?
"Dynamic (2)" :
"Off (0)"));
190 if (
tc->conf.optZoom == 2)
194 f = fopen(
tc->input,
"r");
200 VSManyLocalMotions mlms;
201 if (vsReadLocalMotionsFile(
f, &mlms) == VS_OK) {
203 if (vsLocalmotions2Transforms(
td, &mlms, &
tc->trans) != VS_OK) {
208 if (!vsReadOldTransforms(
td,
f, &
tc->trans)) {
216 if (vsPreprocessTransforms(
td, &
tc->trans) != VS_OK) {
230 VSTransformData*
td = &(
tc->td);
250 for (plane = 0; plane < vsTransformGetSrcFrameInfo(
td)->planes; plane++) {
251 inframe.data[plane] = in->
data[plane];
252 inframe.linesize[plane] = in->
linesize[plane];
255 vsTransformPrepare(
td, &inframe, &inframe);
258 for (plane = 0; plane < vsTransformGetDestFrameInfo(
td)->planes; plane++) {
259 outframe.data[plane] =
out->data[plane];
260 outframe.linesize[plane] =
out->linesize[plane];
262 vsTransformPrepare(
td, &inframe, &outframe);
265 vsDoTransform(
td, vsGetNextTransform(
td, &
tc->trans));
267 vsTransformFinish(
td);
292 .
name =
"vidstabtransform",
294 "pass 2 of 2 for stabilization "
295 "(see vidstabdetect for pass 1)."),
302 .priv_class = &vidstabtransform_class,
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
static void direct(const float *in, const FFTComplex *ir, int len, float *out)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
#define FILTER_PIXFMTS_ARRAY(array)
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
static void zoom(float *u, float *v, float amount)
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
This structure describes decoded (raw) audio or video data.
#define AV_LOG_VERBOSE
Detailed information.
int av_get_bits_per_pixel(const AVPixFmtDescriptor *pixdesc)
Return the number of bits per pixel used by the pixel format described by pixdesc.
const char * name
Filter name.
A link between two filters.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
A filter pad used for either input or output.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
VSPixelFormat ff_av2vs_pixfmt(AVFilterContext *ctx, enum AVPixelFormat pf)
convert AV's pixelformat to vid.stab pixelformat
enum AVPixelFormat ff_vidstab_pix_fmts[]
#define FILTER_INPUTS(array)
Describe the class of an AVClass context structure.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
int av_frame_is_writable(AVFrame *frame)
Check if the frame data is writable.
and forward the test the status of outputs and forward it to the corresponding return FFERROR_NOT_READY If the filters stores internally one or a few frame for some input
#define AV_LOG_INFO
Standard information.
int w
agreed upon image width
static void invert(float *h, int n)
const char * name
Pad name.
void ff_vs_init(void)
sets the memory allocation function and logging constants to av versions
int h
agreed upon image height
#define AV_PIX_FMT_FLAG_PLANAR
At least one pixel component is not in the first data plane.
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
#define FILTER_OUTPUTS(array)
int linesize[AV_NUM_DATA_POINTERS]
For video, a positive or negative value, which is typically indicating the size in bytes of each pict...