Go to the documentation of this file.
   21 #define DEFAULT_INPUT_NAME     "transforms.trf" 
   23 #include <vid.stab/libvidstab.h> 
   45 #define OFFSET(x) offsetof(TransformContext, x) 
   46 #define OFFSETC(x) (offsetof(TransformContext, conf)+offsetof(VSTransformConfig, x)) 
   47 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM 
   50     {
"input",     
"set path to the file storing the transforms", 
OFFSET(
input),
 
   52     {
"smoothing", 
"set number of frames*2 + 1 used for lowpass filtering", 
OFFSETC(smoothing),
 
   55     {
"optalgo",   
"set camera path optimization algo", 
OFFSETC(camPathAlgo),
 
   57     {  
"opt",     
"global optimization",                                            0, 
 
   59     {  
"gauss",   
"gaussian kernel",                                                0,
 
   61     {  
"avg",     
"simple averaging on motion",                                     0,
 
   64     {
"maxshift",  
"set maximal number of pixels to translate image", 
OFFSETC(maxShift),
 
   66     {
"maxangle",  
"set maximal angle in rad to rotate image", 
OFFSETC(maxAngle),
 
   69     {
"crop",      
"set cropping mode", 
OFFSETC(crop),
 
   71     {  
"keep",    
"keep border",                                                    0,
 
   73     {  
"black",   
"black border",                                                   0,
 
   78     {
"relative",  
"consider transforms as relative", 
OFFSETC(relative),
 
   80     {
"zoom",      
"set percentage to zoom (>0: zoom in, <0: zoom out", 
OFFSETC(zoom),
 
   82     {
"optzoom",   
"set optimal zoom (0: nothing, 1: optimal static zoom, 2: optimal dynamic zoom)", 
OFFSETC(optZoom),
 
   84     {
"zoomspeed", 
"for adative zoom: percent to zoom maximally each frame",         
OFFSETC(zoomSpeed),
 
   87     {
"interpol",  
"set type of interpolation", 
OFFSETC(interpolType),
 
   89     {  
"no",      
"no interpolation",                                               0,
 
   91     {  
"linear",  
"linear (horizontal)",                                            0,
 
   93     {  
"bilinear",
"bi-linear",                                                      0,
 
   95     {  
"bicubic", 
"bi-cubic",                                                       0,
 
   98     {
"tripod",    
"enable virtual tripod mode (same as relative=0:smoothing=0)", 
OFFSET(tripod),
 
  100     {
"debug",     
"enable debug mode and writer global motions information to file", 
OFFSET(debug),
 
  111     tc->class = &vidstabtransform_class;
 
  120     vsTransformDataCleanup(&
tc->td);
 
  121     vsTransformationsCleanup(&
tc->trans);
 
  151     VSTransformData *
td = &(
tc->td);
 
  166         fi_src.log2ChromaW != 
desc->log2_chroma_w ||
 
  167         fi_src.log2ChromaH != 
desc->log2_chroma_h) {
 
  171                fi_src.log2ChromaW, 
desc->log2_chroma_w,
 
  172                fi_src.log2ChromaH, 
desc->log2_chroma_h);
 
  177     tc->conf.modName = 
"vidstabtransform";
 
  178     tc->conf.verbose = 1 + 
tc->debug;
 
  181         tc->conf.relative  = 0;
 
  182         tc->conf.smoothing = 0;
 
  184     tc->conf.simpleMotionCalculation = 0;
 
  185     tc->conf.storeTransforms         = 
tc->debug;
 
  186     tc->conf.smoothZoom              = 0;
 
  188     if (vsTransformDataInit(
td, &
tc->conf, &fi_src, &fi_dest) != VS_OK) {
 
  193     vsTransformGetConfig(&
tc->conf, 
td);
 
  198            tc->conf.camPathAlgo == VSOptimalL1 ? 
"opt" :
 
  199            (
tc->conf.camPathAlgo == VSGaussian ? 
"gauss" : 
"avg"));
 
  207            tc->conf.optZoom == 1 ? 
"Static (1)" : (
tc->conf.optZoom == 2 ? 
"Dynamic (2)" : 
"Off (0)"));
 
  208     if (
tc->conf.optZoom == 2)
 
  212     f = fopen(
tc->input, 
"r");
 
  218         VSManyLocalMotions mlms;
 
  219         if (vsReadLocalMotionsFile(
f, &mlms) == VS_OK) {
 
  221             if (vsLocalmotions2Transforms(
td, &mlms, &
tc->trans) != VS_OK) {
 
  226             if (!vsReadOldTransforms(
td, 
f, &
tc->trans)) { 
 
  234     if (vsPreprocessTransforms(
td, &
tc->trans) != VS_OK) {
 
  248     VSTransformData* 
td = &(
tc->td);
 
  268     for (plane = 0; plane < vsTransformGetSrcFrameInfo(
td)->planes; plane++) {
 
  269         inframe.data[plane] = 
in->data[plane];
 
  270         inframe.linesize[plane] = 
in->linesize[plane];
 
  273         vsTransformPrepare(
td, &inframe, &inframe);
 
  276         for (plane = 0; plane < vsTransformGetDestFrameInfo(
td)->planes; plane++) {
 
  277             outframe.data[plane] = 
out->data[plane];
 
  278             outframe.linesize[plane] = 
out->linesize[plane];
 
  280         vsTransformPrepare(
td, &inframe, &outframe);
 
  283     vsDoTransform(
td, vsGetNextTransform(
td, &
tc->trans));
 
  285     vsTransformFinish(
td);
 
  312     .
name          = 
"vidstabtransform",
 
  314                                           "pass 2 of 2 for stabilization " 
  315                                           "(see vidstabdetect for pass 1)."),
 
  322     .priv_class    = &vidstabtransform_class,
 
  
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
static void direct(const float *in, const FFTComplex *ir, int len, float *out)
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
This structure describes decoded (raw) audio or video data.
#define AV_LOG_VERBOSE
Detailed information.
@ AV_PIX_FMT_BGR24
packed RGB 8:8:8, 24bpp, BGRBGR...
int av_get_bits_per_pixel(const AVPixFmtDescriptor *pixdesc)
Return the number of bits per pixel used by the pixel format described by pixdesc.
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
const char * name
Filter name.
A link between two filters.
A filter pad used for either input or output.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
VSPixelFormat ff_av2vs_pixfmt(AVFilterContext *ctx, enum AVPixelFormat pf)
convert AV's pixelformat to vid.stab pixelformat
static const AVFilterPad outputs[]
static enum AVPixelFormat pix_fmts[]
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
@ AV_PIX_FMT_RGBA
packed RGBA 8:8:8:8, 32bpp, RGBARGBA...
Describe the class of an AVClass context structure.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several inputs
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
@ AV_PIX_FMT_RGB24
packed RGB 8:8:8, 24bpp, RGBRGB...
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
int av_frame_is_writable(AVFrame *frame)
Check if the frame data is writable.
and forward the test the status of outputs and forward it to the corresponding return FFERROR_NOT_READY If the filters stores internally one or a few frame for some input
#define AV_LOG_INFO
Standard information.
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
int w
agreed upon image width
static void invert(float *h, int n)
const char * name
Pad name.
void ff_vs_init(void)
sets the memory allocation function and logging constants to av versions
int h
agreed upon image height
#define AV_PIX_FMT_FLAG_PLANAR
At least one pixel component is not in the first data plane.
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)