avfilter/af_afftfilt: make selecting window size simpler

[ffmpeg] / doc / filters.texi
diff --git a/doc/filters.texi b/doc/filters.texi

index 0d062786651128fbf282c9c37687868cf688d711..60b9204245840077180fad6650fa3216efc5d5e2 100644 (file)
--- a/doc/filters.texi
+++ b/doc/filters.texi
@@ -1124,25 +1124,8 @@ Return the value of imaginary part of frequency bin at location (@var{bin},@var{
  @end table
  
  @item win_size
-Set window size.
-
-It accepts the following values:
-@table @samp
-@item w16
-@item w32
-@item w64
-@item w128
-@item w256
-@item w512
-@item w1024
-@item w2048
-@item w4096
-@item w8192
-@item w16384
-@item w32768
-@item w65536
-@end table
-Default is @code{w4096}
+Set window size. Allowed range is from 16 to 131072.
+Default is @code{4096}
  
  @item win_func
  Set window function. Default is @code{hann}.
@@ -1409,6 +1392,10 @@ single-precision floating-point
  16-bit integers
  @end table
  
+@item mix
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item response
  Show IR frequency response, magnitude and phase in additional video stream.
  By default it is disabled.
@@ -1523,6 +1510,10 @@ kHz
  @item width, w
  Specify the band-width of a filter in width_type units.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -1542,6 +1533,10 @@ Syntax for the command is : "@var{width_type}"
  @item width, w
  Change allpass width.
  Syntax for the command is : "@var{width}"
+
+@item mix, m
+Change allpass mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section aloop
@@ -1801,6 +1796,22 @@ Pass only noise.
  
  Default value is @var{o}.
  @end table
+
+@item m
+Set smooth factor. Default value is @var{11}. Allowed range is from @var{1} to @var{15}.
+@end table
+
+@subsection Commands
+
+This filter supports the following commands:
+@table @option
+@item s
+Change denoise strength. Argument is single float number.
+Syntax for the command is : "@var{s}"
+
+@item o
+Change output mode.
+Syntax for the command is : "i", "o" or "n" string.
  @end table
  
  @section anull
@@ -2444,6 +2455,10 @@ kHz
  @item width, w
  Specify the band-width of a filter in width_type units.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -2463,6 +2478,10 @@ Syntax for the command is : "@var{width_type}"
  @item width, w
  Change bandpass width.
  Syntax for the command is : "@var{width}"
+
+@item mix, m
+Change bandpass mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section bandreject
@@ -2495,6 +2514,10 @@ kHz
  @item width, w
  Specify the band-width of a filter in width_type units.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -2514,6 +2537,10 @@ Syntax for the command is : "@var{width_type}"
  @item width, w
  Change bandreject width.
  Syntax for the command is : "@var{width}"
+
+@item mix, m
+Change bandreject mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section bass, lowshelf
@@ -2553,6 +2580,10 @@ kHz
  @item width, w
  Determine how steep is the filter's shelf transition.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -2576,6 +2607,10 @@ Syntax for the command is : "@var{width}"
  @item gain, g
  Change bass gain.
  Syntax for the command is : "@var{gain}"
+
+@item mix, m
+Change bass mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section biquad
@@ -2598,6 +2633,10 @@ This filter supports the following commands:
  @item b2
  Change biquad parameter.
  Syntax for the command is : "@var{value}"
+
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
  @end table
  
  @section bs2b
@@ -3029,6 +3068,42 @@ Optional. It should have a value much less than 1 (e.g. 0.05 or 0.02) and is
  used to prevent clipping.
  @end table
  
+@section deesser
+
+Apply de-essing to the audio samples.
+
+@table @option
+@item i
+Set intensity for triggering de-essing. Allowed range is from 0 to 1.
+Default is 0.
+
+@item m
+Set amount of ducking on treble part of sound. Allowed range is from 0 to 1.
+Default is 0.5.
+
+@item f
+How much of original frequency content to keep when de-essing. Allowed range is from 0 to 1.
+Default is 0.5.
+
+@item s
+Set the output mode.
+
+It accepts the following values:
+@table @option
+@item i
+Pass input unchanged.
+
+@item o
+Pass ess filtered out.
+
+@item e
+Pass only ess.
+
+Default value is @var{o}.
+@end table
+
+@end table
+
  @section drmeter
  Measure audio dynamic range.
  
@@ -3251,6 +3326,10 @@ Specify the band-width of a filter in width_type units.
  Set the required gain or attenuation in dB.
  Beware of clipping when using a positive gain.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -3289,6 +3368,10 @@ Syntax for the command is : "@var{width}"
  @item gain, g
  Change equalizer gain.
  Syntax for the command is : "@var{gain}"
+
+@item mix, m
+Change equalizer mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section extrastereo
@@ -3712,6 +3795,10 @@ Specify the band-width of a filter in width_type units.
  Applies only to double-pole filter.
  The default is 0.707q and gives a Butterworth response.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -3731,6 +3818,10 @@ Syntax for the command is : "@var{width_type}"
  @item width, w
  Change highpass width.
  Syntax for the command is : "@var{width}"
+
+@item mix, m
+Change highpass mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section join
@@ -4020,6 +4111,10 @@ Specify the band-width of a filter in width_type units.
  Applies only to double-pole filter.
  The default is 0.707q and gives a Butterworth response.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -4048,6 +4143,10 @@ Syntax for the command is : "@var{width_type}"
  @item width, w
  Change lowpass width.
  Syntax for the command is : "@var{width}"
+
+@item mix, m
+Change lowpass mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section lv2
@@ -5088,6 +5187,10 @@ kHz
  @item width, w
  Determine how steep is the filter's shelf transition.
  
+@item mix, m
+How much to use filtered signal in output. Default is 1.
+Range is between 0 and 1.
+
  @item channels, c
  Specify which channels to filter, by default all available are filtered.
  @end table
@@ -5111,6 +5214,10 @@ Syntax for the command is : "@var{width}"
  @item gain, g
  Change treble gain.
  Syntax for the command is : "@var{gain}"
+
+@item mix, m
+Change treble mix.
+Syntax for the command is : "@var{mix}"
  @end table
  
  @section tremolo
@@ -8248,6 +8355,40 @@ delogo=x=0:y=0:w=100:h=77:band=10
  
  @end itemize
  
+@section derain
+
+Remove the rain in the input image/video by applying the derain methods based on
+convolutional neural networks. Supported models:
+
+@itemize
+@item
+Recurrent Squeeze-and-Excitation Context Aggregation Net (RESCAN).
+See @url{http://openaccess.thecvf.com/content_ECCV_2018/papers/Xia_Li_Recurrent_Squeeze-and-Excitation_Context_ECCV_2018_paper.pdf}.
+@end itemize
+
+Training scripts as well as scripts for model generation are provided in
+the repository at @url{https://github.com/XueweiMeng/derain_filter.git}.
+
+The filter accepts the following options:
+
+@table @option
+@item dnn_backend
+Specify which DNN backend to use for model loading and execution. This option accepts
+the following values:
+
+@table @samp
+@item native
+Native implementation of DNN loading and execution.
+@end table
+Default value is @samp{native}.
+
+@item model
+Set path to model file specifying network architecture and its parameters.
+Note that different backends use different file formats. TensorFlow backend
+can load files for both formats, while native backend can load files for only
+its format.
+@end table
+
  @section deshake
  
  Attempt to fix small changes in horizontal and/or vertical shift. This
@@ -8912,7 +9053,21 @@ the width of the rendered text
  the x and y offset coordinates where the text is drawn.
  
  These parameters allow the @var{x} and @var{y} expressions to refer
-each other, so you can for example specify @code{y=x/dar}.
+to each other, so you can for example specify @code{y=x/dar}.
+
+@item pict_type
+A one character description of the current frame's picture type.
+
+@item pkt_pos
+The current packet's position in the input file or stream
+(in bytes, from the start of the input). A value of -1 indicates
+this info is not available.
+
+@item pkt_duration
+The current packet's duration, in seconds.
+
+@item pkt_size
+The current packet's size (in bytes).
  @end table
  
  @anchor{drawtext_expansion}
@@ -8982,11 +9137,18 @@ The first argument is mandatory and specifies the metadata key.
  The second argument is optional and specifies a default value, used when the
  metadata key is not found or empty.
  
+Available metadata can be identified by inspecting entries
+starting with TAG included within each frame section
+printed by running @code{ffprobe -show_frames}.
+
+String metadata generated in filters leading to
+the drawtext filter are also available.
+
  @item n, frame_num
  The frame number, starting from 0.
  
  @item pict_type
-A 1 character description of the current picture type.
+A one character description of the current picture type.
  
  @item pts
  The timestamp of the current frame.
@@ -10116,7 +10278,7 @@ Specifies the rectangle in which to search.
  
  @itemize
  @item
-Generate a representative palette of a given video using @command{ffmpeg}:
+Cover a rectangular object by the supplied image of a given video using @command{ffmpeg}:
  @example
  ffmpeg -i file.ts -vf find_rect=newref.pgm,cover_rect=cover.jpg:mode=cover new.mkv
  @end example
@@ -10150,7 +10312,7 @@ Default value is @var{blur}.
  
  @itemize
  @item
-Generate a representative palette of a given video using @command{ffmpeg}:
+Cover a rectangular object by the supplied image of a given video using @command{ffmpeg}:
  @example
  ffmpeg -i file.ts -vf find_rect=newref.pgm,cover_rect=cover.jpg:mode=cover new.mkv
  @end example
@@ -10844,6 +11006,8 @@ Default is @code{1}.
  @code{haldclut} also has the same interpolation options as @ref{lut3d} (both
  filters share the same internals).
  
+This filter also supports the @ref{framesync} options.
+
  More information about the Hald CLUT can be found on Eskil Steenberg's website
  (Hald CLUT author) at @url{http://www.quelsolaar.com/technology/clut.html}.
  
@@ -11929,8 +12093,6 @@ Interpolate values using a tetrahedron.
  @end table
  @end table
  
-This filter also supports the @ref{framesync} options.
-
  @section lumakey
  
  Turn certain luma values into transparency.
@@ -12910,6 +13072,7 @@ Set character blacklist.
  @end table
  
  The filter exports recognized text as the frame metadata @code{lavfi.ocr.text}.
+The filter exports confidence of recognized words as the frame metadata @code{lavfi.ocr.confidence}.
  
  @section ocv
  
@@ -14509,6 +14672,9 @@ Set the black color threshold. Default is @code{0.15}. Allowed range is @code{[0
  @item chp
  Enable checking the parity bit. In the event of a parity error, the filter will output
  @code{0x00} for that character. Default is false.
+
+@item lp
+Lowpass lines prior further proccessing. Default is disabled.
  @end table
  
  @subsection Examples
@@ -15054,6 +15220,8 @@ Set color space conforming to the United States Federal Communications
  Commission (FCC) Code of Federal Regulations (CFR) Title 47 (2003) 73.682 (a).
  
  @item bt601
+@item bt470
+@item smpte170m
  Set color space conforming to:
  
  @itemize
@@ -15070,6 +15238,9 @@ Society of Motion Picture and Television Engineers (SMPTE) ST 170:2004
  
  @item smpte240m
  Set color space conforming to SMPTE ST 240:1999.
+
+@item bt2020
+Set color space conforming to ITU-R BT.2020 non-constant luminance system.
  @end table
  
  @item in_range
@@ -16537,10 +16708,13 @@ Efficient Sub-Pixel Convolutional Neural Network model (ESPCN).
  See @url{https://arxiv.org/abs/1609.05158}.
  @end itemize
  
-Training scripts as well as scripts for model generation can be found at
+Training scripts as well as scripts for model file (.pb) saving can be found at
  @url{https://github.com/XueweiMeng/sr/tree/sr_dnn_native}. Original repository
  is at @url{https://github.com/HighVoltageRocknRoll/sr.git}.
  
+Native model files (.model) can be generated from TensorFlow model
+files (.pb) by using tools/python/convert.py
+
  The filter accepts the following options:
  
  @table @option
@@ -17115,14 +17289,14 @@ Specify flags influencing the filter process.
  Available value for @var{flags} is:
  
  @table @option
-@item low_pass_filter, vlfp
+@item low_pass_filter, vlpf
  Enable linear vertical low-pass filtering in the filter.
  Vertical low-pass filtering is required when creating an interlaced
  destination from a progressive source which contains high-frequency
  vertical detail. Filtering will reduce interlace 'twitter' and Moire
  patterning.
  
-@item complex_filter, cvlfp
+@item complex_filter, cvlpf
  Enable complex vertical low-pass filtering.
  This will slightly less reduce interlace 'twitter' and Moire
  patterning but better retain detail and subjective sharpness impression.
@@ -18464,9 +18638,10 @@ Pick median pixels from several input videos.
  The filter accept the following options:
  
  @table @option
-@item nb_inputs
-Set number of inputs. This must be odd number.
+@item inputs
+Set number of inputs.
  Default is 3. Allowed range is from 3 to 255.
+If number of inputs is even number, than result will be mean value between two median values.
  
  @item planes
  Set which planes to filter. Default value is @code{15}, by which all planes are processed.
@@ -19349,6 +19524,10 @@ Make every semi-green pixel in the input transparent with some slight blending:
  @end example
  @end itemize
  
+@section nlmeans_opencl
+
+Non-local Means denoise filter through OpenCL, this filter accepts same options as @ref{nlmeans}.
+
  @section overlay_opencl
  
  Overlay one video on top of another.
@@ -22243,6 +22422,58 @@ Set minimum amplitude used in @code{log} amplitude scaler.
  
  @end table
  
+@section showspatial
+
+Convert stereo input audio to a video output, representing the spatial relationship
+between two channels.
+
+The filter accepts the following options:
+
+@table @option
+@item size, s
+Specify the video size for the output. For the syntax of this option, check the
+@ref{video size syntax,,"Video size" section in the ffmpeg-utils manual,ffmpeg-utils}.
+Default value is @code{512x512}.
+
+@item win_size
+Set window size. Allowed range is from @var{1024} to @var{65536}. Default size is @var{4096}.
+
+@item win_func
+Set window function.
+
+It accepts the following values:
+@table @samp
+@item rect
+@item bartlett
+@item hann
+@item hanning
+@item hamming
+@item blackman
+@item welch
+@item flattop
+@item bharris
+@item bnuttall
+@item bhann
+@item sine
+@item nuttall
+@item lanczos
+@item gauss
+@item tukey
+@item dolph
+@item cauchy
+@item parzen
+@item poisson
+@item bohman
+@end table
+
+Default value is @code{hann}.
+
+@item overlap
+Set ratio of overlap window. Default value is @code{0.5}.
+When value is @code{1} overlap is set to recommended size for specific
+window function currently used.
+@end table
+
  @anchor{showspectrum}
  @section showspectrum