types/CodecContext.d.ts

import { HWDeviceContext, HWFramesContext } from "./HWContext"

export type MotionEstimationString = 'sad' | 'sse' | 'satd' | 'dct' | 'psnr' | 'bit' | 'rd' | 'zero' | 'vsad' |
                                     'vsse' | 'nsse' | 'w53' | 'w97' | 'dctmax' | 'dct264' | 'median_sad' | 'chroma'
export type FrameSkipString = 'none' | 'default' | 'nonref' | 'bidir' | 'nonintra' | 'nonkey' | 'all'

/** The CodecContext object */
export interface CodecContext {
	/** Object name. */
	readonly type: string
  /** see AV_CODEC_ID_xxx */
	readonly codec_id: number
	/**
	 * Name of the codec implementation.
   * The name is globally unique among encoders and among decoders (but an
   * encoder and a decoder can share the same name).
   * This is the primary way to find a codec from the user perspective.
	 */
	readonly name: string
  /** Descriptive name for the codec, meant to be more human readable than name. */
	readonly long_name: string
	/**
	 * A fourcc string by default, will be a number if not recognised
	 *  - LSB first, so "ABCD" -> ('D'<<24) + ('C'<<16) + ('B'<<8) + 'A').
	 */
	readonly codec_tag: string | number
	/** Codec private data. */
	priv_data: { [key: string]: any } | null
  /** The average bitrate */
	bit_rate: number
  /**
	 * Number of bits the bitstream is allowed to diverge from the reference.
   * The reference can be CBR (for CBR pass1) or VBR (for pass2)
   */
	bit_rate_tolerance: number
  /** Global quality for codecs which cannot change it per frame. This should be proportional to MPEG-1/2/4 qscale. */
	global_quality: number
	compression_level: number
	/** AV_CODEC_FLAG_*. */
	flags: { [key: string]: boolean }
	/** AV_CODEC_FLAG2_*. */
	flags2: { [key: string]: boolean }
	/**
	 * some codecs need / can use extradata like Huffman tables.
	 * MJPEG: Huffman tables
	 * rv10: additional flags
	 * MPEG-4: global headers (they can be in the bitstream or here)
	 * The allocated memory should be AV_INPUT_BUFFER_PADDING_SIZE bytes larger
	 * than extradata_size to avoid problems if it is read with the bitstream reader.
	 * The bytewise contents of extradata must not depend on the architecture or CPU endianness.
   */
	extradata: Buffer | null
	/**
	 * This is the fundamental unit of time (in seconds) in terms
	 * of which frame timestamps are represented. For fixed-fps content,
	 * timebase should be 1/framerate and timestamp increments should be
	 * identically 1.
	 * This often, but not always is the inverse of the frame rate or field rate
	 * for video. 1/time_base is not the average frame rate if the frame rate is not
	 * constant.
	 *
	 * Like containers, elementary streams also can store timestamps, 1/time_base
	 * is the unit in which these timestamps are specified.
	 * As example of such codec time base see ISO/IEC 14496-2:2001(E)
	 * vop_time_increment_resolution and fixed_vop_rate
	 * (fixed_vop_rate == 0 implies that it is different from the framerate)
   */
	time_base: Array<number>
	/**
	 * For some codecs, the time base is closer to the field rate than the frame rate.
	 * Most notably, H.264 and MPEG-2 specify time_base as half of frame duration
	 * if no telecine is used ...
	 *
	 * Set to time_base ticks per frame. Default 1, e.g., H.264/MPEG-2 set it to 2.
	 */
	ticks_per_frame: number
	/**
	 * Number of frames delay in addition to what a standard decoder
	 * as specified in the spec would produce.
	 *
	 * Video:
	 *   Number of frames the decoded output will be delayed relative to the
	 *   encoded input.
	 *
	 * Audio:
	 *   Number of samples the decoder needs to output before the decoder's output is valid.
	 *   When seeking, you should start decoding this many samples prior to your desired seek point.
	 */
	readonly delay: number
	/**
	 * picture width / height.
	 *
	 * @note Those fields may not match the values of the last
	 * Frame output due to frame reordering.
	 *
	 * May be set by the user before opening the decoder if known e.g.
	 * from the container. Some decoders will require the dimensions
	 * to be set by the caller. During decoding, the decoder may
	 * overwrite those values as required while parsing the data.
	 */
	width: number
	height: number
	/**
	 * Bitstream width / height, may be different from width/height e.g. when
	 * the decoded frame is cropped before being output or lowres is enabled.
	 *
	 * @note Those field may not match the value of the last
	 * Frame output due to frame reordering.
	 *
	 * May be set by the user before opening the decoder if known
	 * e.g. from the container. During decoding, the decoder may
	 * overwrite those values as required while parsing the data.
	 */
	coded_width: any
	coded_height: any
	/**
	 * Pixel format, see AV_PIX_FMT_xxx.
	 * May be set by the demuxer if known from headers.
	 * May be overridden by the decoder if it knows better.
	 *
	 * @note This field may not match the value of the last
	 * Frame output due to frame reordering.
	 */
	pix_fmt: string | null
	/**
	 * Maximum number of B-frames between non-B-frames
   * Note: The output will be delayed by max_b_frames+1 relative to the input.
	 */
	max_b_frames: number
  /** qscale factor between IP and B-frames
   * If > 0 then the last P-frame quantizer will be used (q= lastp_q*factor+offset).
   * If < 0 then normal ratecontrol will be done (q= -normal_q*factor+offset).
	 */
	b_quant_factor: number
  /** qscale offset between IP and B-frames */
	b_quant_offset: number
	/**
	 * Size of the frame reordering buffer in the decoder.
	 * For MPEG-2 it is 1 IPB or 0 low delay IP.
   */
	readonly has_b_frames: number
  /** qscale factor between P- and I-frames
   * If > 0 then the last P-frame quantizer will be used (q = lastp_q * factor + offset).
   * If < 0 then normal ratecontrol will be done (q= -normal_q*factor+offset).
	 */
	i_quant_factor: number
  /** qscale offset between P and I-frames */
	i_quant_offset: number
  /** luminance masking (0-> disabled) */
  lumi_masking: number
  /** temporal complexity masking (0-> disabled) */
  temporal_cplx_masking: number
  /** spatial complexity masking (0-> disabled) */
  spatial_cplx_masking: number
  /** p block masking (0-> disabled) */
  p_masking: number
  /** darkness masking (0-> disabled) */
	dark_masking: number
	/** slice count */
  slice_count: number
	/** slice offsets in the frame in bytes */
	slice_offset: Array<number> | null
	/**
	 * sample aspect ratio (0/1 if unknown)
	 * That is the width of a pixel divided by the height of the pixel.
	 * Numerator and denominator must be relatively prime and smaller than 256 for some video standards.
   */
	sample_aspect_ratio: Array<number>
  /** motion estimation comparison function */
	me_cmp: MotionEstimationString
  /** subpixel motion estimation comparison function */
	me_sub_cmp: MotionEstimationString
  /** macroblock comparison function (not supported yet) */
  mb_cmp: MotionEstimationString
  /** interlaced DCT comparison function */
  ildct_cmp: MotionEstimationString
  /** ME diamond size & shape */
  dia_size: number
  /** amount of previous MV predictors (2a+1 x 2a+1 square) */
  last_predictor_count: number
  /** motion estimation prepass comparison function */
  me_pre_cmp: MotionEstimationString
  /** ME prepass diamond size & shape */
  pre_dia_size: number
  /** subpel ME quality */
  me_subpel_quality: number
  /** maximum motion estimation search range in subpel units. If 0 then no limit. */
  me_range: number
	slice_flags: {
		/** draw_horiz_band() is called in coded order instead of display */
		CODED_ORDER: boolean
		/** allow draw_horiz_band() with field slices (MPEG-2 field pics)  */
    ALLOW_FIELD: boolean
		/** allow draw_horiz_band() with 1 component at a time (SVQ1) */
		ALLOW_PLANE: boolean
	}
	/**
	 * macroblock decision mode
	 * simple: uses mb_cmp
	 * bits: chooses the one which needs the fewest bits
	 * rd: rate distortion
	 */
	mb_decision: 'simple' | 'bits' | 'rd'
	/** custom intra quantization matrix */
	intra_matrix: Array<number> | null
	/** custom inter quantization matrix */
	inter_matrix: Array<number> | null
  /** precision of the intra DC coefficient - 8 */
	intra_dc_precision: number
  /** Number of macroblock rows at the top which are skipped. */
	skip_top: number
  /** Number of macroblock rows at the bottom which are skipped. */
	skip_bottom: number
  /** minimum MB Lagrange multiplier */
	mb_lmin: number
  /** maximum MB Lagrange multiplier */
	mb_lmax: number
  /**  */
  bidir_refine: number
  /** minimum GOP size */
  keyint_min: number
	/** number of reference frames */
	refs: number
	/** Value depends upon the compare function used for fullpel ME. */
	mv0_threshold: number
	/** Chromaticity coordinates of the source primaries. */
	color_primaries?: string
	/** Color Transfer Characteristic. */
	color_trc: string
	/** YUV colorspace type. */
	colorspace: string
	/** MPEG vs JPEG YUV range. */
	color_range: string
	/**
	 * Location of chroma samples.
	 *
	 * Illustration showing the location of the first (top left) chroma sample of the
	 * image, the left shows only luma, the right
	 * shows the location of the chroma sample, the 2 could be imagined to overlay
	 * each other but are drawn separately due to limitations of ASCII
	 *``` 
	 *                1st 2nd       1st 2nd horizontal luma sample positions
	 *                 v   v         v   v
	 *                 ______        ______
	 *1st luma line > |X   X ...    |3 4 X ...     X are luma samples,
   *.               |             |1 2           1-6 are possible chroma positions
	 *2nd luma line > |X   X ...    |5 6 X ...     0 is undefined/unknown position
	 *```
	 */
	chroma_sample_location: 'unspecified' | 'left' | 'center' | 'topleft' | 'top' | 'bottomleft' | 'bottom'
	/** Number of slices. Indicates number of picture subdivisions. Used for parallelized decoding. */
	slices: number
	field_order: 'progressive' |
	             'top coded first, top displayed first' |
	             'bottom coded first, bottom displayed first' |
               'top coded first, bottom displayed first' |
               'bottom coded first, top displayed first' |
               'unknown'
  /** Audio only - samples per second */
	sample_rate: number
  /** Audio only - number of audio channels */
	channels: number
  /** audio sample format */
	sample_fmt: string | null
	/**
	 * Number of samples per channel in an audio frame.
	 * May be set by some decoders to indicate constant frame size
	 */
	readonly frame_size: number
	/**
	 * Frame counter - total number of frames returned from the decoder so far.
	 * @note the counter is not incremented if encoding/decoding resulted in an error.
	 */
	readonly frame_number: number
	/** number of bytes per packet if constant and known or 0. Used by some WAV based audio codecs. */
	block_align: number
  /** Audio cutoff bandwidth (0 means "automatic") */
	cutoff: number
  /** Audio channel layout. */
	channel_layout: string
  /** Request decoder to use this channel layout if it can (0 for default) */
	request_channel_layout: string
	/** Type of service that the audio stream conveys. */
	audio_service_type: 'main' | 'effects' | 'visually-impaired' | 'hearing-impaired' | 'dialogue' |
                      'commentary' | 'emergency' | 'voice-over' | 'karaoke' | 'nb'
	/** Desired sample format - decoder will decode to this format if it can. */
	request_sample_fmt: string | null
  /** amount of qscale change between easy & hard scenes (0.0-1.0) */
	qcompress: number
	/** amount of qscale smoothing over time (0.0-1.0) */
  qblur: number
	/** minimum quantizer */
  qmin: number
	/** maximum quantizer */
  qmax: number
	/** maximum quantizer difference between frames */
  max_qdiff: number
	/** decoder bitstream buffer size */
  rc_buffer_size: number
	/** ratecontrol override */
  rc_override: Array<{
    type: 'RcOverride'
    start_frame: number
    end_frame: number
    /** If this is 0 then quality_factor will be used instead. */
		qscale: number
    quality_factor: number
	}>
	/** maximum bitrate */
	rc_max_rate: number
  /** minimum bitrate */
	rc_min_rate: number
	/** Ratecontrol attempt to use, at maximum, <value> of what can be used without an underflow. */
  rc_max_available_vbv_use: number
	/** Ratecontrol attempt to use, at least, <value> times the amount needed to prevent a vbv overflow. */
  rc_min_vbv_overflow_use: number
	/** Number of bits which should be loaded into the rc buffer before decoding starts. */
  rc_initial_buffer_occupancy: number
	/** trellis RD quantization */
  trellis: number
	/** pass1 encoding statistics output buffer */
  readonly stats_out: string | null
	/** pass2 encoding statistics input buffer. Concatenated stuff from stats_out of pass1 should be placed here. */
  stats_in: string | null
  /** Work around bugs in codecs which sometimes cannot be detected automatically. */
	workaround_bugs: { [key: string]: boolean }
	/**
	 * strictly follow the standard (MPEG-4, ...).
	 * Setting this to STRICT or higher means the encoder and decoder will
	 * generally do stupid things, whereas setting it to unofficial or lower
	 * will mean the encoder might produce output that is not supported by all
	 * spec-compliant decoders. Decoders don't differentiate between normal,
	 * unofficial and experimental (that is, they always try to decode things
	 * when they can) unless they are explicitly asked to behave stupidly
	 * (=strictly conform to the specs)
	 */
	strict_std_compliance: 'very-strict' | 'strict' | 'normal' | 'unofficial' | 'experimental'
  /** Error concealment flags */
	error_concealment: {
		GUESS_MVS?: boolean
		DEBLOCK?: boolean
		FAVOR_INTER?: boolean
	}
	debug: { [key: string]: boolean }
  /** Error recognition - may misdetect some more or less valid parts as errors. */
	err_recognition: { [key: string]: boolean }
  /** Opaque 64-bit number (generally a PTS) that will be reordered and output in Frame.reordered_opaque */
	reordered_opaque: number
	readonly error: ReadonlyArray<number> | null
  /** DCT algorithm */
	dct_algo: 'auto' | 'fastint' | 'int' | 'mmx' | 'altivec' | 'faan'
	/** IDCT algorithm */
	idct_algo: 'auto' | 'int' | 'simple' | 'simplemmx' | 'arm' | 'altivec' | 'simplearm' | 'xvid' | 'simplearmv5te' | 'simplearmv6' | 'faan' | 'simpleneon' | 'none' | 'simpleauto'
  /** Bits per sample/pixel from the demuxer (needed for huffyuv). */
	bits_per_coded_sample: number
  /** Bits per sample/pixel of internal libavcodec pixel/sample format. */
	bits_per_raw_sample: number
  /** Thread count is used to decide how many independent tasks should be passed to execute() */
	thread_count: number
  /**
	 * Which multithreading methods to use.
	 * Use of FRAME will increase decoding delay by one frame per thread,
	 * so clients which cannot provide future frames should not use it.
   */
	thread_type: { FRAME?: boolean, SLICE?: boolean }
  /** Which multithreading methods are in use by the codec. */
	readonly active_thread_type: { FRAME?: boolean, SLICE?: boolean }
	/**
	 * Set by the client if its custom get_buffer() callback can be called
	 * synchronously from another thread, which allows faster multithreaded decoding.
	 * draw_horiz_band() will be called from other threads regardless of this setting.
	 * Ignored if the default get_buffer() is used.
   */
	thread_safe_callbacks: number
  /** nsse_weight */
	nsse_weight: number

	profile: string | number
	level: number
  /** Skip loop filtering for selected frames. */
	skip_loop_filter: FrameSkipString
  /** Skip IDCT/dequantization for selected frames. */
	skip_idct: FrameSkipString
  /** Skip decoding for selected frames. */
	skip_frame: FrameSkipString
	/**
	 * Header containing style information for text subtitles.
	 * For SUBTITLE_ASS subtitle type, it should contain the whole ASS
	 * [Script Info] and [V4+ Styles] section, plus the [Events] line and
	 * the Format line following. It shouldn't include any Dialogue line.
	 */
	subtitle_header: Buffer | null
	/**
	 * Audio only. The number of "priming" samples (padding) inserted by the
	 * encoder at the beginning of the audio. I.e. this number of leading
	 * decoded samples must be discarded by the caller to get the original audio
	 * without leading padding.
	 *
	 * The timestamps on the output packets are adjusted by the encoder so that 
	 * they always refer to the first sample of the data actually contained in the packet,
	 * including any added padding.  E.g. if the timebase is 1/samplerate and
	 * the timestamp of the first input sample is 0, the timestamp of the 
	 * first output packet will be -initial_padding.
	 */
	readonly inital_padding: number
  /**
   * For codecs that store a framerate value in the compressed
   * bitstream, the decoder may export it here. [ 0, 1 ] when unknown.
	 */
	framerate: Array<number>
  /** Nominal unaccelerated pixel format, see AV_PIX_FMT_xxx. */
	readonly sw_pix_fmt: string | null
  /** Timebase in which pkt_dts/pts and Packet dts/pts are. */
	pkt_timebase: Array<number>

	readonly codec_descriptor: {
		INTRA_ONLY: boolean
		LOSSY: boolean
		LOSSLESS: boolean
		REORDER: boolean
		BITMAP_SUB: boolean
		TEXT_SUB: boolean
	} | null
  /** Character encoding of the input subtitles file. */
	sub_charenc: string | null
	/**
	 * Subtitles character encoding mode. Formats or codecs might be adjusting
	 * this setting (if they are doing the conversion themselves for instance).
   */
	readonly sub_charenc_mode: 'do-nothing' | 'automatic' | 'pre-decoder' | 'ignore'
	/**
	 * Skip processing alpha if supported by codec.
	 * Note that if the format uses pre-multiplied alpha (common with VP6,
	 * and recommended due to better video quality/compression)
	 * the image will look as if alpha-blended onto a black background.
	 * However for formats that do not use pre-multiplied alpha
	 * there might be serious artefacts (though e.g. libswscale currently
	 * assumes pre-multiplied alpha anyway).
   */
	skip_alpha: number
	/** Number of samples to skip after a discontinuity */
	readonly seek_preroll: number
  /** custom intra quantization matrix */
	chroma_intra_matrix: Array<number>
	/** Dump format separator - can be ", " or "\n      " or anything else */
	dump_separator: string | null
  /** ',' separated list of allowed decoders - if null then all are allowed */
	codec_whitelist: string | null
  /** Properties of the stream that gets decoded */
	readonly properties: { LOSSLESS: boolean, CLOSED_CAPTIONS: boolean }
  /** Additional data associated with the entire coded stream. */
	readonly coded_side_data: {
		type: 'PacketSideData'
		[key: string]: Buffer | string
	}
	/**
	 * A reference to the AVHWFramesContext describing the input (for encoding)
	 * or output (decoding) frames. The reference is set by the caller and
	 * afterwards owned (and freed) by libavcodec - it should never be read by
	 * the caller after being set.
	 *
	 * - decoding: This field should be set by the caller from the get_format()
	 *             callback. The previous reference (if any) will always be
	 *             unreffed by libavcodec before the get_format() call.
	 *
	 *             If the default get_buffer2() is used with a hwaccel pixel
	 *             format, then this AVHWFramesContext will be used for
	 *             allocating the frame buffers.
	 *
	 * - encoding: For hardware encoders configured to use a hwaccel pixel
	 *             format, this field should be set by the caller to a reference
	 *             to the AVHWFramesContext describing input frames.
	 *             AVHWFramesContext.format must be equal to
	 *             AVCodecContext.pix_fmt.
	 *
	 *             This field should be set before avcodec_open2() is called.
	 */
	hw_frames_ctx: HWFramesContext
	/** Control the form of AVSubtitle.rects[N]->ass */
	sub_text_format: number
	/**
	 * Audio only. The amount of padding (in samples) appended by the encoder to
	 * the end of the audio. I.e. this number of decoded samples must be
	 * discarded by the caller from the end of the stream to get the original
	 * audio without any trailing padding.
   */
	trailing_padding: number
  /** The number of pixels per image to maximally accept. */
	max_pixels: number
	/**
	 * A reference to the HWDeviceContext describing the device which will
	 * be used by a hardware encoder/decoder.  The reference is set by the
	 * caller and afterwards owned (and freed) by libavcodec.
	 *
	 * This should be used if either the codec device does not require
	 * hardware frames or any that are used are to be allocated internally by
	 * libavcodec.  If the user wishes to supply any of the frames used as
	 * encoder input or decoder output then hw_frames_ctx should be used
	 * instead.  When hw_frames_ctx is set in get_format() for a decoder, this
	 * field will be ignored while decoding the associated stream segment, but
	 * may again be used on a following one after another get_format() call.
	 *
	 * For both encoders and decoders this field should be set before
	 * avcodec_open2() is called and must not be written to thereafter.
	 *
	 * Note that some decoders may require this field to be set initially in
	 * order to support hw_frames_ctx at all - in that case, all frames
	 * contexts used must be created on the same device.
	 */
	hw_device_ctx: HWDeviceContext
	/**
	 * Bit set of AV_HWACCEL_FLAG_* flags, which affect hardware accelerated
	 * decoding (if active).
   */
	hwaccel_flags: { IGNORE_LEVEL?: boolean, ALLOW_HIGH_DEPTH?: boolean, ALLOW_PROFILE_MISMATCH?: boolean }
	/**
	 * Video decoding only. Certain video codecs support cropping, meaning that
	 * only a sub-rectangle of the decoded frame is intended for display.  This
	 * option controls how cropping is handled by libavcodec.
	 *
	 * When set to 1 (the default), libavcodec will apply cropping internally.
	 * I.e. it will modify the output frame width/height fields and offset the
	 * data pointers (only by as much as possible while preserving alignment, or
	 * by the full amount if the AV_CODEC_FLAG_UNALIGNED flag is set) so that
	 * the frames output by the decoder refer only to the cropped area. The
	 * crop_* fields of the output frames will be zero.
	 *
	 * When set to 0, the width/height fields of the output frames will be set
	 * to the coded dimensions and the crop_* fields will describe the cropping
	 * rectangle. Applying the cropping is left to the caller.
	 *
	 * @warning When hardware acceleration with opaque output frames is used,
	 * libavcodec is unable to apply cropping from the top/left border.
	 *
	 * @note when this option is set to zero, the width/height fields of the
	 * AVCodecContext and output AVFrames have different meanings. The codec
	 * context fields store display dimensions (with the coded dimensions in
	 * coded_width/height), while the frame fields store the coded dimensions
	 * (with the display dimensions being determined by the crop_* fields).
	 */
	apply_cropping: number
	/*
		* Video decoding only.  Sets the number of extra hardware frames which
		* the decoder will allocate for use by the caller.  This must be set
		* before avcodec_open2() is called.
		*
		* Some hardware decoders require all frames that they will use for
		* output to be defined in advance before decoding starts.  For such
		* decoders, the hardware frame pool must therefore be of a fixed size.
		* The extra frames set here are on top of any number that the decoder
		* needs internally in order to operate normally (for example, frames
		* used as reference pictures).
		*/
	extra_hw_frames: number
}