WebM Codec SDK
vpx_encoder.h
Go to the documentation of this file.
1/*
2 * Copyright (c) 2010 The WebM project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10#ifndef VPX_VPX_VPX_ENCODER_H_
11#define VPX_VPX_VPX_ENCODER_H_
12
28#ifdef __cplusplus
29extern "C" {
30#endif
31
32#include "./vpx_codec.h"
33#include "./vpx_ext_ratectrl.h"
34
38#define VPX_TS_MAX_PERIODICITY 16
39
41#define VPX_TS_MAX_LAYERS 5
42
44#define VPX_MAX_LAYERS 12 // 3 temporal + 4 spatial layers are allowed.
45
47#define VPX_SS_MAX_LAYERS 5
48
50#define VPX_SS_DEFAULT_LAYERS 1
51
60#define VPX_ENCODER_ABI_VERSION \
61 (15 + VPX_CODEC_ABI_VERSION + \
62 VPX_EXT_RATECTRL_ABI_VERSION)
73#define VPX_CODEC_CAP_PSNR 0x10000
80#define VPX_CODEC_CAP_OUTPUT_PARTITION 0x20000
81
89#define VPX_CODEC_USE_PSNR 0x10000
91#define VPX_CODEC_USE_OUTPUT_PARTITION 0x20000
92#define VPX_CODEC_USE_HIGHBITDEPTH 0x40000
98typedef struct vpx_fixed_buf {
99 void *buf;
100 size_t sz;
108typedef int64_t vpx_codec_pts_t;
109
117typedef uint32_t vpx_codec_frame_flags_t;
118#define VPX_FRAME_IS_KEY 0x1
121#define VPX_FRAME_IS_DROPPABLE 0x2
123#define VPX_FRAME_IS_INVISIBLE 0x4
125#define VPX_FRAME_IS_FRAGMENT 0x8
126
133typedef uint32_t vpx_codec_er_flags_t;
135#define VPX_ERROR_RESILIENT_DEFAULT 0x1
140#define VPX_ERROR_RESILIENT_PARTITIONS 0x2
141
155
161typedef struct vpx_codec_cx_pkt {
163 union {
164 struct {
165 void *buf;
166 size_t sz;
170 unsigned long duration;
178 unsigned int width[VPX_SS_MAX_LAYERS];
179 unsigned int height[VPX_SS_MAX_LAYERS];
186 struct vpx_psnr_pkt {
187 unsigned int samples[4];
188 uint64_t sse[4];
189 double psnr[4];
193 /* This packet size is fixed to allow codecs to extend this
194 * interface without having to manage storage for raw packets,
195 * i.e., if it's smaller than 128 bytes, you can store in the
196 * packet list directly.
197 */
198 char pad[128 - sizeof(enum vpx_codec_cx_pkt_kind)];
208 void *user_data);
209
213 void *user_priv;
215
220typedef struct vpx_rational {
221 int num;
222 int den;
226typedef enum vpx_enc_pass {
231
238};
239
251 VPX_KF_DISABLED = 0
253
262#define VPX_EFLAG_FORCE_KF (1 << 0)
270typedef struct vpx_codec_enc_cfg {
271 /*
272 * generic settings (g)
273 */
274
279 unsigned int g_usage;
280
287 unsigned int g_threads;
288
297 unsigned int g_profile;
306 unsigned int g_w;
307
315 unsigned int g_h;
316
324
331 unsigned int g_input_bit_depth;
332
346
354
361
374 unsigned int g_lag_in_frames;
375
376 /*
377 * rate control settings (rc)
378 */
379
394
402 unsigned int rc_resize_allowed;
403
409 unsigned int rc_scaled_width;
410
416 unsigned int rc_scaled_height;
417
425
433
443
450
457
462 unsigned int rc_target_bitrate;
463
464 /*
465 * quantizer settings
466 */
467
475 unsigned int rc_min_quantizer;
476
484 unsigned int rc_max_quantizer;
485
486 /*
487 * bitrate tolerance
488 */
489
503 unsigned int rc_undershoot_pct;
504
518 unsigned int rc_overshoot_pct;
519
520 /*
521 * decoder buffer model parameters
522 */
523
533 unsigned int rc_buf_sz;
534
542 unsigned int rc_buf_initial_sz;
543
551 unsigned int rc_buf_optimal_sz;
552
553 /*
554 * 2 pass rate control parameters
555 */
556
566
573
580
587
588 /*
589 * keyframing settings (kf)
590 */
591
599
607 unsigned int kf_min_dist;
608
616 unsigned int kf_max_dist;
617
618 /*
619 * Spatial scalability settings (ss)
620 */
621
626 unsigned int ss_number_layers;
627
634
641
646 unsigned int ts_number_layers;
647
654
661
669 unsigned int ts_periodicity;
670
679
687
696
702
711
720
729
738
747
756
766
775
784
793
802
811
821
831
848typedef struct vpx_svc_parameters {
857
881 vpx_codec_iface_t *iface,
882 const vpx_codec_enc_cfg_t *cfg,
883 vpx_codec_flags_t flags, int ver);
884
889#define vpx_codec_enc_init(ctx, iface, cfg, flags) \
890 vpx_codec_enc_init_ver(ctx, iface, cfg, flags, VPX_ENCODER_ABI_VERSION)
891
914 int num_enc, vpx_codec_flags_t flags, vpx_rational_t *dsf, int ver);
915
920#define vpx_codec_enc_init_multi(ctx, iface, cfg, num_enc, flags, dsf) \
921 vpx_codec_enc_init_multi_ver(ctx, iface, cfg, num_enc, flags, dsf, \
922 VPX_ENCODER_ABI_VERSION)
923
945 unsigned int usage);
946
962 const vpx_codec_enc_cfg_t *cfg);
963
976
978#define VPX_DL_REALTIME (1)
980#define VPX_DL_GOOD_QUALITY (1000000)
982#define VPX_DL_BEST_QUALITY (0)
1020 vpx_codec_pts_t pts, unsigned long duration,
1022 unsigned long deadline);
1023
1068 const vpx_fixed_buf_t *buf,
1069 unsigned int pad_before,
1070 unsigned int pad_after);
1071
1096 vpx_codec_iter_t *iter);
1097
1111
1113#ifdef __cplusplus
1114}
1115#endif
1116#endif // VPX_VPX_VPX_ENCODER_H_
long vpx_codec_flags_t
Initialization-time Feature Enabling.
Definition: vpx_codec.h:170
const void * vpx_codec_iter_t
Iterator.
Definition: vpx_codec.h:190
enum vpx_bit_depth vpx_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
vpx_codec_err_t
Algorithm return codes.
Definition: vpx_codec.h:93
const struct vpx_codec_iface vpx_codec_iface_t
Codec interface structure.
Definition: vpx_codec.h:177
vpx_codec_err_t vpx_codec_enc_init_ver(vpx_codec_ctx_t *ctx, vpx_codec_iface_t *iface, const vpx_codec_enc_cfg_t *cfg, vpx_codec_flags_t flags, int ver)
Initialize an encoder instance.
vpx_codec_err_t vpx_codec_enc_init_multi_ver(vpx_codec_ctx_t *ctx, vpx_codec_iface_t *iface, vpx_codec_enc_cfg_t *cfg, int num_enc, vpx_codec_flags_t flags, vpx_rational_t *dsf, int ver)
Initialize multi-encoder instance.
struct vpx_codec_enc_cfg vpx_codec_enc_cfg_t
Encoder configuration structure.
#define VPX_TS_MAX_LAYERS
Definition: vpx_encoder.h:41
vpx_codec_cx_pkt_kind
Encoder output packet variants.
Definition: vpx_encoder.h:148
void(* vpx_codec_enc_output_cx_pkt_cb_fn_t)(vpx_codec_cx_pkt_t *pkt, void *user_data)
Encoder return output buffer callback.
Definition: vpx_encoder.h:207
vpx_enc_pass
Multi-pass Encoding Pass.
Definition: vpx_encoder.h:226
const vpx_image_t * vpx_codec_get_preview_frame(vpx_codec_ctx_t *ctx)
Get Preview Frame.
struct vpx_svc_parameters vpx_svc_extra_cfg_t
vp9 svc extra configure parameters
struct vpx_fixed_buf vpx_fixed_buf_t
Generic fixed size buffer structure.
const vpx_codec_cx_pkt_t * vpx_codec_get_cx_data(vpx_codec_ctx_t *ctx, vpx_codec_iter_t *iter)
Encoded data iterator.
#define VPX_TS_MAX_PERIODICITY
Definition: vpx_encoder.h:38
struct vpx_codec_enc_output_cx_cb_pair vpx_codec_priv_output_cx_pkt_cb_pair_t
Callback function pointer / user data pair storage.
#define VPX_MAX_LAYERS
Definition: vpx_encoder.h:44
uint32_t vpx_codec_er_flags_t
Error Resilient flags.
Definition: vpx_encoder.h:133
int64_t vpx_codec_pts_t
Time Stamp Type.
Definition: vpx_encoder.h:108
#define VPX_SS_MAX_LAYERS
Definition: vpx_encoder.h:47
long vpx_enc_frame_flags_t
Encoded Frame Flags.
Definition: vpx_encoder.h:261
vpx_codec_err_t vpx_codec_enc_config_default(vpx_codec_iface_t *iface, vpx_codec_enc_cfg_t *cfg, unsigned int usage)
Get a default configuration.
vpx_kf_mode
Keyframe placement mode.
Definition: vpx_encoder.h:248
struct vpx_codec_cx_pkt vpx_codec_cx_pkt_t
Encoder output packet.
uint32_t vpx_codec_frame_flags_t
Compressed Frame Flags.
Definition: vpx_encoder.h:117
vpx_codec_err_t vpx_codec_enc_config_set(vpx_codec_ctx_t *ctx, const vpx_codec_enc_cfg_t *cfg)
Set or change configuration.
vpx_fixed_buf_t * vpx_codec_get_global_headers(vpx_codec_ctx_t *ctx)
Get global stream headers.
struct vpx_rational vpx_rational_t
Rational Number.
vpx_codec_err_t vpx_codec_set_cx_data_buf(vpx_codec_ctx_t *ctx, const vpx_fixed_buf_t *buf, unsigned int pad_before, unsigned int pad_after)
Set compressed data output buffer.
vpx_rc_mode
Rate control mode.
Definition: vpx_encoder.h:233
vpx_codec_err_t vpx_codec_encode(vpx_codec_ctx_t *ctx, const vpx_image_t *img, vpx_codec_pts_t pts, unsigned long duration, vpx_enc_frame_flags_t flags, unsigned long deadline)
Encode a frame.
@ VPX_CODEC_PSNR_PKT
Definition: vpx_encoder.h:152
@ VPX_CODEC_CX_FRAME_PKT
Definition: vpx_encoder.h:149
@ VPX_CODEC_STATS_PKT
Definition: vpx_encoder.h:150
@ VPX_CODEC_CUSTOM_PKT
Definition: vpx_encoder.h:153
@ VPX_CODEC_FPMB_STATS_PKT
Definition: vpx_encoder.h:151
@ VPX_RC_LAST_PASS
Definition: vpx_encoder.h:229
@ VPX_RC_ONE_PASS
Definition: vpx_encoder.h:227
@ VPX_RC_FIRST_PASS
Definition: vpx_encoder.h:228
@ VPX_KF_DISABLED
Definition: vpx_encoder.h:251
@ VPX_KF_FIXED
Definition: vpx_encoder.h:249
@ VPX_KF_AUTO
Definition: vpx_encoder.h:250
@ VPX_Q
Definition: vpx_encoder.h:237
@ VPX_CQ
Definition: vpx_encoder.h:236
@ VPX_CBR
Definition: vpx_encoder.h:235
@ VPX_VBR
Definition: vpx_encoder.h:234
Codec context structure.
Definition: vpx_codec.h:200
Encoder output packet.
Definition: vpx_encoder.h:161
char pad[128 - sizeof(enum vpx_codec_cx_pkt_kind)]
Definition: vpx_encoder.h:198
vpx_codec_frame_flags_t flags
Definition: vpx_encoder.h:171
vpx_fixed_buf_t twopass_stats
Definition: vpx_encoder.h:184
enum vpx_codec_cx_pkt_kind kind
Definition: vpx_encoder.h:162
double psnr[4]
Definition: vpx_encoder.h:189
unsigned int width[5]
Width and height of frames in this packet. VP8 will only use the first one.
Definition: vpx_encoder.h:178
struct vpx_codec_cx_pkt::@1::@2 frame
uint8_t spatial_layer_encoded[5]
Flag to indicate if spatial layer frame in this packet is encoded or dropped. VP8 will always be set ...
Definition: vpx_encoder.h:182
vpx_fixed_buf_t firstpass_mb_stats
Definition: vpx_encoder.h:185
size_t sz
Definition: vpx_encoder.h:166
void * buf
Definition: vpx_encoder.h:165
vpx_codec_pts_t pts
time stamp to show frame (in timebase units)
Definition: vpx_encoder.h:168
vpx_fixed_buf_t raw
Definition: vpx_encoder.h:191
unsigned int height[5]
Definition: vpx_encoder.h:179
int partition_id
the partition id defines the decoding order of the partitions. Only applicable when "output partition...
Definition: vpx_encoder.h:175
unsigned long duration
duration to show frame (in timebase units)
Definition: vpx_encoder.h:170
union vpx_codec_cx_pkt::@1 data
Encoder configuration structure.
Definition: vpx_encoder.h:270
vpx_rational_t rd_mult_arf_qp_fac
Rate-distortion multiplier for alt-ref frames. The multiplier is a crucial parameter in the calculati...
Definition: vpx_encoder.h:830
unsigned int rc_resize_allowed
Enable/disable spatial resampling, if supported by the codec.
Definition: vpx_encoder.h:402
int temporal_layering_mode
Temporal layering mode indicating which temporal layering scheme to use.
Definition: vpx_encoder.h:695
unsigned int kf_min_dist
Keyframe minimum interval.
Definition: vpx_encoder.h:607
vpx_rational_t sr_default_decay_limit
Second reference default decay limit.
Definition: vpx_encoder.h:728
unsigned int rc_min_quantizer
Minimum (Best Quality) Quantizer.
Definition: vpx_encoder.h:475
unsigned int ts_number_layers
Number of temporal coding layers.
Definition: vpx_encoder.h:646
vpx_rational_t kf_max_total_boost_factor
Keyframe maximum total boost adjustment factor.
Definition: vpx_encoder.h:783
vpx_fixed_buf_t rc_twopass_stats_in
Two-pass stats buffer.
Definition: vpx_encoder.h:449
unsigned int rc_resize_down_thresh
Spatial resampling down watermark.
Definition: vpx_encoder.h:432
unsigned int ss_number_layers
Number of spatial coding layers.
Definition: vpx_encoder.h:626
unsigned int rc_2pass_vbr_bias_pct
Two-pass mode CBR/VBR bias.
Definition: vpx_encoder.h:565
unsigned int rc_2pass_vbr_minsection_pct
Two-pass mode per-GOP minimum bitrate.
Definition: vpx_encoder.h:572
int ss_enable_auto_alt_ref[5]
Enable auto alt reference flags for each spatial layer.
Definition: vpx_encoder.h:633
unsigned int rc_scaled_width
Internal coded frame width.
Definition: vpx_encoder.h:409
vpx_rational_t rd_mult_key_qp_fac
Rate-distortion multiplier for key frames. The multiplier is a crucial parameter in the calculation o...
Definition: vpx_encoder.h:840
unsigned int g_profile
Bitstream profile to use.
Definition: vpx_encoder.h:297
unsigned int layer_target_bitrate[12]
Target bitrate for each spatial/temporal layer.
Definition: vpx_encoder.h:686
unsigned int g_h
Height of the frame.
Definition: vpx_encoder.h:315
enum vpx_kf_mode kf_mode
Keyframe placement mode.
Definition: vpx_encoder.h:598
unsigned int ts_layer_id[16]
Template defining the membership of frames to temporal layers.
Definition: vpx_encoder.h:678
vpx_codec_er_flags_t g_error_resilient
Enable error resilient modes.
Definition: vpx_encoder.h:353
unsigned int ts_periodicity
Length of the sequence defining frame temporal layer membership.
Definition: vpx_encoder.h:669
unsigned int rc_overshoot_pct
Rate control adaptation overshoot control.
Definition: vpx_encoder.h:518
vpx_fixed_buf_t rc_firstpass_mb_stats_in
first pass mb stats buffer.
Definition: vpx_encoder.h:456
unsigned int rc_scaled_height
Internal coded frame height.
Definition: vpx_encoder.h:416
unsigned int g_usage
Deprecated: Algorithm specific "usage" value.
Definition: vpx_encoder.h:279
unsigned int g_w
Width of the frame.
Definition: vpx_encoder.h:306
unsigned int ss_target_bitrate[5]
Target bitrate for each spatial layer.
Definition: vpx_encoder.h:640
unsigned int rc_buf_sz
Decoder Buffer Size.
Definition: vpx_encoder.h:533
unsigned int rc_dropframe_thresh
Temporal resampling configuration, if supported by the codec.
Definition: vpx_encoder.h:393
struct vpx_rational g_timebase
Stream timebase units.
Definition: vpx_encoder.h:345
enum vpx_enc_pass g_pass
Multi-pass Encoding Mode.
Definition: vpx_encoder.h:360
vpx_rational_t kf_frame_max_boost_first_factor
Keyframe maximum boost adjustment factor, for the first keyframe in a chunk.
Definition: vpx_encoder.h:765
unsigned int rc_resize_up_thresh
Spatial resampling up watermark.
Definition: vpx_encoder.h:424
unsigned int rc_max_quantizer
Maximum (Worst Quality) Quantizer.
Definition: vpx_encoder.h:484
unsigned int rc_2pass_vbr_corpus_complexity
Two-pass corpus vbr mode complexity control Used only in VP9: A value representing the corpus midpoin...
Definition: vpx_encoder.h:586
vpx_rational_t zm_factor
Zero motion power factor.
Definition: vpx_encoder.h:810
unsigned int g_lag_in_frames
Allow lagged encoding.
Definition: vpx_encoder.h:374
enum vpx_rc_mode rc_end_usage
Rate control algorithm to use.
Definition: vpx_encoder.h:442
vpx_rational_t active_wq_factor
Active worst quality factor.
Definition: vpx_encoder.h:710
vpx_rational_t gf_max_total_boost_factor
Golden frame maximum total boost adjustment factor.
Definition: vpx_encoder.h:792
unsigned int rc_buf_initial_sz
Decoder Buffer Initial Size.
Definition: vpx_encoder.h:542
vpx_bit_depth_t g_bit_depth
Bit-depth of the codec.
Definition: vpx_encoder.h:323
vpx_rational_t gf_frame_max_boost_factor
Golden frame maximum boost adjustment factor.
Definition: vpx_encoder.h:801
unsigned int rc_buf_optimal_sz
Decoder Buffer Optimal Size.
Definition: vpx_encoder.h:551
int use_vizier_rc_params
A flag indicating whether to use external rate control parameters. By default is 0....
Definition: vpx_encoder.h:701
unsigned int rc_2pass_vbr_maxsection_pct
Two-pass mode per-GOP maximum bitrate.
Definition: vpx_encoder.h:579
unsigned int rc_target_bitrate
Target data rate.
Definition: vpx_encoder.h:462
unsigned int ts_target_bitrate[5]
Target bitrate for each temporal layer.
Definition: vpx_encoder.h:653
vpx_rational_t err_per_mb_factor
Error per macroblock adjustment factor.
Definition: vpx_encoder.h:719
unsigned int g_input_bit_depth
Bit-depth of the input frames.
Definition: vpx_encoder.h:331
vpx_rational_t kf_frame_min_boost_factor
Keyframe minimum boost adjustment factor.
Definition: vpx_encoder.h:755
vpx_rational_t sr_diff_factor
Second reference difference factor.
Definition: vpx_encoder.h:737
vpx_rational_t kf_err_per_mb_factor
Keyframe error per macroblock adjustment factor.
Definition: vpx_encoder.h:746
unsigned int rc_undershoot_pct
Rate control adaptation undershoot control.
Definition: vpx_encoder.h:503
unsigned int ts_rate_decimator[5]
Frame rate decimation factor for each temporal layer.
Definition: vpx_encoder.h:660
unsigned int kf_max_dist
Keyframe maximum interval.
Definition: vpx_encoder.h:616
vpx_rational_t rd_mult_inter_qp_fac
Rate-distortion multiplier for inter frames. The multiplier is a crucial parameter in the calculation...
Definition: vpx_encoder.h:820
vpx_rational_t kf_frame_max_boost_subs_factor
Keyframe maximum boost adjustment factor, for subsequent keyframes.
Definition: vpx_encoder.h:774
unsigned int g_threads
Maximum number of threads to use.
Definition: vpx_encoder.h:287
Callback function pointer / user data pair storage.
Definition: vpx_encoder.h:211
void * user_priv
Definition: vpx_encoder.h:213
vpx_codec_enc_output_cx_pkt_cb_fn_t output_cx_pkt
Definition: vpx_encoder.h:212
Generic fixed size buffer structure.
Definition: vpx_encoder.h:98
size_t sz
Definition: vpx_encoder.h:100
void * buf
Definition: vpx_encoder.h:99
Image Descriptor.
Definition: vpx_image.h:72
Rational Number.
Definition: vpx_encoder.h:220
int den
Definition: vpx_encoder.h:222
int num
Definition: vpx_encoder.h:221
vp9 svc extra configure parameters
Definition: vpx_encoder.h:848
int min_quantizers[12]
Definition: vpx_encoder.h:850
int scaling_factor_num[12]
Definition: vpx_encoder.h:851
int speed_per_layer[12]
Definition: vpx_encoder.h:853
int max_quantizers[12]
Definition: vpx_encoder.h:849
int scaling_factor_den[12]
Definition: vpx_encoder.h:852
int loopfilter_ctrl[12]
Definition: vpx_encoder.h:855
int temporal_layering_mode
Definition: vpx_encoder.h:854
Describes the codec algorithm interface to applications.