AOMedia Codec SDK
aom_encoder.h
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 #ifndef AOM_AOM_AOM_ENCODER_H_
12 #define AOM_AOM_AOM_ENCODER_H_
13 
29 #ifdef __cplusplus
30 extern "C" {
31 #endif
32 
33 #include "aom/aom_codec.h"
34 
43 #define AOM_ENCODER_ABI_VERSION \
44  (5 + AOM_CODEC_ABI_VERSION)
55 #define AOM_CODEC_CAP_PSNR 0x10000
59 #define AOM_CODEC_CAP_HIGHBITDEPTH 0x40000
60 
68 #define AOM_CODEC_USE_PSNR 0x10000
70 #define AOM_CODEC_USE_HIGHBITDEPTH 0x40000
76 typedef struct aom_fixed_buf {
77  void *buf;
78  size_t sz;
86 typedef int64_t aom_codec_pts_t;
87 
95 typedef uint32_t aom_codec_frame_flags_t;
96 #define AOM_FRAME_IS_KEY 0x1
99 #define AOM_FRAME_IS_DROPPABLE 0x2
100 
101 #define AOM_FRAME_IS_INVISIBLE 0x4
102 
103 #define AOM_FRAME_IS_FRAGMENT 0x8
104 
105 #define AOM_FRAME_IS_INTRAONLY 0x10
106 
107 #define AOM_FRAME_IS_SWITCH 0x20
108 
109 #define AOM_FRAME_IS_ERROR_RESILIENT 0x40
110 
117 typedef uint32_t aom_codec_er_flags_t;
119 #define AOM_ERROR_RESILIENT_DEFAULT 0x1
120 
132  AOM_CODEC_CUSTOM_PKT = 256
133 };
134 
140 typedef struct aom_codec_cx_pkt {
142  union {
143  struct {
144  void *buf;
145  size_t sz;
149  unsigned long duration;
157  } frame;
160  struct aom_psnr_pkt {
161  unsigned int samples[4];
162  uint64_t sse[4];
163  double psnr[4];
164  } psnr;
167  /* This packet size is fixed to allow codecs to extend this
168  * interface without having to manage storage for raw packets,
169  * i.e., if it's smaller than 128 bytes, you can store in the
170  * packet list directly.
171  */
172  char pad[128 - sizeof(enum aom_codec_cx_pkt_kind)];
173  } data;
180 typedef struct aom_rational {
181  int num;
182  int den;
190 };
191 
198 };
199 
211  AOM_KF_DISABLED = 0
212 };
213 
222 #define AOM_EFLAG_FORCE_KF (1 << 0)
230 typedef struct aom_codec_enc_cfg {
231  /*
232  * generic settings (g)
233  */
234 
242  unsigned int g_usage;
243 
250  unsigned int g_threads;
251 
260  unsigned int g_profile;
269  unsigned int g_w;
270 
278  unsigned int g_h;
279 
283  unsigned int g_limit;
284 
291 
298 
306 
313  unsigned int g_input_bit_depth;
314 
327  struct aom_rational g_timebase;
328 
335  aom_codec_er_flags_t g_error_resilient;
336 
342  enum aom_enc_pass g_pass;
343 
356  unsigned int g_lag_in_frames;
357 
358  /*
359  * rate control settings (rc)
360  */
361 
378  unsigned int rc_dropframe_thresh;
379 
387  unsigned int rc_resize_mode;
388 
395  unsigned int rc_resize_denominator;
396 
404 
414  unsigned int rc_superres_mode;
415 
427 
437 
445  unsigned int rc_superres_qthresh;
446 
455 
464  enum aom_rc_mode rc_end_usage;
465 
472 
479 
484  unsigned int rc_target_bitrate;
485 
486  /*
487  * quantizer settings
488  */
489 
498  unsigned int rc_min_quantizer;
499 
508  unsigned int rc_max_quantizer;
509 
510  /*
511  * bitrate tolerance
512  */
513 
524  unsigned int rc_undershoot_pct;
525 
536  unsigned int rc_overshoot_pct;
537 
538  /*
539  * decoder buffer model parameters
540  */
541 
551  unsigned int rc_buf_sz;
552 
560  unsigned int rc_buf_initial_sz;
561 
569  unsigned int rc_buf_optimal_sz;
570 
571  /*
572  * 2 pass rate control parameters
573  */
574 
583  unsigned int rc_2pass_vbr_bias_pct;
584 
591 
598 
599  /*
600  * keyframing settings (kf)
601  */
602 
606  int fwd_kf_enabled;
607 
614  enum aom_kf_mode kf_mode;
615 
623  unsigned int kf_min_dist;
624 
632  unsigned int kf_max_dist;
633 
639  unsigned int sframe_dist;
640 
654  unsigned int sframe_mode;
655 
662  unsigned int large_scale_tile;
663 
669  unsigned int monochrome;
670 
679 
686  unsigned int save_as_annexb;
687 
695 
703 
708 #define MAX_TILE_WIDTHS 64 // maximum tile width array length
709 
715  int tile_widths[MAX_TILE_WIDTHS];
716 
721 #define MAX_TILE_HEIGHTS 64 // maximum tile height array length
722 
728  int tile_heights[MAX_TILE_HEIGHTS];
729 
759  aom_codec_iface_t *iface,
760  const aom_codec_enc_cfg_t *cfg,
761  aom_codec_flags_t flags, int ver);
762 
767 #define aom_codec_enc_init(ctx, iface, cfg, flags) \
768  aom_codec_enc_init_ver(ctx, iface, cfg, flags, AOM_ENCODER_ABI_VERSION)
769 
792  int num_enc, aom_codec_flags_t flags, aom_rational_t *dsf, int ver);
793 
798 #define aom_codec_enc_init_multi(ctx, iface, cfg, num_enc, flags, dsf) \
799  aom_codec_enc_init_multi_ver(ctx, iface, cfg, num_enc, flags, dsf, \
800  AOM_ENCODER_ABI_VERSION)
801 
822  aom_codec_enc_cfg_t *cfg,
823  unsigned int reserved);
824 
840  const aom_codec_enc_cfg_t *cfg);
841 
866 
892  aom_codec_pts_t pts, unsigned long duration,
893  aom_enc_frame_flags_t flags);
894 
939  const aom_fixed_buf_t *buf,
940  unsigned int pad_before,
941  unsigned int pad_after);
942 
967  aom_codec_iter_t *iter);
968 
982 
984 #ifdef __cplusplus
985 }
986 #endif
987 #endif // AOM_AOM_AOM_ENCODER_H_
aom_codec_enc_cfg::rc_superres_kf_qthresh
unsigned int rc_superres_kf_qthresh
Keyframe super-resolution q threshold.
Definition: aom_encoder.h:454
aom_codec_cx_pkt::duration
unsigned long duration
duration to show frame (in timebase units)
Definition: aom_encoder.h:149
aom_codec_enc_cfg::g_profile
unsigned int g_profile
Bitstream profile to use.
Definition: aom_encoder.h:260
aom_codec_enc_cfg::rc_dropframe_thresh
unsigned int rc_dropframe_thresh
Temporal resampling configuration, if supported by the codec.
Definition: aom_encoder.h:378
aom_codec_cx_pkt::samples
unsigned int samples[4]
Definition: aom_encoder.h:161
aom_codec_enc_cfg
Encoder configuration structure.
Definition: aom_encoder.h:230
MAX_TILE_WIDTHS
#define MAX_TILE_WIDTHS
Maximum number of tile widths in tile widths array.
Definition: aom_encoder.h:708
AOM_KF_FIXED
@ AOM_KF_FIXED
Definition: aom_encoder.h:209
aom_codec_enc_cfg::rc_superres_kf_denominator
unsigned int rc_superres_kf_denominator
Keyframe super-resolution denominator.
Definition: aom_encoder.h:436
aom_fixed_buf
Generic fixed size buffer structure.
Definition: aom_encoder.h:76
aom_codec_enc_cfg::rc_resize_kf_denominator
unsigned int rc_resize_kf_denominator
Keyframe resize denominator.
Definition: aom_encoder.h:403
aom_codec_enc_cfg::rc_2pass_vbr_bias_pct
unsigned int rc_2pass_vbr_bias_pct
Two-pass mode CBR/VBR bias.
Definition: aom_encoder.h:583
aom_codec_enc_cfg::rc_resize_mode
unsigned int rc_resize_mode
Mode for spatial resampling, if supported by the codec.
Definition: aom_encoder.h:387
aom_codec_enc_cfg::g_lag_in_frames
unsigned int g_lag_in_frames
Allow lagged encoding.
Definition: aom_encoder.h:356
MAX_TILE_HEIGHTS
#define MAX_TILE_HEIGHTS
Maximum number of tile heights in tile heights array.
Definition: aom_encoder.h:721
aom_codec_cx_pkt::pad
char pad[128 - sizeof(enum aom_codec_cx_pkt_kind)]
Definition: aom_encoder.h:172
aom_codec_ctx
Codec context structure.
Definition: aom_codec.h:204
aom_codec_enc_cfg::rc_buf_sz
unsigned int rc_buf_sz
Decoder Buffer Size.
Definition: aom_encoder.h:551
aom_codec_iface_t
const struct aom_codec_iface aom_codec_iface_t
Codec interface structure.
Definition: aom_codec.h:181
aom_rational
Rational Number.
Definition: aom_encoder.h:180
AOM_CODEC_FPMB_STATS_PKT
@ AOM_CODEC_FPMB_STATS_PKT
Definition: aom_encoder.h:130
AOM_CQ
@ AOM_CQ
Definition: aom_encoder.h:196
aom_codec_enc_cfg::sframe_mode
unsigned int sframe_mode
sframe insertion mode
Definition: aom_encoder.h:654
aom_codec_get_global_headers
aom_fixed_buf_t * aom_codec_get_global_headers(aom_codec_ctx_t *ctx)
Get global stream headers.
aom_codec.h
Describes the codec algorithm interface to applications.
aom_codec_enc_cfg::rc_target_bitrate
unsigned int rc_target_bitrate
Target data rate.
Definition: aom_encoder.h:484
AOM_RC_FIRST_PASS
@ AOM_RC_FIRST_PASS
Definition: aom_encoder.h:188
AOM_CODEC_PSNR_PKT
@ AOM_CODEC_PSNR_PKT
Definition: aom_encoder.h:131
aom_codec_enc_cfg::rc_min_quantizer
unsigned int rc_min_quantizer
Minimum (Best Quality) Quantizer.
Definition: aom_encoder.h:498
aom_codec_enc_cfg::full_still_picture_hdr
unsigned int full_still_picture_hdr
full_still_picture_hdr
Definition: aom_encoder.h:678
AOM_CBR
@ AOM_CBR
Definition: aom_encoder.h:195
aom_codec_enc_config_set
aom_codec_err_t aom_codec_enc_config_set(aom_codec_ctx_t *ctx, const aom_codec_enc_cfg_t *cfg)
Set or change configuration.
aom_codec_cx_pkt::flags
aom_codec_frame_flags_t flags
Definition: aom_encoder.h:150
aom_rational::den
int den
Definition: aom_encoder.h:182
aom_codec_enc_cfg::rc_undershoot_pct
unsigned int rc_undershoot_pct
Rate control adaptation undershoot control.
Definition: aom_encoder.h:524
AOM_RC_LAST_PASS
@ AOM_RC_LAST_PASS
Definition: aom_encoder.h:189
aom_codec_cx_pkt::twopass_stats
aom_fixed_buf_t twopass_stats
Definition: aom_encoder.h:158
aom_codec_enc_cfg::rc_overshoot_pct
unsigned int rc_overshoot_pct
Rate control adaptation overshoot control.
Definition: aom_encoder.h:536
aom_codec_enc_cfg::tile_height_count
int tile_height_count
Number of explicit tile heights specified.
Definition: aom_encoder.h:702
aom_codec_cx_pkt::buf
void * buf
Definition: aom_encoder.h:144
aom_codec_frame_flags_t
uint32_t aom_codec_frame_flags_t
Compressed Frame Flags.
Definition: aom_encoder.h:95
aom_codec_cx_pkt_t
struct aom_codec_cx_pkt aom_codec_cx_pkt_t
Encoder output packet.
aom_codec_cx_pkt::sse
uint64_t sse[4]
Definition: aom_encoder.h:162
aom_codec_enc_cfg::g_usage
unsigned int g_usage
Algorithm specific "usage" value.
Definition: aom_encoder.h:242
aom_codec_enc_cfg::tile_width_count
int tile_width_count
Number of explicit tile widths specified.
Definition: aom_encoder.h:694
aom_codec_pts_t
int64_t aom_codec_pts_t
Time Stamp Type.
Definition: aom_encoder.h:86
aom_kf_mode
aom_kf_mode
Keyframe placement mode.
Definition: aom_encoder.h:208
aom_codec_enc_cfg::g_forced_max_frame_height
unsigned int g_forced_max_frame_height
Forced maximum height of the frame.
Definition: aom_encoder.h:297
aom_codec_cx_pkt::firstpass_mb_stats
aom_fixed_buf_t firstpass_mb_stats
Definition: aom_encoder.h:159
aom_enc_frame_flags_t
long aom_enc_frame_flags_t
Encoded Frame Flags.
Definition: aom_encoder.h:221
aom_codec_enc_cfg::g_w
unsigned int g_w
Width of the frame.
Definition: aom_encoder.h:269
aom_codec_set_cx_data_buf
aom_codec_err_t aom_codec_set_cx_data_buf(aom_codec_ctx_t *ctx, const aom_fixed_buf_t *buf, unsigned int pad_before, unsigned int pad_after)
Set compressed data output buffer.
aom_codec_enc_cfg::rc_firstpass_mb_stats_in
aom_fixed_buf_t rc_firstpass_mb_stats_in
first pass mb stats buffer.
Definition: aom_encoder.h:478
AOM_VBR
@ AOM_VBR
Definition: aom_encoder.h:194
aom_codec_cx_pkt::raw
aom_fixed_buf_t raw
Definition: aom_encoder.h:165
aom_fixed_buf_t
struct aom_fixed_buf aom_fixed_buf_t
Generic fixed size buffer structure.
aom_codec_enc_cfg::rc_twopass_stats_in
aom_fixed_buf_t rc_twopass_stats_in
Two-pass stats buffer.
Definition: aom_encoder.h:471
aom_codec_err_t
aom_codec_err_t
Algorithm return codes.
Definition: aom_codec.h:101
AOM_RC_ONE_PASS
@ AOM_RC_ONE_PASS
Definition: aom_encoder.h:187
aom_codec_get_cx_data
const aom_codec_cx_pkt_t * aom_codec_get_cx_data(aom_codec_ctx_t *ctx, aom_codec_iter_t *iter)
Encoded data iterator.
aom_codec_encode
aom_codec_err_t aom_codec_encode(aom_codec_ctx_t *ctx, const aom_image_t *img, aom_codec_pts_t pts, unsigned long duration, aom_enc_frame_flags_t flags)
Encode a frame.
aom_codec_enc_init_ver
aom_codec_err_t aom_codec_enc_init_ver(aom_codec_ctx_t *ctx, aom_codec_iface_t *iface, const aom_codec_enc_cfg_t *cfg, aom_codec_flags_t flags, int ver)
Initialize an encoder instance.
aom_codec_enc_cfg::rc_resize_denominator
unsigned int rc_resize_denominator
Frame resize denominator.
Definition: aom_encoder.h:395
aom_codec_enc_cfg::g_limit
unsigned int g_limit
Max number of frames to encode.
Definition: aom_encoder.h:283
aom_codec_enc_cfg::rc_buf_initial_sz
unsigned int rc_buf_initial_sz
Decoder Buffer Initial Size.
Definition: aom_encoder.h:560
aom_codec_enc_cfg::cfg
cfg_options_t cfg
Options defined per config file.
Definition: aom_encoder.h:733
aom_codec_cx_pkt::pts
aom_codec_pts_t pts
time stamp to show frame (in timebase units)
Definition: aom_encoder.h:147
aom_codec_enc_cfg::rc_superres_denominator
unsigned int rc_superres_denominator
Frame super-resolution denominator.
Definition: aom_encoder.h:426
aom_codec_er_flags_t
uint32_t aom_codec_er_flags_t
Error Resilient flags.
Definition: aom_encoder.h:117
AOM_Q
@ AOM_Q
Definition: aom_encoder.h:197
aom_codec_enc_cfg::rc_max_quantizer
unsigned int rc_max_quantizer
Maximum (Worst Quality) Quantizer.
Definition: aom_encoder.h:508
aom_codec_cx_pkt::data
union aom_codec_cx_pkt::@1 data
aom_codec_enc_cfg::monochrome
unsigned int monochrome
Monochrome mode.
Definition: aom_encoder.h:669
AOM_KF_DISABLED
@ AOM_KF_DISABLED
Definition: aom_encoder.h:211
aom_codec_cx_pkt::frame
struct aom_codec_cx_pkt::@1::@2 frame
aom_codec_cx_pkt
Encoder output packet.
Definition: aom_encoder.h:140
aom_codec_enc_cfg::g_forced_max_frame_width
unsigned int g_forced_max_frame_width
Forced maximum width of the frame.
Definition: aom_encoder.h:290
aom_rc_mode
aom_rc_mode
Rate control mode.
Definition: aom_encoder.h:193
AOM_CODEC_CUSTOM_PKT
@ AOM_CODEC_CUSTOM_PKT
Definition: aom_encoder.h:132
AOM_KF_AUTO
@ AOM_KF_AUTO
Definition: aom_encoder.h:210
aom_codec_iter_t
const void * aom_codec_iter_t
Iterator.
Definition: aom_codec.h:194
aom_codec_enc_cfg::rc_superres_mode
unsigned int rc_superres_mode
Frame super-resolution scaling mode.
Definition: aom_encoder.h:414
AOM_CODEC_STATS_PKT
@ AOM_CODEC_STATS_PKT
Definition: aom_encoder.h:129
aom_codec_enc_cfg::rc_superres_qthresh
unsigned int rc_superres_qthresh
Frame super-resolution q threshold.
Definition: aom_encoder.h:445
aom_codec_enc_cfg::g_h
unsigned int g_h
Height of the frame.
Definition: aom_encoder.h:278
aom_enc_pass
aom_enc_pass
Multi-pass Encoding Pass.
Definition: aom_encoder.h:186
AOM_CODEC_CX_FRAME_PKT
@ AOM_CODEC_CX_FRAME_PKT
Definition: aom_encoder.h:128
aom_codec_enc_cfg::save_as_annexb
unsigned int save_as_annexb
Bitstream syntax mode.
Definition: aom_encoder.h:686
aom_codec_flags_t
long aom_codec_flags_t
Initialization-time Feature Enabling.
Definition: aom_codec.h:174
aom_codec_cx_pkt::psnr
double psnr[4]
Definition: aom_encoder.h:163
aom_image
Image Descriptor.
Definition: aom_image.h:141
aom_fixed_buf::sz
size_t sz
Definition: aom_encoder.h:78
aom_codec_cx_pkt::kind
enum aom_codec_cx_pkt_kind kind
Definition: aom_encoder.h:141
aom_codec_enc_cfg::g_threads
unsigned int g_threads
Maximum number of threads to use.
Definition: aom_encoder.h:250
aom_codec_get_preview_frame
const aom_image_t * aom_codec_get_preview_frame(aom_codec_ctx_t *ctx)
Get Preview Frame.
aom_codec_enc_init_multi_ver
aom_codec_err_t aom_codec_enc_init_multi_ver(aom_codec_ctx_t *ctx, aom_codec_iface_t *iface, aom_codec_enc_cfg_t *cfg, int num_enc, aom_codec_flags_t flags, aom_rational_t *dsf, int ver)
Initialize multi-encoder instance.
cfg_options
Config Options.
Definition: aom_codec.h:533
aom_bit_depth_t
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
aom_codec_enc_cfg_t
struct aom_codec_enc_cfg aom_codec_enc_cfg_t
Encoder configuration structure.
aom_codec_enc_cfg::g_bit_depth
aom_bit_depth_t g_bit_depth
Bit-depth of the codec.
Definition: aom_encoder.h:305
aom_codec_enc_cfg::rc_buf_optimal_sz
unsigned int rc_buf_optimal_sz
Decoder Buffer Optimal Size.
Definition: aom_encoder.h:569
aom_codec_enc_cfg::kf_max_dist
unsigned int kf_max_dist
Keyframe maximum interval.
Definition: aom_encoder.h:632
aom_codec_enc_cfg::large_scale_tile
unsigned int large_scale_tile
Tile coding mode.
Definition: aom_encoder.h:662
aom_codec_enc_cfg::sframe_dist
unsigned int sframe_dist
sframe interval
Definition: aom_encoder.h:639
aom_codec_enc_cfg::rc_2pass_vbr_maxsection_pct
unsigned int rc_2pass_vbr_maxsection_pct
Two-pass mode per-GOP maximum bitrate.
Definition: aom_encoder.h:597
aom_fixed_buf::buf
void * buf
Definition: aom_encoder.h:77
aom_codec_cx_pkt::sz
size_t sz
Definition: aom_encoder.h:145
aom_rational_t
struct aom_rational aom_rational_t
Rational Number.
aom_codec_enc_config_default
aom_codec_err_t aom_codec_enc_config_default(aom_codec_iface_t *iface, aom_codec_enc_cfg_t *cfg, unsigned int reserved)
Get a default configuration.
aom_codec_enc_cfg::kf_min_dist
unsigned int kf_min_dist
Keyframe minimum interval.
Definition: aom_encoder.h:623
aom_codec_cx_pkt::vis_frame_size
size_t vis_frame_size
size of the visible frame in this packet
Definition: aom_encoder.h:156
aom_rational::num
int num
Definition: aom_encoder.h:181
aom_codec_cx_pkt_kind
aom_codec_cx_pkt_kind
Encoder output packet variants.
Definition: aom_encoder.h:127
aom_codec_cx_pkt::partition_id
int partition_id
the partition id defines the decoding order of the partitions. Only applicable when "output partition...
Definition: aom_encoder.h:154
aom_codec_enc_cfg::rc_2pass_vbr_minsection_pct
unsigned int rc_2pass_vbr_minsection_pct
Two-pass mode per-GOP minimum bitrate.
Definition: aom_encoder.h:590