1 files changed, 1846 insertions, 0 deletions
diff --git a/include/gst/codecparsers/gstav1parser.h b/include/gst/codecparsers/gstav1parser.h
new file mode 100644
index 0000000000..31f5945498
--- /dev/null
+++ b/include/gst/codecparsers/gstav1parser.h
@@ -0,0 +1,1846 @@
+/*
+ * gstav1parser.h
+ *
+ *  Copyright (C) 2018 Georg Ottinger
+ *  Copyright (C) 2019-2020 Intel Corporation
+ *    Author: Georg Ottinger<g.ottinger@gmx.at>
+ *    Author: Junyan He<junyan.he@hotmail.com>
+ *    Author: Victor Jaquez <vjaquez@igalia.com>
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, write to the
+ * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
+ * Boston, MA 02110-1301, USA.
+ */
+
+#ifndef __GST_AV1_PARSER_H__
+#define __GST_AV1_PARSER_H__
+
+#ifndef GST_USE_UNSTABLE_API
+#warning "The AV1 parsing library is unstable API and may change in future."
+#warning "You can define GST_USE_UNSTABLE_API to avoid this warning."
+#endif
+
+#include <gst/gst.h>
+#include <gst/codecparsers/codecparsers-prelude.h>
+
+G_BEGIN_DECLS
+
+#define GST_AV1_MAX_NUM_TEMPORAL_LAYERS        8
+#define GST_AV1_MAX_NUM_SPATIAL_LAYERS         4
+#define GST_AV1_MAX_TILE_WIDTH                 4096
+#define GST_AV1_MAX_TILE_AREA                  (4096 * 2304)
+#define GST_AV1_TOTAL_REFS_PER_FRAME           8
+#define GST_AV1_MAX_SEGMENTS                   8
+#define GST_AV1_SEG_LVL_MAX                    8
+#define GST_AV1_MAX_TILE_COLS                  64
+#define GST_AV1_MAX_TILE_ROWS                  64
+
+#define GST_AV1_REFS_PER_FRAME                 7
+#define GST_AV1_PRIMARY_REF_NONE               7
+#define GST_AV1_SUPERRES_NUM                   8
+#define GST_AV1_SUPERRES_DENOM_MIN             9
+#define GST_AV1_SUPERRES_DENOM_BITS            3
+#define GST_AV1_MAX_LOOP_FILTER                63
+#define GST_AV1_GM_ABS_TRANS_BITS              12
+#define GST_AV1_GM_ABS_TRANS_ONLY_BITS         9
+#define GST_AV1_GM_ABS_ALPHA_BITS              12
+#define GST_AV1_GM_ALPHA_PREC_BITS             15
+#define GST_AV1_GM_TRANS_PREC_BITS             6
+#define GST_AV1_GM_TRANS_ONLY_PREC_BITS        3
+#define GST_AV1_WARPEDMODEL_PREC_BITS          16
+#define GST_AV1_WARP_PARAM_REDUCE_BITS         6
+#define GST_AV1_SELECT_SCREEN_CONTENT_TOOLS    2
+#define GST_AV1_SELECT_INTEGER_MV              2
+#define GST_AV1_RESTORATION_TILESIZE_MAX       256
+#define GST_AV1_SEG_LVL_ALT_Q                  0
+#define GST_AV1_SEG_LVL_REF_FRAME              5
+/* Following defines are derived from the spec, but not mentioned by
+ * this particular name in the spec */
+#define GST_AV1_CDEF_MAX                       (1 << 3)
+#define GST_AV1_MAX_TILE_COUNT                 512
+#define GST_AV1_MAX_OPERATING_POINTS    \
+  (GST_AV1_MAX_NUM_TEMPORAL_LAYERS * GST_AV1_MAX_NUM_SPATIAL_LAYERS)
+#define GST_AV1_MAX_SPATIAL_LAYERS             2  /* correct? */
+#define GST_AV1_MAX_TEMPORAL_GROUP_SIZE        8  /* correct? */
+#define GST_AV1_MAX_TEMPORAL_GROUP_REFERENCES  8  /* correct? */
+#define GST_AV1_MAX_NUM_Y_POINTS               16
+#define GST_AV1_MAX_NUM_CB_POINTS              16
+#define GST_AV1_MAX_NUM_CR_POINTS              16
+#define GST_AV1_MAX_NUM_POS_LUMA               25
+#define GST_AV1_MAX_NUM_PLANES                 3
+
+#define GST_AV1_DIV_LUT_PREC_BITS              14
+#define GST_AV1_DIV_LUT_BITS                   8
+#define GST_AV1_DIV_LUT_NUM                    (1 << GST_AV1_DIV_LUT_BITS)
+
+
+typedef struct _GstAV1Parser GstAV1Parser;
+
+typedef struct _GstAV1OBUHeader GstAV1OBUHeader;
+typedef struct _GstAV1OBU GstAV1OBU;
+
+typedef struct _GstAV1SequenceHeaderOBU GstAV1SequenceHeaderOBU;
+typedef struct _GstAV1MetadataOBU GstAV1MetadataOBU;
+typedef struct _GstAV1FrameHeaderOBU GstAV1FrameHeaderOBU;
+typedef struct _GstAV1TileListOBU GstAV1TileListOBU;
+typedef struct _GstAV1TileGroupOBU GstAV1TileGroupOBU;
+typedef struct _GstAV1FrameOBU GstAV1FrameOBU;
+
+typedef struct _GstAV1OperatingPoint GstAV1OperatingPoint;
+typedef struct _GstAV1DecoderModelInfo GstAV1DecoderModelInfo;
+typedef struct _GstAV1TimingInfo GstAV1TimingInfo;
+typedef struct _GstAV1ColorConfig GstAV1ColorConfig;
+typedef struct _GstAV1MetadataITUT_T35 GstAV1MetadataITUT_T35;
+typedef struct _GstAV1MetadataHdrCll GstAV1MetadataHdrCll;
+typedef struct _GstAV1MetadataHdrMdcv GstAV1MetadataHdrMdcv;
+typedef struct _GstAV1MetadataScalability GstAV1MetadataScalability;
+typedef struct _GstAV1MetadataTimecode GstAV1MetadataTimecode;
+typedef struct _GstAV1LoopFilterParams GstAV1LoopFilterParams;
+typedef struct _GstAV1QuantizationParams GstAV1QuantizationParams;
+typedef struct _GstAV1SegmenationParams GstAV1SegmenationParams;
+typedef struct _GstAV1TileInfo GstAV1TileInfo;
+typedef struct _GstAV1CDEFParams GstAV1CDEFParams;
+typedef struct _GstAV1LoopRestorationParams GstAV1LoopRestorationParams;
+typedef struct _GstAV1GlobalMotionParams GstAV1GlobalMotionParams;
+typedef struct _GstAV1FilmGrainParams GstAV1FilmGrainParams;
+
+typedef struct _GstAV1ReferenceFrameInfo GstAV1ReferenceFrameInfo;
+
+/**
+ * GstAV1ParserResult:
+ * @GST_AV1_PARSER_OK: successful return
+ * @GST_AV1_PARSER_NO_MORE_DATA: the parser needs more data for one OBU
+ * @GST_AV1_PARSER_DROP: no need to handle this OBU, skip it
+ * @GST_AV1_PARSER_BITSTREAM_ERROR: stream error, for example, include invalid bits
+ * @GST_AV1_PARSER_MISSING_OBU_REFERENCE: no reference, for example, no sequence found
+ * @GST_AV1_PARSER_INVALID_OPERATION: something like invalid parameters
+ *
+ * Defines the result of parser process
+ */
+typedef enum {
+  GST_AV1_PARSER_OK = 0,
+  GST_AV1_PARSER_NO_MORE_DATA = 1,
+  GST_AV1_PARSER_DROP = 2,
+  GST_AV1_PARSER_BITSTREAM_ERROR = 3,
+  GST_AV1_PARSER_MISSING_OBU_REFERENCE = 4,
+  GST_AV1_PARSER_INVALID_OPERATION = 5,
+} GstAV1ParserResult;
+
+/**
+ * GstAV1Profile:
+ * @GST_AV1_PROFILE_0: 8-bit and 10-bit 4:2:0 and 4:0:0 only.
+ * @GST_AV1_PROFILE_1: 8-bit and 10-bit 4:4:4.
+ * @GST_AV1_PROFILE_2: 8-bit and 10-bit 4:2:2, 12-bit 4:0:0 4:2:2 and 4:4:4
+ * @GST_AV1_PROFILE_UNDEFINED: unknow AV1 profile (Since: 1.20)
+ *
+ * Defines the AV1 profiles
+ */
+/**
+ * GST_AV1_PROFILE_UNDEFINED:
+ *
+ * unknow AV1 profile
+ *
+ * Since: 1.20
+ */
+typedef enum {
+  GST_AV1_PROFILE_0 = 0,
+  GST_AV1_PROFILE_1 = 1,
+  GST_AV1_PROFILE_2 = 2,
+  GST_AV1_PROFILE_UNDEFINED,
+} GstAV1Profile;
+
+/**
+ * GstAV1OBUType:
+ * @GST_AV1_OBU_RESERVED_0: Reserved 0
+ * @GST_AV1_OBU_SEQUENCE_HEADER: Sequence Header OBU
+ * @GST_AV1_OBU_TEMPORAL_DELIMITER: Temporal Delimiter OBU
+ * @GST_AV1_OBU_FRAME_HEADER: Frame Header OBU
+ * @GST_AV1_OBU_TILE_GROUP: Tile Group OBU
+ * @GST_AV1_OBU_METADATA: Metadata OBU
+ * @GST_AV1_OBU_FRAME: Frame OBU (includes Frame Header and one Tile Group)
+ * @GST_AV1_OBU_REDUNDANT_FRAME_HEADER: Redundant Frame Header OBU
+ * @GST_AV1_OBU_TILE_LIST: Tile LIst OBU
+ * @GST_AV1_OBU_RESERVED_9: Reserved 9
+ * @GST_AV1_OBU_RESERVED_10: Reserved 10
+ * @GST_AV1_OBU_RESERVED_11: Reserved 11
+ * @GST_AV1_OBU_RESERVED_12: Reserved 12
+ * @GST_AV1_OBU_RESERVED_13: Reserved 13
+ * @GST_AV1_OBU_RESERVED_14: Reserved 14
+ * @GST_AV1_OBU_PADDING: Padding
+ *
+ * Defines all the possible OBU types
+ */
+typedef enum {
+  GST_AV1_OBU_RESERVED_0 = 0,
+  GST_AV1_OBU_SEQUENCE_HEADER = 1,
+  GST_AV1_OBU_TEMPORAL_DELIMITER = 2,
+  GST_AV1_OBU_FRAME_HEADER = 3,
+  GST_AV1_OBU_TILE_GROUP = 4,
+  GST_AV1_OBU_METADATA = 5,
+  GST_AV1_OBU_FRAME = 6,
+  GST_AV1_OBU_REDUNDANT_FRAME_HEADER = 7,
+  GST_AV1_OBU_TILE_LIST = 8,
+  GST_AV1_OBU_RESERVED_9 = 9,
+  GST_AV1_OBU_RESERVED_10 = 10,
+  GST_AV1_OBU_RESERVED_11 = 11,
+  GST_AV1_OBU_RESERVED_12 = 12,
+  GST_AV1_OBU_RESERVED_13 = 13,
+  GST_AV1_OBU_RESERVED_14 = 14,
+  GST_AV1_OBU_PADDING = 15,
+} GstAV1OBUType;
+
+/**
+ * GstAV1SeqLevels:
+ * @GST_AV1_SEQ_LEVEL_2_0: Level 2.0
+ * @GST_AV1_SEQ_LEVEL_2_1: Level 2.1
+ * @GST_AV1_SEQ_LEVEL_2_2: Level 2.2
+ * @GST_AV1_SEQ_LEVEL_2_3: Level 2.3
+ * @GST_AV1_SEQ_LEVEL_3_0: Level 3.0
+ * @GST_AV1_SEQ_LEVEL_3_1: Level 3.1
+ * @GST_AV1_SEQ_LEVEL_3_2: Level 3.2
+ * @GST_AV1_SEQ_LEVEL_3_3: Level 3.3
+ * @GST_AV1_SEQ_LEVEL_4_0: Level 4.0
+ * @GST_AV1_SEQ_LEVEL_4_1: Level 4.1
+ * @GST_AV1_SEQ_LEVEL_4_2: Level 4.2
+ * @GST_AV1_SEQ_LEVEL_4_3: Level 4.3
+ * @GST_AV1_SEQ_LEVEL_5_0: Level 5.0
+ * @GST_AV1_SEQ_LEVEL_5_1: Level 5.1
+ * @GST_AV1_SEQ_LEVEL_5_2: Level 5.2
+ * @GST_AV1_SEQ_LEVEL_5_3: Level 5.3
+ * @GST_AV1_SEQ_LEVEL_6_0: Level 6.0
+ * @GST_AV1_SEQ_LEVEL_6_1: Level 6.1
+ * @GST_AV1_SEQ_LEVEL_6_2: Level 6.2
+ * @GST_AV1_SEQ_LEVEL_6_3: Level 6.3
+ * @GST_AV1_SEQ_LEVEL_7_0: Level 7.0
+ * @GST_AV1_SEQ_LEVEL_7_1: Level 7.1
+ * @GST_AV1_SEQ_LEVEL_7_2: Level 7.2
+ * @GST_AV1_SEQ_LEVEL_7_3: Level 7.3
+ * @GST_AV1_SEQ_LEVELS: all valid levels
+ * @GST_AV1_SEQ_LEVEL_MAX: Maximum parameters
+ *
+ * Defines all the possible OBU types
+ */
+typedef enum {
+  GST_AV1_SEQ_LEVEL_2_0 = 0,
+  GST_AV1_SEQ_LEVEL_2_1 = 1,
+  GST_AV1_SEQ_LEVEL_2_2 = 2,
+  GST_AV1_SEQ_LEVEL_2_3 = 3,
+  GST_AV1_SEQ_LEVEL_3_0 = 4,
+  GST_AV1_SEQ_LEVEL_3_1 = 5,
+  GST_AV1_SEQ_LEVEL_3_2 = 6,
+  GST_AV1_SEQ_LEVEL_3_3 = 7,
+  GST_AV1_SEQ_LEVEL_4_0 = 8,
+  GST_AV1_SEQ_LEVEL_4_1 = 9,
+  GST_AV1_SEQ_LEVEL_4_2 = 10,
+  GST_AV1_SEQ_LEVEL_4_3 = 11,
+  GST_AV1_SEQ_LEVEL_5_0 = 12,
+  GST_AV1_SEQ_LEVEL_5_1 = 13,
+  GST_AV1_SEQ_LEVEL_5_2 = 14,
+  GST_AV1_SEQ_LEVEL_5_3 = 15,
+  GST_AV1_SEQ_LEVEL_6_0 = 16,
+  GST_AV1_SEQ_LEVEL_6_1 = 17,
+  GST_AV1_SEQ_LEVEL_6_2 = 18,
+  GST_AV1_SEQ_LEVEL_6_3 = 19,
+  GST_AV1_SEQ_LEVEL_7_0 = 20,
+  GST_AV1_SEQ_LEVEL_7_1 = 21,
+  GST_AV1_SEQ_LEVEL_7_2 = 22,
+  GST_AV1_SEQ_LEVEL_7_3 = 23,
+  GST_AV1_SEQ_LEVELS,
+  GST_AV1_SEQ_LEVEL_MAX = 31
+} GstAV1SeqLevels;
+
+/**
+ * GstAV1MetadataType:
+ * @GST_AV1_METADATA_TYPE_RESERVED_0: Reserved 0
+ * @GST_AV1_METADATA_TYPE_HDR_CLL: Metadata high dynamic range content
+ *   light level semantics
+ * @GST_AV1_METADATA_TYPE_HDR_MDCV: Metadata high dynamic range mastering
+ *   display color volume semantics
+ * @GST_AV1_METADATA_TYPE_SCALABILITY: Metadata scalability semantics
+ * @GST_AV1_METADATA_TYPE_ITUT_T35: Metadata ITUT T35 semantics
+ * @GST_AV1_METADATA_TYPE_TIMECODE: Timecode semantics
+ */
+typedef enum {
+  GST_AV1_METADATA_TYPE_RESERVED_0 = 0,
+  GST_AV1_METADATA_TYPE_HDR_CLL = 1,
+  GST_AV1_METADATA_TYPE_HDR_MDCV = 2,
+  GST_AV1_METADATA_TYPE_SCALABILITY = 3,
+  GST_AV1_METADATA_TYPE_ITUT_T35 = 4,
+  GST_AV1_METADATA_TYPE_TIMECODE = 5,
+} GstAV1MetadataType;
+
+/**
+ * GstAV1ScalabilityModes:
+ * @GST_AV1_SCALABILITY_L1T2: 1 spatial layer, 2 temporal layers
+ * @GST_AV1_SCALABILITY_L1T3: 1 spatial layer, 3 temporal layers
+ * @GST_AV1_SCALABILITY_L2T1: 2 spatial layer (ratio 2:1), 1 temporal layer,
+ *  inter-layer dependency
+ * @GST_AV1_SCALABILITY_L2T2: 2 spatial layer (ratio 2:1), 2 temporal layer,
+ *  inter-layer dependency
+ * @GST_AV1_SCALABILITY_L2T3: 2 spatial layer (ratio 2:1), 3 temporal layer,
+ *  inter-layer dependency
+ * @GST_AV1_SCALABILITY_S2T1: 2 spatial layer (ratio 2:1), 1 temporal layer
+ * @GST_AV1_SCALABILITY_S2T2: 2 spatial layer (ratio 2:1), 2 temporal layer
+ * @GST_AV1_SCALABILITY_S2T3: 2 spatial layer (ratio 2:1), 3 temporal layer
+ * @GST_AV1_SCALABILITY_L2T1h: 2 spatial layer (ratio 1.5:1), 1 temporal layer,
+ *  inter-layer dependency
+ * @GST_AV1_SCALABILITY_L2T2h: 2 spatial layer (ratio 1.5:1), 2 temporal layer,
+ *  inter-layer dependency
+ * @GST_AV1_SCALABILITY_L2T3h: 2 spatial layer (ratio 1.5:1), 3 temporal layer,
+ *  inter-layer dependency
+ * @GST_AV1_SCALABILITY_S2T1h: 2 spatial layer (ratio 1.5:1), 1 temporal layer
+ * @GST_AV1_SCALABILITY_S2T2h: 2 spatial layer (ratio 1.5:1), 2 temporal layer
+ * @GST_AV1_SCALABILITY_S2T3h: 2 spatial layer (ratio 1.5:1), 3 temporal layer
+ * @GST_AV1_SCALABILITY_SS: Use scalability structure #GstAV1MetadataScalability
+ */
+typedef enum {
+  GST_AV1_SCALABILITY_L1T2 = 0,
+  GST_AV1_SCALABILITY_L1T3 = 1,
+  GST_AV1_SCALABILITY_L2T1 = 2,
+  GST_AV1_SCALABILITY_L2T2 = 3,
+  GST_AV1_SCALABILITY_L2T3 = 4,
+  GST_AV1_SCALABILITY_S2T1 = 5,
+  GST_AV1_SCALABILITY_S2T2 = 6,
+  GST_AV1_SCALABILITY_S2T3 = 7,
+  GST_AV1_SCALABILITY_L2T1h = 8,
+  GST_AV1_SCALABILITY_L2T2h = 9,
+  GST_AV1_SCALABILITY_L2T3h = 10,
+  GST_AV1_SCALABILITY_S2T1h = 11,
+  GST_AV1_SCALABILITY_S2T2h = 12,
+  GST_AV1_SCALABILITY_S2T3h = 13,
+  GST_AV1_SCALABILITY_SS = 14,
+} GstAV1ScalabilityModes;
+
+/**
+ * GstAV1ColorPrimaries:
+ * @GST_AV1_CP_BT_709: BT.709
+ * @GST_AV1_CP_UNSPECIFIED: Unspecified
+ * @GST_AV1_CP_BT_470_M: BT.470 System M (historical)
+ * @GST_AV1_CP_BT_470_B_G:BT.470 System B, G (historical),
+ * @GST_AV1_CP_BT_601: BT.601
+ * @GST_AV1_CP_SMPTE_240: SMPTE 240
+ * @GST_AV1_CP_GENERIC_FILM: Generic film (color filters using illuminant C,
+ * @GST_AV1_CP_BT_2020: BT.2020, BT.2100,
+ * @GST_AV1_CP_XYZ: SMPTE 428 (CIE 1921 XYZ),
+ * @GST_AV1_CP_SMPTE_431: SMPTE RP 431-2
+ * @GST_AV1_CP_SMPTE_432: SMPTE EG 432-1
+ * @GST_AV1_CP_EBU_3213: EBU Tech. 3213-E
+ */
+typedef enum {
+  GST_AV1_CP_BT_709 = 1,
+  GST_AV1_CP_UNSPECIFIED = 2,
+  GST_AV1_CP_BT_470_M = 4,
+  GST_AV1_CP_BT_470_B_G = 5,
+  GST_AV1_CP_BT_601 = 6,
+  GST_AV1_CP_SMPTE_240 = 7,
+  GST_AV1_CP_GENERIC_FILM = 8,
+  GST_AV1_CP_BT_2020 = 9,
+  GST_AV1_CP_XYZ = 10,
+  GST_AV1_CP_SMPTE_431 = 11,
+  GST_AV1_CP_SMPTE_432 = 12,
+  GST_AV1_CP_EBU_3213 = 22,
+} GstAV1ColorPrimaries;
+
+/**
+ * GstAV1TransferCharacteristics:
+ * @GST_AV1_TC_RESERVED_0: For future use
+ * @GST_AV1_TC_BT_709: BT.709
+ * @GST_AV1_TC_UNSPECIFIED: Unspecified
+ * @GST_AV1_TC_RESERVED_3: For future use
+ * @GST_AV1_TC_BT_470_M: BT.470 System M (historical)
+ * @GST_AV1_TC_BT_470_B_G: BT.470 System B, G (historical)
+ * @GST_AV1_TC_BT_601: BT.601
+ * @GST_AV1_TC_SMPTE_240: SMPTE 240 M
+ * @GST_AV1_TC_LINEAR: Linear
+ * @GST_AV1_TC_LOG_100: Logarithmic (100 : 1 range)
+ * @GST_AV1_TC_LOG_100_SQRT10: Logarithmic (100 * Sqrt(10) : 1 range)
+ * @GST_AV1_TC_IEC_61966: IEC 61966-2-4
+ * @GST_AV1_TC_BT_1361: BT.1361
+ * @GST_AV1_TC_SRGB: sRGB or sYCC
+ * @GST_AV1_TC_BT_2020_10_BIT: BT.2020 10-bit systems
+ * @GST_AV1_TC_BT_2020_12_BIT: BT.2020 12-bit systems
+ * @GST_AV1_TC_SMPTE_2084: SMPTE ST 2084, ITU BT.2100 PQ
+ * @GST_AV1_TC_SMPTE_428: SMPTE ST 428
+ * @GST_AV1_TC_HLG: BT.2100 HLG, ARIB STD-B67
+ */
+typedef enum {
+  GST_AV1_TC_RESERVED_0 = 0,
+  GST_AV1_TC_BT_709 = 1,
+  GST_AV1_TC_UNSPECIFIED = 2,
+  GST_AV1_TC_RESERVED_3 = 3,
+  GST_AV1_TC_BT_470_M = 4,
+  GST_AV1_TC_BT_470_B_G = 5,
+  GST_AV1_TC_BT_601 = 6,
+  GST_AV1_TC_SMPTE_240 = 7,
+  GST_AV1_TC_LINEAR = 8,
+  GST_AV1_TC_LOG_100 = 9,
+  GST_AV1_TC_LOG_100_SQRT10 = 10,
+  GST_AV1_TC_IEC_61966 = 11,
+  GST_AV1_TC_BT_1361 = 12,
+  GST_AV1_TC_SRGB = 13,
+  GST_AV1_TC_BT_2020_10_BIT = 14,
+  GST_AV1_TC_BT_2020_12_BIT = 15,
+  GST_AV1_TC_SMPTE_2084 = 16,
+  GST_AV1_TC_SMPTE_428 = 17,
+  GST_AV1_TC_HLG = 18,
+} GstAV1TransferCharacteristics;
+
+/**
+ * GstAV1MatrixCoefficients:
+ * @GST_AV1_MC_IDENTITY: Identity matrix
+ * @GST_AV1_MC_BT_709: BT.709
+ * @GST_AV1_MC_UNSPECIFIED: Unspecified
+ * @GST_AV1_MC_RESERVED_3: For future use
+ * @GST_AV1_MC_FCC: US FCC 73.628
+ * @GST_AV1_MC_BT_470_B_G: BT.470 System B, G (historical)
+ * @GST_AV1_MC_BT_601: BT.601
+ * @GST_AV1_MC_SMPTE_240: SMPTE 240 M
+ * @GST_AV1_MC_SMPTE_YCGCO: YCgCo
+ * @GST_AV1_MC_BT_2020_NCL: BT.2020 non-constant luminance, BT.2100 YCbCr
+ * @GST_AV1_MC_BT_2020_CL: BT.2020 constant luminance
+ * @GST_AV1_MC_SMPTE_2085: SMPTE ST 2085 YDzDx
+ * @GST_AV1_MC_CHROMAT_NCL: Chromaticity-derived non-constant luminance
+ * @GST_AV1_MC_CHROMAT_CL: Chromaticity-derived constant luminancw
+ * @GST_AV1_MC_ICTCP: BT.2100 ICtCp
+ */
+typedef enum {
+  GST_AV1_MC_IDENTITY = 0,
+  GST_AV1_MC_BT_709 = 1,
+  GST_AV1_MC_UNSPECIFIED = 2,
+  GST_AV1_MC_RESERVED_3 = 3,
+  GST_AV1_MC_FCC = 4,
+  GST_AV1_MC_BT_470_B_G = 5,
+  GST_AV1_MC_BT_601 = 6,
+  GST_AV1_MC_SMPTE_240 = 7,
+  GST_AV1_MC_SMPTE_YCGCO = 8,
+  GST_AV1_MC_BT_2020_NCL = 9,
+  GST_AV1_MC_BT_2020_CL = 10,
+  GST_AV1_MC_SMPTE_2085 = 11,
+  GST_AV1_MC_CHROMAT_NCL = 12,
+  GST_AV1_MC_CHROMAT_CL = 13,
+  GST_AV1_MC_ICTCP = 14,
+} GstAV1MatrixCoefficients;
+
+/**
+ * GstAV1ChromaSamplePositions:
+ * @GST_AV1_CSP_UNKNOWN: Unknown (in this case the source video transfer
+ *  function must be signaled outside the AV1 bitstream).
+ * @GST_AV1_CSP_VERTICAL: Horizontally co-located with (0, 0) luma sample,
+ *  vertical position in the middle between two luma samples.
+ * @GST_AV1_CSP_COLOCATED: co-located with (0, 0) luma sample.
+ * @GST_AV1_CSP_RESERVED: For future use.
+ */
+typedef enum {
+  GST_AV1_CSP_UNKNOWN = 0,
+  GST_AV1_CSP_VERTICAL = 1,
+  GST_AV1_CSP_COLOCATED = 2,
+  GST_AV1_CSP_RESERVED = 3,
+} GstAV1ChromaSamplePositions;
+
+/**
+ * GstAV1FrameType:
+ * @GST_AV1_KEY_FRAME: Key Frame
+ * @GST_AV1_INTER_FRAME: InterFrame
+ * @GST_AV1_INTRA_ONLY_FRAME: Intra-Only Frame
+ * @GST_AV1_SWITCH_FRAME: Switch Frame
+ */
+typedef enum {
+  GST_AV1_KEY_FRAME = 0,
+  GST_AV1_INTER_FRAME = 1,
+  GST_AV1_INTRA_ONLY_FRAME = 2,
+  GST_AV1_SWITCH_FRAME = 3,
+} GstAV1FrameType;
+
+/**
+ * GstAV1InterpolationFilter:
+ * @GST_AV1_INTERPOLATION_FILTER_EIGHTTAP: Eighttap
+ * @GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SMOOTH: Eighttap Smooth
+ * @GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SHARP: Eighttap Sharp
+ * @GST_AV1_INTERPOLATION_FILTER_BILINEAR: Bilinear
+ * @GST_AV1_INTERPOLATION_FILTER_SWITCHABLE: Filter is swichtable
+ */
+typedef enum {
+  GST_AV1_INTERPOLATION_FILTER_EIGHTTAP = 0,
+  GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SMOOTH = 1,
+  GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SHARP = 2,
+  GST_AV1_INTERPOLATION_FILTER_BILINEAR = 3,
+  GST_AV1_INTERPOLATION_FILTER_SWITCHABLE = 4,
+} GstAV1InterpolationFilter;
+
+/**
+ * GstAV1TXModes:
+ * @GST_AV1_TX_MODE_ONLY_4x4: the inverse transform will use only 4x4 transforms.
+ * @GST_AV1_TX_MODE_LARGEST: the inverse transform will use the largest transform
+ *   size that fits inside the block.
+ * @GST_AV1_TX_MODE_SELECT: the choice of transform size is specified explicitly
+ *   for each block.
+ */
+typedef enum {
+  GST_AV1_TX_MODE_ONLY_4x4 = 0,
+  GST_AV1_TX_MODE_LARGEST = 1,
+  GST_AV1_TX_MODE_SELECT = 2,
+} GstAV1TXModes;
+
+/**
+ * GstAV1FrameRestorationType:
+ * @GST_AV1_FRAME_RESTORE_NONE: no filtering is applied
+ * @GST_AV1_FRAME_RESTORE_WIENER: Wiener filter process is invoked
+ * @GST_AV1_FRAME_RESTORE_SGRPROJ: self guided filter proces is invoked
+ * @GST_AV1_FRAME_RESTORE_SWITCHABLE: restoration filter is swichtable
+ */
+typedef enum {
+  GST_AV1_FRAME_RESTORE_NONE = 0,
+  GST_AV1_FRAME_RESTORE_WIENER = 1,
+  GST_AV1_FRAME_RESTORE_SGRPROJ = 2,
+  GST_AV1_FRAME_RESTORE_SWITCHABLE = 3,
+} GstAV1FrameRestorationType;
+
+/**
+ * GstAV1ReferenceFrame:
+ * @GST_AV1_REF_INTRA_FRAME: Intra Frame Reference
+ * @GST_AV1_REF_LAST_FRAME: Last Reference Frame
+ * @GST_AV1_REF_LAST2_FRAME: Last2 Reference Frame
+ * @GST_AV1_REF_LAST3_FRAME: Last3 Reference Frame
+ * @GST_AV1_REF_GOLDEN_FRAME: Golden Reference Frame
+ * @GST_AV1_REF_BWDREF_FRAME: BWD Reference Frame
+ * @GST_AV1_REF_ALTREF2_FRAME: Alternative2 Reference Frame
+ * @GST_AV1_REF_ALTREF_FRAME: Alternative Reference Frame
+ * @GST_AV1_NUM_REF_FRAMES: Total Reference Frame Number
+ */
+typedef enum {
+  GST_AV1_REF_INTRA_FRAME = 0,
+  GST_AV1_REF_LAST_FRAME = 1,
+  GST_AV1_REF_LAST2_FRAME = 2,
+  GST_AV1_REF_LAST3_FRAME = 3,
+  GST_AV1_REF_GOLDEN_FRAME = 4,
+  GST_AV1_REF_BWDREF_FRAME = 5,
+  GST_AV1_REF_ALTREF2_FRAME = 6,
+  GST_AV1_REF_ALTREF_FRAME = 7,
+  GST_AV1_NUM_REF_FRAMES
+} GstAV1ReferenceFrame;
+
+/**
+ * GstAV1WarpModelType:
+ * @GST_AV1_WARP_MODEL_IDENTITY: Warp model is just an identity transform
+ * @GST_AV1_WARP_MODEL_TRANSLATION: Warp model is a pure translation
+ * @GST_AV1_WARP_MODEL_ROTZOOM: Warp model is a rotation + symmetric zoom
+ *     + translation
+ * @GST_AV1_WARP_MODEL_AFFINE: Warp model is a general affine transform
+ */
+typedef enum {
+  GST_AV1_WARP_MODEL_IDENTITY = 0,
+  GST_AV1_WARP_MODEL_TRANSLATION = 1,
+  GST_AV1_WARP_MODEL_ROTZOOM = 2,
+  GST_AV1_WARP_MODEL_AFFINE = 3,
+} GstAV1WarpModelType;
+
+/**
+ * GstAV1OBUHeader:
+ * @obu_type: the type of data structure contained in the OBU payload.
+ * @obu_extention_flag: indicates if OBU header extention is present.
+ * @obu_has_size_field: equal to 1 indicates that the obu_size syntax element will be
+ *   present. @obu_has_size_field equal to 0 indicates that the @obu_size syntax element
+ *   will not be present.
+ * @obu_temporal_id: specifies the temporal level of the data contained in the OBU.
+ * @obu_spatial_id: specifies the spatial level of the data contained in the OBU.
+ *
+ * Collect info for OBU header and OBU extension header if
+ * obu_extension_flag == 1.
+ */
+struct _GstAV1OBUHeader {
+  GstAV1OBUType obu_type;
+  gboolean obu_extention_flag;
+  gboolean obu_has_size_field;
+  guint8 obu_temporal_id;
+  guint8 obu_spatial_id;
+};
+
+/**
+ * GstAV1OBU:
+ * @header: a #GstAV1OBUHeader OBU Header
+ * @obu_type: the type of data structure contained in the OBU payload.
+ * @data: references the current data chunk that holds the OBU
+ * @obu_size: size of the OBU, not include header size
+ *
+ * It is the general representation of AV1 OBU (Open Bitstream
+ * Unit). One OBU include its header and payload.
+ */
+struct _GstAV1OBU {
+  GstAV1OBUHeader header;
+  GstAV1OBUType obu_type;
+  guint8 *data;
+  guint32 obu_size;
+};
+
+/**
+ * GstAV1OperatingPoint:
+ * @seq_level_idx: specifies the level that the coded video sequence conforms to.
+ * @seq_tier: specifies the tier that the coded video sequence conforms to.
+ * @idc: contains a bitmask that indicates which spatial and temporal layers should be
+ *   decoded. Bit k is equal to 1 if temporal layer k should be decoded (for k between
+ *   0 and 7). Bit j+8 is equal to 1 if spatial layer j should be decoded (for j between
+ *   0 and 3).
+ * @decoder_model_present_for_this_op: equal to one indicates that there is a decoder model
+ *   associated with this operating point. @decoder_model_present_for_this_op equal to zero
+ *   indicates that there is not a decoder model associated.
+ * @decoder_buffer_delay: specifies the time interval between the arrival of the first bit
+ *   in the smoothing buffer and the subsequent removal of the data that belongs to the
+ *   first coded frame for operating point op, measured in units of 1/90000 seconds. The
+ *   length of @decoder_buffer_delay is specified by @buffer_delay_length_minus_1 + 1, in bits.
+ * @encoder_buffer_delay: specifies, in combination with @decoder_buffer_delay syntax element,
+ *   the first bit arrival time of frames to be decoded to the smoothing buffer.
+ *   @encoder_buffer_delay is measured in units of 1/90000 seconds. For a video sequence that
+ *   includes one or more random access points the sum of @decoder_buffer_delay and
+ *   @encoder_buffer_delay shall be kept constant.
+ * @low_delay_mode_flag: equal to 1 indicates that the smoothing buffer operates in low-delay
+ *   mode for operating point op. In low-delay mode late decode times and buffer underflow
+ *   are both permitted. @low_delay_mode_flag equal to 0 indicates that the smoothing buffer
+ *   operates in strict mode, where buffer underflow is not allowed.
+ * @initial_display_delay_present_for_this_op: equal to 1 indicates that
+ *   @initial_display_delay_minus_1 is specified for this operating. 0 indicates that
+ *   @initial_display_delay_minus_1 is not specified for this operating point.
+ * @initial_display_delay_minus_1: plus 1 specifies, for operating point i, the number of
+ *   decoded frames that should be present in the buffer pool before the first presentable
+ *   frame is displayed. This will ensure that all presentable frames in the sequence can
+ *   be decoded at or before the time that they are scheduled for display.
+ */
+struct _GstAV1OperatingPoint {
+  guint8 seq_level_idx;
+  guint8 seq_tier;
+  guint16 idc;
+  gboolean decoder_model_present_for_this_op;
+  guint8 decoder_buffer_delay;
+  guint8 encoder_buffer_delay;
+  gboolean low_delay_mode_flag;
+  gboolean initial_display_delay_present_for_this_op;
+  guint8 initial_display_delay_minus_1;
+};
+
+/**
+ * GstAV1DecoderModelInfo:
+ * @buffer_delay_length_minus_1: plus 1 specifies the length of the
+ *   @decoder_buffer_delay and the @encoder_buffer_delay syntax elements,
+ *   in bits.
+ * @num_units_in_decoding_tick: is the number of time units of a decoding clock
+ *   operating at the frequency @time_scale Hz that corresponds to one increment
+ *   of a clock tick counter.
+ * @buffer_removal_time_length_minus_1: plus 1 specifies the length of the
+ *   @buffer_removal_time syntax element, in bits.
+ * @frame_presentation_time_length_minus_1: plus 1 specifies the length of the
+ *   @frame_presentation_time syntax element, in bits.
+ */
+struct _GstAV1DecoderModelInfo {
+  guint8 buffer_delay_length_minus_1;
+  guint32 num_units_in_decoding_tick;
+  guint8 buffer_removal_time_length_minus_1;
+  guint8 frame_presentation_time_length_minus_1;
+};
+
+/**
+ * GstAV1TimingInfo:
+ * @num_units_in_display_tick: is the number of time units of a clock operating at the
+ *   frequency @time_scale Hz that corresponds to one increment of a clock tick counter.
+ *   A clock tick, in seconds, is equal to num_units_in_display_tick divided by time_scale.
+ *   It is a requirement of bitstream conformance that num_units_in_display_tick is greater
+ *   than 0.
+ * @time_scale: is the number of time units that pass in one second. It is a requirement of
+ *   bitstream conformance that @time_scale is greater than 0.
+ * @equal_picture_interval: equal to 1 indicates that pictures should be displayed according
+ *   to their output order with the number of ticks between two consecutive pictures (without
+ *   dropping frames) specified by @num_ticks_per_picture_minus_1 + 1. @equal_picture_interval
+ *   equal to 0 indicates that the interval between two consecutive pictures is not specified.
+ * @num_ticks_per_picture_minus_1: plus 1 specifies the number of clock ticks corresponding
+ *   to output time between two consecutive pictures in the output order. It is a requirement
+ *   of bitstream conformance that the value of @num_ticks_per_picture_minus_1 shall be in the
+ *   range of 0 to (1 << 32) - 2, inclusive.
+ */
+struct _GstAV1TimingInfo {
+  guint32 num_units_in_display_tick;
+  guint32 time_scale;
+  gboolean equal_picture_interval;
+  guint32 num_ticks_per_picture_minus_1;
+};
+
+/**
+ * GstAV1ColorConfig:
+ * @high_bitdepth: syntax element which, together with @seq_profile, determine the bit depth.
+ * @twelve_bit: is syntax elements which, together with @seq_profile and @high_bitdepth,
+ *   determines the bit depth.
+ * @mono_chrome: equal to 1 indicates that the video does not contain U and V color planes.
+ *   @mono_chrome equal to 0 indicates that the video contains Y, U, and V color planes.
+ * @color_description_present_flag: equal to 1 specifies that color_primaries,
+ *   @transfer_characteristics, and @matrix_coefficients are present.
+ *   @color_description_present_flag equal to 0 specifies that @color_primaries,
+ *   @transfer_characteristics and @matrix_coefficients are not present.
+ * @color_primaries: is an integer that is defined by the "Color primaries" section of
+ *   ISO/IEC 23091-4/ITU-T H.273.
+ * @transfer_characteristics: is an integer that is defined by the "Transfer characteristics"
+ *   section of ISO/IEC 23091-4/ITU-T H.273.
+ * @matrix_coefficients: is an integer that is defined by the "Matrix coefficients" section
+ *   of ISO/IEC 23091-4/ITU-T H.273.
+ * @color_range: is a binary value that is associated with the VideoFullRangeFlag variable
+ *   specified in ISO/IEC 23091-4/ITU-T H.273. color range equal to 0 shall be referred to
+ *   as the studio swing representation and color range equal to 1 shall be referred to as
+ *   the full swing representation for all intents relating to this specification.
+ * @subsampling_x, @subsampling_y: specify the chroma subsampling format. If
+ *   @matrix_coefficients is equal to GST_AV1_MC_IDENTITY, it is a requirement of bitstream
+ *   conformance that @subsampling_x is equal to 0 and @subsampling_y is equal to 0.
+ * @chroma_sample_position specifies the sample position for subsampled streams:
+ * @separate_uv_delta_q: equal to 1 indicates that the U and V planes may have separate
+ *  delta quantizer values. @separate_uv_delta_q equal to 0 indicates that the U and V
+ *  planes will share the same delta quantizer value.
+ */
+struct _GstAV1ColorConfig {
+  gboolean high_bitdepth;
+  gboolean twelve_bit;
+  gboolean mono_chrome;
+  gboolean color_description_present_flag;
+  GstAV1ColorPrimaries color_primaries;
+  GstAV1TransferCharacteristics transfer_characteristics;
+  GstAV1MatrixCoefficients matrix_coefficients;
+  gboolean color_range;
+  guint8 subsampling_x;
+  guint8 subsampling_y;
+  GstAV1ChromaSamplePositions chroma_sample_position;
+  gboolean separate_uv_delta_q;
+};
+
+/**
+ * GstAV1SequenceHeaderOBU:
+ * @seq_profile: specifies the features that can be used in the coded video sequence
+ * @still_picture: equal to 1 specifies that the bitstream contains only one coded frame.
+ * @reduced_still_picture_header: specifies that the syntax elements not needed by a still
+ *   picture are omitted.
+ * @frame_width_bits_minus_1: specifies the number of bits minus 1 used for transmitting
+ *   the frame width syntax elements.
+ * @frame_height_bits_minus_1: specifies the number of bits minus 1 used for transmitting
+ *   the frame height syntax elements.
+ * @max_frame_width_minus_1: specifies the maximum frame width minus 1 for the frames
+ *   represented by this sequenceheader.
+ * @max_frame_height_minus_1: specifies the maximum frame height minus 1 for the frames
+ *   represented by this sequenceheader.
+ * @frame_id_numbers_present_flag: specifies whether frame id numbers are present in the bitstream.
+ * @delta_frame_id_length_minus_2: specifies the number of bits minus 2 used to encode
+ *   delta_frame_id syntax elements.
+ * @additional_frame_id_length_minus_1: is used to calculate the number of bits used to
+ *   encode the frame_id syntax element.
+ * @use_128x128_superblock: when equal to 1, indicates that superblocks contain 128x128 luma
+ *   samples. When equal to 0, it indicates that superblocks contain 64x64 luma samples.
+ *   (The number of contained chroma samples depends on @subsampling_x and @subsampling_y).
+ * @enable_filter_intra: equal to 1 specifies that the @use_filter_intra syntax element may
+ *   be present. @enable_filter_intra equal to 0 specifies that the @use_filter_intra syntax
+ *   element will not be present.
+ * @enable_intra_edge_filter: specifies whether the intra edge filtering process should be enabled.
+ * @enable_interintra_compound: equal to 1 specifies that the mode info for inter blocks may
+ *   contain the syntax element interintra. @enable_interintra_compound equal to 0 specifies
+ *   that the syntax element interintra will not be present.
+ * @enable_masked_compound: equal to 1 specifies that the mode info for inter blocks may
+ *   contain the syntax element @compound_type. @enable_masked_compound equal to 0 specifies
+ *   that the syntax element @compound_type will not be present.
+ * @enable_warped_motion: equal to 1 indicates that the allow_warped_motion syntax element
+ *   may be present. @enable_warped_motion equal to 0 indicates that the @allow_warped_motion
+ *   syntax element will not be present.
+ * @enable_order_hint: equal to 1 indicates that tools based on the values of order hints
+ *   may be used. @enable_order_hint equal to 0 indicates that tools based on order hints
+ *   are disabled.
+ * @enable_dual_filter: equal to 1 indicates that the inter prediction filter type may be
+ *   specified independently in the horizontal and vertical directions. If the flag is equal
+ *   to 0, only one filter type may be specified, which is then used in both directions.
+ * @enable_jnt_comp: equal to 1 indicates that the distance weights process may be used
+ *   for inter prediction.
+ * @enable_ref_frame_mvs: equal to 1 indicates that the @use_ref_frame_mvs syntax element
+ *   may be present. @enable_ref_frame_mvs equal to 0 indicates that the @use_ref_frame_mvs
+ *   syntax element will not be present.
+ * @seq_choose_screen_content_tools: equal to 0 indicates that the @seq_force_screen_content_tools
+ *   syntax element will be present. @seq_choose_screen_content_tools equal to 1 indicates
+ *   that @seq_force_screen_content_tools should be set equal to SELECT_SCREEN_CONTENT_TOOLS.
+ * @seq_force_screen_content_tools: equal to SELECT_SCREEN_CONTENT_TOOLS indicates that the
+ *   @allow_screen_content_tools syntax element will be present in the frame header. Otherwise,
+ *   @seq_force_screen_content_tools contains the value for @allow_screen_content_tools.
+ * @seq_choose_integer_mv: equal to 0 indicates that the seq_force_integer_mv syntax element
+ *   will be present. @seq_choose_integer_mv equal to 1 indicates that @seq_force_integer_mv
+ *   should be set equal to SELECT_INTEGER_MV.
+ * @seq_force_integer_mv: equal to SELECT_INTEGER_MV indicates that the @force_integer_mv
+ *   syntax element will be present in the frame header (providing allow_screen_content_tools
+ *   is equal to 1). Otherwise, @seq_force_integer_mv contains the value for @force_integer_mv.
+ * @order_hint_bits_minus_1: is used to compute OrderHintBits.
+ * @enable_superres: equal to 1 specifies that the use_superres syntax element will be present
+ *   in the uncompressed header. enable_superres equal to 0 specifies that the use_superres
+ *   syntax element will not be present (instead use_superres will be set to 0 in the
+ *   uncompressed header without being read).
+ * @enable_cdef: equal to 1 specifies that cdef filtering may be enabled. enable_cdef equal
+ *   to 0 specifies that cdef filtering is disabled.
+ * @enable_restoration: equal to 1 specifies that loop restoration filtering may be enabled.
+ *   enable_restoration equal to 0 specifies that loop restoration filtering is disabled.
+ * @film_grain_params_present: specifies whether film grain parameters are present in the bitstream.
+ * @operating_points_cnt_minus_1: indicates the number of operating points minus 1 present
+ *   in this bitstream.
+ * @operating_points: specifies the corresponding operating point for a set of operating
+ *   parameters.
+ * @decoder_model_info_present_flag: specifies whether the decoder model info is present in
+ *   the bitstream.
+ * @decoder_model_info: holds information about the decoder model.
+ * @initial_display_delay_present_flag: specifies whether initial display delay information
+ *   is present in the bitstream or not.
+ * @timing_info_present_flag: specifies whether timing info is present in the bitstream.
+ * @timing_info: holds the timing information.
+ * @color_config: hold the color configuration.
+ * @order_hint_bits: specifies the number of bits used for the order_hint syntax element.
+ * @bit_depth: the bit depth of the stream.
+ * @num_planes: the YUV plane number.
+ */
+struct _GstAV1SequenceHeaderOBU {
+  GstAV1Profile seq_profile;
+  gboolean still_picture;
+  guint8 reduced_still_picture_header;
+
+  guint8 frame_width_bits_minus_1;
+  guint8 frame_height_bits_minus_1;
+  guint16 max_frame_width_minus_1;
+  guint16 max_frame_height_minus_1;
+
+  gboolean frame_id_numbers_present_flag;
+  guint8 delta_frame_id_length_minus_2;
+  guint8 additional_frame_id_length_minus_1;
+
+  gboolean use_128x128_superblock;
+  gboolean enable_filter_intra;
+  gboolean enable_intra_edge_filter;
+  gboolean enable_interintra_compound;
+  gboolean enable_masked_compound;
+  gboolean enable_warped_motion;
+  gboolean enable_order_hint;
+  gboolean enable_dual_filter;
+  gboolean enable_jnt_comp;
+  gboolean enable_ref_frame_mvs;
+  gboolean seq_choose_screen_content_tools;
+  guint8 seq_force_screen_content_tools;
+  gboolean seq_choose_integer_mv;
+  guint8 seq_force_integer_mv;
+  gint8 order_hint_bits_minus_1;
+
+  gboolean enable_superres;
+  gboolean enable_cdef;
+  gboolean enable_restoration;
+
+  guint8 film_grain_params_present;
+
+  guint8 operating_points_cnt_minus_1;
+  GstAV1OperatingPoint operating_points[GST_AV1_MAX_OPERATING_POINTS];
+
+  gboolean decoder_model_info_present_flag;
+  GstAV1DecoderModelInfo decoder_model_info;
+  guint8 initial_display_delay_present_flag;
+
+  gboolean timing_info_present_flag;
+  GstAV1TimingInfo timing_info;
+
+  GstAV1ColorConfig color_config;
+
+  /* Global var calculated by sequence */
+  guint8 order_hint_bits; /* OrderHintBits */
+  guint8 bit_depth; /* BitDepth */
+  guint8 num_planes; /* NumPlanes */
+};
+
+/**
+ * GstAV1MetadataITUT_T35:
+ * @itu_t_t35_country_code: shall be a byte having a value specified as a country code by
+ *   Annex A of Recommendation ITU-T T.35.
+ * @itu_t_t35_country_code_extension_byte: shall be a byte having a value specified as a
+ *   country code by Annex B of Recommendation ITU-T T.35.
+ * @itu_t_t35_payload_bytes: shall be bytes containing data registered as specified in
+ *   Recommendation ITU-T T.35.
+ */
+struct _GstAV1MetadataITUT_T35 {
+  guint8 itu_t_t35_country_code;
+  guint8 itu_t_t35_country_code_extention_byte;
+  /* itu_t_t35_payload_bytes - not specified at this spec */
+  guint8 *itu_t_t35_payload_bytes;
+};
+
+/**
+ * GstAV1MetadataHdrCll:
+ * @max_cll: specifies the maximum content light level as specified in CEA-861.3, Appendix A.
+ * @max_fall: specifies the maximum frame-average light level as specified in CEA-861.3, Appendix A.
+ *
+ * High Dynamic Range content light level syntax metadata.
+ */
+struct _GstAV1MetadataHdrCll {
+  guint16 max_cll;
+  guint16 max_fall;
+};
+
+/**
+ * GstAV1MetadataHdrMdcv:
+ * @primary_chromaticity_x: specifies a 0.16 fixed-point X chromaticity coordinate as
+ *   defined by CIE 1931, where i = 0,1,2 specifies Red, Green, Blue respectively.
+ * @primary_chromaticity_y: specifies a 0.16 fixed-point Y chromaticity coordinate as
+ *   defined by CIE 1931, where i = 0,1,2 specifies Red, Green, Blue respectively.
+ * @white_point_chromaticity_x: specifies a 0.16 fixed-point white X chromaticity coordinate
+ *   as defined by CIE 1931.
+ * @white_point_chromaticity_y: specifies a 0.16 fixed-point white Y chromaticity coordinate
+ *   as defined by CIE 1931.
+ * @luminance_max: is a 24.8 fixed-point maximum luminance, represented in candelas per
+ *   square meter.
+ * @luminance_min: is a 18.14 fixed-point minimum luminance, represented in candelas per
+ *   square meter.
+ *
+ *  High Dynamic Range mastering display color volume metadata.
+ */
+struct _GstAV1MetadataHdrMdcv {
+  guint16 primary_chromaticity_x[3];
+  guint16 primary_chromaticity_y[3];
+  guint16 white_point_chromaticity_x;
+  guint16 white_point_chromaticity_y;
+  guint32 luminance_max;
+  guint32 luminance_min;
+};
+
+/**
+ * GstAV1MetadataScalability:
+ * @scalability_mode_idc: indicates the picture prediction structure of the bitstream.
+ * @spatial_layers_cnt_minus_1: indicates the number of spatial layers present in the video
+ *   sequence minus one.
+ * @spatial_layer_description_present_flag: indicates when set to 1 that the
+ *   spatial_layer_ref_id is present for each of the (@spatial_layers_cnt_minus_1 + 1) layers,
+ *   or that it is not present when set to 0.
+ * @spatial_layer_dimensions_present_flag: indicates when set to 1 that the
+ *   @spatial_layer_max_width and @spatial_layer_max_height parameters are present for each of
+ *   the (@spatial_layers_cnt_minus_1 + 1) layers, or that it they are not present when set to 0.
+ * @temporal_group_description_present_flag: indicates when set to 1 that the temporal
+ *   dependency information is present, or that it is not when set to 0.
+ * @spatial_layer_max_width: specifies the maximum frame width for the frames with
+ *   @spatial_id equal to i. This number must not be larger than @max_frame_width_minus_1 + 1.
+ * @spatial_layer_max_height: specifies the maximum frame height for the frames with
+ *   @spatial_id equal to i. This number must not be larger than @max_frame_height_minus_1 + 1.
+ * @spatial_layer_ref_id: specifies the @spatial_id value of the frame within the current
+ *   temporal unit that the frame of layer i uses for reference. If no frame within the
+ *   current temporal unit is used for reference the value must be equal to 255.
+ * @temporal_group_size: indicates the number of pictures in a temporal picture group. If the
+ *   @temporal_group_size is greater than 0, then the scalability structure data allows the
+ *   inter-picture temporal dependency structure of the video sequence to be specified. If the
+ *   @temporal_group_size is greater than 0, then for @temporal_group_size pictures in the
+ *   temporal group, each picture's temporal layer id (@temporal_id), switch up points
+ *   (@temporal_group_temporal_switching_up_point_flag and
+ *   @temporal_group_spatial_switching_up_point_flag), and the reference picture indices
+ *   (@temporal_group_ref_pic_diff) are specified. The first picture specified in a temporal
+ *   group must have @temporal_id equal to 0. If the parameter @temporal_group_size is not
+ *   present or set to 0, then either there is only one temporal layer or there is no fixed
+ *   inter-picture temporal dependency present going forward in the video sequence. Note that
+ *   for a given picture, all frames follow the same inter-picture temporal dependency
+ *   structure. However, the frame rate of each layer can be different from each other. The
+ *   specified dependency structure in the scalability structure data must be for the highest
+ *   frame rate layer.
+ * @temporal_group_temporal_id: specifies the temporal_id value for the i-th picture in
+ *   the temporal group.
+ * @temporal_group_temporal_switching_up_point_flag: is set to 1 if subsequent (in decoding
+ *   order) pictures with a @temporal_id higher than @temporal_group_temporal_id[i] do not
+ *   depend on any picture preceding the current picture (in coding order) with @temporal_id
+ *   higher than @temporal_group_temporal_id[ i ].
+ * @temporal_group_spatial_switching_up_point_flag: is set to 1 if spatial layers of the
+ *   current picture in the temporal group (i.e., pictures with a spatial_id higher than zero)
+ *   do not depend on any picture preceding the current picture in the temporal group.
+ * @temporal_group_ref_cnt: indicates the number of reference pictures used by the i-th
+ *   picture in the temporal group.
+ * @temporal_group_ref_pic_diff: indicates, for the i-th picture in the temporal group,
+ *   the temporal distance between the i-th picture and the j-th reference picture used by
+ *   the i-th picture. The temporal distance is measured in frames, counting only frames of
+ *   identical @spatial_id values.
+ *
+ * The scalability metadata OBU is intended for use by intermediate
+ * processing entities that may perform selective layer elimination.
+ */
+struct _GstAV1MetadataScalability {
+  GstAV1ScalabilityModes scalability_mode_idc;
+  guint8 spatial_layers_cnt_minus_1;
+  gboolean spatial_layer_dimensions_present_flag;
+  gboolean spatial_layer_description_present_flag;
+  gboolean temporal_group_description_present_flag;
+  guint16 spatial_layer_max_width[GST_AV1_MAX_SPATIAL_LAYERS];
+  guint16 spatial_layer_max_height[GST_AV1_MAX_SPATIAL_LAYERS];
+  guint8 spatial_layer_ref_id[GST_AV1_MAX_SPATIAL_LAYERS];
+  guint8 temporal_group_size;
+
+  guint8 temporal_group_temporal_id[GST_AV1_MAX_TEMPORAL_GROUP_SIZE];
+  guint8 temporal_group_temporal_switching_up_point_flag[GST_AV1_MAX_TEMPORAL_GROUP_SIZE];
+  guint8 temporal_group_spatial_switching_up_point_flag[GST_AV1_MAX_TEMPORAL_GROUP_SIZE];
+  guint8 temporal_group_ref_cnt[GST_AV1_MAX_TEMPORAL_GROUP_SIZE];
+  guint8 temporal_group_ref_pic_diff[GST_AV1_MAX_TEMPORAL_GROUP_SIZE]
+                                    [GST_AV1_MAX_TEMPORAL_GROUP_REFERENCES];
+};
+
+/**
+ * GstAV1MetadataTimecode:
+ * @counting_type: specifies the method of dropping values of the n_frames syntax element as
+ *   specified in AV1 Spec 6.1.1. @counting_type should be the same for all pictures in the
+ *   coded video sequence.
+ * @full_timestamp_flag: equal to 1 indicates that the the @seconds_value, @minutes_value,
+ *   @hours_value syntax elements will be present. @full_timestamp_flag equal to 0 indicates
+ *   that there are flags to control the presence of these syntax elements.
+ * @discontinuity_flag: equal to 0 indicates that the difference between the current value
+ *   of clockTimestamp and the value of clockTimestamp computed from the previous set of
+ *   timestamp syntax elements in output order can be interpreted as the time difference
+ *   between the times of origin or capture of the associated frames or fields.
+ *   @discontinuity_flag equal to 1 indicates that the difference between the current value of
+ *   clockTimestamp and the value of clockTimestamp computed from the previous set of clock
+ *   timestamp syntax elements in output order should not be interpreted as the time difference
+ *   between the times of origin or capture of the associated frames or fields.
+ * @cnt_dropped_flag: specifies the skipping of one or more values of @n_frames using the
+ *   counting method specified by counting_type.
+ * @n_frames: is used to compute clockTimestamp. When @timing_info_present_flag is equal to 1,
+ *   @n_frames shall be less than maxFps, where maxFps is specified by
+ *   maxFps = ceil( time_scale / ( 2 * @num_units_in_display_tick ) ).
+ * @seconds_flag: equal to 1 specifies that @seconds_value and @minutes_flag are present when
+ *   @full_timestamp_flag is equal to 0. @seconds_flag equal to 0 specifies that @seconds_value
+ *   and @minutes_flag are not present.
+ * @seconds_value: is used to compute clockTimestamp and shall be in the range of 0 to 59.
+ *   When @seconds_value is not present, its value is inferred to be equal to the value of
+ *   @seconds_value for the previous set of clock timestamp syntax elements in decoding order,
+ *   and it is required that such a previous @seconds_value shall have been present.
+ * @minutes_flag: equal to 1 specifies that @minutes_value and @hours_flag are present when
+ *   @full_timestamp_flag is equal to 0 and @seconds_flag is equal to 1. @minutes_flag equal to 0
+ *   specifies that @minutes_value and @hours_flag are not present.
+ * @minutes_value: specifies the value of mm used to compute clockTimestamp and shall be in
+ *   the range of 0 to 59, inclusive. When minutes_value is not present, its value is inferred
+ *   to be equal to the value of @minutes_value for the previous set of clock timestamp syntax
+ *   elements in decoding order, and it is required that such a previous @minutes_value shall
+ *   have been present.
+ * @hours_flag: equal to 1 specifies that @hours_value is present when @full_timestamp_flag is
+ *   equal to 0 and @seconds_flag is equal to 1 and @minutes_flag is equal to 1.
+ * @hours_value: is used to compute clockTimestamp and shall be in the range of 0 to 23,
+ *   inclusive. When @hours_value is not present, its value is inferred to be equal to the
+ *   value of @hours_value for the previous set of clock timestamp syntax elements in decoding
+ *   order, and it is required that such a previous @hours_value shall have been present.
+ * @time_offset_length: greater than 0 specifies the length in bits of the @time_offset_value
+ *   syntax element. @time_offset_length equal to 0 specifies that the @time_offset_value syntax
+ *   element is not present. @time_offset_length should be the same for all pictures in the
+ *   coded video sequence.
+ * @time_offset_value: is used to compute clockTimestamp. The number of bits used to represent
+ *   @time_offset_value is equal to @time_offset_length. When @time_offset_value is not present,
+ *   its value is inferred to be equal to 0.
+ */
+struct _GstAV1MetadataTimecode {
+  guint8 counting_type;       /* candidate for sperate Type GstAV1TimecodeCountingType */
+  gboolean full_timestamp_flag;
+  gboolean discontinuity_flag;
+  gboolean cnt_dropped_flag;
+  guint8 n_frames;
+  gboolean seconds_flag;
+  guint8 seconds_value;
+  gboolean minutes_flag;
+  guint8 minutes_value;
+  gboolean hours_flag;
+  guint8 hours_value;
+  guint8 time_offset_length;
+  guint32 time_offset_value;
+};
+
+/**
+ * GstAV1MetadataOBU:
+ * @metadata_type: type of metadata
+ * @itut_t35: ITUT T35 metadata
+ * @hdrcll: high dynamic range content light level metadata
+ * @hdrcmdcv: high dynamic range mastering display color volume metadata_type
+ * @scalability: Scalability metadata
+ * @timecode: Timecode metadata
+ */
+struct _GstAV1MetadataOBU {
+  GstAV1MetadataType metadata_type;
+  union {
+    GstAV1MetadataITUT_T35 itut_t35;
+    GstAV1MetadataHdrCll hdr_cll;
+    GstAV1MetadataHdrMdcv hdr_mdcv;
+    GstAV1MetadataScalability scalability;
+    GstAV1MetadataTimecode timecode;
+  };
+};
+
+/**
+ * GstAV1LoopFilterParams:
+ * @loop_filter_level: is an array containing loop filter strength values. Different loop
+ *   filter strength values from the array are used depending on the image plane being
+ *   filtered, and the edge direction (vertical or horizontal) being filtered.
+ * @loop_filter_sharpness: indicates the sharpness level. The @loop_filter_level and
+ *   @loop_filter_sharpness together determine when a block edge is filtered, and by how much
+ *   the filtering can change the sample values. The loop filter process is described in AV1
+ *   Bitstream Spec. section 7.14.
+ * @loop_filter_delta_enabled: equal to 1 means that the filter level depends on the mode and
+ *   reference frame used to predict a block. @loop_filter_delta_enabled equal to 0 means that
+ *   the filter level does not depend on the mode and reference frame.
+ * @loop_filter_delta_update: equal to 1 means that the bitstream contains additional syntax
+ *   elements that specify which mode and reference frame deltas are to be updated.
+ *   @loop_filter_delta_update equal to 0 means that these syntax elements are not present.
+ * @loop_filter_ref_deltas: contains the adjustment needed for the filter level based on
+ *   the chosen reference frame. If this syntax element is not present in the bitstream,
+ *   it maintains its previous value.
+ * @loop_filter_mode_deltas: contains the adjustment needed for the filter level based on
+ *   the chosen mode. If this syntax element is not present in the bitstream, it maintains
+ *   its previous value.
+ * @delta_lf_present: specifies whether loop filter delta values are present in the bitstream.
+ * @delta_lf_res: specifies the left shift which should be applied to decoded loop filter
+ *   delta values.
+ * @delta_lf_multi: equal to 1 specifies that separate loop filter deltas are sent for
+ *   horizontal luma edges, vertical luma edges, the U edges, and the V edges. @delta_lf_multi
+ *   equal to 0 specifies that the same loop filter delta is used for all edges.
+ */
+struct _GstAV1LoopFilterParams {
+  guint8 loop_filter_level[4];
+  guint8 loop_filter_sharpness;
+  gboolean loop_filter_delta_enabled;
+  gboolean loop_filter_delta_update;
+
+  gint8 loop_filter_ref_deltas[GST_AV1_TOTAL_REFS_PER_FRAME];
+  gint8 loop_filter_mode_deltas[2];
+
+  gboolean delta_lf_present;
+  guint8 delta_lf_res;
+  guint8 delta_lf_multi;
+};
+
+/**
+ * GstAV1QuantizationParams:
+ * @base_q_idx: indicates the base frame qindex. This is used for Y AC coefficients and as
+ *   the base value for the other quantizers.
+ * @diff_uv_delta: equal to 1 indicates that the U and V delta quantizer values are coded
+ *   separately. @diff_uv_delta equal to 0 indicates that the U and V delta quantizer values
+ *   share a common value.
+ * @using_qmatrix: specifies that the quantizer matrix will be used to compute quantizers.
+ * @qm_y: specifies the level in the quantizer matrix that should be used for luma plane decoding.
+ * @qm_u: specifies the level in the quantizer matrix that should be used for chroma U plane decoding.
+ * @qm_v: specifies the level in the quantizer matrix that should be used for chroma V plane decoding.
+ * @delta_q_present: specifies whether quantizer index delta values are present in the bitstream.
+ * @delta_q_res: specifies the left shift which should be applied to decoded quantizer index
+ *   delta values.
+ * @delta_q_y_dc: indicates the Y DC quantizer relative to base_q_idx.
+ * @delta_q_u_dc: indicates the U DC quantizer relative to base_q_idx.
+ * @delta_q_u_ac: indicates the U AC quantizer relative to base_q_idx.
+ * @delta_q_v_dc: indicates the V DC quantizer relative to base_q_idx.
+ * @delta_q_v_ac: indicates the V AC quantizer relative to base_q_idx.
+ */
+struct _GstAV1QuantizationParams {
+  guint8 base_q_idx;
+  gboolean diff_uv_delta;
+  gboolean using_qmatrix;
+  guint8 qm_y;
+  guint8 qm_u;
+  guint8 qm_v;
+
+  gboolean delta_q_present;
+  guint8 delta_q_res;
+
+  gint8 delta_q_y_dc; /* DeltaQYDc */
+  gint8 delta_q_u_dc; /* DeltaQUDc */
+  gint8 delta_q_u_ac; /* DeltaQUAc */
+  gint8 delta_q_v_dc; /* DeltaQVDc */
+  gint8 delta_q_v_ac; /* DeltaQVAc */
+};
+
+/**
+ * GstAV1SegmenationParams:
+ * @segmentation_enabled: equal to 1 indicates that this frame makes use of the segmentation
+ *   tool; @segmentation_enabled equal to 0 indicates that the frame does not use segmentation.
+ * @segmentation_update_map: equal to 1 indicates that the segmentation map are updated during
+ *   the decoding of this frame. @segmentation_update_map equal to 0 means that the segmentation
+ *   map from the previous frame is used.
+ * @segmentation_temporal_update: equal to 1 indicates that the updates to the segmentation map
+ *   are coded relative to the existing segmentation map. @segmentation_temporal_update equal to
+ *   0 indicates that the new segmentation map is coded without reference to the existing
+ *   segmentation map.
+ * @segmentation_update_data: equal to 1 indicates that new parameters are about to be
+ *   specified for each segment. @segmentation_update_data equal to 0 indicates that the
+ *   segmentation parameters should keep their existing values.
+ * @feature_enabled: set to 1 when the feature of segmentation is enabled.
+ * @feature_data: the value of according segmentation feature.
+ * @seg_id_pre_skip: equal to 1 indicates that the segment id will be read before the skip
+ *   syntax element. @seg_id_pre_skip equal to 0 indicates that the skip syntax element will be
+ *   read first.
+ * @last_active_seg_id: indicates the highest numbered segment id that has some enabled feature.
+ *   This is used when decoding the segment id to only decode choices corresponding to used
+ *   segments.
+ */
+struct _GstAV1SegmenationParams {
+  gboolean segmentation_enabled;
+  guint8 segmentation_update_map;
+  guint8 segmentation_temporal_update;
+  guint8 segmentation_update_data;
+
+  gint8 feature_enabled[GST_AV1_MAX_SEGMENTS][GST_AV1_SEG_LVL_MAX]; /* FeatureEnabled */
+  gint16 feature_data[GST_AV1_MAX_SEGMENTS][GST_AV1_SEG_LVL_MAX]; /* FeatureData */
+  guint8 seg_id_pre_skip; /* SegIdPreSkip */
+  guint8 last_active_seg_id; /* LastActiveSegId */
+};
+
+/**
+ * GstAV1TileInfo:
+ * @uniform_tile_spacing_flag: equal to 1 means that the tiles are uniformly spaced across the
+ *   frame. (In other words, all tiles are the same size except for the ones at the right and
+ *   bottom edge which can be smaller.) @uniform_tile_spacing_flag equal to 0 means that the
+ *   tile sizes are coded.
+ * @increment_tile_rows_log2: is used to compute @tile_rows_log2.
+ * @width_in_sbs_minus_1: specifies the width of a tile minus 1 in units of superblocks.
+ * @height_in_sbs_minus_1: specifies the height of a tile minus 1 in units of superblocks.
+ * @tile_size_bytes_minus_1: is used to compute @tile_size_bytes
+ * @context_update_tile_id: specifies which tile to use for the CDF update.
+ * @mi_col_starts: is an array specifying the start column (in units of 4x4 luma samples) for
+ *   each tile across the image.
+ * @mi_row_starts: is an array specifying the start row (in units of 4x4 luma samples) for
+ *   each tile down the image.
+ * @tile_cols_log2: specifies the base 2 logarithm of the desired number of tiles across the frame.
+ * @tile_cols: specifies the number of tiles across the frame. It is a requirement of bitstream
+ *   conformance that @tile_cols is less than or equal to GST_AV1_MAX_TILE_COLS.
+ * @tile_rows_log2: specifies the base 2 logarithm of the desired number of tiles down the frame.
+ * @tile_rows: specifies the number of tiles down the frame. It is a requirement of bitstream
+ *   conformance that @tile_rows is less than or equal to GST_AV1_MAX_TILE_ROWS.
+ * @tile_size_bytes: specifies the number of bytes needed to code each tile size.
+ */
+struct _GstAV1TileInfo {
+  guint8 uniform_tile_spacing_flag;
+  gint increment_tile_rows_log2;
+  gint width_in_sbs_minus_1[GST_AV1_MAX_TILE_COLS];
+  gint height_in_sbs_minus_1[GST_AV1_MAX_TILE_ROWS];
+  gint tile_size_bytes_minus_1;
+  guint8 context_update_tile_id;
+
+  guint32 mi_col_starts[GST_AV1_MAX_TILE_COLS + 1]; /* MiColStarts */
+  guint32 mi_row_starts[GST_AV1_MAX_TILE_ROWS + 1]; /* MiRowStarts */
+  guint8 tile_cols_log2; /* TileColsLog2 */
+  guint8 tile_cols; /* TileCols */
+  guint8 tile_rows_log2; /* TileRowsLog2 */
+  guint8 tile_rows; /* TileRows */
+  guint8 tile_size_bytes; /* TileSizeBytes */
+};
+
+/**
+ * GstAV1CDEFParams:
+ * @cdef_damping: controls the amount of damping in the deringing filter.
+ * @cdef_bits: specifies the number of bits needed to specify which CDEF filter to apply.
+ * @cdef_y_pri_strength: specify the strength of the primary filter (Y component)
+ * @cdef_uv_pri_strength: specify the strength of the primary filter (UV components).
+ * @cdef_y_sec_strength: specify the strength of the secondary filter (Y component).
+ * @cdef_uv_sec_strength: specify the strength of the secondary filter (UV components).
+ *
+ * Parameters of Constrained Directional Enhancement Filter (CDEF).
+ */
+struct _GstAV1CDEFParams {
+  guint8 cdef_damping;
+  guint8 cdef_bits;
+  guint8 cdef_y_pri_strength[GST_AV1_CDEF_MAX];
+  guint8 cdef_y_sec_strength[GST_AV1_CDEF_MAX];
+  guint8 cdef_uv_pri_strength[GST_AV1_CDEF_MAX];
+  guint8 cdef_uv_sec_strength[GST_AV1_CDEF_MAX];
+};
+
+/**
+ * GstAV1LoopRestorationParams:
+ * @lr_unit_shift: specifies if the luma restoration size should be halved.
+ * @lr_uv_shift: is only present for 4:2:0 formats and specifies if the chroma size should be
+ *   half the luma size.
+ * @frame_restoration_type: specifies the type of restoration used for each plane.
+ * @loop_restoration_size: specifies the size of loop restoration units in units of samples in
+ *   the current plane.
+ * @uses_lr: indicates if any plane uses loop restoration.
+ */
+struct _GstAV1LoopRestorationParams {
+  guint8 lr_unit_shift;
+  gboolean lr_uv_shift;
+
+  GstAV1FrameRestorationType frame_restoration_type[GST_AV1_MAX_NUM_PLANES]; /* FrameRestorationType */
+  guint32 loop_restoration_size[GST_AV1_MAX_NUM_PLANES]; /* LoopRestorationSize */
+  guint8 uses_lr; /* UsesLr */
+};
+
+/**
+ * GstAV1GlobalMotionParams:
+ * @is_global: specifies whether global motion parameters are present for a particular
+ *   reference frame.
+ * @is_rot_zoom: specifies whether a particular reference frame uses rotation and zoom
+ *   global motion.
+ * @is_translation: specifies whether a particular reference frame uses translation
+ *   global motion.
+ * @gm_params: is set equal to SavedGmParams[ frame_to_show_map_idx ][ ref ][ j ] for
+ *   ref = LAST_FRAME..ALTREF_FRAME, for j = 0..5.
+ * @gm_type: specifying the type of global motion.
+ * @invalid: whether this global motion parameters is invalid. (Since: 1.20)
+ */
+/**
+ * _GstAV1GlobalMotionParams.invalid:
+ *
+ * whether this global motion parameters is invalid.
+ *
+ * Since: 1.20
+ */
+struct _GstAV1GlobalMotionParams {
+  gboolean is_global[GST_AV1_NUM_REF_FRAMES];
+  gboolean is_rot_zoom[GST_AV1_NUM_REF_FRAMES];
+  gboolean is_translation[GST_AV1_NUM_REF_FRAMES];
+  gint32 gm_params[GST_AV1_NUM_REF_FRAMES][6];
+
+  GstAV1WarpModelType gm_type[GST_AV1_NUM_REF_FRAMES]; /* GmType */
+  gboolean invalid[GST_AV1_NUM_REF_FRAMES];
+};
+
+/**
+ * GstAV1FilmGrainParams:
+ * @apply_grain: equal to 1 specifies that film grain should be added to this frame.
+ *   apply_grain equal to 0 specifies that film grain should not be added.
+ * @grain_seed: specifies the starting value for the pseudo-random numbers used during film
+ *   grain synthesis.
+ * @update_grain: equal to 1 means that a new set of parameters should be sent. @update_grain
+ *   equal to 0 means that the previous set of parameters should be used.
+ * @film_grain_params_ref_idx: indicates which reference frame contains the film grain
+ *   parameters to be used for this frame.
+ * @num_y_points: specifies the number of points for the piece-wise linear scaling function
+ *   of the luma component. It is a requirement of bitstream conformance that @num_y_points is
+ *   less than or equal to 14.
+ * @point_y_value: represents the x (luma value) coordinate for the i-th point of the
+ *   piecewise linear scaling function for luma component. The values are signaled on the
+ *   scale of 0..255. (In case of 10 bit video, these values correspond to luma values divided
+ *   by 4. In case of 12 bit video, these values correspond to luma values divided by 16.)
+ *   If i is greater than 0, it is a r equirement of bitstream conformance that
+ *   @point_y_value[ i ] is greater than @point_y_value[ i - 1 ] (this ensures the x coordinates
+ *   are specified in increasing order).
+ * @point_y_scaling: represents the scaling (output) value for the i-th point of the
+ *   piecewise linear scaling function for luma component.
+ * @chroma_scaling_from_luma: specifies that the chroma scaling is inferred from the luma scaling.
+ * @num_cb_points: specifies the number of points for the piece-wise linear scaling function
+ *   of the cb component. It is a requirement of bitstream conformance that @num_cb_points is
+ *   less than or equal to 10.
+ * @point_cb_value: represents the x coordinate for the i-th point of the piece-wise linear
+ *   scaling function for cb component. The values are signaled on the scale of 0..255. If i
+ *   is greater than 0, it is a requirement of bitstream conformance that point_cb_value[ i ]
+ *   is greater than point_cb_value[ i - 1 ].
+ * @point_cb_scaling: represents the scaling (output) value for the i-th point of the
+ *   piecewise linear scaling function for cb component.
+ * @num_cr_points: specifies represents the number of points for the piece-wise linear scaling
+ *   function of the cr component. It is a requirement of bitstream conformance that
+ *   num_cr_points is less than or equal to 10. If subsampling_x is equal to 1 and
+ *   @subsampling_y is equal to 1 and num_cb_points is equal to 0, it is a requirement of
+ *   bitstream conformance that num_cr_points is equal to 0. If @subsampling_x is equal to 1
+ *   and @subsampling_y is equal to 1 and @num_cb_points is not equal to 0, it is a requirement
+ *   of bitstream conformance that @num_cr_points is not equal to 0.
+ * @point_cr_value: represents the x coordinate for the i-th point of the piece-wise linear
+ *   scaling function for cr component. The values are signaled on the scale of 0..255. If i
+ *   is greater than 0, it is a requirement of bitstream conformance that @point_cr_value[ i ]
+ *   is greater than @point_cr_value[ i - 1 ].
+ * @point_cr_scaling: represents the scaling (output) value for the i-th point of the
+ *   piecewise linear scaling function for cr component.
+ * @grain_scaling_minus_8: represents the shift - 8 applied to the values of the chroma
+ *   component. The @grain_scaling_minus_8 can take values of 0..3 and determines the range and
+ *   quantization step of the standard deviation of film grain.
+ * @ar_coeff_lag: specifies the number of auto-regressive coefficients for luma and chroma.
+ * @ar_coeffs_y_plus_128: specifies auto-regressive coefficients used for the Y plane.
+ * @ar_coeffs_cb_plus_128: specifies auto-regressive coefficients used for the U plane.
+ * @ar_coeffs_cr_plus_128: specifies auto-regressive coefficients used for the V plane.
+ * @ar_coeff_shift_minus_6: specifies the range of the auto-regressive coefficients. Values
+ *   of 0, 1, 2, and 3 correspond to the ranges for auto-regressive coefficients of [-2, 2),
+ *   [-1, 1), [-0.5, 0.5) and [-0.25, 0.25) respectively.
+ * @grain_scale_shift: specifies how much the Gaussian random numbers should be scaled down
+ *   during the grain synthesis process.
+ * @cb_mult: represents a multiplier for the cb component used in derivation of the input
+ *   index to the cb component scaling function.
+ * @cb_luma_mult: represents a multiplier for the average luma component used in derivation
+ *   of the input index to the cb component scaling function.
+ * @cb_offset: represents an offset used in derivation of the input index to the cb component
+ *   scaling function.
+ * @cr_mult: represents a multiplier for the cr component used in derivation of the input
+ *   index to the cr component scaling function.
+ * @cr_luma_mult: represents a multiplier for the average luma component used in derivation
+ *   of the input index to the cr component scaling function.
+ * @cr_offset: represents an offset used in derivation of the input index to the cr component
+ *   scaling function.
+ * @overlap_flag: equal to 1 indicates that the overlap between film grain blocks shall be
+ *   applied. overlap_flag equal to 0 indicates that the overlap between film grain blocks
+ *   shall not be applied.
+ * @clip_to_restricted_range: equal to 1 indicates that clipping to the restricted (studio)
+ *   range shall be applied to the sample values after adding the film grain (see the
+ *   semantics for color_range for an explanation of studio swing). clip_to_restricted_range
+ *   equal to 0 indicates that clipping to the full range shall be applied to the sample
+ *   values after adding the film grain.
+ */
+struct _GstAV1FilmGrainParams {
+  gboolean apply_grain;
+  guint16 grain_seed;
+  gboolean update_grain;
+  guint8 film_grain_params_ref_idx;
+  guint8 num_y_points;
+  guint8 point_y_value[GST_AV1_MAX_NUM_Y_POINTS];
+  guint8 point_y_scaling[GST_AV1_MAX_NUM_Y_POINTS];
+  guint8 chroma_scaling_from_luma;
+  guint8 num_cb_points;
+  guint8 point_cb_value[GST_AV1_MAX_NUM_CB_POINTS];
+  guint8 point_cb_scaling[GST_AV1_MAX_NUM_CB_POINTS];
+  guint8 num_cr_points;
+  guint8 point_cr_value[GST_AV1_MAX_NUM_CR_POINTS];
+  guint8 point_cr_scaling[GST_AV1_MAX_NUM_CR_POINTS];
+  guint8 grain_scaling_minus_8;
+  guint8 ar_coeff_lag;
+  guint8 ar_coeffs_y_plus_128[GST_AV1_MAX_NUM_POS_LUMA];
+  guint8 ar_coeffs_cb_plus_128[GST_AV1_MAX_NUM_POS_LUMA];
+  guint8 ar_coeffs_cr_plus_128[GST_AV1_MAX_NUM_POS_LUMA];
+  guint8 ar_coeff_shift_minus_6;
+  guint8 grain_scale_shift;
+  guint8 cb_mult;
+  guint8 cb_luma_mult;
+  guint16 cb_offset;
+  guint8 cr_mult;
+  guint8 cr_luma_mult;
+  guint16 cr_offset;
+  gboolean overlap_flag;
+  gboolean clip_to_restricted_range;
+};
+
+/**
+ * GstAV1FrameHeaderOBU:
+ * @show_existing_frame: equal to 1, indicates the frame indexed by @frame_to_show_map_idx is
+ *   to be output; @show_existing_frame equal to 0 indicates that further processing is required.
+ *   If @obu_type is equal to #GST_AV1_OBU_FRAME, it is a requirement of bitstream conformance that
+ *   @show_existing_frame is equal to 0.
+ * @frame_to_show_map_idx: specifies the frame to be output. It is only available if
+ *   @show_existing_frame is 1.
+ * @frame_presentation_time: specifies the presentation time of the frame in clock ticks
+ *   DispCT counted from the removal time of the last frame with frame_type equal to KEY_FRAME
+ *   for the operating point that is being decoded. The syntax element is signaled as a fixed
+ *   length unsigned integer with a length in bits given by
+ *   @frame_presentation_time_length_minus_1 + 1. The @frame_presentation_time is the remainder
+ *   of a modulo 1 << (@frame_presentation_time_length_minus_1 + 1) counter.
+ * @tu_presentation_delay: is a syntax element used by the decoder model. It does not affect
+ *   the decoding process.
+ * @display_frame_id: provides the frame id number for the frame to output. It is a requirement
+ *   of bitstream conformance that whenever @display_frame_id is read, the value matches
+ *   @ref_frame_id[ @frame_to_show_map_idx ] (the value of @current_frame_id at the time that the
+ *   frame indexed by @frame_to_show_map_idx was stored), and that
+ *   @ref_valid[ @frame_to_show_map_idx ] is equjal to 1. It is a requirement of bitstream
+ *   conformance that the number of bits needed to read @display_frame_id does not exceed 16.
+ *   This is equivalent to the constraint that idLen <= 16
+ * @frame_type: specifies the type of the frame.
+ * @show_frame: equal to 1 specifies that this frame should be immediately output once decoded.
+ *   show_frame equal to 0 specifies that this frame should not be immediately output. (It may
+ *   be output later if a later uncompressed header uses @show_existing_frame equal to 1).
+ * @showable_frame: equal to 1 specifies that the frame may be output using the
+ *   @show_existing_frame mechanism. showable_frame equal to 0 specifies that this frame will
+ *   not be output using the @show_existing_frame mechanism. It is a requirement of bitstream
+ *   conformance that when @show_existing_frame is used to show a previous frame, that the
+ *   value of @showable_frame for the previous frame was equal to 1. It is a requirement of
+ *   bitstream conformance that a particular showable frame is output via the
+ *   @show_existing_frame mechanism at most once.
+ * @error_resilient_mode: equal to 1 indicates that error resilient mode is enabled;
+ *   @error_resilient_mode equal to 0 indicates that error resilient mode is disabled.
+ * @disable_cdf_update: specifies whether the CDF update in the symbol decoding process should
+ *   be disabled.
+ * @allow_screen_content_tools: equal to 1 indicates that intra blocks may use palette encoding;
+ *   @allow_screen_content_tools equal to 0 indicates that palette encoding is never used.
+ * @force_integer_mv: equal to 1 specifies that motion vectors will always be integers.
+ *   @force_integer_mv equal to 0 specifies that motion vectors can contain fractional bits.
+ * @current_frame_id: specifies the frame id number for the current frame. Frame id numbers
+ *   are additional information that do not affect the decoding process, but provide decoders
+ *   with a way of detecting missing reference frames so that appropriate action can be taken.
+ * @frame_size_override_flag: equal to 0 specifies that the frame size is equal to the size in
+ *   the sequence header. @frame_size_override_flag equal to 1 specifies that the frame size
+ *   will either be specified as the size of one of the reference frames, or computed from the
+ *   @frame_width_minus_1 and @frame_height_minus_1 syntax elements.
+ * @order_hint: is used to compute order_hint.
+ * @primary_ref_frame: specifies which reference frame contains the CDF values and other state
+ *   that should be loaded at the start of the frame.
+ * @buffer_removal_time_present_flag: equal to 1 specifies that @buffer_removal_time is present
+ *   in the bitstream. @buffer_removal_time_present_flag equal to 0 specifies that
+ *   @buffer_removal_time is not present in the bitstream.
+ * @buffer_removal_time: specifies the frame removal time in units of DecCT clock ticks
+ *   counted from the removal time of the last frame with frame_type equal to KEY_FRAME for
+ *   operating point opNum. @buffer_removal_time is signaled as a fixed length unsigned integer
+ *   with a length in bits given by @buffer_removal_time_length_minus_1 + 1. @buffer_removal_time
+ *   is the remainder of a modulo 1 << ( @buffer_removal_time_length_minus_1 + 1 ) counter.
+ * @refresh_frame_flags: contains a bitmask that specifies which reference frame slots will be
+ *   updated with the current frame after it is decoded. If @frame_type is equal to
+ *   #GST_AV1_INTRA_ONLY_FRAME, it is a requirement of bitstream conformance that
+ *   @refresh_frame_flags is not equal to 0xff.
+ * @ref_order_hint: specifies the expected output order hint for each reference buffer.
+ * @allow_intrabc: equal to 1 indicates that intra block copy may be used in this frame.
+ *   allow_intrabc equal to 0 indicates that intra block copy is not allowed in this frame.
+ * @frame_refs_short_signaling: equal to 1 indicates that only two reference frames are
+ *   explicitly signaled. frame_refs_short_signaling equal to 0 indicates that all reference
+ *   frames are explicitly signaled.
+ * @last_frame_idx: specifies the reference frame to use for LAST_FRAME.
+ * @gold_frame_idx: specifies the reference frame to use for GOLDEN_FRAME.
+ * @ref_frame_idx[i]: specifies which reference frames are used by inter frames.
+ * @delta_frame_id_minus_1 is used to calculate @delta_frame_id.
+ * @allow_high_precision_mv: equal to 0 specifies that motion vectors are specified to quarter
+ *   pel precision; @allow_high_precision_mv equal to 1 specifies that motion vectors are
+ *   specified to eighth pel precision.
+ * @is_motion_mode_switchable: equal to 0 specifies that only the SIMPLE motion mode will be used.
+ * @use_ref_frame_mvs: equal to 1 specifies that motion vector information from a previous
+ *   frame can be used when decoding the current frame. @use_ref_frame_mvs equal to 0 specifies
+ *   that this information will not be used.
+ * @disable_frame_end_update_cdf: equal to 1 indicates that the end of frame CDF update is
+ *   disabled; @disable_frame_end_update_cdf equal to 0 indicates that the end of frame CDF
+ *   update is enabled.
+ * @allow_warped_motion: equal to 1 indicates that the syntax element @motion_mode may be
+ *   present. @allow_warped_motion equal to 0 indicates that the syntax element motion_mode
+ *   will not be present (this means that LOCALWARP cannot be signaled if @allow_warped_motion
+ *   is equal to 0).
+ * @reduced_tx_set: equal to 1 specifies that the frame is restricted to a reduced subset of
+ *   the full set of transform types.
+ * @render_and_frame_size_different: equal to 0 means that the render width and height are
+ *   inferred from the frame width and height. @render_and_frame_size_different equal to 1
+ *   means that the render width and height are explicitly coded in the bitstream.
+ * @use_superres: equal to 0 indicates that no upscaling is needed. @use_superres equal to 1
+ *   indicates that upscaling is needed.
+ * @is_filter_switchable: equal to 1 indicates that the filter selection is signaled at the
+ *   block level; @is_filter_switchable equal to 0 indicates that the filter selection is
+ *   signaled at the frame level.
+ * @interpolation_filter: a #GstAV1InterpolationFilter that specifies the filter selection used
+ *   for performing inter prediction.
+ * @loop_filter_params: a #GstAV1LoopFilterParams holding the loop filter parameters.
+ * @quantization_params: a #GstAV1QuantizationParams holding the quantization parameters.
+ * @segmentation_params: a #GstAV1SegmenationParams holding the segementation parameters.
+ * @tile_info: a #GstAV1TileInfo holding the tile info.
+ * @cdef_params: a #GstAV1CDEFParams holding the CDEF paramters.
+ * @loop_restoration_params: a #GstAV1LoopRestorationParams holding the loop restoration parameters.
+ * @tx_mode_select: is used to compute TxMode.
+ * @skip_mode_present: equal to 1 specifies that the syntax element @skip_mode will be coded
+ *   in the bitstream. @skip_mode_present equal to 0 specifies that @skip_mode will not be used
+ *   for this frame.
+ * @reference_select: equal to 1 specifies that the mode info for inter blocks contains the
+ *   syntax element comp_mode that indicates whether to use single or compound reference
+ *   prediction. Reference_select equal to 0 specifies that all interblocks will use single
+ *   prediction.
+ * @global_motion_params: a #GstAV1GlobalMotionParams holding the global motion parameters.
+ * @film_grain_params: a #GstAV1FilmGrainParams holding the Film Grain parameters.
+ * @superres_denom: is the denominator of a fraction that specifies the ratio between the
+ *   superblock width before and after upscaling.
+ * @frame_is_intra: if equal to 0 indicating that this frame may use inter prediction.
+ * @order_hints: specifies the expected output order for each reference frame.
+ * @ref_frame_sign_bias: specifies the intended direction of the motion vector in time for
+ *   each reference frame.
+ * @coded_lossless: is a variable that is equal to 1 when all segments use lossless encoding.
+ * @all_lossless: is a variable that is equal to 1 when @coded_lossless is equal to 1 and
+ *   @frame_width is equal to @upscaled_width. This indicates that the frame is fully lossless
+ *   at the upscaled resolution.
+ * @lossless_array: whether the segmentation is lossless.
+ * @seg_qm_Level: the segmentation's qm level.
+ * @upscaled_width: the upscaled width.
+ * @frame_width: the frame width.
+ * @frame_height: the frame height.
+ * @render_width: the frame width to be rendered.
+ * @render_height: the frame height to be rendered.
+ * @tx_mode: specifies how the transform size is determined.
+ * @skip_mode_frame: specifies the frames to use for compound prediction when @skip_mode is 1.
+ */
+struct _GstAV1FrameHeaderOBU {
+  gboolean show_existing_frame;
+  gint8 frame_to_show_map_idx;
+  guint32 frame_presentation_time;
+  guint32 tu_presentation_delay;
+  guint32 display_frame_id;
+  GstAV1FrameType frame_type;
+  gboolean show_frame;
+  gboolean showable_frame;
+  gboolean error_resilient_mode;
+  gboolean disable_cdf_update;
+  guint8 allow_screen_content_tools;
+  gboolean force_integer_mv;
+  guint32 current_frame_id;
+  gboolean frame_size_override_flag;
+  guint32 order_hint;
+  guint8 primary_ref_frame;
+  gboolean buffer_removal_time_present_flag;
+  guint32 buffer_removal_time[GST_AV1_MAX_OPERATING_POINTS];
+  guint8 refresh_frame_flags;
+  guint32 ref_order_hint[GST_AV1_NUM_REF_FRAMES];
+  gboolean allow_intrabc;
+  gboolean frame_refs_short_signaling;
+  gint8 last_frame_idx;
+  gint8 gold_frame_idx;
+  gint8 ref_frame_idx[GST_AV1_REFS_PER_FRAME];
+  gboolean allow_high_precision_mv;
+  gboolean is_motion_mode_switchable;
+  gboolean use_ref_frame_mvs;
+  gboolean disable_frame_end_update_cdf;
+  gboolean allow_warped_motion;
+  gboolean reduced_tx_set;
+  gboolean render_and_frame_size_different;
+  gboolean use_superres;
+  gboolean is_filter_switchable;
+  GstAV1InterpolationFilter interpolation_filter;
+  GstAV1LoopFilterParams loop_filter_params;
+  GstAV1QuantizationParams quantization_params;
+  GstAV1SegmenationParams segmentation_params;
+  GstAV1TileInfo tile_info;
+  GstAV1CDEFParams cdef_params;
+  GstAV1LoopRestorationParams loop_restoration_params;
+  gboolean tx_mode_select;
+  gboolean skip_mode_present;
+  gboolean reference_select;
+  GstAV1GlobalMotionParams global_motion_params;
+  GstAV1FilmGrainParams film_grain_params;
+
+  /* Global vars set by frame header */
+  guint32 superres_denom; /* SuperresDenom */
+  guint8 frame_is_intra; /* FrameIsIntra */
+  guint32 order_hints[GST_AV1_NUM_REF_FRAMES]; /* OrderHints */
+  guint32 ref_frame_sign_bias[GST_AV1_NUM_REF_FRAMES]; /* RefFrameSignBias */
+
+  guint8 coded_lossless; /* CodedLossless */
+  guint8 all_lossless; /* AllLossless */
+  guint8 lossless_array[GST_AV1_MAX_SEGMENTS]; /* LosslessArray */
+  guint8 seg_qm_Level[3][GST_AV1_MAX_SEGMENTS]; /* SegQMLevel */
+
+  guint32 upscaled_width; /* UpscaledWidth */
+  guint32 frame_width; /* FrameWidth */
+  guint32 frame_height; /* FrameHeight */
+  guint32 render_width;  /* RenderWidth */
+  guint32 render_height; /* RenderHeight */
+
+  GstAV1TXModes tx_mode; /* TxMode */
+
+  guint8 skip_mode_frame[2]; /* SkipModeFrame */
+};
+
+/**
+ * GstAV1ReferenceFrameInfo:
+ *
+ * All the info related to a reference frames.
+ */
+struct _GstAV1ReferenceFrameInfo {
+  struct {
+    gboolean ref_valid; /* RefValid */
+    guint32 ref_frame_id; /* RefFrameId */
+    guint32 ref_upscaled_width; /* RefUpscaledWidth */
+    guint32 ref_frame_width; /* RefFrameWidth */
+    guint32 ref_frame_height; /* RefFrameHeight */
+    guint32 ref_render_width; /* RefRenderWidth */
+    guint32 ref_render_height; /* RefRenderHeight */
+    guint32 ref_mi_cols; /* RefMiCols */
+    guint32 ref_mi_rows; /* RefMiRows */
+    GstAV1FrameType ref_frame_type; /* RefFrameType */
+    guint8 ref_subsampling_x; /* RefSubsamplingX */
+    guint8 ref_subsampling_y; /* RefSubsamplingY */
+    guint8 ref_bit_depth; /* RefBitDepth */
+    guint32 ref_order_hint; /* RefOrderHint */
+    GstAV1SegmenationParams ref_segmentation_params;
+    GstAV1GlobalMotionParams ref_global_motion_params;
+    GstAV1LoopFilterParams ref_lf_params;
+    GstAV1FilmGrainParams ref_film_grain_params;
+    GstAV1TileInfo ref_tile_info;
+  } entry[GST_AV1_NUM_REF_FRAMES];
+};
+
+/**
+ * GstAV1TileListOBU:
+ * @output_frame_width_in_tiles_minus_1: plus one is the width of the output frame, in tile units.
+ * @output_frame_height_in_tiles_minus_1: plus one is the height of the output frame, in tile units.
+ * @tile_count_minus_1: plus one is the number of @tile_list_entry in the list. It is a requirement
+ *   of bitstream conformance that @tile_count_minus_1 is less than or equal to 511.
+ * @anchor_frame_idx: is the index into an array AnchorFrames of the frames that the tile uses
+ *   for prediction. The AnchorFrames array is provided by external means and may change for
+ *   each tile list OBU. The process for creating the AnchorFrames array is outside of the
+ *   scope of this specification. It is a requirement of bitstream conformance that
+ *   @anchor_frame_idx is less than or equal to 127.
+ * @anchor_tile_row: the row coordinate of the tile in the frame that it belongs, in tile
+ *   units. It is a requirement of bitstream conformance that @anchor_tile_row is less than @tile_rows.
+ * @anchor_tile_col: is the column coordinate of the tile in the frame that it belongs, in tile
+ *   units. It is a requirement of bitstream conformance that @anchor_tile_col is less than @tile_cols.
+ * @tile_data_size_minus_1: plus one is the size of the coded tile data, @coded_tile_data, in bytes.
+ * @coded_tile_data: are the @tile_data_size_minus_1 + 1 bytes of the coded tile.
+ */
+struct _GstAV1TileListOBU {
+  guint8 output_frame_width_in_tiles_minus_1;
+  guint8 output_frame_height_in_tiles_minus_1;
+  guint16 tile_count_minus_1;
+  struct {
+    gint8 anchor_frame_idx;
+    guint8 anchor_tile_row;
+    guint8 anchor_tile_col;
+    guint16 tile_data_size_minus_1;
+    /* Just refer to obu's data, invalid after OBU data released */
+    guint8 *coded_tile_data;
+  } entry[GST_AV1_MAX_TILE_COUNT];
+};
+
+/**
+ * GstAV1TileListOBU:
+ * @tile_start_and_end_present_flag: specifies whether @tg_start and @tg_end are present
+ *   in the bitstream. If @tg_start and @tg_end are not present in the bitstream, this
+ *   tile group covers the entire frame. If @obu_type is equal to #GST_AV1_OBU_FRAME, it is a
+ *   requirement of bitstream conformance that the value of @tile_start_and_end_present_flag
+ *   is equal to 0.
+ * @tg_start: specifies the zero-based index of the first tile in the current tile group.
+ *   It is a requirement of bitstream conformance that the value of @tg_start is equal to
+ *   the value of TileNum at the point that tile_group_obu is invoked.
+ * @tg_end: specifies the zero-based index of the last tile in the current tile group.
+ *   It is a requirement of bitstream conformance that the value of tg_end is greater
+ *   than or equal to tg_start. It is a requirement of bitstream conformance that the
+ *   value of tg_end for the last tile group in each frame is equal to num_tiles-1.
+ * @tile_offset: Offset from the OBU data, the real data start of this tile.
+ * @tg_size: Data size of this tile.
+ * @tile_row: Tile index in row.
+ * @tile_col: Tile index in column.
+ * @mi_row_start: start position in mi rows
+ * @mi_row_end: end position in mi rows
+ * @mi_col_start: start position in mi cols
+ * @mi_col_end: end position in mi cols
+ * @num_tiles: specifies the total number of tiles in the frame.
+ */
+struct _GstAV1TileGroupOBU {
+  gboolean tile_start_and_end_present_flag;
+  guint8 tg_start;
+  guint8 tg_end;
+  struct {
+    guint32 tile_offset; /* Tile data offset from the OBU data. */
+    guint32 tile_size; /* Data size of this tile */
+    guint32 tile_row; /* tileRow */
+    guint32 tile_col; /* tileCol */
+    /* global varialbes */
+    guint32 mi_row_start; /* MiRowStart */
+    guint32 mi_row_end; /* MiRowEnd */
+    guint32 mi_col_start; /* MiColStart */
+    guint32 mi_col_end; /* MiColEnd */
+  } entry[GST_AV1_MAX_TILE_COUNT];
+
+  guint32 num_tiles; /* NumTiles */
+};
+
+/**
+ * GstAV1FrameOBU:
+ * @frame_header: a #GstAV1FrameHeaderOBU holding frame_header data.
+ * @tile_group: a #GstAV1TileGroupOBU holding tile_group data.
+ */
+struct _GstAV1FrameOBU {
+  GstAV1TileGroupOBU tile_group;
+  GstAV1FrameHeaderOBU frame_header;
+};
+
+/**
+ * GstAV1Parser:
+ *
+ * #GstAV1Parser opaque structure
+ *
+ * Instantiante it with gst_av1_parser_new() and destroy it with
+ * gst_av1_parser_free()
+ */
+struct _GstAV1Parser
+{
+  /*< private >*/
+  struct
+  {
+    guint32 operating_point;    /* Set by choose_operating_point() */
+    guint8 seen_frame_header;   /* SeenFrameHeader */
+    guint32 operating_point_idc;        /* OperatingPointIdc */
+    gboolean sequence_changed;  /* Received a new sequence */
+    gboolean begin_first_frame; /* already find the first frame */
+
+    /* frame */
+    guint32 upscaled_width;     /* UpscaledWidth */
+    guint32 frame_width;        /* FrameWidth */
+    guint32 frame_height;       /* FrameHeight */
+    guint32 mi_cols;            /* MiCols */
+    guint32 mi_rows;            /* MiRows */
+    guint32 render_width;       /* RenderWidth */
+    guint32 render_height;      /* RenderHeight */
+    guint32 prev_frame_id;      /* PrevFrameID */
+    guint32 current_frame_id;   /* the current frame ID */
+    GstAV1ReferenceFrameInfo ref_info;  /* RefInfo */
+
+    guint32 mi_col_starts[GST_AV1_MAX_TILE_COLS + 1];   /* MiColStarts */
+    guint32 mi_row_starts[GST_AV1_MAX_TILE_ROWS + 1];   /* MiRowStarts */
+    guint8 tile_cols_log2;      /* TileColsLog2 */
+    guint8 tile_cols;           /* TileCols */
+    guint8 tile_rows_log2;      /* TileRowsLog2 */
+    guint8 tile_rows;           /* TileRows */
+    guint8 tile_size_bytes;     /* TileSizeBytes */
+  } state;
+
+  gboolean annex_b;
+  guint32 temporal_unit_size;
+  /* consumed of this temporal unit */
+  guint32 temporal_unit_consumed;
+  guint32 frame_unit_size;
+  /* consumed of this frame unit */
+  guint32 frame_unit_consumed;
+
+  GstAV1SequenceHeaderOBU *seq_header;
+};
+
+GST_CODEC_PARSERS_API
+void
+gst_av1_parser_reset (GstAV1Parser * parser, gboolean annex_b);
+
+GST_CODEC_PARSERS_API
+void
+gst_av1_parser_reset_annex_b (GstAV1Parser * parser);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_identify_one_obu (GstAV1Parser * parser, const guint8 * data,
+    guint32 size, GstAV1OBU * obu, guint32 * consumed);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_sequence_header_obu (GstAV1Parser * parser,
+    GstAV1OBU * obu, GstAV1SequenceHeaderOBU * seq_header);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_temporal_delimiter_obu (GstAV1Parser * parser,
+    GstAV1OBU * obu);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_metadata_obu (GstAV1Parser * parser, GstAV1OBU * obu,
+    GstAV1MetadataOBU * metadata);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_tile_list_obu (GstAV1Parser * parser, GstAV1OBU * obu,
+    GstAV1TileListOBU * tile_list);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_tile_group_obu (GstAV1Parser * parser, GstAV1OBU * obu,
+    GstAV1TileGroupOBU * tile_group);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_frame_header_obu (GstAV1Parser * parser, GstAV1OBU * obu,
+    GstAV1FrameHeaderOBU * frame_header);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_parse_frame_obu (GstAV1Parser * parser, GstAV1OBU * obu,
+    GstAV1FrameOBU * frame);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_reference_frame_loading (GstAV1Parser * parser,
+    GstAV1FrameHeaderOBU * frame_header);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_reference_frame_update (GstAV1Parser * parser,
+    GstAV1FrameHeaderOBU * frame_header);
+
+GST_CODEC_PARSERS_API
+GstAV1ParserResult
+gst_av1_parser_set_operating_point (GstAV1Parser * parser,
+    gint32 operating_point);
+
+GST_CODEC_PARSERS_API
+GstAV1Parser * gst_av1_parser_new (void);
+
+GST_CODEC_PARSERS_API
+void gst_av1_parser_free (GstAV1Parser * parser);
+
+G_END_DECLS
+
+#endif /* __GST_AV1_PARSER_H__ */