/* * gstav1parser.h * * Copyright (C) 2018 Georg Ottinger * Copyright (C) 2019-2020 Intel Corporation * Author: Georg Ottinger * Author: Junyan He * Author: Victor Jaquez * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, * Boston, MA 02110-1301, USA. */ #ifndef __GST_AV1_PARSER_H__ #define __GST_AV1_PARSER_H__ #ifndef GST_USE_UNSTABLE_API #warning "The AV1 parsing library is unstable API and may change in future." #warning "You can define GST_USE_UNSTABLE_API to avoid this warning." #endif #include #include G_BEGIN_DECLS #define GST_AV1_MAX_NUM_TEMPORAL_LAYERS 8 #define GST_AV1_MAX_NUM_SPATIAL_LAYERS 4 #define GST_AV1_MAX_TILE_WIDTH 4096 #define GST_AV1_MAX_TILE_AREA (4096 * 2304) #define GST_AV1_TOTAL_REFS_PER_FRAME 8 #define GST_AV1_MAX_SEGMENTS 8 #define GST_AV1_SEG_LVL_MAX 8 #define GST_AV1_MAX_TILE_COLS 64 #define GST_AV1_MAX_TILE_ROWS 64 #define GST_AV1_REFS_PER_FRAME 7 #define GST_AV1_PRIMARY_REF_NONE 7 #define GST_AV1_SUPERRES_NUM 8 #define GST_AV1_SUPERRES_DENOM_MIN 9 #define GST_AV1_SUPERRES_DENOM_BITS 3 #define GST_AV1_MAX_LOOP_FILTER 63 #define GST_AV1_GM_ABS_TRANS_BITS 12 #define GST_AV1_GM_ABS_TRANS_ONLY_BITS 9 #define GST_AV1_GM_ABS_ALPHA_BITS 12 #define GST_AV1_GM_ALPHA_PREC_BITS 15 #define GST_AV1_GM_TRANS_PREC_BITS 6 #define GST_AV1_GM_TRANS_ONLY_PREC_BITS 3 #define GST_AV1_WARPEDMODEL_PREC_BITS 16 #define GST_AV1_WARP_PARAM_REDUCE_BITS 6 #define GST_AV1_SELECT_SCREEN_CONTENT_TOOLS 2 #define GST_AV1_SELECT_INTEGER_MV 2 #define GST_AV1_RESTORATION_TILESIZE_MAX 256 #define GST_AV1_SEG_LVL_ALT_Q 0 #define GST_AV1_SEG_LVL_REF_FRAME 5 /* Following defines are derived from the spec, but not mentioned by * this particular name in the spec */ #define GST_AV1_CDEF_MAX (1 << 3) #define GST_AV1_MAX_TILE_COUNT 512 #define GST_AV1_MAX_OPERATING_POINTS \ (GST_AV1_MAX_NUM_TEMPORAL_LAYERS * GST_AV1_MAX_NUM_SPATIAL_LAYERS) #define GST_AV1_MAX_SPATIAL_LAYERS 2 /* correct? */ #define GST_AV1_MAX_TEMPORAL_GROUP_SIZE 8 /* correct? */ #define GST_AV1_MAX_TEMPORAL_GROUP_REFERENCES 8 /* correct? */ #define GST_AV1_MAX_NUM_Y_POINTS 16 #define GST_AV1_MAX_NUM_CB_POINTS 16 #define GST_AV1_MAX_NUM_CR_POINTS 16 #define GST_AV1_MAX_NUM_POS_LUMA 25 #define GST_AV1_MAX_NUM_PLANES 3 #define GST_AV1_DIV_LUT_PREC_BITS 14 #define GST_AV1_DIV_LUT_BITS 8 #define GST_AV1_DIV_LUT_NUM (1 << GST_AV1_DIV_LUT_BITS) typedef struct _GstAV1Parser GstAV1Parser; typedef struct _GstAV1OBUHeader GstAV1OBUHeader; typedef struct _GstAV1OBU GstAV1OBU; typedef struct _GstAV1SequenceHeaderOBU GstAV1SequenceHeaderOBU; typedef struct _GstAV1MetadataOBU GstAV1MetadataOBU; typedef struct _GstAV1FrameHeaderOBU GstAV1FrameHeaderOBU; typedef struct _GstAV1TileListOBU GstAV1TileListOBU; typedef struct _GstAV1TileGroupOBU GstAV1TileGroupOBU; typedef struct _GstAV1FrameOBU GstAV1FrameOBU; typedef struct _GstAV1OperatingPoint GstAV1OperatingPoint; typedef struct _GstAV1DecoderModelInfo GstAV1DecoderModelInfo; typedef struct _GstAV1TimingInfo GstAV1TimingInfo; typedef struct _GstAV1ColorConfig GstAV1ColorConfig; typedef struct _GstAV1MetadataITUT_T35 GstAV1MetadataITUT_T35; typedef struct _GstAV1MetadataHdrCll GstAV1MetadataHdrCll; typedef struct _GstAV1MetadataHdrMdcv GstAV1MetadataHdrMdcv; typedef struct _GstAV1MetadataScalability GstAV1MetadataScalability; typedef struct _GstAV1MetadataTimecode GstAV1MetadataTimecode; typedef struct _GstAV1LoopFilterParams GstAV1LoopFilterParams; typedef struct _GstAV1QuantizationParams GstAV1QuantizationParams; typedef struct _GstAV1SegmenationParams GstAV1SegmenationParams; typedef struct _GstAV1TileInfo GstAV1TileInfo; typedef struct _GstAV1CDEFParams GstAV1CDEFParams; typedef struct _GstAV1LoopRestorationParams GstAV1LoopRestorationParams; typedef struct _GstAV1GlobalMotionParams GstAV1GlobalMotionParams; typedef struct _GstAV1FilmGrainParams GstAV1FilmGrainParams; typedef struct _GstAV1ReferenceFrameInfo GstAV1ReferenceFrameInfo; /** * GstAV1ParserResult: * @GST_AV1_PARSER_OK: successful return * @GST_AV1_PARSER_NO_MORE_DATA: the parser needs more data for one OBU * @GST_AV1_PARSER_DROP: no need to handle this OBU, skip it * @GST_AV1_PARSER_BITSTREAM_ERROR: stream error, for example, include invalid bits * @GST_AV1_PARSER_MISSING_OBU_REFERENCE: no reference, for example, no sequence found * @GST_AV1_PARSER_INVALID_OPERATION: something like invalid parameters * * Defines the result of parser process */ typedef enum { GST_AV1_PARSER_OK = 0, GST_AV1_PARSER_NO_MORE_DATA = 1, GST_AV1_PARSER_DROP = 2, GST_AV1_PARSER_BITSTREAM_ERROR = 3, GST_AV1_PARSER_MISSING_OBU_REFERENCE = 4, GST_AV1_PARSER_INVALID_OPERATION = 5, } GstAV1ParserResult; /** * GstAV1Profile: * @GST_AV1_PROFILE_0: 8-bit and 10-bit 4:2:0 and 4:0:0 only. * @GST_AV1_PROFILE_1: 8-bit and 10-bit 4:4:4. * @GST_AV1_PROFILE_2: 8-bit and 10-bit 4:2:2, 12-bit 4:0:0 4:2:2 and 4:4:4 * * Defines the AV1 profiles */ typedef enum { GST_AV1_PROFILE_0 = 0, GST_AV1_PROFILE_1 = 1, GST_AV1_PROFILE_2 = 2, } GstAV1Profile; /** * GstAV1OBUType: * @GST_AV1_OBU_RESERVED_0: Reserved 0 * @GST_AV1_OBU_SEQUENCE_HEADER: Sequence Header OBU * @GST_AV1_OBU_TEMPORAL_DELIMITER: Temporal Delimiter OBU * @GST_AV1_OBU_FRAME_HEADER: Frame Header OBU * @GST_AV1_OBU_TILE_GROUP: Tile Group OBU * @GST_AV1_OBU_METADATA: Metadata OBU * @GST_AV1_OBU_FRAME: Frame OBU (includes Frame Header and one Tile Group) * @GST_AV1_OBU_REDUNDANT_FRAME_HEADER: Redundant Frame Header OBU * @GST_AV1_OBU_TILE_LIST: Tile LIst OBU * @GST_AV1_OBU_RESERVED_9: Reserved 9 * @GST_AV1_OBU_RESERVED_10: Reserved 10 * @GST_AV1_OBU_RESERVED_11: Reserved 11 * @GST_AV1_OBU_RESERVED_12: Reserved 12 * @GST_AV1_OBU_RESERVED_13: Reserved 13 * @GST_AV1_OBU_RESERVED_14: Reserved 14 * @GST_AV1_OBU_PADDING: Padding * * Defines all the possible OBU types */ typedef enum { GST_AV1_OBU_RESERVED_0 = 0, GST_AV1_OBU_SEQUENCE_HEADER = 1, GST_AV1_OBU_TEMPORAL_DELIMITER = 2, GST_AV1_OBU_FRAME_HEADER = 3, GST_AV1_OBU_TILE_GROUP = 4, GST_AV1_OBU_METADATA = 5, GST_AV1_OBU_FRAME = 6, GST_AV1_OBU_REDUNDANT_FRAME_HEADER = 7, GST_AV1_OBU_TILE_LIST = 8, GST_AV1_OBU_RESERVED_9 = 9, GST_AV1_OBU_RESERVED_10 = 10, GST_AV1_OBU_RESERVED_11 = 11, GST_AV1_OBU_RESERVED_12 = 12, GST_AV1_OBU_RESERVED_13 = 13, GST_AV1_OBU_RESERVED_14 = 14, GST_AV1_OBU_PADDING = 15, } GstAV1OBUType; /** * GstAV1SeqLevels: * @GST_AV1_SEQ_LEVEL_2_0: Level 2.0 * @GST_AV1_SEQ_LEVEL_2_1: Level 2.1 * @GST_AV1_SEQ_LEVEL_2_2: Level 2.2 * @GST_AV1_SEQ_LEVEL_2_3: Level 2.3 * @GST_AV1_SEQ_LEVEL_3_0: Level 3.0 * @GST_AV1_SEQ_LEVEL_3_1: Level 3.1 * @GST_AV1_SEQ_LEVEL_3_2: Level 3.2 * @GST_AV1_SEQ_LEVEL_3_3: Level 3.3 * @GST_AV1_SEQ_LEVEL_4_0: Level 4.0 * @GST_AV1_SEQ_LEVEL_4_1: Level 4.1 * @GST_AV1_SEQ_LEVEL_4_2: Level 4.2 * @GST_AV1_SEQ_LEVEL_4_3: Level 4.3 * @GST_AV1_SEQ_LEVEL_5_0: Level 5.0 * @GST_AV1_SEQ_LEVEL_5_1: Level 5.1 * @GST_AV1_SEQ_LEVEL_5_2: Level 5.2 * @GST_AV1_SEQ_LEVEL_5_3: Level 5.3 * @GST_AV1_SEQ_LEVEL_6_0: Level 6.0 * @GST_AV1_SEQ_LEVEL_6_1: Level 6.1 * @GST_AV1_SEQ_LEVEL_6_2: Level 6.2 * @GST_AV1_SEQ_LEVEL_6_3: Level 6.3 * @GST_AV1_SEQ_LEVEL_7_0: Level 7.0 * @GST_AV1_SEQ_LEVEL_7_1: Level 7.1 * @GST_AV1_SEQ_LEVEL_7_2: Level 7.2 * @GST_AV1_SEQ_LEVEL_7_3: Level 7.3 * @GST_AV1_SEQ_LEVELS: all valid levels * @GST_AV1_SEQ_LEVEL_MAX: Maximum parameters * * Defines all the possible OBU types */ typedef enum { GST_AV1_SEQ_LEVEL_2_0 = 0, GST_AV1_SEQ_LEVEL_2_1 = 1, GST_AV1_SEQ_LEVEL_2_2 = 2, GST_AV1_SEQ_LEVEL_2_3 = 3, GST_AV1_SEQ_LEVEL_3_0 = 4, GST_AV1_SEQ_LEVEL_3_1 = 5, GST_AV1_SEQ_LEVEL_3_2 = 6, GST_AV1_SEQ_LEVEL_3_3 = 7, GST_AV1_SEQ_LEVEL_4_0 = 8, GST_AV1_SEQ_LEVEL_4_1 = 9, GST_AV1_SEQ_LEVEL_4_2 = 10, GST_AV1_SEQ_LEVEL_4_3 = 11, GST_AV1_SEQ_LEVEL_5_0 = 12, GST_AV1_SEQ_LEVEL_5_1 = 13, GST_AV1_SEQ_LEVEL_5_2 = 14, GST_AV1_SEQ_LEVEL_5_3 = 15, GST_AV1_SEQ_LEVEL_6_0 = 16, GST_AV1_SEQ_LEVEL_6_1 = 17, GST_AV1_SEQ_LEVEL_6_2 = 18, GST_AV1_SEQ_LEVEL_6_3 = 19, GST_AV1_SEQ_LEVEL_7_0 = 20, GST_AV1_SEQ_LEVEL_7_1 = 21, GST_AV1_SEQ_LEVEL_7_2 = 22, GST_AV1_SEQ_LEVEL_7_3 = 23, GST_AV1_SEQ_LEVELS, GST_AV1_SEQ_LEVEL_MAX = 31 } GstAV1SeqLevels; /** * GstAV1MetadataType: * @GST_AV1_METADATA_TYPE_RESERVED_0: Reserved 0 * @GST_AV1_METADATA_TYPE_HDR_CLL: Metadata high dynamic range content * light level semantics * @GST_AV1_METADATA_TYPE_HDR_MDCV: Metadata high dynamic range mastering * display color volume semantics * @GST_AV1_METADATA_TYPE_SCALABILITY: Metadata scalability semantics * @GST_AV1_METADATA_TYPE_ITUT_T35: Metadata ITUT T35 semantics * @GST_AV1_METADATA_TYPE_TIMECODE: Timecode semantics */ typedef enum { GST_AV1_METADATA_TYPE_RESERVED_0 = 0, GST_AV1_METADATA_TYPE_HDR_CLL = 1, GST_AV1_METADATA_TYPE_HDR_MDCV = 2, GST_AV1_METADATA_TYPE_SCALABILITY = 3, GST_AV1_METADATA_TYPE_ITUT_T35 = 4, GST_AV1_METADATA_TYPE_TIMECODE = 5, } GstAV1MetadataType; /** * GstAV1ScalabilityModes: * @GST_AV1_SCALABILITY_L1T2: 1 spatial layer, 2 temporal layers * @GST_AV1_SCALABILITY_L1T3: 1 spatial layer, 3 temporal layers * @GST_AV1_SCALABILITY_L2T1: 2 spatial layer (ratio 2:1), 1 temporal layer, * inter-layer dependency * @GST_AV1_SCALABILITY_L2T2: 2 spatial layer (ratio 2:1), 2 temporal layer, * inter-layer dependency * @GST_AV1_SCALABILITY_L2T3: 2 spatial layer (ratio 2:1), 3 temporal layer, * inter-layer dependency * @GST_AV1_SCALABILITY_S2T1: 2 spatial layer (ratio 2:1), 1 temporal layer * @GST_AV1_SCALABILITY_S2T2: 2 spatial layer (ratio 2:1), 2 temporal layer * @GST_AV1_SCALABILITY_S2T3: 2 spatial layer (ratio 2:1), 3 temporal layer * @GST_AV1_SCALABILITY_L2T1h: 2 spatial layer (ratio 1.5:1), 1 temporal layer, * inter-layer dependency * @GST_AV1_SCALABILITY_L2T2h: 2 spatial layer (ratio 1.5:1), 2 temporal layer, * inter-layer dependency * @GST_AV1_SCALABILITY_L2T3h: 2 spatial layer (ratio 1.5:1), 3 temporal layer, * inter-layer dependency * @GST_AV1_SCALABILITY_S2T1h: 2 spatial layer (ratio 1.5:1), 1 temporal layer * @GST_AV1_SCALABILITY_S2T2h: 2 spatial layer (ratio 1.5:1), 2 temporal layer * @GST_AV1_SCALABILITY_S2T3h: 2 spatial layer (ratio 1.5:1), 3 temporal layer * @GST_AV1_SCALABILITY_SS: Use scalability structure #GstAV1MetadataScalability */ typedef enum { GST_AV1_SCALABILITY_L1T2 = 0, GST_AV1_SCALABILITY_L1T3 = 1, GST_AV1_SCALABILITY_L2T1 = 2, GST_AV1_SCALABILITY_L2T2 = 3, GST_AV1_SCALABILITY_L2T3 = 4, GST_AV1_SCALABILITY_S2T1 = 5, GST_AV1_SCALABILITY_S2T2 = 6, GST_AV1_SCALABILITY_S2T3 = 7, GST_AV1_SCALABILITY_L2T1h = 8, GST_AV1_SCALABILITY_L2T2h = 9, GST_AV1_SCALABILITY_L2T3h = 10, GST_AV1_SCALABILITY_S2T1h = 11, GST_AV1_SCALABILITY_S2T2h = 12, GST_AV1_SCALABILITY_S2T3h = 13, GST_AV1_SCALABILITY_SS = 14, } GstAV1ScalabilityModes; /** * GstAV1ColorPrimaries: * @GST_AV1_CP_BT_709: BT.709 * @GST_AV1_CP_UNSPECIFIED: Unspecified * @GST_AV1_CP_BT_470_M: BT.470 System M (historical) * @GST_AV1_CP_BT_470_B_G:BT.470 System B, G (historical), * @GST_AV1_CP_BT_601: BT.601 * @GST_AV1_CP_SMPTE_240: SMPTE 240 * @GST_AV1_CP_GENERIC_FILM: Generic film (color filters using illuminant C, * @GST_AV1_CP_BT_2020: BT.2020, BT.2100, * @GST_AV1_CP_XYZ: SMPTE 428 (CIE 1921 XYZ), * @GST_AV1_CP_SMPTE_431: SMPTE RP 431-2 * @GST_AV1_CP_SMPTE_432: SMPTE EG 432-1 * @GST_AV1_CP_EBU_3213: EBU Tech. 3213-E */ typedef enum { GST_AV1_CP_BT_709 = 1, GST_AV1_CP_UNSPECIFIED = 2, GST_AV1_CP_BT_470_M = 4, GST_AV1_CP_BT_470_B_G = 5, GST_AV1_CP_BT_601 = 6, GST_AV1_CP_SMPTE_240 = 7, GST_AV1_CP_GENERIC_FILM = 8, GST_AV1_CP_BT_2020 = 9, GST_AV1_CP_XYZ = 10, GST_AV1_CP_SMPTE_431 = 11, GST_AV1_CP_SMPTE_432 = 12, GST_AV1_CP_EBU_3213 = 22, } GstAV1ColorPrimaries; /** * GstAV1TransferCharacteristics: * @GST_AV1_TC_RESERVED_0: For future use * @GST_AV1_TC_BT_709: BT.709 * @GST_AV1_TC_UNSPECIFIED: Unspecified * @GST_AV1_TC_RESERVED_3: For future use * @GST_AV1_TC_BT_470_M: BT.470 System M (historical) * @GST_AV1_TC_BT_470_B_G: BT.470 System B, G (historical) * @GST_AV1_TC_BT_601: BT.601 * @GST_AV1_TC_SMPTE_240: SMPTE 240 M * @GST_AV1_TC_LINEAR: Linear * @GST_AV1_TC_LOG_100: Logarithmic (100 : 1 range) * @GST_AV1_TC_LOG_100_SQRT10: Logarithmic (100 * Sqrt(10) : 1 range) * @GST_AV1_TC_IEC_61966: IEC 61966-2-4 * @GST_AV1_TC_BT_1361: BT.1361 * @GST_AV1_TC_SRGB: sRGB or sYCC * @GST_AV1_TC_BT_2020_10_BIT: BT.2020 10-bit systems * @GST_AV1_TC_BT_2020_12_BIT: BT.2020 12-bit systems * @GST_AV1_TC_SMPTE_2084: SMPTE ST 2084, ITU BT.2100 PQ * @GST_AV1_TC_SMPTE_428: SMPTE ST 428 * @GST_AV1_TC_HLG: BT.2100 HLG, ARIB STD-B67 */ typedef enum { GST_AV1_TC_RESERVED_0 = 0, GST_AV1_TC_BT_709 = 1, GST_AV1_TC_UNSPECIFIED = 2, GST_AV1_TC_RESERVED_3 = 3, GST_AV1_TC_BT_470_M = 4, GST_AV1_TC_BT_470_B_G = 5, GST_AV1_TC_BT_601 = 6, GST_AV1_TC_SMPTE_240 = 7, GST_AV1_TC_LINEAR = 8, GST_AV1_TC_LOG_100 = 9, GST_AV1_TC_LOG_100_SQRT10 = 10, GST_AV1_TC_IEC_61966 = 11, GST_AV1_TC_BT_1361 = 12, GST_AV1_TC_SRGB = 13, GST_AV1_TC_BT_2020_10_BIT = 14, GST_AV1_TC_BT_2020_12_BIT = 15, GST_AV1_TC_SMPTE_2084 = 16, GST_AV1_TC_SMPTE_428 = 17, GST_AV1_TC_HLG = 18, } GstAV1TransferCharacteristics; /** * GstAV1MatrixCoefficients: * @GST_AV1_MC_IDENTITY: Identity matrix * @GST_AV1_MC_BT_709: BT.709 * @GST_AV1_MC_UNSPECIFIED: Unspecified * @GST_AV1_MC_RESERVED_3: For future use * @GST_AV1_MC_FCC: US FCC 73.628 * @GST_AV1_MC_BT_470_B_G: BT.470 System B, G (historical) * @GST_AV1_MC_BT_601: BT.601 * @GST_AV1_MC_SMPTE_240: SMPTE 240 M * @GST_AV1_MC_SMPTE_YCGCO: YCgCo * @GST_AV1_MC_BT_2020_NCL: BT.2020 non-constant luminance, BT.2100 YCbCr * @GST_AV1_MC_BT_2020_CL: BT.2020 constant luminance * @GST_AV1_MC_SMPTE_2085: SMPTE ST 2085 YDzDx * @GST_AV1_MC_CHROMAT_NCL: Chromaticity-derived non-constant luminance * @GST_AV1_MC_CHROMAT_CL: Chromaticity-derived constant luminancw * @GST_AV1_MC_ICTCP: BT.2100 ICtCp */ typedef enum { GST_AV1_MC_IDENTITY = 0, GST_AV1_MC_BT_709 = 1, GST_AV1_MC_UNSPECIFIED = 2, GST_AV1_MC_RESERVED_3 = 3, GST_AV1_MC_FCC = 4, GST_AV1_MC_BT_470_B_G = 5, GST_AV1_MC_BT_601 = 6, GST_AV1_MC_SMPTE_240 = 7, GST_AV1_MC_SMPTE_YCGCO = 8, GST_AV1_MC_BT_2020_NCL = 9, GST_AV1_MC_BT_2020_CL = 10, GST_AV1_MC_SMPTE_2085 = 11, GST_AV1_MC_CHROMAT_NCL = 12, GST_AV1_MC_CHROMAT_CL = 13, GST_AV1_MC_ICTCP = 14, } GstAV1MatrixCoefficients; /** * GstAV1ChromaSamplePositions: * @GST_AV1_CSP_UNKNOWN: Unknown (in this case the source video transfer * function must be signaled outside the AV1 bitstream). * @GST_AV1_CSP_VERTICAL: Horizontally co-located with (0, 0) luma sample, * vertical position in the middle between two luma samples. * @GST_AV1_CSP_COLOCATED: co-located with (0, 0) luma sample. * @GST_AV1_CSP_RESERVED: For future use. */ typedef enum { GST_AV1_CSP_UNKNOWN = 0, GST_AV1_CSP_VERTICAL = 1, GST_AV1_CSP_COLOCATED = 2, GST_AV1_CSP_RESERVED = 3, } GstAV1ChromaSamplePositions; /** * GstAV1FrameType: * @GST_AV1_KEY_FRAME: Key Frame * @GST_AV1_INTER_FRAME: InterFrame * @GST_AV1_INTRA_ONLY_FRAME: Intra-Only Frame * @GST_AV1_SWITCH_FRAME: Switch Frame */ typedef enum { GST_AV1_KEY_FRAME = 0, GST_AV1_INTER_FRAME = 1, GST_AV1_INTRA_ONLY_FRAME = 2, GST_AV1_SWITCH_FRAME = 3, } GstAV1FrameType; /** * GstAV1InterpolationFilter: * @GST_AV1_INTERPOLATION_FILTER_EIGHTTAP: Eighttap * @GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SMOOTH: Eighttap Smooth * @GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SHARP: Eighttap Sharp * @GST_AV1_INTERPOLATION_FILTER_BILINEAR: Bilinear * @GST_AV1_INTERPOLATION_FILTER_SWITCHABLE: Filter is swichtable */ typedef enum { GST_AV1_INTERPOLATION_FILTER_EIGHTTAP = 0, GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SMOOTH = 1, GST_AV1_INTERPOLATION_FILTER_EIGHTTAP_SHARP = 2, GST_AV1_INTERPOLATION_FILTER_BILINEAR = 3, GST_AV1_INTERPOLATION_FILTER_SWITCHABLE = 4, } GstAV1InterpolationFilter; /** * GstAV1TXModes: * @GST_AV1_TX_MODE_ONLY_4x4: the inverse transform will use only 4x4 transforms. * @GST_AV1_TX_MODE_LARGEST: the inverse transform will use the largest transform * size that fits inside the block. * @GST_AV1_TX_MODE_SELECT: the choice of transform size is specified explicitly * for each block. */ typedef enum { GST_AV1_TX_MODE_ONLY_4x4 = 0, GST_AV1_TX_MODE_LARGEST = 1, GST_AV1_TX_MODE_SELECT = 2, } GstAV1TXModes; /** * GstAV1FrameRestorationType: * @GST_AV1_FRAME_RESTORE_NONE: no filtering is applied * @GST_AV1_FRAME_RESTORE_WIENER: Wiener filter process is invoked * @GST_AV1_FRAME_RESTORE_SGRPROJ: self guided filter proces is invoked * @GST_AV1_FRAME_RESTORE_SWITCHABLE: restoration filter is swichtable */ typedef enum { GST_AV1_FRAME_RESTORE_NONE = 0, GST_AV1_FRAME_RESTORE_WIENER = 1, GST_AV1_FRAME_RESTORE_SGRPROJ = 2, GST_AV1_FRAME_RESTORE_SWITCHABLE = 3, } GstAV1FrameRestorationType; /** * GstAV1ReferenceFrame: * @GST_AV1_REF_INTRA_FRAME: Intra Frame Reference * @GST_AV1_REF_LAST_FRAME: Last Reference Frame * @GST_AV1_REF_LAST2_FRAME: Last2 Reference Frame * @GST_AV1_REF_LAST3_FRAME: Last3 Reference Frame * @GST_AV1_REF_GOLDEN_FRAME: Golden Reference Frame * @GST_AV1_REF_BWDREF_FRAME: BWD Reference Frame * @GST_AV1_REF_ALTREF2_FRAME: Alternative2 Reference Frame * @GST_AV1_REF_ALTREF_FRAME: Alternative Reference Frame * @GST_AV1_NUM_REF_FRAMES: Total Reference Frame Number */ typedef enum { GST_AV1_REF_INTRA_FRAME = 0, GST_AV1_REF_LAST_FRAME = 1, GST_AV1_REF_LAST2_FRAME = 2, GST_AV1_REF_LAST3_FRAME = 3, GST_AV1_REF_GOLDEN_FRAME = 4, GST_AV1_REF_BWDREF_FRAME = 5, GST_AV1_REF_ALTREF2_FRAME = 6, GST_AV1_REF_ALTREF_FRAME = 7, GST_AV1_NUM_REF_FRAMES } GstAV1ReferenceFrame; /** * GstAV1WarpModelType: * @GST_AV1_WARP_MODEL_IDENTITY: Warp model is just an identity transform * @GST_AV1_WARP_MODEL_TRANSLATION: Warp model is a pure translation * @GST_AV1_WARP_MODEL_ROTZOOM: Warp model is a rotation + symmetric zoom * + translation * @GST_AV1_WARP_MODEL_AFFINE: Warp model is a general affine transform */ typedef enum { GST_AV1_WARP_MODEL_IDENTITY = 0, GST_AV1_WARP_MODEL_TRANSLATION = 1, GST_AV1_WARP_MODEL_ROTZOOM = 2, GST_AV1_WARP_MODEL_AFFINE = 3, } GstAV1WarpModelType; /** * GstAV1OBUHeader: * @obu_type: the type of data structure contained in the OBU payload. * @obu_extention_flag: indicates if OBU header extention is present. * @obu_has_size_field: equal to 1 indicates that the obu_size syntax element will be * present. @obu_has_size_field equal to 0 indicates that the @obu_size syntax element * will not be present. * @obu_temporal_id: specifies the temporal level of the data contained in the OBU. * @obu_spatial_id: specifies the spatial level of the data contained in the OBU. * * Collect info for OBU header and OBU extension header if * obu_extension_flag == 1. */ struct _GstAV1OBUHeader { GstAV1OBUType obu_type; gboolean obu_extention_flag; gboolean obu_has_size_field; guint8 obu_temporal_id; guint8 obu_spatial_id; }; /** * GstAV1OBU: * @header: a #GstAV1OBUHeader OBU Header * @obu_type: the type of data structure contained in the OBU payload. * @data: references the current data chunk that holds the OBU * @obu_size: size of the OBU, not include header size * * It is the general representation of AV1 OBU (Open Bitstream * Unit). One OBU include its header and payload. */ struct _GstAV1OBU { GstAV1OBUHeader header; GstAV1OBUType obu_type; guint8 *data; guint32 obu_size; }; /** * GstAV1OperatingPoint: * @seq_level_idx: specifies the level that the coded video sequence conforms to. * @seq_tier: specifies the tier that the coded video sequence conforms to. * @idc: contains a bitmask that indicates which spatial and temporal layers should be * decoded. Bit k is equal to 1 if temporal layer k should be decoded (for k between * 0 and 7). Bit j+8 is equal to 1 if spatial layer j should be decoded (for j between * 0 and 3). * @decoder_model_present_for_this_op: equal to one indicates that there is a decoder model * associated with this operating point. @decoder_model_present_for_this_op equal to zero * indicates that there is not a decoder model associated. * @decoder_buffer_delay: specifies the time interval between the arrival of the first bit * in the smoothing buffer and the subsequent removal of the data that belongs to the * first coded frame for operating point op, measured in units of 1/90000 seconds. The * length of @decoder_buffer_delay is specified by @buffer_delay_length_minus_1 + 1, in bits. * @encoder_buffer_delay: specifies, in combination with @decoder_buffer_delay syntax element, * the first bit arrival time of frames to be decoded to the smoothing buffer. * @encoder_buffer_delay is measured in units of 1/90000 seconds. For a video sequence that * includes one or more random access points the sum of @decoder_buffer_delay and * @encoder_buffer_delay shall be kept constant. * @low_delay_mode_flag: equal to 1 indicates that the smoothing buffer operates in low-delay * mode for operating point op. In low-delay mode late decode times and buffer underflow * are both permitted. @low_delay_mode_flag equal to 0 indicates that the smoothing buffer * operates in strict mode, where buffer underflow is not allowed. * @initial_display_delay_present_for_this_op: equal to 1 indicates that * @initial_display_delay_minus_1 is specified for this operating. 0 indicates that * @initial_display_delay_minus_1 is not specified for this operating point. * @initial_display_delay_minus_1: plus 1 specifies, for operating point i, the number of * decoded frames that should be present in the buffer pool before the first presentable * frame is displayed. This will ensure that all presentable frames in the sequence can * be decoded at or before the time that they are scheduled for display. */ struct _GstAV1OperatingPoint { guint8 seq_level_idx; guint8 seq_tier; guint16 idc; gboolean decoder_model_present_for_this_op; guint8 decoder_buffer_delay; guint8 encoder_buffer_delay; gboolean low_delay_mode_flag; gboolean initial_display_delay_present_for_this_op; guint8 initial_display_delay_minus_1; }; /** * GstAV1DecoderModelInfo: * @buffer_delay_length_minus_1: plus 1 specifies the length of the * @decoder_buffer_delay and the @encoder_buffer_delay syntax elements, * in bits. * @num_units_in_decoding_tick: is the number of time units of a decoding clock * operating at the frequency @time_scale Hz that corresponds to one increment * of a clock tick counter. * @buffer_removal_time_length_minus_1: plus 1 specifies the length of the * @buffer_removal_time syntax element, in bits. * @frame_presentation_time_length_minus_1: plus 1 specifies the length of the * @frame_presentation_time syntax element, in bits. */ struct _GstAV1DecoderModelInfo { guint8 buffer_delay_length_minus_1; guint32 num_units_in_decoding_tick; guint8 buffer_removal_time_length_minus_1; guint8 frame_presentation_time_length_minus_1; }; /** * GstAV1TimingInfo: * @num_units_in_display_tick: is the number of time units of a clock operating at the * frequency @time_scale Hz that corresponds to one increment of a clock tick counter. * A clock tick, in seconds, is equal to num_units_in_display_tick divided by time_scale. * It is a requirement of bitstream conformance that num_units_in_display_tick is greater * than 0. * @time_scale: is the number of time units that pass in one second. It is a requirement of * bitstream conformance that @time_scale is greater than 0. * @equal_picture_interval: equal to 1 indicates that pictures should be displayed according * to their output order with the number of ticks between two consecutive pictures (without * dropping frames) specified by @num_ticks_per_picture_minus_1 + 1. @equal_picture_interval * equal to 0 indicates that the interval between two consecutive pictures is not specified. * @num_ticks_per_picture_minus_1: plus 1 specifies the number of clock ticks corresponding * to output time between two consecutive pictures in the output order. It is a requirement * of bitstream conformance that the value of @num_ticks_per_picture_minus_1 shall be in the * range of 0 to (1 << 32) - 2, inclusive. */ struct _GstAV1TimingInfo { guint32 num_units_in_display_tick; guint32 time_scale; gboolean equal_picture_interval; guint32 num_ticks_per_picture_minus_1; }; /** * GstAV1ColorConfig: * @high_bitdepth: syntax element which, together with @seq_profile, determine the bit depth. * @twelve_bit: is syntax elements which, together with @seq_profile and @high_bitdepth, * determines the bit depth. * @mono_chrome: equal to 1 indicates that the video does not contain U and V color planes. * @mono_chrome equal to 0 indicates that the video contains Y, U, and V color planes. * @color_description_present_flag: equal to 1 specifies that color_primaries, * @transfer_characteristics, and @matrix_coefficients are present. * @color_description_present_flag equal to 0 specifies that @color_primaries, * @transfer_characteristics and @matrix_coefficients are not present. * @color_primaries: is an integer that is defined by the "Color primaries" section of * ISO/IEC 23091-4/ITU-T H.273. * @transfer_characteristics: is an integer that is defined by the "Transfer characteristics" * section of ISO/IEC 23091-4/ITU-T H.273. * @matrix_coefficients: is an integer that is defined by the "Matrix coefficients" section * of ISO/IEC 23091-4/ITU-T H.273. * @color_range: is a binary value that is associated with the VideoFullRangeFlag variable * specified in ISO/IEC 23091-4/ITU-T H.273. color range equal to 0 shall be referred to * as the studio swing representation and color range equal to 1 shall be referred to as * the full swing representation for all intents relating to this specification. * @subsampling_x, @subsampling_y: specify the chroma subsampling format. If * @matrix_coefficients is equal to GST_AV1_MC_IDENTITY, it is a requirement of bitstream * conformance that @subsampling_x is equal to 0 and @subsampling_y is equal to 0. * @chroma_sample_position specifies the sample position for subsampled streams: * @separate_uv_delta_q: equal to 1 indicates that the U and V planes may have separate * delta quantizer values. @separate_uv_delta_q equal to 0 indicates that the U and V * planes will share the same delta quantizer value. */ struct _GstAV1ColorConfig { gboolean high_bitdepth; gboolean twelve_bit; gboolean mono_chrome; gboolean color_description_present_flag; GstAV1ColorPrimaries color_primaries; GstAV1TransferCharacteristics transfer_characteristics; GstAV1MatrixCoefficients matrix_coefficients; gboolean color_range; guint8 subsampling_x; guint8 subsampling_y; GstAV1ChromaSamplePositions chroma_sample_position; gboolean separate_uv_delta_q; }; /** * GstAV1SequenceHeaderOBU: * @seq_profile: specifies the features that can be used in the coded video sequence * @still_picture: equal to 1 specifies that the bitstream contains only one coded frame. * @reduced_still_picture_header: specifies that the syntax elements not needed by a still * picture are omitted. * @frame_width_bits_minus_1: specifies the number of bits minus 1 used for transmitting * the frame width syntax elements. * @frame_height_bits_minus_1: specifies the number of bits minus 1 used for transmitting * the frame height syntax elements. * @max_frame_width_minus_1: specifies the maximum frame width minus 1 for the frames * represented by this sequenceheader. * @max_frame_height_minus_1: specifies the maximum frame height minus 1 for the frames * represented by this sequenceheader. * @frame_id_numbers_present_flag: specifies whether frame id numbers are present in the bitstream. * @delta_frame_id_length_minus_2: specifies the number of bits minus 2 used to encode * delta_frame_id syntax elements. * @additional_frame_id_length_minus_1: is used to calculate the number of bits used to * encode the frame_id syntax element. * @use_128x128_superblock: when equal to 1, indicates that superblocks contain 128x128 luma * samples. When equal to 0, it indicates that superblocks contain 64x64 luma samples. * (The number of contained chroma samples depends on @subsampling_x and @subsampling_y). * @enable_filter_intra: equal to 1 specifies that the @use_filter_intra syntax element may * be present. @enable_filter_intra equal to 0 specifies that the @use_filter_intra syntax * element will not be present. * @enable_intra_edge_filter: specifies whether the intra edge filtering process should be enabled. * @enable_interintra_compound: equal to 1 specifies that the mode info for inter blocks may * contain the syntax element interintra. @enable_interintra_compound equal to 0 specifies * that the syntax element interintra will not be present. * @enable_masked_compound: equal to 1 specifies that the mode info for inter blocks may * contain the syntax element @compound_type. @enable_masked_compound equal to 0 specifies * that the syntax element @compound_type will not be present. * @enable_warped_motion: equal to 1 indicates that the allow_warped_motion syntax element * may be present. @enable_warped_motion equal to 0 indicates that the @allow_warped_motion * syntax element will not be present. * @enable_order_hint: equal to 1 indicates that tools based on the values of order hints * may be used. @enable_order_hint equal to 0 indicates that tools based on order hints * are disabled. * @enable_dual_filter: equal to 1 indicates that the inter prediction filter type may be * specified independently in the horizontal and vertical directions. If the flag is equal * to 0, only one filter type may be specified, which is then used in both directions. * @enable_jnt_comp: equal to 1 indicates that the distance weights process may be used * for inter prediction. * @enable_ref_frame_mvs: equal to 1 indicates that the @use_ref_frame_mvs syntax element * may be present. @enable_ref_frame_mvs equal to 0 indicates that the @use_ref_frame_mvs * syntax element will not be present. * @seq_choose_screen_content_tools: equal to 0 indicates that the @seq_force_screen_content_tools * syntax element will be present. @seq_choose_screen_content_tools equal to 1 indicates * that @seq_force_screen_content_tools should be set equal to SELECT_SCREEN_CONTENT_TOOLS. * @seq_force_screen_content_tools: equal to SELECT_SCREEN_CONTENT_TOOLS indicates that the * @allow_screen_content_tools syntax element will be present in the frame header. Otherwise, * @seq_force_screen_content_tools contains the value for @allow_screen_content_tools. * @seq_choose_integer_mv: equal to 0 indicates that the seq_force_integer_mv syntax element * will be present. @seq_choose_integer_mv equal to 1 indicates that @seq_force_integer_mv * should be set equal to SELECT_INTEGER_MV. * @seq_force_integer_mv: equal to SELECT_INTEGER_MV indicates that the @force_integer_mv * syntax element will be present in the frame header (providing allow_screen_content_tools * is equal to 1). Otherwise, @seq_force_integer_mv contains the value for @force_integer_mv. * @order_hint_bits_minus_1: is used to compute OrderHintBits. * @enable_superres: equal to 1 specifies that the use_superres syntax element will be present * in the uncompressed header. enable_superres equal to 0 specifies that the use_superres * syntax element will not be present (instead use_superres will be set to 0 in the * uncompressed header without being read). * @enable_cdef: equal to 1 specifies that cdef filtering may be enabled. enable_cdef equal * to 0 specifies that cdef filtering is disabled. * @enable_restoration: equal to 1 specifies that loop restoration filtering may be enabled. * enable_restoration equal to 0 specifies that loop restoration filtering is disabled. * @film_grain_params_present: specifies whether film grain parameters are present in the bitstream. * @operating_points_cnt_minus_1: indicates the number of operating points minus 1 present * in this bitstream. * @operating_points: specifies the corresponding operating point for a set of operating * parameters. * @decoder_model_info_present_flag: specifies whether the decoder model info is present in * the bitstream. * @decoder_model_info: holds information about the decoder model. * @initial_display_delay_present_flag: specifies whether initial display delay information * is present in the bitstream or not. * @timing_info_present_flag: specifies whether timing info is present in the bitstream. * @timing_info: holds the timing information. * @color_config: hold the color configuration. * @order_hint_bits: specifies the number of bits used for the order_hint syntax element. * @bit_depth: the bit depth of the stream. * @num_planes: the YUV plane number. */ struct _GstAV1SequenceHeaderOBU { GstAV1Profile seq_profile; gboolean still_picture; guint8 reduced_still_picture_header; guint8 frame_width_bits_minus_1; guint8 frame_height_bits_minus_1; guint16 max_frame_width_minus_1; guint16 max_frame_height_minus_1; gboolean frame_id_numbers_present_flag; guint8 delta_frame_id_length_minus_2; guint8 additional_frame_id_length_minus_1; gboolean use_128x128_superblock; gboolean enable_filter_intra; gboolean enable_intra_edge_filter; gboolean enable_interintra_compound; gboolean enable_masked_compound; gboolean enable_warped_motion; gboolean enable_order_hint; gboolean enable_dual_filter; gboolean enable_jnt_comp; gboolean enable_ref_frame_mvs; gboolean seq_choose_screen_content_tools; guint8 seq_force_screen_content_tools; gboolean seq_choose_integer_mv; guint8 seq_force_integer_mv; gint8 order_hint_bits_minus_1; gboolean enable_superres; gboolean enable_cdef; gboolean enable_restoration; guint8 film_grain_params_present; guint8 operating_points_cnt_minus_1; GstAV1OperatingPoint operating_points[GST_AV1_MAX_OPERATING_POINTS]; gboolean decoder_model_info_present_flag; GstAV1DecoderModelInfo decoder_model_info; guint8 initial_display_delay_present_flag; gboolean timing_info_present_flag; GstAV1TimingInfo timing_info; GstAV1ColorConfig color_config; /* Global var calculated by sequence */ guint8 order_hint_bits; /* OrderHintBits */ guint8 bit_depth; /* BitDepth */ guint8 num_planes; /* NumPlanes */ }; /** * GstAV1MetadataITUT_T35: * @itu_t_t35_country_code: shall be a byte having a value specified as a country code by * Annex A of Recommendation ITU-T T.35. * @itu_t_t35_country_code_extension_byte: shall be a byte having a value specified as a * country code by Annex B of Recommendation ITU-T T.35. * @itu_t_t35_payload_bytes: shall be bytes containing data registered as specified in * Recommendation ITU-T T.35. */ struct _GstAV1MetadataITUT_T35 { guint8 itu_t_t35_country_code; guint8 itu_t_t35_country_code_extention_byte; /* itu_t_t35_payload_bytes - not specified at this spec */ guint8 *itu_t_t35_payload_bytes; }; /** * GstAV1MetadataHdrCll: * @max_cll: specifies the maximum content light level as specified in CEA-861.3, Appendix A. * @max_fall: specifies the maximum frame-average light level as specified in CEA-861.3, Appendix A. * * High Dynamic Range content light level syntax metadata. */ struct _GstAV1MetadataHdrCll { guint16 max_cll; guint16 max_fall; }; /** * GstAV1MetadataHdrMdcv: * @primary_chromaticity_x: specifies a 0.16 fixed-point X chromaticity coordinate as * defined by CIE 1931, where i = 0,1,2 specifies Red, Green, Blue respectively. * @primary_chromaticity_y: specifies a 0.16 fixed-point Y chromaticity coordinate as * defined by CIE 1931, where i = 0,1,2 specifies Red, Green, Blue respectively. * @white_point_chromaticity_x: specifies a 0.16 fixed-point white X chromaticity coordinate * as defined by CIE 1931. * @white_point_chromaticity_y: specifies a 0.16 fixed-point white Y chromaticity coordinate * as defined by CIE 1931. * @luminance_max: is a 24.8 fixed-point maximum luminance, represented in candelas per * square meter. * @luminance_min: is a 18.14 fixed-point minimum luminance, represented in candelas per * square meter. * * High Dynamic Range mastering display color volume metadata. */ struct _GstAV1MetadataHdrMdcv { guint16 primary_chromaticity_x[3]; guint16 primary_chromaticity_y[3]; guint16 white_point_chromaticity_x; guint16 white_point_chromaticity_y; guint32 luminance_max; guint32 luminance_min; }; /** * GstAV1MetadataScalability: * @scalability_mode_idc: indicates the picture prediction structure of the bitstream. * @spatial_layers_cnt_minus_1: indicates the number of spatial layers present in the video * sequence minus one. * @spatial_layer_description_present_flag: indicates when set to 1 that the * spatial_layer_ref_id is present for each of the (@spatial_layers_cnt_minus_1 + 1) layers, * or that it is not present when set to 0. * @spatial_layer_dimensions_present_flag: indicates when set to 1 that the * @spatial_layer_max_width and @spatial_layer_max_height parameters are present for each of * the (@spatial_layers_cnt_minus_1 + 1) layers, or that it they are not present when set to 0. * @temporal_group_description_present_flag: indicates when set to 1 that the temporal * dependency information is present, or that it is not when set to 0. * @spatial_layer_max_width: specifies the maximum frame width for the frames with * @spatial_id equal to i. This number must not be larger than @max_frame_width_minus_1 + 1. * @spatial_layer_max_height: specifies the maximum frame height for the frames with * @spatial_id equal to i. This number must not be larger than @max_frame_height_minus_1 + 1. * @spatial_layer_ref_id: specifies the @spatial_id value of the frame within the current * temporal unit that the frame of layer i uses for reference. If no frame within the * current temporal unit is used for reference the value must be equal to 255. * @temporal_group_size: indicates the number of pictures in a temporal picture group. If the * @temporal_group_size is greater than 0, then the scalability structure data allows the * inter-picture temporal dependency structure of the video sequence to be specified. If the * @temporal_group_size is greater than 0, then for @temporal_group_size pictures in the * temporal group, each picture's temporal layer id (@temporal_id), switch up points * (@temporal_group_temporal_switching_up_point_flag and * @temporal_group_spatial_switching_up_point_flag), and the reference picture indices * (@temporal_group_ref_pic_diff) are specified. The first picture specified in a temporal * group must have @temporal_id equal to 0. If the parameter @temporal_group_size is not * present or set to 0, then either there is only one temporal layer or there is no fixed * inter-picture temporal dependency present going forward in the video sequence. Note that * for a given picture, all frames follow the same inter-picture temporal dependency * structure. However, the frame rate of each layer can be different from each other. The * specified dependency structure in the scalability structure data must be for the highest * frame rate layer. * @temporal_group_temporal_id: specifies the temporal_id value for the i-th picture in * the temporal group. * @temporal_group_temporal_switching_up_point_flag: is set to 1 if subsequent (in decoding * order) pictures with a @temporal_id higher than @temporal_group_temporal_id[i] do not * depend on any picture preceding the current picture (in coding order) with @temporal_id * higher than @temporal_group_temporal_id[ i ]. * @temporal_group_spatial_switching_up_point_flag: is set to 1 if spatial layers of the * current picture in the temporal group (i.e., pictures with a spatial_id higher than zero) * do not depend on any picture preceding the current picture in the temporal group. * @temporal_group_ref_cnt: indicates the number of reference pictures used by the i-th * picture in the temporal group. * @temporal_group_ref_pic_diff: indicates, for the i-th picture in the temporal group, * the temporal distance between the i-th picture and the j-th reference picture used by * the i-th picture. The temporal distance is measured in frames, counting only frames of * identical @spatial_id values. * * The scalability metadata OBU is intended for use by intermediate * processing entities that may perform selective layer elimination. */ struct _GstAV1MetadataScalability { GstAV1ScalabilityModes scalability_mode_idc; guint8 spatial_layers_cnt_minus_1; gboolean spatial_layer_dimensions_present_flag; gboolean spatial_layer_description_present_flag; gboolean temporal_group_description_present_flag; guint16 spatial_layer_max_width[GST_AV1_MAX_SPATIAL_LAYERS]; guint16 spatial_layer_max_height[GST_AV1_MAX_SPATIAL_LAYERS]; guint8 spatial_layer_ref_id[GST_AV1_MAX_SPATIAL_LAYERS]; guint8 temporal_group_size; guint8 temporal_group_temporal_id[GST_AV1_MAX_TEMPORAL_GROUP_SIZE]; guint8 temporal_group_temporal_switching_up_point_flag[GST_AV1_MAX_TEMPORAL_GROUP_SIZE]; guint8 temporal_group_spatial_switching_up_point_flag[GST_AV1_MAX_TEMPORAL_GROUP_SIZE]; guint8 temporal_group_ref_cnt[GST_AV1_MAX_TEMPORAL_GROUP_SIZE]; guint8 temporal_group_ref_pic_diff[GST_AV1_MAX_TEMPORAL_GROUP_SIZE] [GST_AV1_MAX_TEMPORAL_GROUP_REFERENCES]; }; /** * GstAV1MetadataTimecode: * @counting_type: specifies the method of dropping values of the n_frames syntax element as * specified in AV1 Spec 6.1.1. @counting_type should be the same for all pictures in the * coded video sequence. * @full_timestamp_flag: equal to 1 indicates that the the @seconds_value, @minutes_value, * @hours_value syntax elements will be present. @full_timestamp_flag equal to 0 indicates * that there are flags to control the presence of these syntax elements. * @discontinuity_flag: equal to 0 indicates that the difference between the current value * of clockTimestamp and the value of clockTimestamp computed from the previous set of * timestamp syntax elements in output order can be interpreted as the time difference * between the times of origin or capture of the associated frames or fields. * @discontinuity_flag equal to 1 indicates that the difference between the current value of * clockTimestamp and the value of clockTimestamp computed from the previous set of clock * timestamp syntax elements in output order should not be interpreted as the time difference * between the times of origin or capture of the associated frames or fields. * @cnt_dropped_flag: specifies the skipping of one or more values of @n_frames using the * counting method specified by counting_type. * @n_frames: is used to compute clockTimestamp. When @timing_info_present_flag is equal to 1, * @n_frames shall be less than maxFps, where maxFps is specified by * maxFps = ceil( time_scale / ( 2 * @num_units_in_display_tick ) ). * @seconds_flag: equal to 1 specifies that @seconds_value and @minutes_flag are present when * @full_timestamp_flag is equal to 0. @seconds_flag equal to 0 specifies that @seconds_value * and @minutes_flag are not present. * @seconds_value: is used to compute clockTimestamp and shall be in the range of 0 to 59. * When @seconds_value is not present, its value is inferred to be equal to the value of * @seconds_value for the previous set of clock timestamp syntax elements in decoding order, * and it is required that such a previous @seconds_value shall have been present. * @minutes_flag: equal to 1 specifies that @minutes_value and @hours_flag are present when * @full_timestamp_flag is equal to 0 and @seconds_flag is equal to 1. @minutes_flag equal to 0 * specifies that @minutes_value and @hours_flag are not present. * @minutes_value: specifies the value of mm used to compute clockTimestamp and shall be in * the range of 0 to 59, inclusive. When minutes_value is not present, its value is inferred * to be equal to the value of @minutes_value for the previous set of clock timestamp syntax * elements in decoding order, and it is required that such a previous @minutes_value shall * have been present. * @hours_flag: equal to 1 specifies that @hours_value is present when @full_timestamp_flag is * equal to 0 and @seconds_flag is equal to 1 and @minutes_flag is equal to 1. * @hours_value: is used to compute clockTimestamp and shall be in the range of 0 to 23, * inclusive. When @hours_value is not present, its value is inferred to be equal to the * value of @hours_value for the previous set of clock timestamp syntax elements in decoding * order, and it is required that such a previous @hours_value shall have been present. * @time_offset_length: greater than 0 specifies the length in bits of the @time_offset_value * syntax element. @time_offset_length equal to 0 specifies that the @time_offset_value syntax * element is not present. @time_offset_length should be the same for all pictures in the * coded video sequence. * @time_offset_value: is used to compute clockTimestamp. The number of bits used to represent * @time_offset_value is equal to @time_offset_length. When @time_offset_value is not present, * its value is inferred to be equal to 0. */ struct _GstAV1MetadataTimecode { guint8 counting_type; /* candidate for sperate Type GstAV1TimecodeCountingType */ gboolean full_timestamp_flag; gboolean discontinuity_flag; gboolean cnt_dropped_flag; guint8 n_frames; gboolean seconds_flag; guint8 seconds_value; gboolean minutes_flag; guint8 minutes_value; gboolean hours_flag; guint8 hours_value; guint8 time_offset_length; guint32 time_offset_value; }; /** * GstAV1MetadataOBU: * @metadata_type: type of metadata * @itut_t35: ITUT T35 metadata * @hdrcll: high dynamic range content light level metadata * @hdrcmdcv: high dynamic range mastering display color volume metadata_type * @scalability: Scalability metadata * @timecode: Timecode metadata */ struct _GstAV1MetadataOBU { GstAV1MetadataType metadata_type; union { GstAV1MetadataITUT_T35 itut_t35; GstAV1MetadataHdrCll hdr_cll; GstAV1MetadataHdrMdcv hdr_mdcv; GstAV1MetadataScalability scalability; GstAV1MetadataTimecode timecode; }; }; /** * GstAV1LoopFilterParams: * @loop_filter_level: is an array containing loop filter strength values. Different loop * filter strength values from the array are used depending on the image plane being * filtered, and the edge direction (vertical or horizontal) being filtered. * @loop_filter_sharpness: indicates the sharpness level. The @loop_filter_level and * @loop_filter_sharpness together determine when a block edge is filtered, and by how much * the filtering can change the sample values. The loop filter process is described in AV1 * Bitstream Spec. section 7.14. * @loop_filter_delta_enabled: equal to 1 means that the filter level depends on the mode and * reference frame used to predict a block. @loop_filter_delta_enabled equal to 0 means that * the filter level does not depend on the mode and reference frame. * @loop_filter_delta_update: equal to 1 means that the bitstream contains additional syntax * elements that specify which mode and reference frame deltas are to be updated. * @loop_filter_delta_update equal to 0 means that these syntax elements are not present. * @loop_filter_ref_deltas: contains the adjustment needed for the filter level based on * the chosen reference frame. If this syntax element is not present in the bitstream, * it maintains its previous value. * @loop_filter_mode_deltas: contains the adjustment needed for the filter level based on * the chosen mode. If this syntax element is not present in the bitstream, it maintains * its previous value. * @delta_lf_present: specifies whether loop filter delta values are present in the bitstream. * @delta_lf_res: specifies the left shift which should be applied to decoded loop filter * delta values. * @delta_lf_multi: equal to 1 specifies that separate loop filter deltas are sent for * horizontal luma edges, vertical luma edges, the U edges, and the V edges. @delta_lf_multi * equal to 0 specifies that the same loop filter delta is used for all edges. */ struct _GstAV1LoopFilterParams { guint8 loop_filter_level[4]; guint8 loop_filter_sharpness; gboolean loop_filter_delta_enabled; gboolean loop_filter_delta_update; gint8 loop_filter_ref_deltas[GST_AV1_TOTAL_REFS_PER_FRAME]; gint8 loop_filter_mode_deltas[2]; gboolean delta_lf_present; guint8 delta_lf_res; guint8 delta_lf_multi; }; /** * GstAV1QuantizationParams: * @base_q_idx: indicates the base frame qindex. This is used for Y AC coefficients and as * the base value for the other quantizers. * @diff_uv_delta: equal to 1 indicates that the U and V delta quantizer values are coded * separately. @diff_uv_delta equal to 0 indicates that the U and V delta quantizer values * share a common value. * @using_qmatrix: specifies that the quantizer matrix will be used to compute quantizers. * @qm_y: specifies the level in the quantizer matrix that should be used for luma plane decoding. * @qm_u: specifies the level in the quantizer matrix that should be used for chroma U plane decoding. * @qm_v: specifies the level in the quantizer matrix that should be used for chroma V plane decoding. * @delta_q_present: specifies whether quantizer index delta values are present in the bitstream. * @delta_q_res: specifies the left shift which should be applied to decoded quantizer index * delta values. * @delta_q_y_dc: indicates the Y DC quantizer relative to base_q_idx. * @delta_q_u_dc: indicates the U DC quantizer relative to base_q_idx. * @delta_q_u_ac: indicates the U AC quantizer relative to base_q_idx. * @delta_q_v_dc: indicates the V DC quantizer relative to base_q_idx. * @delta_q_v_ac: indicates the V AC quantizer relative to base_q_idx. */ struct _GstAV1QuantizationParams { guint8 base_q_idx; gboolean diff_uv_delta; gboolean using_qmatrix; guint8 qm_y; guint8 qm_u; guint8 qm_v; gboolean delta_q_present; guint8 delta_q_res; gint8 delta_q_y_dc; /* DeltaQYDc */ gint8 delta_q_u_dc; /* DeltaQUDc */ gint8 delta_q_u_ac; /* DeltaQUAc */ gint8 delta_q_v_dc; /* DeltaQVDc */ gint8 delta_q_v_ac; /* DeltaQVAc */ }; /** * GstAV1SegmenationParams: * @segmentation_enabled: equal to 1 indicates that this frame makes use of the segmentation * tool; @segmentation_enabled equal to 0 indicates that the frame does not use segmentation. * @segmentation_update_map: equal to 1 indicates that the segmentation map are updated during * the decoding of this frame. @segmentation_update_map equal to 0 means that the segmentation * map from the previous frame is used. * @segmentation_temporal_update: equal to 1 indicates that the updates to the segmentation map * are coded relative to the existing segmentation map. @segmentation_temporal_update equal to * 0 indicates that the new segmentation map is coded without reference to the existing * segmentation map. * @segmentation_update_data: equal to 1 indicates that new parameters are about to be * specified for each segment. @segmentation_update_data equal to 0 indicates that the * segmentation parameters should keep their existing values. * @feature_enabled: set to 1 when the feature of segmentation is enabled. * @feature_data: the value of according segmentation feature. * @seg_id_pre_skip: equal to 1 indicates that the segment id will be read before the skip * syntax element. @seg_id_pre_skip equal to 0 indicates that the skip syntax element will be * read first. * @last_active_seg_id: indicates the highest numbered segment id that has some enabled feature. * This is used when decoding the segment id to only decode choices corresponding to used * segments. */ struct _GstAV1SegmenationParams { gboolean segmentation_enabled; guint8 segmentation_update_map; guint8 segmentation_temporal_update; guint8 segmentation_update_data; gint8 feature_enabled[GST_AV1_MAX_SEGMENTS][GST_AV1_SEG_LVL_MAX]; /* FeatureEnabled */ gint16 feature_data[GST_AV1_MAX_SEGMENTS][GST_AV1_SEG_LVL_MAX]; /* FeatureData */ guint8 seg_id_pre_skip; /* SegIdPreSkip */ guint8 last_active_seg_id; /* LastActiveSegId */ }; /** * GstAV1TileInfo: * @uniform_tile_spacing_flag: equal to 1 means that the tiles are uniformly spaced across the * frame. (In other words, all tiles are the same size except for the ones at the right and * bottom edge which can be smaller.) @uniform_tile_spacing_flag equal to 0 means that the * tile sizes are coded. * @increment_tile_rows_log2: is used to compute @tile_rows_log2. * @width_in_sbs_minus_1: specifies the width of a tile minus 1 in units of superblocks. * @height_in_sbs_minus_1: specifies the height of a tile minus 1 in units of superblocks. * @tile_size_bytes_minus_1: is used to compute @tile_size_bytes * @context_update_tile_id: specifies which tile to use for the CDF update. * @mi_col_starts: is an array specifying the start column (in units of 4x4 luma samples) for * each tile across the image. * @mi_row_starts: is an array specifying the start row (in units of 4x4 luma samples) for * each tile down the image. * @tile_cols_log2: specifies the base 2 logarithm of the desired number of tiles across the frame. * @tile_cols: specifies the number of tiles across the frame. It is a requirement of bitstream * conformance that @tile_cols is less than or equal to GST_AV1_MAX_TILE_COLS. * @tile_rows_log2: specifies the base 2 logarithm of the desired number of tiles down the frame. * @tile_rows: specifies the number of tiles down the frame. It is a requirement of bitstream * conformance that @tile_rows is less than or equal to GST_AV1_MAX_TILE_ROWS. * @tile_size_bytes: specifies the number of bytes needed to code each tile size. */ struct _GstAV1TileInfo { guint8 uniform_tile_spacing_flag; gint increment_tile_rows_log2; gint width_in_sbs_minus_1[GST_AV1_MAX_TILE_COLS]; gint height_in_sbs_minus_1[GST_AV1_MAX_TILE_ROWS]; gint tile_size_bytes_minus_1; guint8 context_update_tile_id; guint32 mi_col_starts[GST_AV1_MAX_TILE_COLS + 1]; /* MiColStarts */ guint32 mi_row_starts[GST_AV1_MAX_TILE_ROWS + 1]; /* MiRowStarts */ guint8 tile_cols_log2; /* TileColsLog2 */ guint8 tile_cols; /* TileCols */ guint8 tile_rows_log2; /* TileRowsLog2 */ guint8 tile_rows; /* TileRows */ guint8 tile_size_bytes; /* TileSizeBytes */ }; /** * GstAV1CDEFParams: * @cdef_damping: controls the amount of damping in the deringing filter. * @cdef_bits: specifies the number of bits needed to specify which CDEF filter to apply. * @cdef_y_pri_strength: specify the strength of the primary filter (Y component) * @cdef_uv_pri_strength: specify the strength of the primary filter (UV components). * @cdef_y_sec_strength: specify the strength of the secondary filter (Y component). * @cdef_uv_sec_strength: specify the strength of the secondary filter (UV components). * * Parameters of Constrained Directional Enhancement Filter (CDEF). */ struct _GstAV1CDEFParams { guint8 cdef_damping; guint8 cdef_bits; guint8 cdef_y_pri_strength[GST_AV1_CDEF_MAX]; guint8 cdef_y_sec_strength[GST_AV1_CDEF_MAX]; guint8 cdef_uv_pri_strength[GST_AV1_CDEF_MAX]; guint8 cdef_uv_sec_strength[GST_AV1_CDEF_MAX]; }; /** * GstAV1LoopRestorationParams: * @lr_unit_shift: specifies if the luma restoration size should be halved. * @lr_uv_shift: is only present for 4:2:0 formats and specifies if the chroma size should be * half the luma size. * @frame_restoration_type: specifies the type of restoration used for each plane. * @loop_restoration_size: specifies the size of loop restoration units in units of samples in * the current plane. * @uses_lr: indicates if any plane uses loop restoration. */ struct _GstAV1LoopRestorationParams { guint8 lr_unit_shift; gboolean lr_uv_shift; GstAV1FrameRestorationType frame_restoration_type[GST_AV1_MAX_NUM_PLANES]; /* FrameRestorationType */ guint32 loop_restoration_size[GST_AV1_MAX_NUM_PLANES]; /* LoopRestorationSize */ guint8 uses_lr; /* UsesLr */ }; /** * GstAV1GlobalMotionParams: * @is_global: specifies whether global motion parameters are present for a particular * reference frame. * @is_rot_zoom: specifies whether a particular reference frame uses rotation and zoom * global motion. * @is_translation: specifies whether a particular reference frame uses translation * global motion. * @gm_params: is set equal to SavedGmParams[ frame_to_show_map_idx ][ ref ][ j ] for * ref = LAST_FRAME..ALTREF_FRAME, for j = 0..5. * @gm_type: specifying the type of global motion. * @invalid: whether this global motion parameters is invalid. (Since: 1.20) */ /** * _GstAV1GlobalMotionParams.invalid: * * whether this global motion parameters is invalid. * * Since: 1.20 */ struct _GstAV1GlobalMotionParams { gboolean is_global[GST_AV1_NUM_REF_FRAMES]; gboolean is_rot_zoom[GST_AV1_NUM_REF_FRAMES]; gboolean is_translation[GST_AV1_NUM_REF_FRAMES]; gint32 gm_params[GST_AV1_NUM_REF_FRAMES][6]; GstAV1WarpModelType gm_type[GST_AV1_NUM_REF_FRAMES]; /* GmType */ gboolean invalid[GST_AV1_NUM_REF_FRAMES]; }; /** * GstAV1FilmGrainParams: * @apply_grain: equal to 1 specifies that film grain should be added to this frame. * apply_grain equal to 0 specifies that film grain should not be added. * @grain_seed: specifies the starting value for the pseudo-random numbers used during film * grain synthesis. * @update_grain: equal to 1 means that a new set of parameters should be sent. @update_grain * equal to 0 means that the previous set of parameters should be used. * @film_grain_params_ref_idx: indicates which reference frame contains the film grain * parameters to be used for this frame. * @num_y_points: specifies the number of points for the piece-wise linear scaling function * of the luma component. It is a requirement of bitstream conformance that @num_y_points is * less than or equal to 14. * @point_y_value: represents the x (luma value) coordinate for the i-th point of the * piecewise linear scaling function for luma component. The values are signaled on the * scale of 0..255. (In case of 10 bit video, these values correspond to luma values divided * by 4. In case of 12 bit video, these values correspond to luma values divided by 16.) * If i is greater than 0, it is a r equirement of bitstream conformance that * @point_y_value[ i ] is greater than @point_y_value[ i - 1 ] (this ensures the x coordinates * are specified in increasing order). * @point_y_scaling: represents the scaling (output) value for the i-th point of the * piecewise linear scaling function for luma component. * @chroma_scaling_from_luma: specifies that the chroma scaling is inferred from the luma scaling. * @num_cb_points: specifies the number of points for the piece-wise linear scaling function * of the cb component. It is a requirement of bitstream conformance that @num_cb_points is * less than or equal to 10. * @point_cb_value: represents the x coordinate for the i-th point of the piece-wise linear * scaling function for cb component. The values are signaled on the scale of 0..255. If i * is greater than 0, it is a requirement of bitstream conformance that point_cb_value[ i ] * is greater than point_cb_value[ i - 1 ]. * @point_cb_scaling: represents the scaling (output) value for the i-th point of the * piecewise linear scaling function for cb component. * @num_cr_points: specifies represents the number of points for the piece-wise linear scaling * function of the cr component. It is a requirement of bitstream conformance that * num_cr_points is less than or equal to 10. If subsampling_x is equal to 1 and * @subsampling_y is equal to 1 and num_cb_points is equal to 0, it is a requirement of * bitstream conformance that num_cr_points is equal to 0. If @subsampling_x is equal to 1 * and @subsampling_y is equal to 1 and @num_cb_points is not equal to 0, it is a requirement * of bitstream conformance that @num_cr_points is not equal to 0. * @point_cr_value: represents the x coordinate for the i-th point of the piece-wise linear * scaling function for cr component. The values are signaled on the scale of 0..255. If i * is greater than 0, it is a requirement of bitstream conformance that @point_cr_value[ i ] * is greater than @point_cr_value[ i - 1 ]. * @point_cr_scaling: represents the scaling (output) value for the i-th point of the * piecewise linear scaling function for cr component. * @grain_scaling_minus_8: represents the shift - 8 applied to the values of the chroma * component. The @grain_scaling_minus_8 can take values of 0..3 and determines the range and * quantization step of the standard deviation of film grain. * @ar_coeff_lag: specifies the number of auto-regressive coefficients for luma and chroma. * @ar_coeffs_y_plus_128: specifies auto-regressive coefficients used for the Y plane. * @ar_coeffs_cb_plus_128: specifies auto-regressive coefficients used for the U plane. * @ar_coeffs_cr_plus_128: specifies auto-regressive coefficients used for the V plane. * @ar_coeff_shift_minus_6: specifies the range of the auto-regressive coefficients. Values * of 0, 1, 2, and 3 correspond to the ranges for auto-regressive coefficients of [-2, 2), * [-1, 1), [-0.5, 0.5) and [-0.25, 0.25) respectively. * @grain_scale_shift: specifies how much the Gaussian random numbers should be scaled down * during the grain synthesis process. * @cb_mult: represents a multiplier for the cb component used in derivation of the input * index to the cb component scaling function. * @cb_luma_mult: represents a multiplier for the average luma component used in derivation * of the input index to the cb component scaling function. * @cb_offset: represents an offset used in derivation of the input index to the cb component * scaling function. * @cr_mult: represents a multiplier for the cr component used in derivation of the input * index to the cr component scaling function. * @cr_luma_mult: represents a multiplier for the average luma component used in derivation * of the input index to the cr component scaling function. * @cr_offset: represents an offset used in derivation of the input index to the cr component * scaling function. * @overlap_flag: equal to 1 indicates that the overlap between film grain blocks shall be * applied. overlap_flag equal to 0 indicates that the overlap between film grain blocks * shall not be applied. * @clip_to_restricted_range: equal to 1 indicates that clipping to the restricted (studio) * range shall be applied to the sample values after adding the film grain (see the * semantics for color_range for an explanation of studio swing). clip_to_restricted_range * equal to 0 indicates that clipping to the full range shall be applied to the sample * values after adding the film grain. */ struct _GstAV1FilmGrainParams { gboolean apply_grain; guint16 grain_seed; gboolean update_grain; guint8 film_grain_params_ref_idx; guint8 num_y_points; guint8 point_y_value[GST_AV1_MAX_NUM_Y_POINTS]; guint8 point_y_scaling[GST_AV1_MAX_NUM_Y_POINTS]; guint8 chroma_scaling_from_luma; guint8 num_cb_points; guint8 point_cb_value[GST_AV1_MAX_NUM_CB_POINTS]; guint8 point_cb_scaling[GST_AV1_MAX_NUM_CB_POINTS]; guint8 num_cr_points; guint8 point_cr_value[GST_AV1_MAX_NUM_CR_POINTS]; guint8 point_cr_scaling[GST_AV1_MAX_NUM_CR_POINTS]; guint8 grain_scaling_minus_8; guint8 ar_coeff_lag; guint8 ar_coeffs_y_plus_128[GST_AV1_MAX_NUM_POS_LUMA]; guint8 ar_coeffs_cb_plus_128[GST_AV1_MAX_NUM_POS_LUMA]; guint8 ar_coeffs_cr_plus_128[GST_AV1_MAX_NUM_POS_LUMA]; guint8 ar_coeff_shift_minus_6; guint8 grain_scale_shift; guint8 cb_mult; guint8 cb_luma_mult; guint8 cb_offset; guint8 cr_mult; guint8 cr_luma_mult; guint8 cr_offset; gboolean overlap_flag; gboolean clip_to_restricted_range; }; /** * GstAV1FrameHeaderOBU: * @show_existing_frame: equal to 1, indicates the frame indexed by @frame_to_show_map_idx is * to be output; @show_existing_frame equal to 0 indicates that further processing is required. * If @obu_type is equal to #GST_AV1_OBU_FRAME, it is a requirement of bitstream conformance that * @show_existing_frame is equal to 0. * @frame_to_show_map_idx: specifies the frame to be output. It is only available if * @show_existing_frame is 1. * @frame_presentation_time: specifies the presentation time of the frame in clock ticks * DispCT counted from the removal time of the last frame with frame_type equal to KEY_FRAME * for the operating point that is being decoded. The syntax element is signaled as a fixed * length unsigned integer with a length in bits given by * @frame_presentation_time_length_minus_1 + 1. The @frame_presentation_time is the remainder * of a modulo 1 << (@frame_presentation_time_length_minus_1 + 1) counter. * @tu_presentation_delay: is a syntax element used by the decoder model. It does not affect * the decoding process. * @display_frame_id: provides the frame id number for the frame to output. It is a requirement * of bitstream conformance that whenever @display_frame_id is read, the value matches * @ref_frame_id[ @frame_to_show_map_idx ] (the value of @current_frame_id at the time that the * frame indexed by @frame_to_show_map_idx was stored), and that * @ref_valid[ @frame_to_show_map_idx ] is equjal to 1. It is a requirement of bitstream * conformance that the number of bits needed to read @display_frame_id does not exceed 16. * This is equivalent to the constraint that idLen <= 16 * @frame_type: specifies the type of the frame. * @show_frame: equal to 1 specifies that this frame should be immediately output once decoded. * show_frame equal to 0 specifies that this frame should not be immediately output. (It may * be output later if a later uncompressed header uses @show_existing_frame equal to 1). * @showable_frame: equal to 1 specifies that the frame may be output using the * @show_existing_frame mechanism. showable_frame equal to 0 specifies that this frame will * not be output using the @show_existing_frame mechanism. It is a requirement of bitstream * conformance that when @show_existing_frame is used to show a previous frame, that the * value of @showable_frame for the previous frame was equal to 1. It is a requirement of * bitstream conformance that a particular showable frame is output via the * @show_existing_frame mechanism at most once. * @error_resilient_mode: equal to 1 indicates that error resilient mode is enabled; * @error_resilient_mode equal to 0 indicates that error resilient mode is disabled. * @disable_cdf_update: specifies whether the CDF update in the symbol decoding process should * be disabled. * @allow_screen_content_tools: equal to 1 indicates that intra blocks may use palette encoding; * @allow_screen_content_tools equal to 0 indicates that palette encoding is never used. * @force_integer_mv: equal to 1 specifies that motion vectors will always be integers. * @force_integer_mv equal to 0 specifies that motion vectors can contain fractional bits. * @current_frame_id: specifies the frame id number for the current frame. Frame id numbers * are additional information that do not affect the decoding process, but provide decoders * with a way of detecting missing reference frames so that appropriate action can be taken. * @frame_size_override_flag: equal to 0 specifies that the frame size is equal to the size in * the sequence header. @frame_size_override_flag equal to 1 specifies that the frame size * will either be specified as the size of one of the reference frames, or computed from the * @frame_width_minus_1 and @frame_height_minus_1 syntax elements. * @order_hint: is used to compute order_hint. * @primary_ref_frame: specifies which reference frame contains the CDF values and other state * that should be loaded at the start of the frame. * @buffer_removal_time_present_flag: equal to 1 specifies that @buffer_removal_time is present * in the bitstream. @buffer_removal_time_present_flag equal to 0 specifies that * @buffer_removal_time is not present in the bitstream. * @buffer_removal_time: specifies the frame removal time in units of DecCT clock ticks * counted from the removal time of the last frame with frame_type equal to KEY_FRAME for * operating point opNum. @buffer_removal_time is signaled as a fixed length unsigned integer * with a length in bits given by @buffer_removal_time_length_minus_1 + 1. @buffer_removal_time * is the remainder of a modulo 1 << ( @buffer_removal_time_length_minus_1 + 1 ) counter. * @refresh_frame_flags: contains a bitmask that specifies which reference frame slots will be * updated with the current frame after it is decoded. If @frame_type is equal to * #GST_AV1_INTRA_ONLY_FRAME, it is a requirement of bitstream conformance that * @refresh_frame_flags is not equal to 0xff. * @ref_order_hint: specifies the expected output order hint for each reference buffer. * @allow_intrabc: equal to 1 indicates that intra block copy may be used in this frame. * allow_intrabc equal to 0 indicates that intra block copy is not allowed in this frame. * @frame_refs_short_signaling: equal to 1 indicates that only two reference frames are * explicitly signaled. frame_refs_short_signaling equal to 0 indicates that all reference * frames are explicitly signaled. * @last_frame_idx: specifies the reference frame to use for LAST_FRAME. * @gold_frame_idx: specifies the reference frame to use for GOLDEN_FRAME. * @ref_frame_idx[i]: specifies which reference frames are used by inter frames. * @delta_frame_id_minus_1 is used to calculate @delta_frame_id. * @allow_high_precision_mv: equal to 0 specifies that motion vectors are specified to quarter * pel precision; @allow_high_precision_mv equal to 1 specifies that motion vectors are * specified to eighth pel precision. * @is_motion_mode_switchable: equal to 0 specifies that only the SIMPLE motion mode will be used. * @use_ref_frame_mvs: equal to 1 specifies that motion vector information from a previous * frame can be used when decoding the current frame. @use_ref_frame_mvs equal to 0 specifies * that this information will not be used. * @disable_frame_end_update_cdf: equal to 1 indicates that the end of frame CDF update is * disabled; @disable_frame_end_update_cdf equal to 0 indicates that the end of frame CDF * update is enabled. * @allow_warped_motion: equal to 1 indicates that the syntax element @motion_mode may be * present. @allow_warped_motion equal to 0 indicates that the syntax element motion_mode * will not be present (this means that LOCALWARP cannot be signaled if @allow_warped_motion * is equal to 0). * @reduced_tx_set: equal to 1 specifies that the frame is restricted to a reduced subset of * the full set of transform types. * @render_and_frame_size_different: equal to 0 means that the render width and height are * inferred from the frame width and height. @render_and_frame_size_different equal to 1 * means that the render width and height are explicitly coded in the bitstream. * @use_superres: equal to 0 indicates that no upscaling is needed. @use_superres equal to 1 * indicates that upscaling is needed. * @is_filter_switchable: equal to 1 indicates that the filter selection is signaled at the * block level; @is_filter_switchable equal to 0 indicates that the filter selection is * signaled at the frame level. * @interpolation_filter: a #GstAV1InterpolationFilter that specifies the filter selection used * for performing inter prediction. * @loop_filter_params: a #GstAV1LoopFilterParams holding the loop filter parameters. * @quantization_params: a #GstAV1QuantizationParams holding the quantization parameters. * @segmentation_params: a #GstAV1SegmenationParams holding the segementation parameters. * @tile_info: a #GstAV1TileInfo holding the tile info. * @cdef_params: a #GstAV1CDEFParams holding the CDEF paramters. * @loop_restoration_params: a #GstAV1LoopRestorationParams holding the loop restoration parameters. * @tx_mode_select: is used to compute TxMode. * @skip_mode_present: equal to 1 specifies that the syntax element @skip_mode will be coded * in the bitstream. @skip_mode_present equal to 0 specifies that @skip_mode will not be used * for this frame. * @reference_select: equal to 1 specifies that the mode info for inter blocks contains the * syntax element comp_mode that indicates whether to use single or compound reference * prediction. Reference_select equal to 0 specifies that all interblocks will use single * prediction. * @global_motion_params: a #GstAV1GlobalMotionParams holding the global motion parameters. * @film_grain_params: a #GstAV1FilmGrainParams holding the Film Grain parameters. * @superres_denom: is the denominator of a fraction that specifies the ratio between the * superblock width before and after upscaling. * @frame_is_intra: if equal to 0 indicating that this frame may use inter prediction. * @order_hints: specifies the expected output order for each reference frame. * @ref_frame_sign_bias: specifies the intended direction of the motion vector in time for * each reference frame. * @coded_lossless: is a variable that is equal to 1 when all segments use lossless encoding. * @all_lossless: is a variable that is equal to 1 when @coded_lossless is equal to 1 and * @frame_width is equal to @upscaled_width. This indicates that the frame is fully lossless * at the upscaled resolution. * @lossless_array: whether the segmentation is lossless. * @seg_qm_Level: the segmentation's qm level. * @upscaled_width: the upscaled width. * @frame_width: the frame width. * @frame_height: the frame height. * @render_width: the frame width to be rendered. * @render_height: the frame height to be rendered. * @tx_mode: specifies how the transform size is determined. * @skip_mode_frame: specifies the frames to use for compound prediction when @skip_mode is 1. */ struct _GstAV1FrameHeaderOBU { gboolean show_existing_frame; gint8 frame_to_show_map_idx; guint32 frame_presentation_time; guint32 tu_presentation_delay; guint32 display_frame_id; GstAV1FrameType frame_type; gboolean show_frame; gboolean showable_frame; gboolean error_resilient_mode; gboolean disable_cdf_update; guint8 allow_screen_content_tools; gboolean force_integer_mv; guint32 current_frame_id; gboolean frame_size_override_flag; guint32 order_hint; guint8 primary_ref_frame; gboolean buffer_removal_time_present_flag; guint32 buffer_removal_time[GST_AV1_MAX_OPERATING_POINTS]; guint8 refresh_frame_flags; guint32 ref_order_hint[GST_AV1_NUM_REF_FRAMES]; gboolean allow_intrabc; gboolean frame_refs_short_signaling; guint8 last_frame_idx; gint8 gold_frame_idx; gint8 ref_frame_idx[GST_AV1_REFS_PER_FRAME]; gboolean allow_high_precision_mv; gboolean is_motion_mode_switchable; gboolean use_ref_frame_mvs; gboolean disable_frame_end_update_cdf; gboolean allow_warped_motion; gboolean reduced_tx_set; gboolean render_and_frame_size_different; gboolean use_superres; gboolean is_filter_switchable; GstAV1InterpolationFilter interpolation_filter; GstAV1LoopFilterParams loop_filter_params; GstAV1QuantizationParams quantization_params; GstAV1SegmenationParams segmentation_params; GstAV1TileInfo tile_info; GstAV1CDEFParams cdef_params; GstAV1LoopRestorationParams loop_restoration_params; gboolean tx_mode_select; gboolean skip_mode_present; gboolean reference_select; GstAV1GlobalMotionParams global_motion_params; GstAV1FilmGrainParams film_grain_params; /* Global vars set by frame header */ guint32 superres_denom; /* SuperresDenom */ guint8 frame_is_intra; /* FrameIsIntra */ guint32 order_hints[GST_AV1_NUM_REF_FRAMES]; /* OrderHints */ guint32 ref_frame_sign_bias[GST_AV1_NUM_REF_FRAMES]; /* RefFrameSignBias */ guint8 coded_lossless; /* CodedLossless */ guint8 all_lossless; /* AllLossless */ guint8 lossless_array[GST_AV1_MAX_SEGMENTS]; /* LosslessArray */ guint8 seg_qm_Level[3][GST_AV1_MAX_SEGMENTS]; /* SegQMLevel */ guint32 upscaled_width; /* UpscaledWidth */ guint32 frame_width; /* FrameWidth */ guint32 frame_height; /* FrameHeight */ guint32 render_width; /* RenderWidth */ guint32 render_height; /* RenderHeight */ GstAV1TXModes tx_mode; /* TxMode */ guint8 skip_mode_frame[2]; /* SkipModeFrame */ }; /** * GstAV1ReferenceFrameInfo: * * All the info related to a reference frames. */ struct _GstAV1ReferenceFrameInfo { struct { gboolean ref_valid; /* RefValid */ guint32 ref_frame_id; /* RefFrameId */ guint32 ref_upscaled_width; /* RefUpscaledWidth */ guint32 ref_frame_width; /* RefFrameWidth */ guint32 ref_frame_height; /* RefFrameHeight */ guint32 ref_render_width; /* RefRenderWidth */ guint32 ref_render_height; /* RefRenderHeight */ guint32 ref_mi_cols; /* RefMiCols */ guint32 ref_mi_rows; /* RefMiRows */ GstAV1FrameType ref_frame_type; /* RefFrameType */ guint8 ref_subsampling_x; /* RefSubsamplingX */ guint8 ref_subsampling_y; /* RefSubsamplingY */ guint8 ref_bit_depth; /* RefBitDepth */ guint32 ref_order_hint; /* RefOrderHint */ GstAV1SegmenationParams ref_segmentation_params; GstAV1GlobalMotionParams ref_global_motion_params; GstAV1LoopFilterParams ref_lf_params; GstAV1FilmGrainParams ref_film_grain_params; GstAV1TileInfo ref_tile_info; } entry[GST_AV1_NUM_REF_FRAMES]; }; /** * GstAV1TileListOBU: * @output_frame_width_in_tiles_minus_1: plus one is the width of the output frame, in tile units. * @output_frame_height_in_tiles_minus_1: plus one is the height of the output frame, in tile units. * @tile_count_minus_1: plus one is the number of @tile_list_entry in the list. It is a requirement * of bitstream conformance that @tile_count_minus_1 is less than or equal to 511. * @anchor_frame_idx: is the index into an array AnchorFrames of the frames that the tile uses * for prediction. The AnchorFrames array is provided by external means and may change for * each tile list OBU. The process for creating the AnchorFrames array is outside of the * scope of this specification. It is a requirement of bitstream conformance that * @anchor_frame_idx is less than or equal to 127. * @anchor_tile_row: the row coordinate of the tile in the frame that it belongs, in tile * units. It is a requirement of bitstream conformance that @anchor_tile_row is less than @tile_rows. * @anchor_tile_col: is the column coordinate of the tile in the frame that it belongs, in tile * units. It is a requirement of bitstream conformance that @anchor_tile_col is less than @tile_cols. * @tile_data_size_minus_1: plus one is the size of the coded tile data, @coded_tile_data, in bytes. * @coded_tile_data: are the @tile_data_size_minus_1 + 1 bytes of the coded tile. */ struct _GstAV1TileListOBU { guint8 output_frame_width_in_tiles_minus_1; guint8 output_frame_height_in_tiles_minus_1; guint16 tile_count_minus_1; struct { gint8 anchor_frame_idx; guint8 anchor_tile_row; guint8 anchor_tile_col; guint16 tile_data_size_minus_1; /* Just refer to obu's data, invalid after OBU data released */ guint8 *coded_tile_data; } entry[GST_AV1_MAX_TILE_COUNT]; }; /** * GstAV1TileListOBU: * @tile_start_and_end_present_flag: specifies whether @tg_start and @tg_end are present * in the bitstream. If @tg_start and @tg_end are not present in the bitstream, this * tile group covers the entire frame. If @obu_type is equal to #GST_AV1_OBU_FRAME, it is a * requirement of bitstream conformance that the value of @tile_start_and_end_present_flag * is equal to 0. * @tg_start: specifies the zero-based index of the first tile in the current tile group. * It is a requirement of bitstream conformance that the value of @tg_start is equal to * the value of TileNum at the point that tile_group_obu is invoked. * @tg_end: specifies the zero-based index of the last tile in the current tile group. * It is a requirement of bitstream conformance that the value of tg_end is greater * than or equal to tg_start. It is a requirement of bitstream conformance that the * value of tg_end for the last tile group in each frame is equal to num_tiles-1. * @mi_row_start: start position in mi rows * @mi_row_end: end position in mi rows * @mi_col_start: start position in mi cols * @mi_col_end: end position in mi cols * @num_tiles: specifies the total number of tiles in the frame. */ struct _GstAV1TileGroupOBU { gboolean tile_start_and_end_present_flag; guint8 tg_start; guint8 tg_end; struct { /* global varialbes */ guint32 mi_row_start; /* MiRowStart */ guint32 mi_row_end; /* MiRowEnd */ guint32 mi_col_start; /* MiColStart */ guint32 mi_col_end; /* MiColEnd */ } entry[GST_AV1_MAX_TILE_COUNT]; guint32 num_tiles; /* NumTiles */ }; /** * GstAV1FrameOBU: * @frame_header: a #GstAV1FrameHeaderOBU holding frame_header data. * @tile_group: a #GstAV1TileGroupOBU holding tile_group data. */ struct _GstAV1FrameOBU { GstAV1TileGroupOBU tile_group; GstAV1FrameHeaderOBU frame_header; }; /** * GstAV1Parser: * * #GstAV1Parser opaque structure * * Instantiante it with gst_av1_parser_new() and destroy it with * gst_av1_parser_free() */ struct _GstAV1Parser { /*< private >*/ struct { guint32 operating_point; /* Set by choose_operating_point() */ guint8 seen_frame_header; /* SeenFrameHeader */ guint32 operating_point_idc; /* OperatingPointIdc */ gboolean sequence_changed; /* Received a new sequence */ gboolean begin_first_frame; /* already find the first frame */ /* frame */ guint32 upscaled_width; /* UpscaledWidth */ guint32 frame_width; /* FrameWidth */ guint32 frame_height; /* FrameHeight */ guint32 mi_cols; /* MiCols */ guint32 mi_rows; /* MiRows */ guint32 render_width; /* RenderWidth */ guint32 render_height; /* RenderHeight */ guint32 prev_frame_id; /* PrevFrameID */ guint32 current_frame_id; /* the current frame ID */ GstAV1ReferenceFrameInfo ref_info; /* RefInfo */ guint32 mi_col_starts[GST_AV1_MAX_TILE_COLS + 1]; /* MiColStarts */ guint32 mi_row_starts[GST_AV1_MAX_TILE_ROWS + 1]; /* MiRowStarts */ guint8 tile_cols_log2; /* TileColsLog2 */ guint8 tile_cols; /* TileCols */ guint8 tile_rows_log2; /* TileRowsLog2 */ guint8 tile_rows; /* TileRows */ guint8 tile_size_bytes; /* TileSizeBytes */ } state; gboolean annex_b; guint32 temporal_unit_size; /* consumed of this temporal unit */ guint32 temporal_unit_consumed; guint32 frame_unit_size; /* consumed of this frame unit */ guint32 frame_unit_consumed; GstAV1SequenceHeaderOBU *seq_header; }; GST_CODEC_PARSERS_API void gst_av1_parser_reset (GstAV1Parser * parser, gboolean annex_b); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_identify_one_obu (GstAV1Parser * parser, const guint8 * data, guint32 size, GstAV1OBU * obu, guint32 * consumed); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_sequence_header_obu (GstAV1Parser * parser, GstAV1OBU * obu, GstAV1SequenceHeaderOBU * seq_header); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_temporal_delimiter_obu (GstAV1Parser * parser, GstAV1OBU * obu); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_metadata_obu (GstAV1Parser * parser, GstAV1OBU * obu, GstAV1MetadataOBU * metadata); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_tile_list_obu (GstAV1Parser * parser, GstAV1OBU * obu, GstAV1TileListOBU * tile_list); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_tile_group_obu (GstAV1Parser * parser, GstAV1OBU * obu, GstAV1TileGroupOBU * tile_group); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_frame_header_obu (GstAV1Parser * parser, GstAV1OBU * obu, GstAV1FrameHeaderOBU * frame_header); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_parse_frame_obu (GstAV1Parser * parser, GstAV1OBU * obu, GstAV1FrameOBU * frame); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_reference_frame_loading (GstAV1Parser * parser, GstAV1FrameHeaderOBU * frame_header); GST_CODEC_PARSERS_API GstAV1ParserResult gst_av1_parser_reference_frame_update (GstAV1Parser * parser, GstAV1FrameHeaderOBU * frame_header); GST_CODEC_PARSERS_API GstAV1Parser * gst_av1_parser_new (void); GST_CODEC_PARSERS_API void gst_av1_parser_free (GstAV1Parser * parser); G_END_DECLS #endif /* __GST_AV1_PARSER_H__ */