/* GStreamer AAC parser plugin * Copyright (C) 2008 Nokia Corporation. All rights reserved. * * Contact: Stefan Kost * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public * License along with this library; if not, write to the * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, * Boston, MA 02110-1301, USA. */ /** * SECTION:element-aacparse * @short_description: AAC parser * @see_also: #GstAmrParse * * This is an AAC parser which handles both ADIF and ADTS stream formats. * * As ADIF format is not framed, it is not seekable and stream duration cannot * be determined either. However, ADTS format AAC clips can be seeked, and parser * can also estimate playback position and clip duration. * * * Example launch line * |[ * gst-launch-1.0 filesrc location=abc.aac ! aacparse ! faad ! audioresample ! audioconvert ! alsasink * ]| * */ #ifdef HAVE_CONFIG_H #include "config.h" #endif #include #include #include #include "gstaacparse.h" static GstStaticPadTemplate src_template = GST_STATIC_PAD_TEMPLATE ("src", GST_PAD_SRC, GST_PAD_ALWAYS, GST_STATIC_CAPS ("audio/mpeg, " "framed = (boolean) true, " "mpegversion = (int) { 2, 4 }, " "stream-format = (string) { raw, adts, adif, loas };")); static GstStaticPadTemplate sink_template = GST_STATIC_PAD_TEMPLATE ("sink", GST_PAD_SINK, GST_PAD_ALWAYS, GST_STATIC_CAPS ("audio/mpeg, mpegversion = (int) { 2, 4 };")); GST_DEBUG_CATEGORY_STATIC (aacparse_debug); #define GST_CAT_DEFAULT aacparse_debug #define ADIF_MAX_SIZE 40 /* Should be enough */ #define ADTS_MAX_SIZE 10 /* Should be enough */ #define LOAS_MAX_SIZE 3 /* Should be enough */ #define AAC_FRAME_DURATION(parse) (GST_SECOND/parse->frames_per_sec) static const gint loas_sample_rate_table[32] = { 96000, 88200, 64000, 48000, 44100, 32000, 24000, 22050, 16000, 12000, 11025, 8000, 7350, 0, 0, 0 }; static const gint loas_channels_table[32] = { 0, 1, 2, 3, 4, 5, 6, 8, 0, 0, 0, 0, 0, 0, 0, 0 }; static gboolean gst_aac_parse_start (GstBaseParse * parse); static gboolean gst_aac_parse_stop (GstBaseParse * parse); static gboolean gst_aac_parse_sink_setcaps (GstBaseParse * parse, GstCaps * caps); static GstCaps *gst_aac_parse_sink_getcaps (GstBaseParse * parse, GstCaps * filter); static GstFlowReturn gst_aac_parse_handle_frame (GstBaseParse * parse, GstBaseParseFrame * frame, gint * skipsize); static GstFlowReturn gst_aac_parse_pre_push_frame (GstBaseParse * parse, GstBaseParseFrame * frame); G_DEFINE_TYPE (GstAacParse, gst_aac_parse, GST_TYPE_BASE_PARSE); /** * gst_aac_parse_class_init: * @klass: #GstAacParseClass. * */ static void gst_aac_parse_class_init (GstAacParseClass * klass) { GstElementClass *element_class = GST_ELEMENT_CLASS (klass); GstBaseParseClass *parse_class = GST_BASE_PARSE_CLASS (klass); GST_DEBUG_CATEGORY_INIT (aacparse_debug, "aacparse", 0, "AAC audio stream parser"); gst_element_class_add_pad_template (element_class, gst_static_pad_template_get (&sink_template)); gst_element_class_add_pad_template (element_class, gst_static_pad_template_get (&src_template)); gst_element_class_set_static_metadata (element_class, "AAC audio stream parser", "Codec/Parser/Audio", "Advanced Audio Coding parser", "Stefan Kost "); parse_class->start = GST_DEBUG_FUNCPTR (gst_aac_parse_start); parse_class->stop = GST_DEBUG_FUNCPTR (gst_aac_parse_stop); parse_class->set_sink_caps = GST_DEBUG_FUNCPTR (gst_aac_parse_sink_setcaps); parse_class->get_sink_caps = GST_DEBUG_FUNCPTR (gst_aac_parse_sink_getcaps); parse_class->handle_frame = GST_DEBUG_FUNCPTR (gst_aac_parse_handle_frame); parse_class->pre_push_frame = GST_DEBUG_FUNCPTR (gst_aac_parse_pre_push_frame); } /** * gst_aac_parse_init: * @aacparse: #GstAacParse. * @klass: #GstAacParseClass. * */ static void gst_aac_parse_init (GstAacParse * aacparse) { GST_DEBUG ("initialized"); } /** * gst_aac_parse_set_src_caps: * @aacparse: #GstAacParse. * @sink_caps: (proposed) caps of sink pad * * Set source pad caps according to current knowledge about the * audio stream. * * Returns: TRUE if caps were successfully set. */ static gboolean gst_aac_parse_set_src_caps (GstAacParse * aacparse, GstCaps * sink_caps) { GstStructure *s; GstCaps *src_caps = NULL, *allowed; gboolean res = FALSE; const gchar *stream_format; GstBuffer *codec_data; guint16 codec_data_data; GST_DEBUG_OBJECT (aacparse, "sink caps: %" GST_PTR_FORMAT, sink_caps); if (sink_caps) src_caps = gst_caps_copy (sink_caps); else src_caps = gst_caps_new_empty_simple ("audio/mpeg"); gst_caps_set_simple (src_caps, "framed", G_TYPE_BOOLEAN, TRUE, "mpegversion", G_TYPE_INT, aacparse->mpegversion, NULL); aacparse->output_header_type = aacparse->header_type; switch (aacparse->header_type) { case DSPAAC_HEADER_NONE: stream_format = "raw"; break; case DSPAAC_HEADER_ADTS: stream_format = "adts"; break; case DSPAAC_HEADER_ADIF: stream_format = "adif"; break; case DSPAAC_HEADER_LOAS: stream_format = "loas"; break; default: stream_format = NULL; } s = gst_caps_get_structure (src_caps, 0); if (aacparse->sample_rate > 0) gst_structure_set (s, "rate", G_TYPE_INT, aacparse->sample_rate, NULL); if (aacparse->channels > 0) gst_structure_set (s, "channels", G_TYPE_INT, aacparse->channels, NULL); if (stream_format) gst_structure_set (s, "stream-format", G_TYPE_STRING, stream_format, NULL); allowed = gst_pad_get_allowed_caps (GST_BASE_PARSE (aacparse)->srcpad); if (!gst_caps_can_intersect (src_caps, allowed)) { GST_DEBUG_OBJECT (GST_BASE_PARSE (aacparse)->srcpad, "Caps can not intersect"); if (aacparse->header_type == DSPAAC_HEADER_ADTS) { GST_DEBUG_OBJECT (GST_BASE_PARSE (aacparse)->srcpad, "Input is ADTS, trying raw"); gst_caps_set_simple (src_caps, "stream-format", G_TYPE_STRING, "raw", NULL); if (gst_caps_can_intersect (src_caps, allowed)) { GstMapInfo map; int idx; idx = gst_codec_utils_aac_get_index_from_sample_rate (aacparse->sample_rate); if (idx < 0) goto not_a_known_rate; GST_DEBUG_OBJECT (GST_BASE_PARSE (aacparse)->srcpad, "Caps can intersect, we will drop the ADTS layer"); aacparse->output_header_type = DSPAAC_HEADER_NONE; /* The codec_data data is according to AudioSpecificConfig, ISO/IEC 14496-3, 1.6.2.1 */ codec_data = gst_buffer_new_and_alloc (2); gst_buffer_map (codec_data, &map, GST_MAP_WRITE); codec_data_data = (aacparse->object_type << 11) | (idx << 7) | (aacparse->channels << 3); GST_WRITE_UINT16_BE (map.data, codec_data_data); gst_buffer_unmap (codec_data, &map); gst_caps_set_simple (src_caps, "codec_data", GST_TYPE_BUFFER, codec_data, NULL); } } } gst_caps_unref (allowed); GST_DEBUG_OBJECT (aacparse, "setting src caps: %" GST_PTR_FORMAT, src_caps); res = gst_pad_set_caps (GST_BASE_PARSE (aacparse)->srcpad, src_caps); gst_caps_unref (src_caps); return res; not_a_known_rate: gst_caps_unref (allowed); gst_caps_unref (src_caps); return FALSE; } /** * gst_aac_parse_sink_setcaps: * @sinkpad: GstPad * @caps: GstCaps * * Implementation of "set_sink_caps" vmethod in #GstBaseParse class. * * Returns: TRUE on success. */ static gboolean gst_aac_parse_sink_setcaps (GstBaseParse * parse, GstCaps * caps) { GstAacParse *aacparse; GstStructure *structure; gchar *caps_str; const GValue *value; aacparse = GST_AAC_PARSE (parse); structure = gst_caps_get_structure (caps, 0); caps_str = gst_caps_to_string (caps); GST_DEBUG_OBJECT (aacparse, "setcaps: %s", caps_str); g_free (caps_str); /* This is needed at least in case of RTP * Parses the codec_data information to get ObjectType, * number of channels and samplerate */ value = gst_structure_get_value (structure, "codec_data"); if (value) { GstBuffer *buf = gst_value_get_buffer (value); if (buf) { GstMapInfo map; guint sr_idx; gst_buffer_map (buf, &map, GST_MAP_READ); sr_idx = ((map.data[0] & 0x07) << 1) | ((map.data[1] & 0x80) >> 7); aacparse->object_type = (map.data[0] & 0xf8) >> 3; aacparse->sample_rate = gst_codec_utils_aac_get_sample_rate_from_index (sr_idx); aacparse->channels = (map.data[1] & 0x78) >> 3; aacparse->header_type = DSPAAC_HEADER_NONE; aacparse->mpegversion = 4; aacparse->frame_samples = (map.data[1] & 4) ? 960 : 1024; gst_buffer_unmap (buf, &map); GST_DEBUG ("codec_data: object_type=%d, sample_rate=%d, channels=%d, " "samples=%d", aacparse->object_type, aacparse->sample_rate, aacparse->channels, aacparse->frame_samples); /* arrange for metadata and get out of the way */ gst_aac_parse_set_src_caps (aacparse, caps); gst_base_parse_set_passthrough (parse, TRUE); } else return FALSE; /* caps info overrides */ gst_structure_get_int (structure, "rate", &aacparse->sample_rate); gst_structure_get_int (structure, "channels", &aacparse->channels); } else { aacparse->sample_rate = 0; aacparse->channels = 0; aacparse->header_type = DSPAAC_HEADER_NOT_PARSED; gst_base_parse_set_passthrough (parse, FALSE); } return TRUE; } /** * gst_aac_parse_adts_get_frame_len: * @data: block of data containing an ADTS header. * * This function calculates ADTS frame length from the given header. * * Returns: size of the ADTS frame. */ static inline guint gst_aac_parse_adts_get_frame_len (const guint8 * data) { return ((data[3] & 0x03) << 11) | (data[4] << 3) | ((data[5] & 0xe0) >> 5); } /** * gst_aac_parse_check_adts_frame: * @aacparse: #GstAacParse. * @data: Data to be checked. * @avail: Amount of data passed. * @framesize: If valid ADTS frame was found, this will be set to tell the * found frame size in bytes. * @needed_data: If frame was not found, this may be set to tell how much * more data is needed in the next round to detect the frame * reliably. This may happen when a frame header candidate * is found but it cannot be guaranteed to be the header without * peeking the following data. * * Check if the given data contains contains ADTS frame. The algorithm * will examine ADTS frame header and calculate the frame size. Also, another * consecutive ADTS frame header need to be present after the found frame. * Otherwise the data is not considered as a valid ADTS frame. However, this * "extra check" is omitted when EOS has been received. In this case it is * enough when data[0] contains a valid ADTS header. * * This function may set the #needed_data to indicate that a possible frame * candidate has been found, but more data (#needed_data bytes) is needed to * be absolutely sure. When this situation occurs, FALSE will be returned. * * When a valid frame is detected, this function will use * gst_base_parse_set_min_frame_size() function from #GstBaseParse class * to set the needed bytes for next frame.This way next data chunk is already * of correct size. * * Returns: TRUE if the given data contains a valid ADTS header. */ static gboolean gst_aac_parse_check_adts_frame (GstAacParse * aacparse, const guint8 * data, const guint avail, gboolean drain, guint * framesize, guint * needed_data) { *needed_data = 0; if (G_UNLIKELY (avail < 2)) return FALSE; if ((data[0] == 0xff) && ((data[1] & 0xf6) == 0xf0)) { *framesize = gst_aac_parse_adts_get_frame_len (data); /* In EOS mode this is enough. No need to examine the data further. We also relax the check when we have sync, on the assumption that if we're not looking at random data, we have a much higher chance to get the correct sync, and this avoids losing two frames when a single bit corruption happens. */ if (drain || !GST_BASE_PARSE_LOST_SYNC (aacparse)) { return TRUE; } if (*framesize + ADTS_MAX_SIZE > avail) { /* We have found a possible frame header candidate, but can't be sure since we don't have enough data to check the next frame */ GST_DEBUG ("NEED MORE DATA: we need %d, available %d", *framesize + ADTS_MAX_SIZE, avail); *needed_data = *framesize + ADTS_MAX_SIZE; gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), *framesize + ADTS_MAX_SIZE); return FALSE; } if ((data[*framesize] == 0xff) && ((data[*framesize + 1] & 0xf6) == 0xf0)) { guint nextlen = gst_aac_parse_adts_get_frame_len (data + (*framesize)); GST_LOG ("ADTS frame found, len: %d bytes", *framesize); gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), nextlen + ADTS_MAX_SIZE); return TRUE; } } return FALSE; } static gboolean gst_aac_parse_latm_get_value (GstAacParse * aacparse, GstBitReader * br, guint32 * value) { guint8 bytes, i, byte; *value = 0; if (!gst_bit_reader_get_bits_uint8 (br, &bytes, 2)) return FALSE; for (i = 0; i < bytes; ++i) { *value <<= 8; if (!gst_bit_reader_get_bits_uint8 (br, &byte, 8)) return FALSE; *value += byte; } return TRUE; } static gboolean gst_aac_parse_get_audio_object_type (GstAacParse * aacparse, GstBitReader * br, guint8 * audio_object_type) { if (!gst_bit_reader_get_bits_uint8 (br, audio_object_type, 5)) return FALSE; if (*audio_object_type == 31) { if (!gst_bit_reader_get_bits_uint8 (br, audio_object_type, 6)) return FALSE; *audio_object_type += 32; } GST_LOG_OBJECT (aacparse, "audio object type %u", *audio_object_type); return TRUE; } static gboolean gst_aac_parse_get_audio_sample_rate (GstAacParse * aacparse, GstBitReader * br, gint * sample_rate) { guint8 sampling_frequency_index; if (!gst_bit_reader_get_bits_uint8 (br, &sampling_frequency_index, 4)) return FALSE; GST_LOG_OBJECT (aacparse, "sampling_frequency_index: %u", sampling_frequency_index); if (sampling_frequency_index == 0xf) { guint32 sampling_rate; if (!gst_bit_reader_get_bits_uint32 (br, &sampling_rate, 24)) return FALSE; *sample_rate = sampling_rate; } else { *sample_rate = loas_sample_rate_table[sampling_frequency_index]; if (!*sample_rate) return FALSE; } return TRUE; } /* See table 1.13 in ISO/IEC 14496-3 */ static gboolean gst_aac_parse_read_loas_audio_specific_config (GstAacParse * aacparse, GstBitReader * br, gint * sample_rate, gint * channels, guint32 * bits) { guint8 audio_object_type, channel_configuration; if (!gst_aac_parse_get_audio_object_type (aacparse, br, &audio_object_type)) return FALSE; if (!gst_aac_parse_get_audio_sample_rate (aacparse, br, sample_rate)) return FALSE; if (!gst_bit_reader_get_bits_uint8 (br, &channel_configuration, 4)) return FALSE; GST_LOG_OBJECT (aacparse, "channel_configuration: %d", channel_configuration); *channels = loas_channels_table[channel_configuration]; if (!*channels) return FALSE; if (audio_object_type == 5) { GST_LOG_OBJECT (aacparse, "Audio object type 5, so rereading sampling rate..."); if (!gst_aac_parse_get_audio_sample_rate (aacparse, br, sample_rate)) return FALSE; } GST_INFO_OBJECT (aacparse, "Found LOAS config: %d Hz, %d channels", *sample_rate, *channels); /* There's LOTS of stuff next, but we ignore it for now as we have what we want (sample rate and number of channels */ GST_DEBUG_OBJECT (aacparse, "Need more code to parse humongous LOAS data, currently ignored"); if (bits) *bits = 0; return TRUE; } static gboolean gst_aac_parse_read_loas_config (GstAacParse * aacparse, const guint8 * data, guint avail, gint * sample_rate, gint * channels, gint * version) { GstBitReader br; guint8 u8, v, vA; /* No version in the bitstream, but the spec has LOAS in the MPEG-4 section */ if (version) *version = 4; gst_bit_reader_init (&br, data, avail); /* skip sync word (11 bits) and size (13 bits) */ if (!gst_bit_reader_skip (&br, 11 + 13)) return FALSE; /* First bit is "use last config" */ if (!gst_bit_reader_get_bits_uint8 (&br, &u8, 1)) return FALSE; if (u8) { GST_DEBUG_OBJECT (aacparse, "Frame uses previous config"); if (!aacparse->sample_rate || !aacparse->channels) { GST_WARNING_OBJECT (aacparse, "No previous config to use"); } *sample_rate = aacparse->sample_rate; *channels = aacparse->channels; return TRUE; } GST_DEBUG_OBJECT (aacparse, "Frame contains new config"); if (!gst_bit_reader_get_bits_uint8 (&br, &v, 1)) return FALSE; if (v) { if (!gst_bit_reader_get_bits_uint8 (&br, &vA, 1)) return FALSE; } else vA = 0; GST_LOG_OBJECT (aacparse, "v %d, vA %d", v, vA); if (vA == 0) { guint8 same_time, subframes, num_program, prog; if (v == 1) { guint32 value; if (!gst_aac_parse_latm_get_value (aacparse, &br, &value)) return FALSE; } if (!gst_bit_reader_get_bits_uint8 (&br, &same_time, 1)) return FALSE; if (!gst_bit_reader_get_bits_uint8 (&br, &subframes, 6)) return FALSE; if (!gst_bit_reader_get_bits_uint8 (&br, &num_program, 4)) return FALSE; GST_LOG_OBJECT (aacparse, "same_time %d, subframes %d, num_program %d", same_time, subframes, num_program); for (prog = 0; prog <= num_program; ++prog) { guint8 num_layer, layer; if (!gst_bit_reader_get_bits_uint8 (&br, &num_layer, 3)) return FALSE; GST_LOG_OBJECT (aacparse, "Program %d: %d layers", prog, num_layer); for (layer = 0; layer <= num_layer; ++layer) { guint8 use_same_config; if (prog == 0 && layer == 0) { use_same_config = 0; } else { if (!gst_bit_reader_get_bits_uint8 (&br, &use_same_config, 1)) return FALSE; } if (!use_same_config) { if (v == 0) { if (!gst_aac_parse_read_loas_audio_specific_config (aacparse, &br, sample_rate, channels, NULL)) return FALSE; } else { guint32 bits, asc_len; if (!gst_aac_parse_latm_get_value (aacparse, &br, &asc_len)) return FALSE; if (!gst_aac_parse_read_loas_audio_specific_config (aacparse, &br, sample_rate, channels, &bits)) return FALSE; asc_len -= bits; if (!gst_bit_reader_skip (&br, asc_len)) return FALSE; } } } } GST_LOG_OBJECT (aacparse, "More data ignored"); } else { GST_WARNING_OBJECT (aacparse, "Spec says \"TBD\"..."); } return TRUE; } /** * gst_aac_parse_loas_get_frame_len: * @data: block of data containing a LOAS header. * * This function calculates LOAS frame length from the given header. * * Returns: size of the LOAS frame. */ static inline guint gst_aac_parse_loas_get_frame_len (const guint8 * data) { return (((data[1] & 0x1f) << 8) | data[2]) + 3; } /** * gst_aac_parse_check_loas_frame: * @aacparse: #GstAacParse. * @data: Data to be checked. * @avail: Amount of data passed. * @framesize: If valid LOAS frame was found, this will be set to tell the * found frame size in bytes. * @needed_data: If frame was not found, this may be set to tell how much * more data is needed in the next round to detect the frame * reliably. This may happen when a frame header candidate * is found but it cannot be guaranteed to be the header without * peeking the following data. * * Check if the given data contains contains LOAS frame. The algorithm * will examine LOAS frame header and calculate the frame size. Also, another * consecutive LOAS frame header need to be present after the found frame. * Otherwise the data is not considered as a valid LOAS frame. However, this * "extra check" is omitted when EOS has been received. In this case it is * enough when data[0] contains a valid LOAS header. * * This function may set the #needed_data to indicate that a possible frame * candidate has been found, but more data (#needed_data bytes) is needed to * be absolutely sure. When this situation occurs, FALSE will be returned. * * When a valid frame is detected, this function will use * gst_base_parse_set_min_frame_size() function from #GstBaseParse class * to set the needed bytes for next frame.This way next data chunk is already * of correct size. * * LOAS can have three different formats, if I read the spec correctly. Only * one of them is supported here, as the two samples I have use this one. * * Returns: TRUE if the given data contains a valid LOAS header. */ static gboolean gst_aac_parse_check_loas_frame (GstAacParse * aacparse, const guint8 * data, const guint avail, gboolean drain, guint * framesize, guint * needed_data) { *needed_data = 0; /* 3 byte header */ if (G_UNLIKELY (avail < 3)) return FALSE; if ((data[0] == 0x56) && ((data[1] & 0xe0) == 0xe0)) { *framesize = gst_aac_parse_loas_get_frame_len (data); GST_DEBUG_OBJECT (aacparse, "Found %u byte LOAS frame", *framesize); /* In EOS mode this is enough. No need to examine the data further. We also relax the check when we have sync, on the assumption that if we're not looking at random data, we have a much higher chance to get the correct sync, and this avoids losing two frames when a single bit corruption happens. */ if (drain || !GST_BASE_PARSE_LOST_SYNC (aacparse)) { return TRUE; } if (*framesize + LOAS_MAX_SIZE > avail) { /* We have found a possible frame header candidate, but can't be sure since we don't have enough data to check the next frame */ GST_DEBUG ("NEED MORE DATA: we need %d, available %d", *framesize + LOAS_MAX_SIZE, avail); *needed_data = *framesize + LOAS_MAX_SIZE; gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), *framesize + LOAS_MAX_SIZE); return FALSE; } if ((data[*framesize] == 0x56) && ((data[*framesize + 1] & 0xe0) == 0xe0)) { guint nextlen = gst_aac_parse_loas_get_frame_len (data + (*framesize)); GST_LOG ("LOAS frame found, len: %d bytes", *framesize); gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), nextlen + LOAS_MAX_SIZE); return TRUE; } } return FALSE; } /* caller ensure sufficient data */ static inline void gst_aac_parse_parse_adts_header (GstAacParse * aacparse, const guint8 * data, gint * rate, gint * channels, gint * object, gint * version) { if (rate) { gint sr_idx = (data[2] & 0x3c) >> 2; *rate = gst_codec_utils_aac_get_sample_rate_from_index (sr_idx); } if (channels) *channels = ((data[2] & 0x01) << 2) | ((data[3] & 0xc0) >> 6); if (version) *version = (data[1] & 0x08) ? 2 : 4; if (object) *object = ((data[2] & 0xc0) >> 6) + 1; } /** * gst_aac_parse_detect_stream: * @aacparse: #GstAacParse. * @data: A block of data that needs to be examined for stream characteristics. * @avail: Size of the given datablock. * @framesize: If valid stream was found, this will be set to tell the * first frame size in bytes. * @skipsize: If valid stream was found, this will be set to tell the first * audio frame position within the given data. * * Examines the given piece of data and try to detect the format of it. It * checks for "ADIF" header (in the beginning of the clip) and ADTS frame * header. If the stream is detected, TRUE will be returned and #framesize * is set to indicate the found frame size. Additionally, #skipsize might * be set to indicate the number of bytes that need to be skipped, a.k.a. the * position of the frame inside given data chunk. * * Returns: TRUE on success. */ static gboolean gst_aac_parse_detect_stream (GstAacParse * aacparse, const guint8 * data, const guint avail, gboolean drain, guint * framesize, gint * skipsize) { gboolean found = FALSE; guint need_data_adts = 0, need_data_loas; guint i = 0; GST_DEBUG_OBJECT (aacparse, "Parsing header data"); /* FIXME: No need to check for ADIF if we are not in the beginning of the stream */ /* Can we even parse the header? */ if (avail < MAX (ADTS_MAX_SIZE, LOAS_MAX_SIZE)) { GST_DEBUG_OBJECT (aacparse, "Not enough data to check"); return FALSE; } for (i = 0; i < avail - 4; i++) { if (((data[i] == 0xff) && ((data[i + 1] & 0xf6) == 0xf0)) || ((data[0] == 0x56) && ((data[1] & 0xe0) == 0xe0)) || strncmp ((char *) data + i, "ADIF", 4) == 0) { GST_DEBUG_OBJECT (aacparse, "Found signature at offset %u", i); found = TRUE; if (i) { /* Trick: tell the parent class that we didn't find the frame yet, but make it skip 'i' amount of bytes. Next time we arrive here we have full frame in the beginning of the data. */ *skipsize = i; return FALSE; } break; } } if (!found) { if (i) *skipsize = i; return FALSE; } if (gst_aac_parse_check_adts_frame (aacparse, data, avail, drain, framesize, &need_data_adts)) { gint rate, channels; GST_INFO ("ADTS ID: %d, framesize: %d", (data[1] & 0x08) >> 3, *framesize); gst_aac_parse_parse_adts_header (aacparse, data, &rate, &channels, &aacparse->object_type, &aacparse->mpegversion); if (!channels || !framesize) { GST_DEBUG_OBJECT (aacparse, "impossible ADTS configuration"); return FALSE; } aacparse->header_type = DSPAAC_HEADER_ADTS; gst_base_parse_set_frame_rate (GST_BASE_PARSE (aacparse), rate, aacparse->frame_samples, 2, 2); GST_DEBUG ("ADTS: samplerate %d, channels %d, objtype %d, version %d", rate, channels, aacparse->object_type, aacparse->mpegversion); gst_base_parse_set_syncable (GST_BASE_PARSE (aacparse), TRUE); return TRUE; } if (gst_aac_parse_check_loas_frame (aacparse, data, avail, drain, framesize, &need_data_loas)) { gint rate, channels; GST_INFO ("LOAS, framesize: %d", *framesize); aacparse->header_type = DSPAAC_HEADER_LOAS; if (!gst_aac_parse_read_loas_config (aacparse, data, avail, &rate, &channels, &aacparse->mpegversion)) { GST_WARNING_OBJECT (aacparse, "Error reading LOAS config"); return FALSE; } if (rate && channels) { gst_base_parse_set_frame_rate (GST_BASE_PARSE (aacparse), rate, aacparse->frame_samples, 2, 2); GST_DEBUG ("LOAS: samplerate %d, channels %d, objtype %d, version %d", rate, channels, aacparse->object_type, aacparse->mpegversion); aacparse->sample_rate = rate; aacparse->channels = channels; } gst_base_parse_set_syncable (GST_BASE_PARSE (aacparse), TRUE); return TRUE; } if (need_data_adts || need_data_loas) { /* This tells the parent class not to skip any data */ *skipsize = 0; return FALSE; } if (avail < ADIF_MAX_SIZE) return FALSE; if (memcmp (data + i, "ADIF", 4) == 0) { const guint8 *adif; int skip_size = 0; int bitstream_type; int sr_idx; GstCaps *sinkcaps; aacparse->header_type = DSPAAC_HEADER_ADIF; aacparse->mpegversion = 4; /* Skip the "ADIF" bytes */ adif = data + i + 4; /* copyright string */ if (adif[0] & 0x80) skip_size += 9; /* skip 9 bytes */ bitstream_type = adif[0 + skip_size] & 0x10; aacparse->bitrate = ((unsigned int) (adif[0 + skip_size] & 0x0f) << 19) | ((unsigned int) adif[1 + skip_size] << 11) | ((unsigned int) adif[2 + skip_size] << 3) | ((unsigned int) adif[3 + skip_size] & 0xe0); /* CBR */ if (bitstream_type == 0) { #if 0 /* Buffer fullness parsing. Currently not needed... */ guint num_elems = 0; guint fullness = 0; num_elems = (adif[3 + skip_size] & 0x1e); GST_INFO ("ADIF num_config_elems: %d", num_elems); fullness = ((unsigned int) (adif[3 + skip_size] & 0x01) << 19) | ((unsigned int) adif[4 + skip_size] << 11) | ((unsigned int) adif[5 + skip_size] << 3) | ((unsigned int) (adif[6 + skip_size] & 0xe0) >> 5); GST_INFO ("ADIF buffer fullness: %d", fullness); #endif aacparse->object_type = ((adif[6 + skip_size] & 0x01) << 1) | ((adif[7 + skip_size] & 0x80) >> 7); sr_idx = (adif[7 + skip_size] & 0x78) >> 3; } /* VBR */ else { aacparse->object_type = (adif[4 + skip_size] & 0x18) >> 3; sr_idx = ((adif[4 + skip_size] & 0x07) << 1) | ((adif[5 + skip_size] & 0x80) >> 7); } /* FIXME: This gives totally wrong results. Duration calculation cannot be based on this */ aacparse->sample_rate = gst_codec_utils_aac_get_sample_rate_from_index (sr_idx); /* baseparse is not given any fps, * so it will give up on timestamps, seeking, etc */ /* FIXME: Can we assume this? */ aacparse->channels = 2; GST_INFO ("ADIF: br=%d, samplerate=%d, objtype=%d", aacparse->bitrate, aacparse->sample_rate, aacparse->object_type); gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), 512); /* arrange for metadata and get out of the way */ sinkcaps = gst_pad_get_current_caps (GST_BASE_PARSE_SINK_PAD (aacparse)); gst_aac_parse_set_src_caps (aacparse, sinkcaps); if (sinkcaps) gst_caps_unref (sinkcaps); /* not syncable, not easily seekable (unless we push data from start */ gst_base_parse_set_syncable (GST_BASE_PARSE_CAST (aacparse), FALSE); gst_base_parse_set_passthrough (GST_BASE_PARSE_CAST (aacparse), TRUE); gst_base_parse_set_average_bitrate (GST_BASE_PARSE_CAST (aacparse), 0); *framesize = avail; return TRUE; } /* This should never happen */ return FALSE; } /** * gst_aac_parse_check_valid_frame: * @parse: #GstBaseParse. * @frame: #GstBaseParseFrame. * @skipsize: How much data parent class should skip in order to find the * frame header. * * Implementation of "handle_frame" vmethod in #GstBaseParse class. * * Also determines frame overhead. * ADTS streams have a 7 byte header in each frame. MP4 and ADIF streams don't have * a per-frame header. LOAS has 3 bytes. * * We're making a couple of simplifying assumptions: * * 1. We count Program Configuration Elements rather than searching for them * in the streams to discount them - the overhead is negligible. * * 2. We ignore CRC. This has a worst-case impact of (num_raw_blocks + 1)*16 * bits, which should still not be significant enough to warrant the * additional parsing through the headers * * Returns: a #GstFlowReturn. */ static GstFlowReturn gst_aac_parse_handle_frame (GstBaseParse * parse, GstBaseParseFrame * frame, gint * skipsize) { GstMapInfo map; GstAacParse *aacparse; gboolean ret = FALSE; gboolean lost_sync; GstBuffer *buffer; guint framesize; gint rate, channels; aacparse = GST_AAC_PARSE (parse); buffer = frame->buffer; gst_buffer_map (buffer, &map, GST_MAP_READ); *skipsize = -1; lost_sync = GST_BASE_PARSE_LOST_SYNC (parse); if (aacparse->header_type == DSPAAC_HEADER_ADIF || aacparse->header_type == DSPAAC_HEADER_NONE) { /* There is nothing to parse */ framesize = map.size; ret = TRUE; } else if (aacparse->header_type == DSPAAC_HEADER_NOT_PARSED || lost_sync) { ret = gst_aac_parse_detect_stream (aacparse, map.data, map.size, GST_BASE_PARSE_DRAINING (parse), &framesize, skipsize); } else if (aacparse->header_type == DSPAAC_HEADER_ADTS) { guint needed_data = 1024; ret = gst_aac_parse_check_adts_frame (aacparse, map.data, map.size, GST_BASE_PARSE_DRAINING (parse), &framesize, &needed_data); if (!ret) { GST_DEBUG ("buffer didn't contain valid frame"); gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), needed_data); } } else if (aacparse->header_type == DSPAAC_HEADER_LOAS) { guint needed_data = 1024; ret = gst_aac_parse_check_loas_frame (aacparse, map.data, map.size, GST_BASE_PARSE_DRAINING (parse), &framesize, &needed_data); if (!ret) { GST_DEBUG ("buffer didn't contain valid frame"); gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), needed_data); } } else { GST_DEBUG ("buffer didn't contain valid frame"); gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), ADTS_MAX_SIZE); } if (G_UNLIKELY (!ret)) goto exit; if (aacparse->header_type == DSPAAC_HEADER_ADTS) { /* see above */ frame->overhead = 7; gst_aac_parse_parse_adts_header (aacparse, map.data, &rate, &channels, NULL, NULL); GST_LOG_OBJECT (aacparse, "rate: %d, chans: %d", rate, channels); if (G_UNLIKELY (rate != aacparse->sample_rate || channels != aacparse->channels)) { aacparse->sample_rate = rate; aacparse->channels = channels; if (!gst_aac_parse_set_src_caps (aacparse, NULL)) { /* If linking fails, we need to return appropriate error */ ret = GST_FLOW_NOT_LINKED; } gst_base_parse_set_frame_rate (GST_BASE_PARSE (aacparse), aacparse->sample_rate, aacparse->frame_samples, 2, 2); } } else if (aacparse->header_type == DSPAAC_HEADER_LOAS) { gboolean setcaps = FALSE; /* see above */ frame->overhead = 3; if (!gst_aac_parse_read_loas_config (aacparse, map.data, map.size, &rate, &channels, NULL)) { GST_WARNING_OBJECT (aacparse, "Error reading LOAS config"); } else if (G_UNLIKELY (rate != aacparse->sample_rate || channels != aacparse->channels)) { aacparse->sample_rate = rate; aacparse->channels = channels; setcaps = TRUE; GST_INFO_OBJECT (aacparse, "New LOAS config: %d Hz, %d channels", rate, channels); } /* We want to set caps both at start, and when rate/channels change. Since only some LOAS frames have that info, we may receive frames before knowing about rate/channels. */ if (setcaps || !gst_pad_has_current_caps (GST_BASE_PARSE_SRC_PAD (aacparse))) { if (!gst_aac_parse_set_src_caps (aacparse, NULL)) { /* If linking fails, we need to return appropriate error */ ret = GST_FLOW_NOT_LINKED; } gst_base_parse_set_frame_rate (GST_BASE_PARSE (aacparse), aacparse->sample_rate, aacparse->frame_samples, 2, 2); } } exit: gst_buffer_unmap (buffer, &map); if (ret) { /* found, skip if needed */ if (*skipsize > 0) return GST_FLOW_OK; *skipsize = 0; } else { if (*skipsize < 0) *skipsize = 1; } if (ret && framesize <= map.size) { return gst_base_parse_finish_frame (parse, frame, framesize); } return GST_FLOW_OK; } static GstFlowReturn gst_aac_parse_pre_push_frame (GstBaseParse * parse, GstBaseParseFrame * frame) { GstAacParse *aacparse = GST_AAC_PARSE (parse); /* As a special case, we can remove the ADTS framing and output raw AAC. */ if (aacparse->header_type == DSPAAC_HEADER_ADTS && aacparse->output_header_type == DSPAAC_HEADER_NONE) { guint header_size; GstMapInfo map; gst_buffer_map (frame->buffer, &map, GST_MAP_READ); header_size = (map.data[1] & 1) ? 7 : 9; /* optional CRC */ gst_buffer_unmap (frame->buffer, &map); gst_buffer_resize (frame->buffer, header_size, gst_buffer_get_size (frame->buffer) - header_size); } return GST_FLOW_OK; } /** * gst_aac_parse_start: * @parse: #GstBaseParse. * * Implementation of "start" vmethod in #GstBaseParse class. * * Returns: TRUE if startup succeeded. */ static gboolean gst_aac_parse_start (GstBaseParse * parse) { GstAacParse *aacparse; aacparse = GST_AAC_PARSE (parse); GST_DEBUG ("start"); aacparse->frame_samples = 1024; gst_base_parse_set_min_frame_size (GST_BASE_PARSE (aacparse), ADTS_MAX_SIZE); return TRUE; } /** * gst_aac_parse_stop: * @parse: #GstBaseParse. * * Implementation of "stop" vmethod in #GstBaseParse class. * * Returns: TRUE is stopping succeeded. */ static gboolean gst_aac_parse_stop (GstBaseParse * parse) { GST_DEBUG ("stop"); return TRUE; } static GstCaps * gst_aac_parse_sink_getcaps (GstBaseParse * parse, GstCaps * filter) { GstCaps *peercaps, *templ; GstCaps *res; templ = gst_pad_get_pad_template_caps (GST_BASE_PARSE_SINK_PAD (parse)); peercaps = gst_pad_peer_query_caps (GST_BASE_PARSE_SRC_PAD (parse), filter); if (peercaps) { guint i, n; /* Remove the framed field */ peercaps = gst_caps_make_writable (peercaps); n = gst_caps_get_size (peercaps); for (i = 0; i < n; i++) { GstStructure *s = gst_caps_get_structure (peercaps, i); gst_structure_remove_field (s, "framed"); } res = gst_caps_intersect_full (peercaps, templ, GST_CAPS_INTERSECT_FIRST); gst_caps_unref (peercaps); res = gst_caps_make_writable (res); /* Append the template caps because we still want to accept * caps without any fields in the case upstream does not * know anything. */ gst_caps_append (res, templ); } else { res = templ; } if (filter) { GstCaps *intersection; intersection = gst_caps_intersect_full (filter, res, GST_CAPS_INTERSECT_FIRST); gst_caps_unref (res); res = intersection; } return res; }