mirror of
https://gitlab.freedesktop.org/gstreamer/gstreamer.git
synced 2025-01-18 05:16:05 +00:00
5861f366a0
Original commit message from CVS: * gst/audioconvert/gstaudioconvert.c: (find_suitable_channel_layout), (gst_audio_convert_fixate_channels), (gst_audio_convert_fixate_caps): Preserve channel layout when fixating the number of channels in the output caps, or make sure there's a suitable channel position layout set on the caps if required. Fixes #430677.
1049 lines
33 KiB
C
1049 lines
33 KiB
C
/* GStreamer
|
|
* Copyright (C) 2003 Benjamin Otte <in7y118@public.uni-hamburg.de>
|
|
* Copyright (C) 2005 Thomas Vander Stichele <thomas at apestaart dot org>
|
|
* Copyright (C) 2005 Wim Taymans <wim at fluendo dot com>
|
|
*
|
|
* gstaudioconvert.c: Convert audio to different audio formats automatically
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Library General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Library General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Library General Public
|
|
* License along with this library; if not, write to the
|
|
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
* Boston, MA 02111-1307, USA.
|
|
*/
|
|
|
|
/**
|
|
* SECTION:element-audioconvert
|
|
*
|
|
* <refsect2>
|
|
* <para>
|
|
* Audioconvert converts raw audio buffers between various possible formats.
|
|
* It supports integer to float conversion, width/depth conversion,
|
|
* signedness and endianness conversion.
|
|
* </para>
|
|
* <para>
|
|
* Some format conversion are not carried out in an optimal way right now.
|
|
* E.g. converting from double to float would cause a loss of precision.
|
|
* </para>
|
|
* <title>Example launch line</title>
|
|
* <para>
|
|
* <programlisting>
|
|
* gst-launch -v -m audiotestsrc ! audioconvert ! audio/x-raw-int,channels=2,width=8,depth=8 ! level ! fakesink silent=TRUE
|
|
* </programlisting>
|
|
* This pipeline converts audio to 8-bit. The level element shows that
|
|
* the output levels still match the one for a sine wave.
|
|
* </para>
|
|
* <para>
|
|
* <programlisting>
|
|
* gst-launch -v -m audiotestsrc ! audioconvert ! vorbisenc ! fakesink silent=TRUE
|
|
* </programlisting>
|
|
* The vorbis encoder takes float audio data instead of the integer data
|
|
* generated by audiotestsrc.
|
|
* </para>
|
|
* </refsect2>
|
|
*
|
|
* Last reviewed on 2006-03-02 (0.10.4)
|
|
*/
|
|
|
|
/*
|
|
* design decisions:
|
|
* - audioconvert converts buffers in a set of supported caps. If it supports
|
|
* a caps, it supports conversion from these caps to any other caps it
|
|
* supports. (example: if it does A=>B and A=>C, it also does B=>C)
|
|
* - audioconvert does not save state between buffers. Every incoming buffer is
|
|
* converted and the converted buffer is pushed out.
|
|
* conclusion:
|
|
* audioconvert is not supposed to be a one-element-does-anything solution for
|
|
* audio conversions.
|
|
*/
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "config.h"
|
|
#endif
|
|
|
|
#include <string.h>
|
|
|
|
#include "gstaudioconvert.h"
|
|
#include "gstchannelmix.h"
|
|
#include "gstaudioquantize.h"
|
|
#include "plugin.h"
|
|
|
|
GST_DEBUG_CATEGORY (audio_convert_debug);
|
|
|
|
/*** DEFINITIONS **************************************************************/
|
|
|
|
static const GstElementDetails audio_convert_details =
|
|
GST_ELEMENT_DETAILS ("Audio converter",
|
|
"Filter/Converter/Audio",
|
|
"Convert audio to different formats",
|
|
"Benjamin Otte <in7y118@public.uni-hamburg.de>");
|
|
|
|
/* type functions */
|
|
static void gst_audio_convert_dispose (GObject * obj);
|
|
|
|
/* gstreamer functions */
|
|
static gboolean gst_audio_convert_get_unit_size (GstBaseTransform * base,
|
|
GstCaps * caps, guint * size);
|
|
static GstCaps *gst_audio_convert_transform_caps (GstBaseTransform * base,
|
|
GstPadDirection direction, GstCaps * caps);
|
|
static void gst_audio_convert_fixate_caps (GstBaseTransform * base,
|
|
GstPadDirection direction, GstCaps * caps, GstCaps * othercaps);
|
|
static gboolean gst_audio_convert_set_caps (GstBaseTransform * base,
|
|
GstCaps * incaps, GstCaps * outcaps);
|
|
static GstFlowReturn gst_audio_convert_transform (GstBaseTransform * base,
|
|
GstBuffer * inbuf, GstBuffer * outbuf);
|
|
static GstFlowReturn gst_audio_convert_transform_ip (GstBaseTransform * base,
|
|
GstBuffer * buf);
|
|
static void gst_audio_convert_set_property (GObject * object, guint prop_id,
|
|
const GValue * value, GParamSpec * pspec);
|
|
static void gst_audio_convert_get_property (GObject * object, guint prop_id,
|
|
GValue * value, GParamSpec * pspec);
|
|
|
|
|
|
/* AudioConvert signals and args */
|
|
enum
|
|
{
|
|
/* FILL ME */
|
|
LAST_SIGNAL
|
|
};
|
|
|
|
enum
|
|
{
|
|
ARG_0,
|
|
ARG_DITHERING,
|
|
ARG_NOISE_SHAPING,
|
|
};
|
|
|
|
#define DEBUG_INIT(bla) \
|
|
GST_DEBUG_CATEGORY_INIT (audio_convert_debug, "audioconvert", 0, "audio conversion element");
|
|
|
|
GST_BOILERPLATE_FULL (GstAudioConvert, gst_audio_convert, GstBaseTransform,
|
|
GST_TYPE_BASE_TRANSFORM, DEBUG_INIT);
|
|
|
|
/*** GSTREAMER PROTOTYPES *****************************************************/
|
|
|
|
#define STATIC_CAPS \
|
|
GST_STATIC_CAPS ( \
|
|
"audio/x-raw-float, " \
|
|
"rate = (int) [ 1, MAX ], " \
|
|
"channels = (int) [ 1, 8 ], " \
|
|
"endianness = (int) { LITTLE_ENDIAN, BIG_ENDIAN }, " \
|
|
"width = (int) 64;" \
|
|
"audio/x-raw-float, " \
|
|
"rate = (int) [ 1, MAX ], " \
|
|
"channels = (int) [ 1, 8 ], " \
|
|
"endianness = (int) { LITTLE_ENDIAN, BIG_ENDIAN }, " \
|
|
"width = (int) 32;" \
|
|
"audio/x-raw-int, " \
|
|
"rate = (int) [ 1, MAX ], " \
|
|
"channels = (int) [ 1, 8 ], " \
|
|
"endianness = (int) { LITTLE_ENDIAN, BIG_ENDIAN }, " \
|
|
"width = (int) 32, " \
|
|
"depth = (int) [ 1, 32 ], " \
|
|
"signed = (boolean) { true, false }; " \
|
|
"audio/x-raw-int, " \
|
|
"rate = (int) [ 1, MAX ], " \
|
|
"channels = (int) [ 1, 8 ], " \
|
|
"endianness = (int) { LITTLE_ENDIAN, BIG_ENDIAN }, " \
|
|
"width = (int) 24, " \
|
|
"depth = (int) [ 1, 24 ], " "signed = (boolean) { true, false }; " \
|
|
"audio/x-raw-int, " \
|
|
"rate = (int) [ 1, MAX ], " \
|
|
"channels = (int) [ 1, 8 ], " \
|
|
"endianness = (int) { LITTLE_ENDIAN, BIG_ENDIAN }, " \
|
|
"width = (int) 16, " \
|
|
"depth = (int) [ 1, 16 ], " \
|
|
"signed = (boolean) { true, false }; " \
|
|
"audio/x-raw-int, " \
|
|
"rate = (int) [ 1, MAX ], " \
|
|
"channels = (int) [ 1, 8 ], " \
|
|
"endianness = (int) { LITTLE_ENDIAN, BIG_ENDIAN }, " \
|
|
"width = (int) 8, " \
|
|
"depth = (int) [ 1, 8 ], " \
|
|
"signed = (boolean) { true, false } " \
|
|
)
|
|
|
|
static GstAudioChannelPosition *supported_positions;
|
|
|
|
static GstStaticPadTemplate gst_audio_convert_src_template =
|
|
GST_STATIC_PAD_TEMPLATE ("src",
|
|
GST_PAD_SRC,
|
|
GST_PAD_ALWAYS,
|
|
STATIC_CAPS);
|
|
|
|
static GstStaticPadTemplate gst_audio_convert_sink_template =
|
|
GST_STATIC_PAD_TEMPLATE ("sink",
|
|
GST_PAD_SINK,
|
|
GST_PAD_ALWAYS,
|
|
STATIC_CAPS);
|
|
|
|
#define GST_TYPE_AUDIO_CONVERT_DITHERING (gst_audio_convert_dithering_get_type ())
|
|
static GType
|
|
gst_audio_convert_dithering_get_type (void)
|
|
{
|
|
static GType gtype = 0;
|
|
|
|
if (gtype == 0) {
|
|
static const GEnumValue values[] = {
|
|
{DITHER_NONE, "No dithering",
|
|
"none"},
|
|
{DITHER_RPDF, "Rectangular dithering", "rpdf"},
|
|
{DITHER_TPDF, "Triangular dithering (default)", "tpdf"},
|
|
{DITHER_TPDF_HF, "High frequency triangular dithering", "tpdf-hf"},
|
|
{0, NULL, NULL}
|
|
};
|
|
|
|
gtype = g_enum_register_static ("GstAudioConvertDithering", values);
|
|
}
|
|
return gtype;
|
|
}
|
|
|
|
#define GST_TYPE_AUDIO_CONVERT_NOISE_SHAPING (gst_audio_convert_ns_get_type ())
|
|
static GType
|
|
gst_audio_convert_ns_get_type (void)
|
|
{
|
|
static GType gtype = 0;
|
|
|
|
if (gtype == 0) {
|
|
static const GEnumValue values[] = {
|
|
{NOISE_SHAPING_NONE, "No noise shaping (default)",
|
|
"none"},
|
|
{NOISE_SHAPING_ERROR_FEEDBACK, "Error feedback", "error-feedback"},
|
|
{NOISE_SHAPING_SIMPLE, "Simple 2-pole noise shaping", "simple"},
|
|
{NOISE_SHAPING_MEDIUM, "Medium 5-pole noise shaping", "medium"},
|
|
{NOISE_SHAPING_HIGH, "High 8-pole noise shaping", "high"},
|
|
{0, NULL, NULL}
|
|
};
|
|
|
|
gtype = g_enum_register_static ("GstAudioConvertNoiseShaping", values);
|
|
}
|
|
return gtype;
|
|
}
|
|
|
|
|
|
/*** TYPE FUNCTIONS ***********************************************************/
|
|
|
|
static void
|
|
gst_audio_convert_base_init (gpointer g_class)
|
|
{
|
|
GstElementClass *element_class = GST_ELEMENT_CLASS (g_class);
|
|
|
|
gst_element_class_add_pad_template (element_class,
|
|
gst_static_pad_template_get (&gst_audio_convert_src_template));
|
|
gst_element_class_add_pad_template (element_class,
|
|
gst_static_pad_template_get (&gst_audio_convert_sink_template));
|
|
gst_element_class_set_details (element_class, &audio_convert_details);
|
|
}
|
|
|
|
static void
|
|
gst_audio_convert_class_init (GstAudioConvertClass * klass)
|
|
{
|
|
GObjectClass *gobject_class = G_OBJECT_CLASS (klass);
|
|
GstBaseTransformClass *basetransform_class = GST_BASE_TRANSFORM_CLASS (klass);
|
|
gint i;
|
|
|
|
gobject_class->dispose = gst_audio_convert_dispose;
|
|
gobject_class->set_property = gst_audio_convert_set_property;
|
|
gobject_class->get_property = gst_audio_convert_get_property;
|
|
|
|
supported_positions = g_new0 (GstAudioChannelPosition,
|
|
GST_AUDIO_CHANNEL_POSITION_NUM);
|
|
for (i = 0; i < GST_AUDIO_CHANNEL_POSITION_NUM; i++)
|
|
supported_positions[i] = i;
|
|
|
|
g_object_class_install_property (gobject_class, ARG_DITHERING,
|
|
g_param_spec_enum ("dithering", "Dithering",
|
|
"Selects between different dithering methods.",
|
|
GST_TYPE_AUDIO_CONVERT_DITHERING, DITHER_TPDF, G_PARAM_READWRITE));
|
|
|
|
g_object_class_install_property (gobject_class, ARG_NOISE_SHAPING,
|
|
g_param_spec_enum ("noise-shaping", "Noise shaping",
|
|
"Selects between different noise shaping methods.",
|
|
GST_TYPE_AUDIO_CONVERT_NOISE_SHAPING, NOISE_SHAPING_NONE,
|
|
G_PARAM_READWRITE));
|
|
|
|
basetransform_class->get_unit_size =
|
|
GST_DEBUG_FUNCPTR (gst_audio_convert_get_unit_size);
|
|
basetransform_class->transform_caps =
|
|
GST_DEBUG_FUNCPTR (gst_audio_convert_transform_caps);
|
|
basetransform_class->fixate_caps =
|
|
GST_DEBUG_FUNCPTR (gst_audio_convert_fixate_caps);
|
|
basetransform_class->set_caps =
|
|
GST_DEBUG_FUNCPTR (gst_audio_convert_set_caps);
|
|
basetransform_class->transform_ip =
|
|
GST_DEBUG_FUNCPTR (gst_audio_convert_transform_ip);
|
|
basetransform_class->transform =
|
|
GST_DEBUG_FUNCPTR (gst_audio_convert_transform);
|
|
|
|
basetransform_class->passthrough_on_same_caps = TRUE;
|
|
}
|
|
|
|
static void
|
|
gst_audio_convert_init (GstAudioConvert * this, GstAudioConvertClass * g_class)
|
|
{
|
|
this->dither = DITHER_TPDF;
|
|
this->ns = NOISE_SHAPING_NONE;
|
|
memset (&this->ctx, 0, sizeof (AudioConvertCtx));
|
|
}
|
|
|
|
static void
|
|
gst_audio_convert_dispose (GObject * obj)
|
|
{
|
|
GstAudioConvert *this = GST_AUDIO_CONVERT (obj);
|
|
|
|
audio_convert_clean_context (&this->ctx);
|
|
|
|
G_OBJECT_CLASS (parent_class)->dispose (obj);
|
|
}
|
|
|
|
/*** GSTREAMER FUNCTIONS ******************************************************/
|
|
|
|
/* convert the given GstCaps to our format */
|
|
static gboolean
|
|
gst_audio_convert_parse_caps (const GstCaps * caps, AudioConvertFmt * fmt)
|
|
{
|
|
GstStructure *structure = gst_caps_get_structure (caps, 0);
|
|
|
|
GST_DEBUG ("parse caps %p and %" GST_PTR_FORMAT, caps, caps);
|
|
|
|
g_return_val_if_fail (gst_caps_is_fixed (caps), FALSE);
|
|
g_return_val_if_fail (fmt != NULL, FALSE);
|
|
|
|
/* cleanup old */
|
|
audio_convert_clean_fmt (fmt);
|
|
|
|
fmt->endianness = G_BYTE_ORDER;
|
|
fmt->is_int =
|
|
(strcmp (gst_structure_get_name (structure), "audio/x-raw-int") == 0);
|
|
|
|
/* parse common fields */
|
|
if (!gst_structure_get_int (structure, "channels", &fmt->channels))
|
|
goto no_values;
|
|
if (!(fmt->pos = gst_audio_get_channel_positions (structure)))
|
|
goto no_values;
|
|
if (!gst_structure_get_int (structure, "width", &fmt->width))
|
|
goto no_values;
|
|
if (!gst_structure_get_int (structure, "rate", &fmt->rate))
|
|
goto no_values;
|
|
/* width != 8 needs an endianness field */
|
|
if (fmt->width != 8) {
|
|
if (!gst_structure_get_int (structure, "endianness", &fmt->endianness))
|
|
goto no_values;
|
|
}
|
|
|
|
if (fmt->is_int) {
|
|
/* int specific fields */
|
|
if (!gst_structure_get_boolean (structure, "signed", &fmt->sign))
|
|
goto no_values;
|
|
if (!gst_structure_get_int (structure, "depth", &fmt->depth))
|
|
goto no_values;
|
|
|
|
/* depth cannot be bigger than the width */
|
|
if (fmt->depth > fmt->width)
|
|
goto not_allowed;
|
|
}
|
|
|
|
fmt->unit_size = (fmt->width * fmt->channels) / 8;
|
|
|
|
return TRUE;
|
|
|
|
/* ERRORS */
|
|
no_values:
|
|
{
|
|
GST_DEBUG ("could not get some values from structure");
|
|
audio_convert_clean_fmt (fmt);
|
|
return FALSE;
|
|
}
|
|
not_allowed:
|
|
{
|
|
GST_DEBUG ("width > depth, not allowed - make us advertise correct fmt");
|
|
audio_convert_clean_fmt (fmt);
|
|
return FALSE;
|
|
}
|
|
}
|
|
|
|
/* BaseTransform vmethods */
|
|
static gboolean
|
|
gst_audio_convert_get_unit_size (GstBaseTransform * base, GstCaps * caps,
|
|
guint * size)
|
|
{
|
|
AudioConvertFmt fmt = { 0 };
|
|
|
|
g_assert (size);
|
|
|
|
if (!gst_audio_convert_parse_caps (caps, &fmt))
|
|
goto parse_error;
|
|
|
|
GST_INFO_OBJECT (base, "unit_size = %u", fmt.unit_size);
|
|
*size = fmt.unit_size;
|
|
|
|
audio_convert_clean_fmt (&fmt);
|
|
|
|
return TRUE;
|
|
|
|
parse_error:
|
|
{
|
|
GST_INFO_OBJECT (base, "failed to parse caps to get unit_size");
|
|
return FALSE;
|
|
}
|
|
}
|
|
|
|
/* Set widths (a list); multiples of 8 between min and max */
|
|
static void
|
|
set_structure_widths (GstStructure * s, int min, int max)
|
|
{
|
|
GValue list = { 0 };
|
|
GValue val = { 0 };
|
|
int width;
|
|
|
|
if (min == max) {
|
|
gst_structure_set (s, "width", G_TYPE_INT, min, NULL);
|
|
return;
|
|
}
|
|
|
|
g_value_init (&list, GST_TYPE_LIST);
|
|
g_value_init (&val, G_TYPE_INT);
|
|
for (width = min; width <= max; width += 8) {
|
|
g_value_set_int (&val, width);
|
|
gst_value_list_append_value (&list, &val);
|
|
}
|
|
gst_structure_set_value (s, "width", &list);
|
|
g_value_unset (&val);
|
|
g_value_unset (&list);
|
|
}
|
|
|
|
/* Set widths of 32 bits and 64 bits (as list) */
|
|
static void
|
|
set_structure_widths_32_and_64 (GstStructure * s)
|
|
{
|
|
GValue list = { 0 };
|
|
GValue val = { 0 };
|
|
|
|
g_value_init (&list, GST_TYPE_LIST);
|
|
g_value_init (&val, G_TYPE_INT);
|
|
g_value_set_int (&val, 32);
|
|
gst_value_list_append_value (&list, &val);
|
|
g_value_set_int (&val, 64);
|
|
gst_value_list_append_value (&list, &val);
|
|
gst_structure_set_value (s, "width", &list);
|
|
g_value_unset (&val);
|
|
g_value_unset (&list);
|
|
}
|
|
|
|
/* Modify the structure so that things that must always have a single
|
|
* value (for float), or can always be losslessly converted (for int), have
|
|
* appropriate values.
|
|
*/
|
|
static GstStructure *
|
|
make_lossless_changes (GstStructure * s, gboolean isfloat)
|
|
{
|
|
GValue list = { 0 };
|
|
GValue val = { 0 };
|
|
int i;
|
|
const gint endian[] = { G_LITTLE_ENDIAN, G_BIG_ENDIAN };
|
|
const gboolean booleans[] = { TRUE, FALSE };
|
|
|
|
g_value_init (&list, GST_TYPE_LIST);
|
|
g_value_init (&val, G_TYPE_INT);
|
|
for (i = 0; i < 2; i++) {
|
|
g_value_set_int (&val, endian[i]);
|
|
gst_value_list_append_value (&list, &val);
|
|
}
|
|
gst_structure_set_value (s, "endianness", &list);
|
|
g_value_unset (&val);
|
|
g_value_unset (&list);
|
|
|
|
if (isfloat) {
|
|
/* float doesn't have a depth or signedness field and only supports
|
|
* widths of 32 and 64 bits */
|
|
gst_structure_remove_field (s, "depth");
|
|
gst_structure_remove_field (s, "signed");
|
|
set_structure_widths_32_and_64 (s);
|
|
} else {
|
|
/* int supports signed and unsigned. GValues are a pain */
|
|
g_value_init (&list, GST_TYPE_LIST);
|
|
g_value_init (&val, G_TYPE_BOOLEAN);
|
|
for (i = 0; i < 2; i++) {
|
|
g_value_set_boolean (&val, booleans[i]);
|
|
gst_value_list_append_value (&list, &val);
|
|
}
|
|
gst_structure_set_value (s, "signed", &list);
|
|
g_value_unset (&val);
|
|
g_value_unset (&list);
|
|
}
|
|
|
|
return s;
|
|
}
|
|
|
|
static void
|
|
strip_width_64 (GstStructure * s)
|
|
{
|
|
const GValue *v = gst_structure_get_value (s, "width");
|
|
GValue widths = { 0 };
|
|
|
|
if (GST_VALUE_HOLDS_LIST (v)) {
|
|
int i;
|
|
int len = gst_value_list_get_size (v);
|
|
|
|
g_value_init (&widths, GST_TYPE_LIST);
|
|
|
|
for (i = 0; i < len; i++) {
|
|
const GValue *width = gst_value_list_get_value (v, i);
|
|
|
|
if (g_value_get_int (width) != 64)
|
|
gst_value_list_append_value (&widths, width);
|
|
}
|
|
gst_structure_set_value (s, "width", &widths);
|
|
g_value_unset (&widths);
|
|
}
|
|
}
|
|
|
|
/* Little utility function to create a related structure for float/int */
|
|
static void
|
|
append_with_other_format (GstCaps * caps, GstStructure * s, gboolean isfloat)
|
|
{
|
|
GstStructure *s2;
|
|
|
|
if (isfloat) {
|
|
s2 = gst_structure_copy (s);
|
|
gst_structure_set_name (s2, "audio/x-raw-int");
|
|
s = make_lossless_changes (s2, FALSE);
|
|
/* If 64 bit float was allowed; remove width 64: we don't support it for
|
|
* integer*/
|
|
strip_width_64 (s);
|
|
gst_caps_append_structure (caps, s2);
|
|
} else {
|
|
s2 = gst_structure_copy (s);
|
|
gst_structure_set_name (s2, "audio/x-raw-float");
|
|
s = make_lossless_changes (s2, TRUE);
|
|
gst_caps_append_structure (caps, s2);
|
|
}
|
|
}
|
|
|
|
/* Audioconvert can perform all conversions on audio except for resampling.
|
|
* However, there are some conversions we _prefer_ not to do. For example, it's
|
|
* better to convert format (float<->int, endianness, etc) than the number of
|
|
* channels, as the latter conversion is not lossless.
|
|
*
|
|
* So, we return, in order (assuming input caps have only one structure;
|
|
* which is enforced by basetransform):
|
|
* - input caps with a different format (lossless conversions).
|
|
* - input caps with a different format (slightly lossy conversions).
|
|
* - input caps with a different number of channels (very lossy!)
|
|
*/
|
|
static GstCaps *
|
|
gst_audio_convert_transform_caps (GstBaseTransform * base,
|
|
GstPadDirection direction, GstCaps * caps)
|
|
{
|
|
GstCaps *ret;
|
|
GstStructure *s, *structure;
|
|
gboolean isfloat;
|
|
gint width, depth, channels;
|
|
const gchar *fields_used[] = {
|
|
"width", "depth", "rate", "channels", "endianness", "signed"
|
|
};
|
|
const gchar *structure_name;
|
|
int i;
|
|
|
|
g_return_val_if_fail (GST_CAPS_IS_SIMPLE (caps), NULL);
|
|
|
|
structure = gst_caps_get_structure (caps, 0);
|
|
structure_name = gst_structure_get_name (structure);
|
|
|
|
isfloat = strcmp (structure_name, "audio/x-raw-float") == 0;
|
|
|
|
/* We operate on a version of the original structure with any additional
|
|
* fields absent */
|
|
s = gst_structure_empty_new (structure_name);
|
|
for (i = 0; i < sizeof (fields_used) / sizeof (*fields_used); i++) {
|
|
if (gst_structure_has_field (structure, fields_used[i]))
|
|
gst_structure_set_value (s, fields_used[i],
|
|
gst_structure_get_value (structure, fields_used[i]));
|
|
}
|
|
|
|
if (!isfloat) {
|
|
/* Commonly, depth is left out: set it equal to width if we have a fixed
|
|
* width, if so */
|
|
if (!gst_structure_has_field (s, "depth") &&
|
|
gst_structure_get_int (s, "width", &width))
|
|
gst_structure_set (s, "depth", G_TYPE_INT, width, NULL);
|
|
}
|
|
|
|
ret = gst_caps_new_empty ();
|
|
|
|
/* All lossless conversions */
|
|
s = make_lossless_changes (s, isfloat);
|
|
gst_caps_append_structure (ret, s);
|
|
|
|
/* Same, plus a float<->int conversion */
|
|
append_with_other_format (ret, s, isfloat);
|
|
GST_DEBUG_OBJECT (base, " step1: (%d) %" GST_PTR_FORMAT,
|
|
gst_caps_get_size (ret), ret);
|
|
|
|
/* We don't mind increasing width/depth/channels, but reducing them is
|
|
* Very Bad. Only available if width, depth, channels are already fixed. */
|
|
s = gst_structure_copy (s);
|
|
if (!isfloat) {
|
|
if (gst_structure_get_int (structure, "width", &width))
|
|
set_structure_widths (s, width, 32);
|
|
if (gst_structure_get_int (structure, "depth", &depth)) {
|
|
if (depth == 32)
|
|
gst_structure_set (s, "depth", G_TYPE_INT, 32, NULL);
|
|
else
|
|
gst_structure_set (s, "depth", GST_TYPE_INT_RANGE, depth, 32, NULL);
|
|
}
|
|
}
|
|
|
|
if (gst_structure_get_int (structure, "channels", &channels)) {
|
|
if (channels == 8)
|
|
gst_structure_set (s, "channels", G_TYPE_INT, 8, NULL);
|
|
else
|
|
gst_structure_set (s, "channels", GST_TYPE_INT_RANGE, channels, 8, NULL);
|
|
}
|
|
gst_caps_append_structure (ret, s);
|
|
|
|
/* Same, plus a float<->int conversion */
|
|
append_with_other_format (ret, s, isfloat);
|
|
|
|
/* We'll reduce depth if we must. We reduce as low as 16 bits (for integer);
|
|
* reducing to less than this is even worse than dropping channels. We only
|
|
* do this if we haven't already done the equivalent above. */
|
|
if (!gst_structure_get_int (structure, "width", &width) || width > 16) {
|
|
if (isfloat) {
|
|
GstStructure *s2 = gst_structure_copy (s);
|
|
|
|
set_structure_widths_32_and_64 (s2);
|
|
append_with_other_format (ret, s2, TRUE);
|
|
gst_structure_free (s2);
|
|
} else {
|
|
s = gst_structure_copy (s);
|
|
set_structure_widths (s, 16, 32);
|
|
gst_structure_set (s, "depth", GST_TYPE_INT_RANGE, 16, 32, NULL);
|
|
gst_caps_append_structure (ret, s);
|
|
}
|
|
}
|
|
|
|
/* Channel conversions to fewer channels is only done if needed - generally
|
|
* it's very bad to drop channels entirely.
|
|
*/
|
|
s = gst_structure_copy (s);
|
|
gst_structure_set (s, "channels", GST_TYPE_INT_RANGE, 1, 8, NULL);
|
|
gst_caps_append_structure (ret, s);
|
|
|
|
/* Same, plus a float<->int conversion */
|
|
append_with_other_format (ret, s, isfloat);
|
|
|
|
/* And, finally, for integer only, we allow conversion to any width/depth we
|
|
* support: this should be equivalent to our (non-float) template caps. (the
|
|
* floating point case should be being handled just above) */
|
|
s = gst_structure_copy (s);
|
|
set_structure_widths (s, 8, 32);
|
|
gst_structure_set (s, "depth", GST_TYPE_INT_RANGE, 1, 32, NULL);
|
|
|
|
if (isfloat) {
|
|
append_with_other_format (ret, s, TRUE);
|
|
gst_structure_free (s);
|
|
} else
|
|
gst_caps_append_structure (ret, s);
|
|
|
|
GST_DEBUG_OBJECT (base, "Caps transformed to %" GST_PTR_FORMAT, ret);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static const GstAudioChannelPosition default_positions[8][8] = {
|
|
/* 1 channel */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_MONO,
|
|
},
|
|
/* 2 channels */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
},
|
|
/* 3 channels (2.1) */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_LFE, /* or FRONT_CENTER for 3.0? */
|
|
},
|
|
/* 4 channels (4.0 or 3.1?) */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT,
|
|
},
|
|
/* 5 channels */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
|
|
},
|
|
/* 6 channels */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
|
|
GST_AUDIO_CHANNEL_POSITION_LFE,
|
|
},
|
|
/* 7 channels */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
|
|
GST_AUDIO_CHANNEL_POSITION_LFE,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_CENTER,
|
|
},
|
|
/* 8 channels */
|
|
{
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT,
|
|
GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
|
|
GST_AUDIO_CHANNEL_POSITION_LFE,
|
|
GST_AUDIO_CHANNEL_POSITION_SIDE_LEFT,
|
|
GST_AUDIO_CHANNEL_POSITION_SIDE_RIGHT,
|
|
}
|
|
};
|
|
|
|
const GValue *
|
|
find_suitable_channel_layout (const GValue * val, guint chans)
|
|
{
|
|
/* if output layout is fixed already and looks sane, we're done */
|
|
if (GST_VALUE_HOLDS_ARRAY (val) && gst_value_array_get_size (val) == chans)
|
|
return val;
|
|
|
|
/* if it's a list, go through it recursively and return the first
|
|
* sane-enough looking value we find */
|
|
if (GST_VALUE_HOLDS_LIST (val)) {
|
|
gint i;
|
|
|
|
for (i = 0; i < gst_value_list_get_size (val); ++i) {
|
|
const GValue *v, *ret;
|
|
|
|
v = gst_value_list_get_value (val, i);
|
|
if ((ret = find_suitable_channel_layout (v, chans)))
|
|
return ret;
|
|
}
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
static void
|
|
gst_audio_convert_fixate_channels (GstBaseTransform * base, GstStructure * ins,
|
|
GstStructure * outs)
|
|
{
|
|
const GValue *out_layout;
|
|
gint in_chans, out_chans;
|
|
|
|
if (!gst_structure_get_int (ins, "channels", &in_chans))
|
|
return; /* this shouldn't really happen, should it? */
|
|
|
|
if (!gst_structure_has_field (outs, "channels")) {
|
|
/* we could try to get the implied number of channels from the layout,
|
|
* but that seems overdoing it for a somewhat exotic corner case */
|
|
gst_structure_remove_field (outs, "channel-positions");
|
|
return;
|
|
}
|
|
|
|
/* ok, let's fixate the channels if they are not fixated yet */
|
|
gst_structure_fixate_field_nearest_int (outs, "channels", in_chans);
|
|
|
|
if (!gst_structure_get_int (outs, "channels", &out_chans)) {
|
|
/* shouldn't really happen ... */
|
|
gst_structure_remove_field (outs, "channel-positions");
|
|
return;
|
|
}
|
|
|
|
/* check if the output has a channel layout (or a list of layouts) */
|
|
out_layout = gst_structure_get_value (outs, "channel-positions");
|
|
|
|
if (out_layout == NULL) {
|
|
if (out_chans <= 2)
|
|
return; /* nothing to do, default layout will be assumed */
|
|
GST_WARNING_OBJECT (base, "downstream caps contain no channel layout");
|
|
}
|
|
|
|
if (in_chans == out_chans) {
|
|
const GValue *in_layout;
|
|
GValue res = { 0, };
|
|
|
|
in_layout = gst_structure_get_value (ins, "channel-positions");
|
|
g_return_if_fail (in_layout != NULL);
|
|
|
|
/* same number of channels and no output layout: just use input layout */
|
|
if (out_layout == NULL) {
|
|
gst_structure_set_value (outs, "channel-positions", in_layout);
|
|
return;
|
|
}
|
|
|
|
/* if output layout is fixed already and looks sane, we're done */
|
|
if (GST_VALUE_HOLDS_ARRAY (out_layout) &&
|
|
gst_value_array_get_size (out_layout) == out_chans) {
|
|
return;
|
|
}
|
|
|
|
/* if the output layout is not fixed, check if the output layout contains
|
|
* the input layout */
|
|
if (gst_value_intersect (&res, in_layout, out_layout)) {
|
|
gst_structure_set_value (outs, "channel-positions", in_layout);
|
|
g_value_unset (&res);
|
|
return;
|
|
}
|
|
|
|
/* output layout is not fixed and does not contain the input layout, so
|
|
* just pick the first layout in the list (it should be a list ...) */
|
|
if ((out_layout = find_suitable_channel_layout (out_layout, out_chans))) {
|
|
gst_structure_set_value (outs, "channel-positions", out_layout);
|
|
return;
|
|
}
|
|
|
|
/* ... else fall back to default layout (NB: out_layout is NULL here) */
|
|
GST_WARNING_OBJECT (base, "unexpected output channel layout");
|
|
}
|
|
|
|
/* number of input channels != number of output channels:
|
|
* if this value contains a list of channel layouts (or even worse: a list
|
|
* with another list), just pick the first value and repeat until we find a
|
|
* channel position array or something else that's not a list; we assume
|
|
* the input if half-way sane and don't try to fall back on other list items
|
|
* if the first one is something unexpected or non-channel-pos-array-y */
|
|
if (out_layout != NULL && GST_VALUE_HOLDS_LIST (out_layout))
|
|
out_layout = find_suitable_channel_layout (out_layout, out_chans);
|
|
|
|
if (out_layout != NULL) {
|
|
if (GST_VALUE_HOLDS_ARRAY (out_layout) &&
|
|
gst_value_array_get_size (out_layout) == out_chans) {
|
|
/* looks sane enough, let's use it */
|
|
gst_structure_set_value (outs, "channel-positions", out_layout);
|
|
return;
|
|
}
|
|
|
|
/* what now?! Just ignore what we're given and use default positions */
|
|
GST_WARNING_OBJECT (base, "invalid or unexpected channel-positions");
|
|
}
|
|
|
|
/* missing or invalid output layout and we can't use the input layout for
|
|
* one reason or another, so just pick a default layout (we could be smarter
|
|
* and try to add/remove channels from the input layout, or pick a default
|
|
* layout based on LFE-presence in input layout, but let's save that for
|
|
* another day) */
|
|
if (out_chans > 0 && out_chans < G_N_ELEMENTS (default_positions[0])) {
|
|
GST_DEBUG_OBJECT (base, "using default channel layout as fallback");
|
|
gst_audio_set_channel_positions (outs, default_positions[out_chans - 1]);
|
|
}
|
|
}
|
|
|
|
/* try to keep as many of the structure members the same by fixating the
|
|
* possible ranges; this way we convert the least amount of things as possible
|
|
*/
|
|
static void
|
|
gst_audio_convert_fixate_caps (GstBaseTransform * base,
|
|
GstPadDirection direction, GstCaps * caps, GstCaps * othercaps)
|
|
{
|
|
GstStructure *ins, *outs;
|
|
gint rate, endianness, depth, width;
|
|
gboolean signedness;
|
|
|
|
g_return_if_fail (gst_caps_is_fixed (caps));
|
|
|
|
GST_DEBUG_OBJECT (base, "trying to fixate othercaps %" GST_PTR_FORMAT
|
|
" based on caps %" GST_PTR_FORMAT, othercaps, caps);
|
|
|
|
ins = gst_caps_get_structure (caps, 0);
|
|
outs = gst_caps_get_structure (othercaps, 0);
|
|
|
|
gst_audio_convert_fixate_channels (base, ins, outs);
|
|
|
|
if (gst_structure_get_int (ins, "rate", &rate)) {
|
|
if (gst_structure_has_field (outs, "rate")) {
|
|
gst_structure_fixate_field_nearest_int (outs, "rate", rate);
|
|
}
|
|
}
|
|
if (gst_structure_get_int (ins, "endianness", &endianness)) {
|
|
if (gst_structure_has_field (outs, "endianness")) {
|
|
gst_structure_fixate_field_nearest_int (outs, "endianness", endianness);
|
|
}
|
|
}
|
|
if (gst_structure_get_int (ins, "width", &width)) {
|
|
if (gst_structure_has_field (outs, "width")) {
|
|
gst_structure_fixate_field_nearest_int (outs, "width", width);
|
|
}
|
|
} else {
|
|
/* this is not allowed */
|
|
}
|
|
|
|
if (gst_structure_get_int (ins, "depth", &depth)) {
|
|
if (gst_structure_has_field (outs, "depth")) {
|
|
gst_structure_fixate_field_nearest_int (outs, "depth", depth);
|
|
}
|
|
} else {
|
|
/* set depth as width */
|
|
if (gst_structure_has_field (outs, "depth")) {
|
|
gst_structure_fixate_field_nearest_int (outs, "depth", width);
|
|
}
|
|
}
|
|
|
|
if (gst_structure_get_boolean (ins, "signed", &signedness)) {
|
|
if (gst_structure_has_field (outs, "signed")) {
|
|
gst_structure_fixate_field_boolean (outs, "signed", signedness);
|
|
}
|
|
}
|
|
|
|
GST_DEBUG_OBJECT (base, "fixated othercaps to %" GST_PTR_FORMAT, othercaps);
|
|
}
|
|
|
|
static gboolean
|
|
gst_audio_convert_set_caps (GstBaseTransform * base, GstCaps * incaps,
|
|
GstCaps * outcaps)
|
|
{
|
|
AudioConvertFmt in_ac_caps = { 0 };
|
|
AudioConvertFmt out_ac_caps = { 0 };
|
|
GstAudioConvert *this = GST_AUDIO_CONVERT (base);
|
|
|
|
GST_DEBUG_OBJECT (base, "incaps %" GST_PTR_FORMAT ", outcaps %"
|
|
GST_PTR_FORMAT, incaps, outcaps);
|
|
|
|
if (!gst_audio_convert_parse_caps (incaps, &in_ac_caps))
|
|
return FALSE;
|
|
if (!gst_audio_convert_parse_caps (outcaps, &out_ac_caps))
|
|
return FALSE;
|
|
|
|
if (!audio_convert_prepare_context (&this->ctx, &in_ac_caps, &out_ac_caps,
|
|
this->dither, this->ns))
|
|
goto no_converter;
|
|
|
|
return TRUE;
|
|
|
|
no_converter:
|
|
{
|
|
return FALSE;
|
|
}
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_audio_convert_transform_ip (GstBaseTransform * base, GstBuffer * buf)
|
|
{
|
|
/* nothing to do here */
|
|
return GST_FLOW_OK;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_audio_convert_transform (GstBaseTransform * base, GstBuffer * inbuf,
|
|
GstBuffer * outbuf)
|
|
{
|
|
GstAudioConvert *this = GST_AUDIO_CONVERT (base);
|
|
gboolean res;
|
|
gint insize, outsize;
|
|
gint samples;
|
|
gpointer src, dst;
|
|
|
|
/* get amount of samples to convert. */
|
|
samples = GST_BUFFER_SIZE (inbuf) / this->ctx.in.unit_size;
|
|
|
|
/* get in/output sizes, to see if the buffers we got are of correct
|
|
* sizes */
|
|
if (!(res = audio_convert_get_sizes (&this->ctx, samples, &insize, &outsize)))
|
|
goto error;
|
|
|
|
if (insize == 0 || outsize == 0)
|
|
return GST_FLOW_OK;
|
|
|
|
/* check in and outsize */
|
|
if (GST_BUFFER_SIZE (inbuf) < insize)
|
|
goto wrong_size;
|
|
if (GST_BUFFER_SIZE (outbuf) < outsize)
|
|
goto wrong_size;
|
|
|
|
/* get src and dst data */
|
|
src = GST_BUFFER_DATA (inbuf);
|
|
dst = GST_BUFFER_DATA (outbuf);
|
|
|
|
/* and convert the samples */
|
|
if (!(res = audio_convert_convert (&this->ctx, src, dst,
|
|
samples, gst_buffer_is_writable (inbuf))))
|
|
goto convert_error;
|
|
|
|
GST_BUFFER_SIZE (outbuf) = outsize;
|
|
|
|
return GST_FLOW_OK;
|
|
|
|
/* ERRORS */
|
|
error:
|
|
{
|
|
GST_ELEMENT_ERROR (this, STREAM, FORMAT,
|
|
(NULL), ("cannot get input/output sizes for %d samples", samples));
|
|
return GST_FLOW_ERROR;
|
|
}
|
|
wrong_size:
|
|
{
|
|
GST_ELEMENT_ERROR (this, STREAM, FORMAT,
|
|
(NULL),
|
|
("input/output buffers are of wrong size in: %d < %d or out: %d < %d",
|
|
GST_BUFFER_SIZE (inbuf), insize, GST_BUFFER_SIZE (outbuf),
|
|
outsize));
|
|
return GST_FLOW_ERROR;
|
|
}
|
|
convert_error:
|
|
{
|
|
GST_ELEMENT_ERROR (this, STREAM, FORMAT,
|
|
(NULL), ("error while converting"));
|
|
return GST_FLOW_ERROR;
|
|
}
|
|
}
|
|
|
|
static void
|
|
gst_audio_convert_set_property (GObject * object, guint prop_id,
|
|
const GValue * value, GParamSpec * pspec)
|
|
{
|
|
GstAudioConvert *this = GST_AUDIO_CONVERT (object);
|
|
|
|
switch (prop_id) {
|
|
case ARG_DITHERING:
|
|
this->dither = g_value_get_enum (value);
|
|
break;
|
|
case ARG_NOISE_SHAPING:
|
|
this->ns = g_value_get_enum (value);
|
|
break;
|
|
default:
|
|
G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
|
|
break;
|
|
}
|
|
}
|
|
|
|
static void
|
|
gst_audio_convert_get_property (GObject * object, guint prop_id,
|
|
GValue * value, GParamSpec * pspec)
|
|
{
|
|
GstAudioConvert *this = GST_AUDIO_CONVERT (object);
|
|
|
|
switch (prop_id) {
|
|
case ARG_DITHERING:
|
|
g_value_set_enum (value, this->dither);
|
|
break;
|
|
case ARG_NOISE_SHAPING:
|
|
g_value_set_enum (value, this->ns);
|
|
break;
|
|
default:
|
|
G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
|
|
break;
|
|
}
|
|
}
|