mirror of
https://gitlab.freedesktop.org/gstreamer/gstreamer.git
synced 2024-12-01 06:01:04 +00:00
8d223d75d0
Original commit message from CVS: 2005-11-22 Andy Wingo <wingo@pobox.com> * Update for gst_tag_setter API changes.
1158 lines
32 KiB
C
1158 lines
32 KiB
C
/* GStreamer
|
|
* Copyright (C) <1999> Erik Walthinsen <omega@cse.ogi.edu>
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Library General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Library General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Library General Public
|
|
* License along with this library; if not, write to the
|
|
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
* Boston, MA 02111-1307, USA.
|
|
*/
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "config.h"
|
|
#endif
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <time.h>
|
|
#include <math.h>
|
|
#include <speex/speex.h>
|
|
#include <speex/speex_stereo.h>
|
|
|
|
#include <gst/gsttagsetter.h>
|
|
#include <gst/tag/tag.h>
|
|
#include "gstspeexenc.h"
|
|
|
|
GST_DEBUG_CATEGORY (speexenc_debug);
|
|
#define GST_CAT_DEFAULT speexenc_debug
|
|
|
|
static GstPadTemplate *gst_speexenc_src_template, *gst_speexenc_sink_template;
|
|
|
|
/* elementfactory information */
|
|
GstElementDetails speexenc_details = {
|
|
"Speex encoder",
|
|
"Codec/Encoder/Audio",
|
|
"Encodes audio in Speex format",
|
|
"Wim Taymans <wim@fluendo.com>",
|
|
};
|
|
|
|
/* GstSpeexEnc signals and args */
|
|
enum
|
|
{
|
|
/* FILL ME */
|
|
LAST_SIGNAL
|
|
};
|
|
|
|
#define DEFAULT_QUALITY 8.0
|
|
#define DEFAULT_BITRATE 0
|
|
#define DEFAULT_VBR FALSE
|
|
#define DEFAULT_ABR 0
|
|
#define DEFAULT_VAD FALSE
|
|
#define DEFAULT_DTX FALSE
|
|
#define DEFAULT_COMPLEXITY 3
|
|
#define DEFAULT_NFRAMES 1
|
|
|
|
enum
|
|
{
|
|
ARG_0,
|
|
ARG_QUALITY,
|
|
ARG_BITRATE,
|
|
ARG_VBR,
|
|
ARG_ABR,
|
|
ARG_VAD,
|
|
ARG_DTX,
|
|
ARG_COMPLEXITY,
|
|
ARG_NFRAMES,
|
|
ARG_LAST_MESSAGE
|
|
};
|
|
|
|
#if 0
|
|
static const GstFormat *
|
|
gst_speexenc_get_formats (GstPad * pad)
|
|
{
|
|
static const GstFormat src_formats[] = {
|
|
GST_FORMAT_BYTES,
|
|
GST_FORMAT_TIME,
|
|
0
|
|
};
|
|
static const GstFormat sink_formats[] = {
|
|
GST_FORMAT_BYTES,
|
|
GST_FORMAT_DEFAULT,
|
|
GST_FORMAT_TIME,
|
|
0
|
|
};
|
|
|
|
return (GST_PAD_IS_SRC (pad) ? src_formats : sink_formats);
|
|
}
|
|
#endif
|
|
|
|
static void gst_speexenc_base_init (gpointer g_class);
|
|
static void gst_speexenc_class_init (GstSpeexEncClass * klass);
|
|
static void gst_speexenc_init (GstSpeexEnc * speexenc);
|
|
|
|
static gboolean gst_speexenc_sinkevent (GstPad * pad, GstEvent * event);
|
|
static GstFlowReturn gst_speexenc_chain (GstPad * pad, GstBuffer * buf);
|
|
static gboolean gst_speexenc_setup (GstSpeexEnc * speexenc);
|
|
|
|
static void gst_speexenc_get_property (GObject * object, guint prop_id,
|
|
GValue * value, GParamSpec * pspec);
|
|
static void gst_speexenc_set_property (GObject * object, guint prop_id,
|
|
const GValue * value, GParamSpec * pspec);
|
|
static GstStateChangeReturn gst_speexenc_change_state (GstElement * element,
|
|
GstStateChange transition);
|
|
|
|
static GstElementClass *parent_class = NULL;
|
|
|
|
/*static guint gst_speexenc_signals[LAST_SIGNAL] = { 0 }; */
|
|
|
|
GType
|
|
gst_speexenc_get_type (void)
|
|
{
|
|
static GType speexenc_type = 0;
|
|
|
|
if (!speexenc_type) {
|
|
static const GTypeInfo speexenc_info = {
|
|
sizeof (GstSpeexEncClass),
|
|
gst_speexenc_base_init,
|
|
NULL,
|
|
(GClassInitFunc) gst_speexenc_class_init,
|
|
NULL,
|
|
NULL,
|
|
sizeof (GstSpeexEnc),
|
|
0,
|
|
(GInstanceInitFunc) gst_speexenc_init,
|
|
};
|
|
static const GInterfaceInfo tag_setter_info = {
|
|
NULL,
|
|
NULL,
|
|
NULL
|
|
};
|
|
|
|
speexenc_type =
|
|
g_type_register_static (GST_TYPE_ELEMENT, "GstSpeexEnc", &speexenc_info,
|
|
0);
|
|
|
|
g_type_add_interface_static (speexenc_type, GST_TYPE_TAG_SETTER,
|
|
&tag_setter_info);
|
|
|
|
GST_DEBUG_CATEGORY_INIT (speexenc_debug, "speexenc", 0, "Speex encoder");
|
|
}
|
|
return speexenc_type;
|
|
}
|
|
|
|
static GstCaps *
|
|
speex_caps_factory (void)
|
|
{
|
|
return gst_caps_new_simple ("audio/x-speex", NULL);
|
|
}
|
|
|
|
static GstCaps *
|
|
raw_caps_factory (void)
|
|
{
|
|
return
|
|
gst_caps_new_simple ("audio/x-raw-int",
|
|
"rate", GST_TYPE_INT_RANGE, 6000, 48000,
|
|
"channels", GST_TYPE_INT_RANGE, 1, 2,
|
|
"endianness", G_TYPE_INT, G_BYTE_ORDER,
|
|
"signed", G_TYPE_BOOLEAN, TRUE,
|
|
"width", G_TYPE_INT, 16, "depth", G_TYPE_INT, 16, NULL);
|
|
}
|
|
|
|
static void
|
|
gst_speexenc_base_init (gpointer g_class)
|
|
{
|
|
GstElementClass *element_class = GST_ELEMENT_CLASS (g_class);
|
|
GstCaps *raw_caps, *speex_caps;
|
|
|
|
raw_caps = raw_caps_factory ();
|
|
speex_caps = speex_caps_factory ();
|
|
|
|
gst_speexenc_sink_template = gst_pad_template_new ("sink", GST_PAD_SINK,
|
|
GST_PAD_ALWAYS, raw_caps);
|
|
gst_speexenc_src_template = gst_pad_template_new ("src", GST_PAD_SRC,
|
|
GST_PAD_ALWAYS, speex_caps);
|
|
gst_element_class_add_pad_template (element_class,
|
|
gst_speexenc_sink_template);
|
|
gst_element_class_add_pad_template (element_class, gst_speexenc_src_template);
|
|
gst_element_class_set_details (element_class, &speexenc_details);
|
|
}
|
|
|
|
static void
|
|
gst_speexenc_class_init (GstSpeexEncClass * klass)
|
|
{
|
|
GObjectClass *gobject_class;
|
|
GstElementClass *gstelement_class;
|
|
|
|
gobject_class = (GObjectClass *) klass;
|
|
gstelement_class = (GstElementClass *) klass;
|
|
|
|
gobject_class->set_property = gst_speexenc_set_property;
|
|
gobject_class->get_property = gst_speexenc_get_property;
|
|
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_QUALITY,
|
|
g_param_spec_float ("quality", "Quality", "Encoding quality",
|
|
0.0, 10.0, DEFAULT_QUALITY, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_BITRATE,
|
|
g_param_spec_int ("bitrate", "Encoding Bit-rate",
|
|
"Specify an encoding bit-rate (in bps). (0 = automatic)",
|
|
0, G_MAXINT, DEFAULT_BITRATE, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_VBR,
|
|
g_param_spec_boolean ("vbr", "VBR",
|
|
"Enable variable bit-rate", DEFAULT_VBR, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_ABR,
|
|
g_param_spec_int ("abr", "ABR",
|
|
"Enable average bit-rate (0 = disabled)",
|
|
0, G_MAXINT, DEFAULT_ABR, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_VAD,
|
|
g_param_spec_boolean ("vad", "VAD",
|
|
"Enable voice activity detection", DEFAULT_VAD, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_DTX,
|
|
g_param_spec_boolean ("dtx", "DTX",
|
|
"Enable discontinuous transmission", DEFAULT_DTX, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_COMPLEXITY,
|
|
g_param_spec_int ("complexity", "Complexity",
|
|
"Set encoding complexity",
|
|
0, G_MAXINT, DEFAULT_COMPLEXITY, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_NFRAMES,
|
|
g_param_spec_int ("nframes", "NFrames",
|
|
"Number of frames per buffer",
|
|
0, G_MAXINT, DEFAULT_NFRAMES, G_PARAM_READWRITE));
|
|
g_object_class_install_property (G_OBJECT_CLASS (klass), ARG_LAST_MESSAGE,
|
|
g_param_spec_string ("last-message", "last-message",
|
|
"The last status message", NULL, G_PARAM_READABLE));
|
|
|
|
parent_class = g_type_class_ref (GST_TYPE_ELEMENT);
|
|
|
|
gstelement_class->change_state = gst_speexenc_change_state;
|
|
}
|
|
|
|
static gboolean
|
|
gst_speexenc_sink_setcaps (GstPad * pad, GstCaps * caps)
|
|
{
|
|
GstSpeexEnc *speexenc;
|
|
GstStructure *structure;
|
|
|
|
speexenc = GST_SPEEXENC (GST_PAD_PARENT (pad));
|
|
speexenc->setup = FALSE;
|
|
|
|
structure = gst_caps_get_structure (caps, 0);
|
|
gst_structure_get_int (structure, "channels", &speexenc->channels);
|
|
gst_structure_get_int (structure, "rate", &speexenc->rate);
|
|
|
|
gst_speexenc_setup (speexenc);
|
|
|
|
if (speexenc->setup)
|
|
return TRUE;
|
|
|
|
return FALSE;
|
|
}
|
|
|
|
static gboolean
|
|
gst_speexenc_convert_src (GstPad * pad, GstFormat src_format, gint64 src_value,
|
|
GstFormat * dest_format, gint64 * dest_value)
|
|
{
|
|
gboolean res = TRUE;
|
|
GstSpeexEnc *speexenc;
|
|
gint64 avg;
|
|
|
|
speexenc = GST_SPEEXENC (GST_PAD_PARENT (pad));
|
|
|
|
if (speexenc->samples_in == 0 ||
|
|
speexenc->bytes_out == 0 || speexenc->rate == 0)
|
|
return FALSE;
|
|
|
|
avg = (speexenc->bytes_out * speexenc->rate) / (speexenc->samples_in);
|
|
|
|
switch (src_format) {
|
|
case GST_FORMAT_BYTES:
|
|
switch (*dest_format) {
|
|
case GST_FORMAT_TIME:
|
|
*dest_value = src_value * GST_SECOND / avg;
|
|
break;
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
break;
|
|
case GST_FORMAT_TIME:
|
|
switch (*dest_format) {
|
|
case GST_FORMAT_BYTES:
|
|
*dest_value = src_value * avg / GST_SECOND;
|
|
break;
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
break;
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
static gboolean
|
|
gst_speexenc_convert_sink (GstPad * pad, GstFormat src_format,
|
|
gint64 src_value, GstFormat * dest_format, gint64 * dest_value)
|
|
{
|
|
gboolean res = TRUE;
|
|
guint scale = 1;
|
|
gint bytes_per_sample;
|
|
GstSpeexEnc *speexenc;
|
|
|
|
speexenc = GST_SPEEXENC (GST_PAD_PARENT (pad));
|
|
|
|
bytes_per_sample = speexenc->channels * 2;
|
|
|
|
switch (src_format) {
|
|
case GST_FORMAT_BYTES:
|
|
switch (*dest_format) {
|
|
case GST_FORMAT_DEFAULT:
|
|
if (bytes_per_sample == 0)
|
|
return FALSE;
|
|
*dest_value = src_value / bytes_per_sample;
|
|
break;
|
|
case GST_FORMAT_TIME:
|
|
{
|
|
gint byterate = bytes_per_sample * speexenc->rate;
|
|
|
|
if (byterate == 0)
|
|
return FALSE;
|
|
*dest_value = src_value * GST_SECOND / byterate;
|
|
break;
|
|
}
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
break;
|
|
case GST_FORMAT_DEFAULT:
|
|
switch (*dest_format) {
|
|
case GST_FORMAT_BYTES:
|
|
*dest_value = src_value * bytes_per_sample;
|
|
break;
|
|
case GST_FORMAT_TIME:
|
|
if (speexenc->rate == 0)
|
|
return FALSE;
|
|
*dest_value = src_value * GST_SECOND / speexenc->rate;
|
|
break;
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
break;
|
|
case GST_FORMAT_TIME:
|
|
switch (*dest_format) {
|
|
case GST_FORMAT_BYTES:
|
|
scale = bytes_per_sample;
|
|
/* fallthrough */
|
|
case GST_FORMAT_DEFAULT:
|
|
*dest_value = src_value * scale * speexenc->rate / GST_SECOND;
|
|
break;
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
break;
|
|
default:
|
|
res = FALSE;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
static const GstQueryType *
|
|
gst_speexenc_get_query_types (GstPad * pad)
|
|
{
|
|
static const GstQueryType gst_speexenc_src_query_types[] = {
|
|
GST_QUERY_POSITION,
|
|
GST_QUERY_DURATION,
|
|
GST_QUERY_CONVERT,
|
|
0
|
|
};
|
|
|
|
return gst_speexenc_src_query_types;
|
|
}
|
|
|
|
static gboolean
|
|
gst_speexenc_src_query (GstPad * pad, GstQuery * query)
|
|
{
|
|
gboolean res = TRUE;
|
|
GstSpeexEnc *speexenc;
|
|
GstPad *peerpad;
|
|
|
|
speexenc = GST_SPEEXENC (gst_pad_get_parent (pad));
|
|
peerpad = gst_pad_get_peer (GST_PAD (speexenc->sinkpad));
|
|
|
|
switch (GST_QUERY_TYPE (query)) {
|
|
case GST_QUERY_POSITION:
|
|
{
|
|
GstFormat fmt, req_fmt;
|
|
gint64 pos, val;
|
|
|
|
gst_query_parse_position (query, &req_fmt, NULL);
|
|
if ((res = gst_pad_query_position (peerpad, &req_fmt, &val))) {
|
|
gst_query_set_position (query, req_fmt, val);
|
|
break;
|
|
}
|
|
|
|
fmt = GST_FORMAT_TIME;
|
|
if (!(res = gst_pad_query_position (peerpad, &fmt, &pos)))
|
|
break;
|
|
|
|
if ((res = gst_pad_query_convert (peerpad, fmt, pos, &req_fmt, &val)))
|
|
gst_query_set_position (query, req_fmt, val);
|
|
|
|
break;
|
|
}
|
|
case GST_QUERY_DURATION:
|
|
{
|
|
GstFormat fmt, req_fmt;
|
|
gint64 dur, val;
|
|
|
|
gst_query_parse_duration (query, &req_fmt, NULL);
|
|
if ((res = gst_pad_query_duration (peerpad, &req_fmt, &val))) {
|
|
gst_query_set_duration (query, req_fmt, val);
|
|
break;
|
|
}
|
|
|
|
fmt = GST_FORMAT_TIME;
|
|
if (!(res = gst_pad_query_duration (peerpad, &fmt, &dur)))
|
|
break;
|
|
|
|
if ((res = gst_pad_query_convert (peerpad, fmt, dur, &req_fmt, &val))) {
|
|
gst_query_set_duration (query, req_fmt, val);
|
|
}
|
|
break;
|
|
}
|
|
case GST_QUERY_CONVERT:
|
|
{
|
|
GstFormat src_fmt, dest_fmt;
|
|
gint64 src_val, dest_val;
|
|
|
|
gst_query_parse_convert (query, &src_fmt, &src_val, &dest_fmt, &dest_val);
|
|
if (!(res = gst_speexenc_convert_src (pad, src_fmt, src_val, &dest_fmt,
|
|
&dest_val)))
|
|
goto error;
|
|
gst_query_set_convert (query, src_fmt, src_val, dest_fmt, dest_val);
|
|
break;
|
|
}
|
|
default:
|
|
res = FALSE;
|
|
break;
|
|
}
|
|
|
|
error:
|
|
gst_object_unref (peerpad);
|
|
gst_object_unref (speexenc);
|
|
return res;
|
|
}
|
|
|
|
static gboolean
|
|
gst_speexenc_sink_query (GstPad * pad, GstQuery * query)
|
|
{
|
|
gboolean res = TRUE;
|
|
GstSpeexEnc *speexenc;
|
|
|
|
speexenc = GST_SPEEXENC (GST_PAD_PARENT (pad));
|
|
|
|
switch (GST_QUERY_TYPE (query)) {
|
|
case GST_QUERY_CONVERT:
|
|
{
|
|
GstFormat src_fmt, dest_fmt;
|
|
gint64 src_val, dest_val;
|
|
|
|
gst_query_parse_convert (query, &src_fmt, &src_val, &dest_fmt, &dest_val);
|
|
if (!(res =
|
|
gst_speexenc_convert_sink (pad, src_fmt, src_val, &dest_fmt,
|
|
&dest_val)))
|
|
goto error;
|
|
gst_query_set_convert (query, src_fmt, src_val, dest_fmt, dest_val);
|
|
break;
|
|
}
|
|
default:
|
|
res = FALSE;
|
|
break;
|
|
}
|
|
|
|
error:
|
|
return res;
|
|
}
|
|
|
|
static void
|
|
gst_speexenc_init (GstSpeexEnc * speexenc)
|
|
{
|
|
speexenc->sinkpad =
|
|
gst_pad_new_from_template (gst_speexenc_sink_template, "sink");
|
|
gst_element_add_pad (GST_ELEMENT (speexenc), speexenc->sinkpad);
|
|
gst_pad_set_event_function (speexenc->sinkpad, gst_speexenc_sinkevent);
|
|
gst_pad_set_chain_function (speexenc->sinkpad, gst_speexenc_chain);
|
|
gst_pad_set_setcaps_function (speexenc->sinkpad, gst_speexenc_sink_setcaps);
|
|
gst_pad_set_query_function (speexenc->sinkpad,
|
|
GST_DEBUG_FUNCPTR (gst_speexenc_sink_query));
|
|
|
|
speexenc->srcpad =
|
|
gst_pad_new_from_template (gst_speexenc_src_template, "src");
|
|
gst_pad_set_query_function (speexenc->srcpad,
|
|
GST_DEBUG_FUNCPTR (gst_speexenc_src_query));
|
|
gst_pad_set_query_type_function (speexenc->srcpad,
|
|
GST_DEBUG_FUNCPTR (gst_speexenc_get_query_types));
|
|
gst_element_add_pad (GST_ELEMENT (speexenc), speexenc->srcpad);
|
|
|
|
speexenc->channels = -1;
|
|
speexenc->rate = -1;
|
|
|
|
speexenc->quality = DEFAULT_QUALITY;
|
|
speexenc->bitrate = DEFAULT_BITRATE;
|
|
speexenc->vbr = DEFAULT_VBR;
|
|
speexenc->abr = DEFAULT_ABR;
|
|
speexenc->vad = DEFAULT_VAD;
|
|
speexenc->dtx = DEFAULT_DTX;
|
|
speexenc->complexity = DEFAULT_COMPLEXITY;
|
|
speexenc->nframes = DEFAULT_NFRAMES;
|
|
|
|
speexenc->setup = FALSE;
|
|
speexenc->header_sent = FALSE;
|
|
|
|
speexenc->adapter = gst_adapter_new ();
|
|
}
|
|
|
|
|
|
/* FIXME: why are we not using the from/to vorbiscomment
|
|
* functions that are in -lgsttagedit-0.9 here? */
|
|
|
|
static gchar *
|
|
gst_speexenc_get_tag_value (const GstTagList * list, const gchar * tag,
|
|
int index)
|
|
{
|
|
GType tag_type;
|
|
gchar *speexvalue = NULL;
|
|
|
|
if (tag == NULL)
|
|
return NULL;
|
|
|
|
tag_type = gst_tag_get_type (tag);
|
|
|
|
/* get tag name right */
|
|
if ((strcmp (tag, GST_TAG_TRACK_NUMBER) == 0)
|
|
|| (strcmp (tag, GST_TAG_ALBUM_VOLUME_NUMBER) == 0)
|
|
|| (strcmp (tag, GST_TAG_TRACK_COUNT) == 0)
|
|
|| (strcmp (tag, GST_TAG_ALBUM_VOLUME_COUNT) == 0)) {
|
|
guint track_no;
|
|
|
|
if (gst_tag_list_get_uint_index (list, tag, index, &track_no)) {
|
|
speexvalue = g_strdup_printf ("%u", track_no);
|
|
} else {
|
|
GST_WARNING ("Failed to extract int tag %d for '%s'", index, tag);
|
|
}
|
|
} else if (tag_type == GST_TYPE_DATE) {
|
|
/* FIXME: how are dates represented in speex files? */
|
|
GDate *date;
|
|
|
|
if (gst_tag_list_get_date_index (list, tag, index, &date)) {
|
|
speexvalue =
|
|
g_strdup_printf ("%04d-%02d-%02d", (gint) g_date_get_year (date),
|
|
(gint) g_date_get_month (date), (gint) g_date_get_day (date));
|
|
g_date_free (date);
|
|
} else {
|
|
GST_WARNING ("Failed to extract date tag %d for '%s'", index, tag);
|
|
}
|
|
} else if (tag_type == G_TYPE_STRING) {
|
|
if (!gst_tag_list_get_string_index (list, tag, index, &speexvalue))
|
|
GST_WARNING ("Failed to extract string tag %d for '%s'", index, tag);
|
|
}
|
|
|
|
return speexvalue;
|
|
}
|
|
|
|
/*
|
|
* Comments will be stored in the Vorbis style.
|
|
* It is describled in the "Structure" section of
|
|
* http://www.xiph.org/ogg/vorbis/doc/v-comment.html
|
|
*
|
|
* The comment header is decoded as follows:
|
|
* 1) [vendor_length] = read an unsigned integer of 32 bits
|
|
* 2) [vendor_string] = read a UTF-8 vector as [vendor_length] octets
|
|
* 3) [user_comment_list_length] = read an unsigned integer of 32 bits
|
|
* 4) iterate [user_comment_list_length] times {
|
|
* 5) [length] = read an unsigned integer of 32 bits
|
|
* 6) this iteration's user comment = read a UTF-8 vector as [length] octets
|
|
* }
|
|
* 7) [framing_bit] = read a single bit as boolean
|
|
* 8) if ( [framing_bit] unset or end of packet ) then ERROR
|
|
* 9) done.
|
|
*
|
|
* If you have troubles, please write to ymnk@jcraft.com.
|
|
*/
|
|
static void
|
|
comment_init (guint8 ** comments, int *length, char *vendor_string)
|
|
{
|
|
int vendor_length = strlen (vendor_string);
|
|
int user_comment_list_length = 0;
|
|
int len = 4 + vendor_length + 4;
|
|
guint8 *p = g_malloc (len);
|
|
|
|
GST_WRITE_UINT32_LE (p, vendor_length);
|
|
memcpy (p + 4, vendor_string, vendor_length);
|
|
GST_WRITE_UINT32_LE (p + 4 + vendor_length, user_comment_list_length);
|
|
*length = len;
|
|
*comments = p;
|
|
}
|
|
static void
|
|
comment_add (guint8 ** comments, int *length, const char *tag, char *val)
|
|
{
|
|
guint8 *p = *comments;
|
|
int vendor_length = GST_READ_UINT32_LE (p);
|
|
int user_comment_list_length = GST_READ_UINT32_LE (p + 4 + vendor_length);
|
|
int tag_len = (tag ? strlen (tag) : 0);
|
|
int val_len = strlen (val);
|
|
int len = (*length) + 4 + tag_len + val_len;
|
|
|
|
p = g_realloc (p, len);
|
|
|
|
GST_WRITE_UINT32_LE (p + *length, tag_len + val_len); /* length of comment */
|
|
if (tag)
|
|
memcpy (p + *length + 4, (guint8 *) tag, tag_len); /* comment */
|
|
memcpy (p + *length + 4 + tag_len, val, val_len); /* comment */
|
|
GST_WRITE_UINT32_LE (p + 4 + vendor_length, user_comment_list_length + 1);
|
|
|
|
*comments = p;
|
|
*length = len;
|
|
}
|
|
|
|
static void
|
|
gst_speexenc_metadata_set1 (const GstTagList * list, const gchar * tag,
|
|
gpointer speexenc)
|
|
{
|
|
const gchar *speextag = NULL;
|
|
gchar *speexvalue = NULL;
|
|
guint i, count;
|
|
GstSpeexEnc *enc = GST_SPEEXENC (speexenc);
|
|
|
|
speextag = gst_tag_to_vorbis_tag (tag);
|
|
if (speextag == NULL) {
|
|
return;
|
|
}
|
|
|
|
count = gst_tag_list_get_tag_size (list, tag);
|
|
for (i = 0; i < count; i++) {
|
|
speexvalue = gst_speexenc_get_tag_value (list, tag, i);
|
|
|
|
if (speexvalue != NULL) {
|
|
comment_add (&enc->comments, &enc->comment_len, speextag, speexvalue);
|
|
}
|
|
}
|
|
}
|
|
|
|
static void
|
|
gst_speexenc_set_metadata (GstSpeexEnc * speexenc)
|
|
{
|
|
GstTagList *copy;
|
|
const GstTagList *user_tags;
|
|
|
|
user_tags = gst_tag_setter_get_tag_list (GST_TAG_SETTER (speexenc));
|
|
if (!(speexenc->tags || user_tags))
|
|
return;
|
|
|
|
comment_init (&speexenc->comments, &speexenc->comment_len,
|
|
"Encoded with GStreamer Speexenc");
|
|
copy =
|
|
gst_tag_list_merge (user_tags, speexenc->tags,
|
|
gst_tag_setter_get_tag_merge_mode (GST_TAG_SETTER (speexenc)));
|
|
gst_tag_list_foreach (copy, gst_speexenc_metadata_set1, speexenc);
|
|
gst_tag_list_free (copy);
|
|
}
|
|
|
|
static gboolean
|
|
gst_speexenc_setup (GstSpeexEnc * speexenc)
|
|
{
|
|
speexenc->setup = FALSE;
|
|
|
|
switch (speexenc->mode) {
|
|
case GST_SPEEXENC_MODE_UWB:
|
|
speexenc->speex_mode = (SpeexMode *) & speex_uwb_mode;
|
|
break;
|
|
case GST_SPEEXENC_MODE_WB:
|
|
speexenc->speex_mode = (SpeexMode *) & speex_wb_mode;
|
|
break;
|
|
case GST_SPEEXENC_MODE_NB:
|
|
speexenc->speex_mode = (SpeexMode *) & speex_nb_mode;
|
|
break;
|
|
case GST_SPEEXENC_MODE_AUTO:
|
|
/* fall through */
|
|
default:
|
|
break;
|
|
}
|
|
|
|
if (speexenc->rate > 25000) {
|
|
if (speexenc->mode == GST_SPEEXENC_MODE_AUTO) {
|
|
speexenc->speex_mode = (SpeexMode *) & speex_uwb_mode;
|
|
} else {
|
|
if (speexenc->speex_mode != &speex_uwb_mode) {
|
|
speexenc->last_message =
|
|
g_strdup_printf
|
|
("Warning: suggest to use ultra wide band mode for this rate");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
}
|
|
}
|
|
} else if (speexenc->rate > 12500) {
|
|
if (speexenc->mode == GST_SPEEXENC_MODE_AUTO) {
|
|
speexenc->speex_mode = (SpeexMode *) & speex_wb_mode;
|
|
} else {
|
|
if (speexenc->speex_mode != &speex_wb_mode) {
|
|
speexenc->last_message =
|
|
g_strdup_printf
|
|
("Warning: suggest to use wide band mode for this rate");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
}
|
|
}
|
|
} else {
|
|
if (speexenc->mode == GST_SPEEXENC_MODE_AUTO) {
|
|
speexenc->speex_mode = (SpeexMode *) & speex_nb_mode;
|
|
} else {
|
|
if (speexenc->speex_mode != &speex_nb_mode) {
|
|
speexenc->last_message =
|
|
g_strdup_printf
|
|
("Warning: suggest to use narrow band mode for this rate");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
}
|
|
}
|
|
}
|
|
|
|
if (speexenc->rate != 8000 && speexenc->rate != 16000
|
|
&& speexenc->rate != 32000) {
|
|
speexenc->last_message =
|
|
g_strdup_printf ("Warning: speex is optimized for 8, 16 and 32 KHz");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
}
|
|
|
|
speex_init_header (&speexenc->header, speexenc->rate, 1,
|
|
speexenc->speex_mode);
|
|
speexenc->header.frames_per_packet = speexenc->nframes;
|
|
speexenc->header.vbr = speexenc->vbr;
|
|
speexenc->header.nb_channels = speexenc->channels;
|
|
|
|
/*Initialize Speex encoder */
|
|
speexenc->state = speex_encoder_init (speexenc->speex_mode);
|
|
|
|
speex_encoder_ctl (speexenc->state, SPEEX_GET_FRAME_SIZE,
|
|
&speexenc->frame_size);
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_COMPLEXITY,
|
|
&speexenc->complexity);
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_SAMPLING_RATE, &speexenc->rate);
|
|
|
|
if (speexenc->vbr)
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_VBR_QUALITY,
|
|
&speexenc->quality);
|
|
else {
|
|
gint tmp = floor (speexenc->quality);
|
|
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_QUALITY, &tmp);
|
|
}
|
|
if (speexenc->bitrate) {
|
|
if (speexenc->quality >= 0.0 && speexenc->vbr) {
|
|
speexenc->last_message =
|
|
g_strdup_printf ("Warning: bitrate option is overriding quality");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
}
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_BITRATE, &speexenc->bitrate);
|
|
}
|
|
if (speexenc->vbr) {
|
|
gint tmp = 1;
|
|
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_VBR, &tmp);
|
|
} else if (speexenc->vad) {
|
|
gint tmp = 1;
|
|
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_VAD, &tmp);
|
|
}
|
|
|
|
if (speexenc->dtx) {
|
|
gint tmp = 1;
|
|
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_DTX, &tmp);
|
|
}
|
|
|
|
if (speexenc->dtx && !(speexenc->vbr || speexenc->abr || speexenc->vad)) {
|
|
speexenc->last_message =
|
|
g_strdup_printf ("Warning: dtx is useless without vad, vbr or abr");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
} else if ((speexenc->vbr || speexenc->abr) && (speexenc->vad)) {
|
|
speexenc->last_message =
|
|
g_strdup_printf ("Warning: vad is already implied by vbr or abr");
|
|
g_object_notify (G_OBJECT (speexenc), "last_message");
|
|
}
|
|
|
|
if (speexenc->abr) {
|
|
speex_encoder_ctl (speexenc->state, SPEEX_SET_ABR, &speexenc->abr);
|
|
}
|
|
|
|
speex_encoder_ctl (speexenc->state, SPEEX_GET_LOOKAHEAD,
|
|
&speexenc->lookahead);
|
|
|
|
speexenc->setup = TRUE;
|
|
|
|
return TRUE;
|
|
}
|
|
|
|
/* prepare a buffer for transmission */
|
|
static GstBuffer *
|
|
gst_speexenc_buffer_from_data (GstSpeexEnc * speexenc, guchar * data,
|
|
gint data_len, guint64 granulepos)
|
|
{
|
|
GstBuffer *outbuf;
|
|
|
|
outbuf = gst_buffer_new_and_alloc (data_len);
|
|
memcpy (GST_BUFFER_DATA (outbuf), data, data_len);
|
|
GST_BUFFER_OFFSET (outbuf) = speexenc->bytes_out;
|
|
GST_BUFFER_OFFSET_END (outbuf) = granulepos;
|
|
|
|
GST_DEBUG ("encoded buffer of %d bytes", GST_BUFFER_SIZE (outbuf));
|
|
return outbuf;
|
|
}
|
|
|
|
|
|
/* push out the buffer and do internal bookkeeping */
|
|
static GstFlowReturn
|
|
gst_speexenc_push_buffer (GstSpeexEnc * speexenc, GstBuffer * buffer)
|
|
{
|
|
speexenc->bytes_out += GST_BUFFER_SIZE (buffer);
|
|
|
|
return gst_pad_push (speexenc->srcpad, buffer);
|
|
|
|
}
|
|
|
|
static GstCaps *
|
|
gst_speexenc_set_header_on_caps (GstCaps * caps, GstBuffer * buf1,
|
|
GstBuffer * buf2)
|
|
{
|
|
caps = gst_caps_make_writable (caps);
|
|
GstStructure *structure = gst_caps_get_structure (caps, 0);
|
|
GValue list = { 0 };
|
|
GValue value = { 0 };
|
|
|
|
/* mark buffers */
|
|
GST_BUFFER_FLAG_SET (buf1, GST_BUFFER_FLAG_IN_CAPS);
|
|
GST_BUFFER_FLAG_SET (buf2, GST_BUFFER_FLAG_IN_CAPS);
|
|
|
|
/* put buffers in a fixed list */
|
|
g_value_init (&list, GST_TYPE_ARRAY);
|
|
g_value_init (&value, GST_TYPE_BUFFER);
|
|
gst_value_set_buffer (&value, buf1);
|
|
gst_value_list_append_value (&list, &value);
|
|
g_value_unset (&value);
|
|
g_value_init (&value, GST_TYPE_BUFFER);
|
|
gst_value_set_buffer (&value, buf2);
|
|
gst_value_list_append_value (&list, &value);
|
|
gst_structure_set_value (structure, "streamheader", &list);
|
|
g_value_unset (&value);
|
|
g_value_unset (&list);
|
|
|
|
return caps;
|
|
}
|
|
|
|
|
|
static gboolean
|
|
gst_speexenc_sinkevent (GstPad * pad, GstEvent * event)
|
|
{
|
|
gboolean res = TRUE;
|
|
GstSpeexEnc *speexenc;
|
|
|
|
speexenc = GST_SPEEXENC (GST_PAD_PARENT (pad));
|
|
|
|
switch (GST_EVENT_TYPE (event)) {
|
|
case GST_EVENT_EOS:
|
|
speexenc->eos = TRUE;
|
|
res = gst_pad_event_default (pad, event);
|
|
break;
|
|
case GST_EVENT_TAG:
|
|
{
|
|
GstTagList *list;
|
|
|
|
gst_event_parse_tag (event, &list);
|
|
if (speexenc->tags) {
|
|
gst_tag_list_insert (speexenc->tags, list,
|
|
gst_tag_setter_get_tag_merge_mode (GST_TAG_SETTER (speexenc)));
|
|
} else {
|
|
g_assert_not_reached ();
|
|
}
|
|
res = gst_pad_event_default (pad, event);
|
|
break;
|
|
}
|
|
default:
|
|
res = gst_pad_event_default (pad, event);
|
|
break;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
|
|
static GstFlowReturn
|
|
gst_speexenc_chain (GstPad * pad, GstBuffer * buf)
|
|
{
|
|
GstSpeexEnc *speexenc;
|
|
GstFlowReturn ret = GST_FLOW_OK;
|
|
|
|
speexenc = GST_SPEEXENC (gst_pad_get_parent (pad));
|
|
|
|
if (!speexenc->setup) {
|
|
gst_buffer_unref (buf);
|
|
GST_ELEMENT_ERROR (speexenc, CORE, NEGOTIATION, (NULL),
|
|
("encoder not initialized (input is not audio?)"));
|
|
ret = GST_FLOW_UNEXPECTED;
|
|
goto error;
|
|
}
|
|
|
|
if (!speexenc->header_sent) {
|
|
/* Speex streams begin with two headers; the initial header (with
|
|
most of the codec setup parameters) which is mandated by the Ogg
|
|
bitstream spec. The second header holds any comment fields.
|
|
We merely need to make the headers, then pass them to libspeex
|
|
one at a time; libspeex handles the additional Ogg bitstream
|
|
constraints */
|
|
GstBuffer *buf1, *buf2;
|
|
GstCaps *caps;
|
|
guchar *data;
|
|
gint data_len;
|
|
|
|
gst_speexenc_set_metadata (speexenc);
|
|
|
|
/* create header buffer */
|
|
data = (guint8 *) speex_header_to_packet (&speexenc->header, &data_len);
|
|
buf1 = gst_speexenc_buffer_from_data (speexenc, data, data_len, 0);
|
|
|
|
/* create comment buffer */
|
|
buf2 =
|
|
gst_speexenc_buffer_from_data (speexenc, speexenc->comments,
|
|
speexenc->comment_len, 0);
|
|
|
|
/* mark and put on caps */
|
|
caps = gst_pad_get_caps (speexenc->srcpad);
|
|
caps = gst_speexenc_set_header_on_caps (caps, buf1, buf2);
|
|
|
|
/* negotiate with these caps */
|
|
GST_DEBUG ("here are the caps: %" GST_PTR_FORMAT, caps);
|
|
gst_pad_set_caps (speexenc->srcpad, caps);
|
|
|
|
gst_buffer_set_caps (buf1, caps);
|
|
gst_buffer_set_caps (buf2, caps);
|
|
|
|
/* push out buffers */
|
|
ret = gst_speexenc_push_buffer (speexenc, buf1);
|
|
|
|
if ((GST_FLOW_OK != ret) && (GST_FLOW_NOT_LINKED != ret)) {
|
|
gst_buffer_unref (buf1);
|
|
goto error;
|
|
}
|
|
|
|
ret = gst_speexenc_push_buffer (speexenc, buf2);
|
|
|
|
if ((GST_FLOW_OK != ret) && (GST_FLOW_NOT_LINKED != ret)) {
|
|
|
|
gst_buffer_unref (buf2);
|
|
goto error;
|
|
}
|
|
|
|
speex_bits_init (&speexenc->bits);
|
|
speex_bits_reset (&speexenc->bits);
|
|
|
|
speexenc->header_sent = TRUE;
|
|
}
|
|
|
|
{
|
|
gint frame_size = speexenc->frame_size;
|
|
gint bytes = frame_size * 2 * speexenc->channels;
|
|
|
|
/* push buffer to adapter */
|
|
gst_adapter_push (speexenc->adapter, buf);
|
|
|
|
while (gst_adapter_available (speexenc->adapter) >= bytes) {
|
|
gint16 *data;
|
|
gint i;
|
|
gint outsize, written;
|
|
GstBuffer *outbuf;
|
|
|
|
data = (gint16 *) gst_adapter_peek (speexenc->adapter, bytes);
|
|
|
|
for (i = 0; i < frame_size * speexenc->channels; i++) {
|
|
speexenc->input[i] = (gfloat) data[i];
|
|
}
|
|
gst_adapter_flush (speexenc->adapter, bytes);
|
|
|
|
speexenc->samples_in += frame_size;
|
|
|
|
if (speexenc->channels == 2) {
|
|
speex_encode_stereo (speexenc->input, frame_size, &speexenc->bits);
|
|
}
|
|
speex_encode (speexenc->state, speexenc->input, &speexenc->bits);
|
|
|
|
speexenc->frameno++;
|
|
|
|
if ((speexenc->frameno % speexenc->nframes) != 0)
|
|
continue;
|
|
|
|
speex_bits_insert_terminator (&speexenc->bits);
|
|
outsize = speex_bits_nbytes (&speexenc->bits);
|
|
|
|
ret = gst_pad_alloc_buffer (speexenc->srcpad,
|
|
GST_BUFFER_OFFSET_NONE, outsize, GST_PAD_CAPS (speexenc->srcpad),
|
|
&outbuf);
|
|
|
|
if ((GST_FLOW_OK != ret)) {
|
|
goto error;
|
|
}
|
|
|
|
written = speex_bits_write (&speexenc->bits,
|
|
(gchar *) GST_BUFFER_DATA (outbuf), outsize);
|
|
g_assert (written == outsize);
|
|
speex_bits_reset (&speexenc->bits);
|
|
|
|
GST_BUFFER_TIMESTAMP (outbuf) =
|
|
(speexenc->frameno * frame_size -
|
|
speexenc->lookahead) * GST_SECOND / speexenc->rate;
|
|
GST_BUFFER_DURATION (outbuf) = frame_size * GST_SECOND / speexenc->rate;
|
|
GST_BUFFER_OFFSET (outbuf) = speexenc->bytes_out;
|
|
GST_BUFFER_OFFSET_END (outbuf) =
|
|
speexenc->frameno * frame_size - speexenc->lookahead;
|
|
|
|
ret = gst_speexenc_push_buffer (speexenc, outbuf);
|
|
|
|
if ((GST_FLOW_OK != ret) && (GST_FLOW_NOT_LINKED != ret)) {
|
|
gst_buffer_unref (outbuf);
|
|
goto error;
|
|
}
|
|
}
|
|
}
|
|
|
|
error:
|
|
|
|
gst_object_unref (speexenc);
|
|
return ret;
|
|
}
|
|
|
|
|
|
static void
|
|
gst_speexenc_get_property (GObject * object, guint prop_id, GValue * value,
|
|
GParamSpec * pspec)
|
|
{
|
|
GstSpeexEnc *speexenc;
|
|
|
|
g_return_if_fail (GST_IS_SPEEXENC (object));
|
|
|
|
speexenc = GST_SPEEXENC (object);
|
|
|
|
switch (prop_id) {
|
|
case ARG_QUALITY:
|
|
g_value_set_float (value, speexenc->quality);
|
|
break;
|
|
case ARG_BITRATE:
|
|
g_value_set_int (value, speexenc->bitrate);
|
|
break;
|
|
case ARG_VBR:
|
|
g_value_set_boolean (value, speexenc->vbr);
|
|
break;
|
|
case ARG_ABR:
|
|
g_value_set_int (value, speexenc->abr);
|
|
break;
|
|
case ARG_VAD:
|
|
g_value_set_boolean (value, speexenc->vad);
|
|
break;
|
|
case ARG_DTX:
|
|
g_value_set_boolean (value, speexenc->dtx);
|
|
break;
|
|
case ARG_COMPLEXITY:
|
|
g_value_set_int (value, speexenc->complexity);
|
|
break;
|
|
case ARG_NFRAMES:
|
|
g_value_set_int (value, speexenc->nframes);
|
|
break;
|
|
case ARG_LAST_MESSAGE:
|
|
g_value_set_string (value, speexenc->last_message);
|
|
break;
|
|
default:
|
|
G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
|
|
break;
|
|
}
|
|
}
|
|
|
|
static void
|
|
gst_speexenc_set_property (GObject * object, guint prop_id,
|
|
const GValue * value, GParamSpec * pspec)
|
|
{
|
|
GstSpeexEnc *speexenc;
|
|
|
|
g_return_if_fail (GST_IS_SPEEXENC (object));
|
|
|
|
speexenc = GST_SPEEXENC (object);
|
|
|
|
switch (prop_id) {
|
|
case ARG_QUALITY:
|
|
speexenc->quality = g_value_get_float (value);
|
|
break;
|
|
case ARG_BITRATE:
|
|
speexenc->bitrate = g_value_get_int (value);
|
|
break;
|
|
case ARG_VBR:
|
|
speexenc->vbr = g_value_get_boolean (value);
|
|
break;
|
|
case ARG_ABR:
|
|
speexenc->abr = g_value_get_int (value);
|
|
break;
|
|
case ARG_VAD:
|
|
speexenc->vad = g_value_get_boolean (value);
|
|
break;
|
|
case ARG_DTX:
|
|
speexenc->dtx = g_value_get_boolean (value);
|
|
break;
|
|
case ARG_COMPLEXITY:
|
|
speexenc->complexity = g_value_get_int (value);
|
|
break;
|
|
case ARG_NFRAMES:
|
|
speexenc->nframes = g_value_get_int (value);
|
|
break;
|
|
default:
|
|
G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
|
|
break;
|
|
}
|
|
}
|
|
|
|
static GstStateChangeReturn
|
|
gst_speexenc_change_state (GstElement * element, GstStateChange transition)
|
|
{
|
|
GstSpeexEnc *speexenc = GST_SPEEXENC (element);
|
|
GstStateChangeReturn res;
|
|
|
|
switch (transition) {
|
|
case GST_STATE_CHANGE_NULL_TO_READY:
|
|
speexenc->tags = gst_tag_list_new ();
|
|
break;
|
|
case GST_STATE_CHANGE_READY_TO_PAUSED:
|
|
speexenc->frameno = 0;
|
|
speexenc->samples_in = 0;
|
|
break;
|
|
case GST_STATE_CHANGE_PAUSED_TO_PLAYING:
|
|
/* fall through */
|
|
default:
|
|
break;
|
|
}
|
|
|
|
res = GST_ELEMENT_CLASS (parent_class)->change_state (element, transition);
|
|
|
|
switch (transition) {
|
|
case GST_STATE_CHANGE_PLAYING_TO_PAUSED:
|
|
break;
|
|
case GST_STATE_CHANGE_PAUSED_TO_READY:
|
|
speexenc->setup = FALSE;
|
|
speexenc->header_sent = FALSE;
|
|
break;
|
|
case GST_STATE_CHANGE_READY_TO_NULL:
|
|
gst_tag_list_free (speexenc->tags);
|
|
speexenc->tags = NULL;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
return res;
|
|
}
|