OGM text support, Matroska UTF-8 text support, deadlock fixes all over the place, subtitle awareness in decodebin/pla...
Original commit message from CVS:
* configure.ac:
* ext/ogg/gstoggdemux.c: (gst_ogg_pad_new):
* ext/ogg/gstogmparse.c: (gst_ogm_text_parse_get_type),
(gst_ogm_text_parse_base_init), (gst_ogm_text_parse_init),
(gst_ogm_parse_get_sink_querytypes), (gst_ogm_parse_sink_convert),
(gst_ogm_parse_sink_query), (gst_ogm_parse_chain),
(gst_ogm_parse_plugin_init):
* ext/pango/gsttextoverlay.c: (gst_textoverlay_linkedpads),
(gst_textoverlay_link), (gst_textoverlay_getcaps),
(gst_textoverlay_event), (gst_textoverlay_video_chain),
(gst_textoverlay_loop), (gst_textoverlay_init), (plugin_init):
* ext/pango/gsttextoverlay.h:
* gst/matroska/matroska-demux.c: (gst_matroska_demux_add_stream),
(gst_matroska_demux_handle_seek_event),
(gst_matroska_demux_sync_streams),
(gst_matroska_demux_parse_blockgroup),
(gst_matroska_demux_subtitle_caps),
(gst_matroska_demux_plugin_init):
* gst/matroska/matroska-ids.h:
* gst/playback/gstdecodebin.c: (close_pad_link):
* gst/playback/gstplaybasebin.c: (gst_play_base_bin_init),
(gen_preroll_element), (remove_groups), (add_stream),
(new_decoded_pad), (setup_subtitles), (gen_source_element),
(setup_source):
* gst/playback/gstplaybasebin.h:
* gst/playback/gstplaybin.c: (gen_text_element), (setup_sinks):
* gst/subparse/Makefile.am:
* gst/subparse/gstsubparse.c: (gst_subparse_get_type),
(gst_subparse_base_init), (gst_subparse_class_init),
(gst_subparse_init), (gst_subparse_formats),
(gst_subparse_eventmask), (gst_subparse_event),
(gst_subparse_handle_event), (convert_encoding), (get_next_line),
(parse_mdvdsub), (parse_mdvdsub_init), (parse_subrip),
(parse_subrip_deinit), (parse_subrip_init), (parse_mpsub),
(parse_mpsub_deinit), (parse_mpsub_init),
(gst_subparse_buffer_format_autodetect),
(gst_subparse_format_autodetect), (gst_subparse_loop),
(gst_subparse_change_state), (gst_subparse_type_find),
(plugin_init):
* gst/subparse/gstsubparse.h:
* gst/typefind/gsttypefindfunctions.c: (ogmtext_type_find),
(plugin_init):
Add subtitle support, .sub parser (supports SRT and MPsub),
OGM text support, Matroska UTF-8 text support, deadlock fixes
all over the place, subtitle awareness in decodebin/playbin
and some fixes to textoverlay to handle subtitles in a stream
correctly. Fixes #100931.
2005-01-08 18:22:41 +00:00
|
|
|
/* GStreamer
|
|
|
|
* Copyright (C) <1999> Erik Walthinsen <omega@cse.ogi.edu>
|
|
|
|
* Copyright (c) 2004 Ronald S. Bultje <rbultje@ronald.bitfreak.net>
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Library General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Library General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Library General Public
|
|
|
|
* License along with this library; if not, write to the
|
|
|
|
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
|
|
* Boston, MA 02111-1307, USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
#include "config.h"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include <string.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <regex.h>
|
|
|
|
|
|
|
|
#include "gstsubparse.h"
|
|
|
|
|
|
|
|
GST_DEBUG_CATEGORY_STATIC (subparse_debug);
|
|
|
|
#define GST_CAT_DEFAULT subparse_debug
|
|
|
|
|
|
|
|
/* format enum */
|
|
|
|
typedef enum
|
|
|
|
{
|
|
|
|
GST_SUB_PARSE_FORMAT_UNKNOWN = 0,
|
|
|
|
GST_SUB_PARSE_FORMAT_MDVDSUB = 1,
|
|
|
|
GST_SUB_PARSE_FORMAT_SUBRIP = 2,
|
|
|
|
GST_SUB_PARSE_FORMAT_MPSUB = 3
|
|
|
|
} GstSubParseFormat;
|
|
|
|
|
|
|
|
static GstStaticPadTemplate sink_templ = GST_STATIC_PAD_TEMPLATE ("sink",
|
|
|
|
GST_PAD_SINK,
|
|
|
|
GST_PAD_ALWAYS,
|
|
|
|
GST_STATIC_CAPS ("application/x-subtitle")
|
|
|
|
);
|
|
|
|
|
|
|
|
static GstStaticPadTemplate src_templ = GST_STATIC_PAD_TEMPLATE ("src",
|
|
|
|
GST_PAD_SRC,
|
|
|
|
GST_PAD_ALWAYS,
|
|
|
|
GST_STATIC_CAPS ("text/plain; text/x-pango-markup")
|
|
|
|
);
|
|
|
|
|
|
|
|
static void gst_subparse_base_init (GstSubparseClass * klass);
|
|
|
|
static void gst_subparse_class_init (GstSubparseClass * klass);
|
|
|
|
static void gst_subparse_init (GstSubparse * subparse);
|
|
|
|
|
|
|
|
static const GstFormat *gst_subparse_formats (GstPad * pad);
|
|
|
|
static const GstEventMask *gst_subparse_eventmask (GstPad * pad);
|
|
|
|
static gboolean gst_subparse_event (GstPad * pad, GstEvent * event);
|
|
|
|
|
|
|
|
static GstElementStateReturn gst_subparse_change_state (GstElement * element);
|
|
|
|
static void gst_subparse_loop (GstElement * element);
|
|
|
|
|
|
|
|
#if 0
|
|
|
|
static GstCaps *gst_subparse_type_find (GstBuffer * buf, gpointer private);
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static GstElementClass *parent_class = NULL;
|
|
|
|
|
|
|
|
GType
|
|
|
|
gst_subparse_get_type (void)
|
|
|
|
{
|
|
|
|
static GType subparse_type = 0;
|
|
|
|
|
|
|
|
if (!subparse_type) {
|
|
|
|
static const GTypeInfo subparse_info = {
|
|
|
|
sizeof (GstSubparseClass),
|
|
|
|
(GBaseInitFunc) gst_subparse_base_init,
|
|
|
|
NULL,
|
|
|
|
(GClassInitFunc) gst_subparse_class_init,
|
|
|
|
NULL,
|
|
|
|
NULL,
|
|
|
|
sizeof (GstSubparse),
|
|
|
|
0,
|
|
|
|
(GInstanceInitFunc) gst_subparse_init,
|
|
|
|
};
|
|
|
|
|
|
|
|
subparse_type = g_type_register_static (GST_TYPE_ELEMENT,
|
|
|
|
"GstSubparse", &subparse_info, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
return subparse_type;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
gst_subparse_base_init (GstSubparseClass * klass)
|
|
|
|
{
|
|
|
|
GstElementClass *element_class = GST_ELEMENT_CLASS (klass);
|
|
|
|
static GstElementDetails subparse_details = {
|
|
|
|
"Subtitle parsers",
|
|
|
|
"Codec/Parser/Subtitle",
|
|
|
|
"Parses subtitle (.sub) files into text streams",
|
|
|
|
"Gustavo J. A. M. Carneiro <gjc@inescporto.pt>\n"
|
|
|
|
"Ronald S. Bultje <rbultje@ronald.bitfreak.net>"
|
|
|
|
};
|
|
|
|
|
|
|
|
gst_element_class_add_pad_template (element_class,
|
|
|
|
gst_static_pad_template_get (&sink_templ));
|
|
|
|
gst_element_class_add_pad_template (element_class,
|
|
|
|
gst_static_pad_template_get (&src_templ));
|
|
|
|
gst_element_class_set_details (element_class, &subparse_details);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
gst_subparse_class_init (GstSubparseClass * klass)
|
|
|
|
{
|
|
|
|
GstElementClass *element_class = GST_ELEMENT_CLASS (klass);
|
|
|
|
|
|
|
|
parent_class = g_type_class_ref (GST_TYPE_ELEMENT);
|
|
|
|
|
|
|
|
element_class->change_state = gst_subparse_change_state;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
gst_subparse_init (GstSubparse * subparse)
|
|
|
|
{
|
|
|
|
subparse->sinkpad =
|
|
|
|
gst_pad_new_from_template (gst_static_pad_template_get (&sink_templ),
|
|
|
|
"sink");
|
|
|
|
gst_element_add_pad (GST_ELEMENT (subparse), subparse->sinkpad);
|
|
|
|
|
|
|
|
subparse->srcpad =
|
|
|
|
gst_pad_new_from_template (gst_static_pad_template_get (&src_templ),
|
|
|
|
"src");
|
|
|
|
gst_pad_use_explicit_caps (subparse->srcpad);
|
|
|
|
gst_pad_set_formats_function (subparse->srcpad, gst_subparse_formats);
|
|
|
|
gst_pad_set_event_function (subparse->srcpad, gst_subparse_event);
|
|
|
|
gst_pad_set_event_mask_function (subparse->srcpad, gst_subparse_eventmask);
|
|
|
|
gst_element_add_pad (GST_ELEMENT (subparse), subparse->srcpad);
|
|
|
|
|
|
|
|
gst_element_set_loop_function (GST_ELEMENT (subparse), gst_subparse_loop);
|
|
|
|
|
|
|
|
subparse->textbuf = g_string_new (NULL);
|
|
|
|
subparse->parser.type = GST_SUB_PARSE_FORMAT_UNKNOWN;
|
|
|
|
subparse->parser_detected = FALSE;
|
|
|
|
subparse->seek_time = GST_CLOCK_TIME_NONE;
|
|
|
|
subparse->flush = FALSE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Source pad functions.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static const GstFormat *
|
|
|
|
gst_subparse_formats (GstPad * pad)
|
|
|
|
{
|
|
|
|
static const GstFormat formats[] = {
|
|
|
|
GST_FORMAT_TIME,
|
|
|
|
0
|
|
|
|
};
|
|
|
|
|
|
|
|
return formats;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const GstEventMask *
|
|
|
|
gst_subparse_eventmask (GstPad * pad)
|
|
|
|
{
|
|
|
|
static const GstEventMask masks[] = {
|
|
|
|
{GST_EVENT_SEEK, GST_SEEK_METHOD_SET},
|
|
|
|
{0, 0}
|
|
|
|
};
|
|
|
|
|
|
|
|
return masks;
|
|
|
|
}
|
|
|
|
|
|
|
|
static gboolean
|
|
|
|
gst_subparse_event (GstPad * pad, GstEvent * event)
|
|
|
|
{
|
|
|
|
GstSubparse *self = GST_SUBPARSE (gst_pad_get_parent (pad));
|
|
|
|
gboolean res = FALSE;
|
|
|
|
|
|
|
|
switch (GST_EVENT_TYPE (event)) {
|
|
|
|
case GST_EVENT_SEEK:
|
|
|
|
if (!(GST_EVENT_SEEK_FORMAT (event) == GST_FORMAT_TIME &&
|
|
|
|
GST_EVENT_SEEK_METHOD (event) == GST_SEEK_METHOD_SET))
|
|
|
|
break;
|
|
|
|
self->seek_time = GST_EVENT_SEEK_OFFSET (event);
|
|
|
|
res = TRUE;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
gst_event_unref (event);
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* TRUE = continue, FALSE = stop.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static gboolean
|
|
|
|
gst_subparse_handle_event (GstSubparse * self, GstEvent * event)
|
|
|
|
{
|
|
|
|
gboolean res = TRUE;
|
|
|
|
|
|
|
|
switch (GST_EVENT_TYPE (event)) {
|
|
|
|
case GST_EVENT_INTERRUPT:
|
|
|
|
gst_event_unref (event);
|
|
|
|
res = FALSE;
|
|
|
|
break;
|
|
|
|
case GST_EVENT_EOS:
|
|
|
|
res = FALSE;
|
|
|
|
/* fall-through */
|
|
|
|
default:
|
|
|
|
gst_pad_event_default (self->sinkpad, event);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
static gchar *
|
|
|
|
convert_encoding (GstSubparse * self, const gchar * str, gsize len)
|
|
|
|
{
|
|
|
|
gsize bytes_read, bytes_written;
|
|
|
|
gchar *rv;
|
|
|
|
GString *converted;
|
|
|
|
|
|
|
|
converted = g_string_new (NULL);
|
|
|
|
while (len) {
|
|
|
|
GST_DEBUG ("Trying to convert '%s'", g_strndup (str, len));
|
|
|
|
rv = g_locale_to_utf8 (str, len, &bytes_read, &bytes_written, NULL);
|
|
|
|
g_string_append_len (converted, rv, bytes_written);
|
|
|
|
len -= bytes_read;
|
|
|
|
str += bytes_read;
|
|
|
|
if (len) {
|
|
|
|
/* conversion error ocurred => skip one char */
|
|
|
|
len--;
|
|
|
|
str++;
|
|
|
|
g_string_append_c (converted, '?');
|
|
|
|
}
|
|
|
|
}
|
|
|
|
rv = converted->str;
|
|
|
|
g_string_free (converted, FALSE);
|
|
|
|
GST_DEBUG ("Converted to '%s'", rv);
|
|
|
|
return rv;
|
|
|
|
}
|
|
|
|
|
|
|
|
static gchar *
|
|
|
|
get_next_line (GstSubparse * self)
|
|
|
|
{
|
|
|
|
GstBuffer *buf;
|
|
|
|
const char *line_end;
|
|
|
|
int line_len;
|
|
|
|
gboolean have_r = FALSE;
|
|
|
|
gchar *line;
|
|
|
|
|
|
|
|
if ((line_end = strchr (self->textbuf->str, '\n')) == NULL) {
|
|
|
|
/* end-of-line not found; try to get more data */
|
|
|
|
buf = NULL;
|
|
|
|
do {
|
|
|
|
GstData *data = gst_pad_pull (self->sinkpad);
|
|
|
|
|
|
|
|
if (GST_IS_EVENT (data)) {
|
|
|
|
if (!gst_subparse_handle_event (self, GST_EVENT (data)))
|
|
|
|
return NULL;
|
|
|
|
} else {
|
|
|
|
buf = GST_BUFFER (data);
|
|
|
|
}
|
|
|
|
} while (!buf);
|
|
|
|
self->textbuf = g_string_append_len (self->textbuf,
|
|
|
|
GST_BUFFER_DATA (buf), GST_BUFFER_SIZE (buf));
|
|
|
|
gst_buffer_unref (buf);
|
|
|
|
/* search for end-of-line again */
|
|
|
|
line_end = strchr (self->textbuf->str, '\n');
|
|
|
|
}
|
|
|
|
/* get rid of '\r' */
|
|
|
|
if ((int) (line_end - self->textbuf->str) > 0 &&
|
|
|
|
self->textbuf->str[(int) (line_end - self->textbuf->str) - 1] == '\r') {
|
|
|
|
line_end--;
|
|
|
|
have_r = TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (line_end) {
|
|
|
|
line_len = line_end - self->textbuf->str;
|
|
|
|
line = convert_encoding (self, self->textbuf->str, line_len);
|
|
|
|
self->textbuf = g_string_erase (self->textbuf, 0,
|
|
|
|
line_len + (have_r ? 2 : 1));
|
|
|
|
return line;
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static gchar *
|
|
|
|
parse_mdvdsub (GstSubparse * self, guint64 * out_start_time,
|
|
|
|
guint64 * out_end_time, gboolean after_seek)
|
|
|
|
{
|
|
|
|
gchar *line, *line_start, *line_split, *line_chunk;
|
|
|
|
guint start_frame, end_frame;
|
|
|
|
|
|
|
|
/* FIXME: hardcoded for now, but detecting the correct value is
|
|
|
|
* not going to be easy, I suspect... */
|
2005-01-14 12:27:22 +00:00
|
|
|
const double frames_per_sec = 24000 / 1001;
|
OGM text support, Matroska UTF-8 text support, deadlock fixes all over the place, subtitle awareness in decodebin/pla...
Original commit message from CVS:
* configure.ac:
* ext/ogg/gstoggdemux.c: (gst_ogg_pad_new):
* ext/ogg/gstogmparse.c: (gst_ogm_text_parse_get_type),
(gst_ogm_text_parse_base_init), (gst_ogm_text_parse_init),
(gst_ogm_parse_get_sink_querytypes), (gst_ogm_parse_sink_convert),
(gst_ogm_parse_sink_query), (gst_ogm_parse_chain),
(gst_ogm_parse_plugin_init):
* ext/pango/gsttextoverlay.c: (gst_textoverlay_linkedpads),
(gst_textoverlay_link), (gst_textoverlay_getcaps),
(gst_textoverlay_event), (gst_textoverlay_video_chain),
(gst_textoverlay_loop), (gst_textoverlay_init), (plugin_init):
* ext/pango/gsttextoverlay.h:
* gst/matroska/matroska-demux.c: (gst_matroska_demux_add_stream),
(gst_matroska_demux_handle_seek_event),
(gst_matroska_demux_sync_streams),
(gst_matroska_demux_parse_blockgroup),
(gst_matroska_demux_subtitle_caps),
(gst_matroska_demux_plugin_init):
* gst/matroska/matroska-ids.h:
* gst/playback/gstdecodebin.c: (close_pad_link):
* gst/playback/gstplaybasebin.c: (gst_play_base_bin_init),
(gen_preroll_element), (remove_groups), (add_stream),
(new_decoded_pad), (setup_subtitles), (gen_source_element),
(setup_source):
* gst/playback/gstplaybasebin.h:
* gst/playback/gstplaybin.c: (gen_text_element), (setup_sinks):
* gst/subparse/Makefile.am:
* gst/subparse/gstsubparse.c: (gst_subparse_get_type),
(gst_subparse_base_init), (gst_subparse_class_init),
(gst_subparse_init), (gst_subparse_formats),
(gst_subparse_eventmask), (gst_subparse_event),
(gst_subparse_handle_event), (convert_encoding), (get_next_line),
(parse_mdvdsub), (parse_mdvdsub_init), (parse_subrip),
(parse_subrip_deinit), (parse_subrip_init), (parse_mpsub),
(parse_mpsub_deinit), (parse_mpsub_init),
(gst_subparse_buffer_format_autodetect),
(gst_subparse_format_autodetect), (gst_subparse_loop),
(gst_subparse_change_state), (gst_subparse_type_find),
(plugin_init):
* gst/subparse/gstsubparse.h:
* gst/typefind/gsttypefindfunctions.c: (ogmtext_type_find),
(plugin_init):
Add subtitle support, .sub parser (supports SRT and MPsub),
OGM text support, Matroska UTF-8 text support, deadlock fixes
all over the place, subtitle awareness in decodebin/playbin
and some fixes to textoverlay to handle subtitles in a stream
correctly. Fixes #100931.
2005-01-08 18:22:41 +00:00
|
|
|
GString *markup;
|
|
|
|
gchar *rv;
|
|
|
|
|
|
|
|
/* style variables */
|
|
|
|
gboolean italic;
|
|
|
|
gboolean bold;
|
|
|
|
guint fontsize;
|
|
|
|
|
|
|
|
line = line_start = get_next_line (self);
|
|
|
|
if (!line)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
if (sscanf (line, "{%u}{%u}", &start_frame, &end_frame) != 2) {
|
|
|
|
g_warning ("Parse of the following line, assumed to be in microdvd .sub"
|
|
|
|
" format, failed:\n%s", line);
|
|
|
|
g_free (line_start);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
*out_start_time = (start_frame - 1000) / frames_per_sec * GST_SECOND;
|
|
|
|
*out_end_time = (end_frame - 1000) / frames_per_sec * GST_SECOND;
|
|
|
|
/* skip the {%u}{%u} part */
|
|
|
|
line = strchr (line, '}') + 1;
|
|
|
|
line = strchr (line, '}') + 1;
|
|
|
|
|
|
|
|
markup = g_string_new (NULL);
|
|
|
|
while (1) {
|
|
|
|
italic = FALSE;
|
|
|
|
bold = FALSE;
|
|
|
|
fontsize = 0;
|
|
|
|
/* parse style markup */
|
|
|
|
if (strncmp (line, "{y:i}", 5) == 0) {
|
|
|
|
italic = TRUE;
|
|
|
|
line = strchr (line, '}') + 1;
|
|
|
|
}
|
|
|
|
if (strncmp (line, "{y:b}", 5) == 0) {
|
|
|
|
bold = TRUE;
|
|
|
|
line = strchr (line, '}') + 1;
|
|
|
|
}
|
|
|
|
if (sscanf (line, "{s:%u}", &fontsize) == 1) {
|
|
|
|
line = strchr (line, '}') + 1;
|
|
|
|
}
|
|
|
|
if ((line_split = strchr (line, '|')))
|
|
|
|
line_chunk = g_markup_escape_text (line, line_split - line);
|
|
|
|
else
|
|
|
|
line_chunk = g_markup_escape_text (line, strlen (line));
|
|
|
|
markup = g_string_append (markup, "<span");
|
|
|
|
if (italic)
|
|
|
|
g_string_append (markup, " style=\"italic\"");
|
|
|
|
if (bold)
|
|
|
|
g_string_append (markup, " weight=\"bold\"");
|
|
|
|
if (fontsize)
|
|
|
|
g_string_append_printf (markup, " size=\"%u\"", fontsize * 1000);
|
|
|
|
g_string_append_printf (markup, ">%s</span>", line_chunk);
|
|
|
|
g_free (line_chunk);
|
|
|
|
if (line_split) {
|
|
|
|
g_string_append (markup, "\n");
|
|
|
|
line = line_split + 1;
|
|
|
|
} else
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
rv = markup->str;
|
|
|
|
g_string_free (markup, FALSE);
|
|
|
|
g_free (line_start);
|
|
|
|
GST_DEBUG ("parse_mdvdsub returning (start=%f, end=%f): %s",
|
|
|
|
*out_start_time / (double) GST_SECOND,
|
|
|
|
*out_end_time / (double) GST_SECOND, rv);
|
|
|
|
return rv;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
parse_mdvdsub_init (GstSubparse * self)
|
|
|
|
{
|
|
|
|
self->parser.deinit = NULL;
|
|
|
|
self->parser.parse = parse_mdvdsub;
|
|
|
|
}
|
|
|
|
|
|
|
|
static gchar *
|
|
|
|
parse_subrip (GstSubparse * self, guint64 * out_start_time,
|
|
|
|
guint64 * out_end_time, gboolean after_seek)
|
|
|
|
{
|
|
|
|
gchar *line;
|
|
|
|
guint h1, m1, s1, ms1;
|
|
|
|
guint h2, m2, s2, ms2;
|
|
|
|
int subnum;
|
|
|
|
|
|
|
|
while (1) {
|
|
|
|
switch (self->state.subrip.state) {
|
|
|
|
case 0:
|
|
|
|
/* looking for a single integer */
|
|
|
|
line = get_next_line (self);
|
|
|
|
if (!line)
|
|
|
|
return NULL;
|
|
|
|
if (sscanf (line, "%u", &subnum) == 1)
|
|
|
|
self->state.subrip.state = 1;
|
|
|
|
g_free (line);
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
/* looking for start_time --> end_time */
|
|
|
|
line = get_next_line (self);
|
|
|
|
if (!line)
|
|
|
|
return NULL;
|
|
|
|
if (sscanf (line, "%u:%u:%u,%u --> %u:%u:%u,%u",
|
|
|
|
&h1, &m1, &s1, &ms1, &h2, &m2, &s2, &ms2) == 8) {
|
|
|
|
self->state.subrip.state = 2;
|
|
|
|
self->state.subrip.time1 =
|
|
|
|
(((guint64) h1) * 3600 + m1 * 60 + s1) * GST_SECOND +
|
|
|
|
ms1 * GST_MSECOND;
|
|
|
|
self->state.subrip.time2 =
|
|
|
|
(((guint64) h2) * 3600 + m2 * 60 + s2) * GST_SECOND +
|
|
|
|
ms2 * GST_MSECOND;
|
|
|
|
} else {
|
|
|
|
GST_DEBUG (0, "error parsing subrip time line");
|
|
|
|
self->state.subrip.state = 0;
|
|
|
|
}
|
|
|
|
g_free (line);
|
|
|
|
break;
|
|
|
|
case 2:
|
|
|
|
/* looking for subtitle text; empty line ends this
|
|
|
|
* subtitle entry */
|
|
|
|
line = get_next_line (self);
|
|
|
|
if (!line)
|
|
|
|
return NULL;
|
|
|
|
if (self->state.subrip.buf->len)
|
|
|
|
g_string_append_c (self->state.subrip.buf, '\n');
|
|
|
|
g_string_append (self->state.subrip.buf, line);
|
|
|
|
if (strlen (line) == 0) {
|
|
|
|
gchar *rv;
|
|
|
|
|
|
|
|
g_free (line);
|
|
|
|
*out_start_time = self->state.subrip.time1;
|
|
|
|
*out_end_time = self->state.subrip.time2;
|
|
|
|
rv = g_markup_escape_text (self->state.subrip.buf->str,
|
|
|
|
self->state.subrip.buf->len);
|
|
|
|
rv = g_strdup (self->state.subrip.buf->str);
|
|
|
|
g_string_truncate (self->state.subrip.buf, 0);
|
|
|
|
self->state.subrip.state = 0;
|
|
|
|
return rv;
|
|
|
|
}
|
|
|
|
g_free (line);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
parse_subrip_deinit (GstSubparse * self)
|
|
|
|
{
|
|
|
|
g_string_free (self->state.subrip.buf, TRUE);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
parse_subrip_init (GstSubparse * self)
|
|
|
|
{
|
|
|
|
self->state.subrip.state = 0;
|
|
|
|
self->state.subrip.buf = g_string_new (NULL);
|
|
|
|
self->parser.parse = parse_subrip;
|
|
|
|
self->parser.deinit = parse_subrip_deinit;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static gchar *
|
|
|
|
parse_mpsub (GstSubparse * self, guint64 * out_start_time,
|
|
|
|
guint64 * out_end_time, gboolean after_seek)
|
|
|
|
{
|
|
|
|
gchar *line;
|
|
|
|
float t1, t2;
|
|
|
|
|
|
|
|
if (after_seek) {
|
|
|
|
self->state.mpsub.time = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
while (1) {
|
|
|
|
switch (self->state.mpsub.state) {
|
|
|
|
case 0:
|
|
|
|
/* looking for two floats (offset, duration) */
|
|
|
|
line = get_next_line (self);
|
|
|
|
if (!line)
|
|
|
|
return NULL;
|
|
|
|
if (sscanf (line, "%f %f", &t1, &t2) == 2) {
|
|
|
|
self->state.mpsub.state = 1;
|
|
|
|
self->state.mpsub.time += GST_SECOND * t1;
|
|
|
|
}
|
|
|
|
g_free (line);
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
/* looking for subtitle text; empty line ends this
|
|
|
|
* subtitle entry */
|
|
|
|
line = get_next_line (self);
|
|
|
|
if (!line)
|
|
|
|
return NULL;
|
|
|
|
if (self->state.mpsub.buf->len)
|
|
|
|
g_string_append_c (self->state.mpsub.buf, '\n');
|
|
|
|
g_string_append (self->state.mpsub.buf, line);
|
|
|
|
if (strlen (line) == 0) {
|
|
|
|
gchar *rv;
|
|
|
|
|
|
|
|
g_free (line);
|
|
|
|
*out_start_time = self->state.mpsub.time;
|
|
|
|
*out_end_time = self->state.mpsub.time + t2 * GST_SECOND;
|
|
|
|
self->state.mpsub.time += t2 * GST_SECOND;
|
|
|
|
rv = g_markup_escape_text (self->state.mpsub.buf->str,
|
|
|
|
self->state.mpsub.buf->len);
|
|
|
|
rv = g_strdup (self->state.mpsub.buf->str);
|
|
|
|
g_string_truncate (self->state.mpsub.buf, 0);
|
|
|
|
self->state.mpsub.state = 0;
|
|
|
|
return rv;
|
|
|
|
}
|
|
|
|
g_free (line);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
parse_mpsub_deinit (GstSubparse * self)
|
|
|
|
{
|
|
|
|
g_string_free (self->state.mpsub.buf, TRUE);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
parse_mpsub_init (GstSubparse * self)
|
|
|
|
{
|
|
|
|
self->state.mpsub.state = 0;
|
|
|
|
self->state.mpsub.buf = g_string_new (NULL);
|
|
|
|
self->parser.deinit = parse_mpsub_deinit;
|
|
|
|
self->parser.parse = parse_mpsub;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* FIXME: maybe we should pass along a second argument, the preceding
|
|
|
|
* text buffer, because that is how this originally worked, even though
|
|
|
|
* I don't really see the use of that.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static GstSubParseFormat
|
|
|
|
gst_subparse_buffer_format_autodetect (GstBuffer * buf)
|
|
|
|
{
|
|
|
|
static gboolean need_init_regexps = TRUE;
|
|
|
|
static regex_t mdvd_rx;
|
|
|
|
static regex_t subrip_rx;
|
|
|
|
const gchar *str = GST_BUFFER_DATA (buf);
|
|
|
|
|
|
|
|
/* initialize the regexps used the first time around */
|
|
|
|
if (need_init_regexps) {
|
|
|
|
int err;
|
|
|
|
char errstr[128];
|
|
|
|
|
|
|
|
need_init_regexps = FALSE;
|
|
|
|
regcomp (&mdvd_rx, "^\\{[0-9]+\\}\\{[0-9]+\\}",
|
|
|
|
REG_EXTENDED | REG_NEWLINE | REG_NOSUB);
|
|
|
|
if ((err = regcomp (&subrip_rx, "^1\x0d\x0a"
|
|
|
|
"[0-9][0-9]:[0-9][0-9]:[0-9][0-9],[0-9]{3}"
|
|
|
|
" --> [0-9][0-9]:[0-9][0-9]:[0-9][0-9],[0-9]{3}",
|
|
|
|
REG_EXTENDED | REG_NEWLINE | REG_NOSUB)) != 0) {
|
|
|
|
regerror (err, &subrip_rx, errstr, 127);
|
|
|
|
GST_WARNING ("Compilation of subrip regex failed: %s", errstr);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (regexec (&mdvd_rx, str, 0, NULL, 0) == 0) {
|
|
|
|
GST_LOG ("subparse: MicroDVD (frame based) format detected");
|
|
|
|
return GST_SUB_PARSE_FORMAT_MDVDSUB;
|
|
|
|
}
|
|
|
|
if (regexec (&subrip_rx, str, 0, NULL, 0) == 0) {
|
|
|
|
GST_LOG ("subparse: SubRip (time based) format detected");
|
|
|
|
return GST_SUB_PARSE_FORMAT_SUBRIP;
|
|
|
|
}
|
|
|
|
if (!strncmp (str, "FORMAT=TIME", 11)) {
|
|
|
|
GST_LOG ("subparse: MPSub (time based) format detected");
|
|
|
|
return GST_SUB_PARSE_FORMAT_MPSUB;
|
|
|
|
}
|
|
|
|
GST_WARNING ("subparse: subtitle format autodetection failed!");
|
|
|
|
return GST_SUB_PARSE_FORMAT_UNKNOWN;
|
|
|
|
}
|
|
|
|
|
|
|
|
static gboolean
|
|
|
|
gst_subparse_format_autodetect (GstSubparse * self)
|
|
|
|
{
|
|
|
|
GstBuffer *buf = NULL;
|
|
|
|
GstSubParseFormat format;
|
|
|
|
gboolean res = TRUE;
|
|
|
|
|
|
|
|
do {
|
|
|
|
GstData *data = gst_pad_pull (self->sinkpad);
|
|
|
|
|
|
|
|
if (GST_IS_EVENT (data)) {
|
|
|
|
if (!gst_subparse_handle_event (self, GST_EVENT (data)))
|
|
|
|
return FALSE;
|
|
|
|
} else {
|
|
|
|
buf = GST_BUFFER (data);
|
|
|
|
}
|
|
|
|
} while (!buf);
|
|
|
|
self->textbuf = g_string_append_len (self->textbuf, GST_BUFFER_DATA (buf),
|
|
|
|
GST_BUFFER_SIZE (buf));
|
|
|
|
format = gst_subparse_buffer_format_autodetect (buf);
|
|
|
|
gst_buffer_unref (buf);
|
|
|
|
self->parser_detected = TRUE;
|
|
|
|
self->parser.type = format;
|
|
|
|
switch (format) {
|
|
|
|
case GST_SUB_PARSE_FORMAT_MDVDSUB:
|
|
|
|
GST_DEBUG ("MicroDVD format detected");
|
|
|
|
parse_mdvdsub_init (self);
|
|
|
|
res = gst_pad_set_explicit_caps (self->srcpad,
|
|
|
|
gst_caps_new_simple ("text/x-pango-markup", NULL));
|
|
|
|
break;
|
|
|
|
case GST_SUB_PARSE_FORMAT_SUBRIP:
|
|
|
|
GST_DEBUG ("SubRip format detected");
|
|
|
|
parse_subrip_init (self);
|
|
|
|
res = gst_pad_set_explicit_caps (self->srcpad,
|
|
|
|
gst_caps_new_simple ("text/plain", NULL));
|
|
|
|
break;
|
|
|
|
case GST_SUB_PARSE_FORMAT_MPSUB:
|
|
|
|
GST_DEBUG ("MPSub format detected");
|
|
|
|
parse_mpsub_init (self);
|
|
|
|
res = gst_pad_set_explicit_caps (self->srcpad,
|
|
|
|
gst_caps_new_simple ("text/plain", NULL));
|
|
|
|
break;
|
|
|
|
case GST_SUB_PARSE_FORMAT_UNKNOWN:
|
|
|
|
default:
|
|
|
|
GST_DEBUG ("no subtitle format detected");
|
|
|
|
GST_ELEMENT_ERROR (self, STREAM, WRONG_TYPE,
|
|
|
|
("The input is not a valid/supported subtitle file"), (NULL));
|
|
|
|
res = FALSE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* parse input, getting a start and end time
|
|
|
|
* then parse next input, and if next start time > current end time, send
|
|
|
|
* clear buffer.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static void
|
|
|
|
gst_subparse_loop (GstElement * element)
|
|
|
|
{
|
|
|
|
GstSubparse *self;
|
|
|
|
GstBuffer *buf;
|
|
|
|
guint64 start_time, end_time, need_time = GST_CLOCK_TIME_NONE;
|
|
|
|
gchar *subtitle;
|
|
|
|
gboolean after_seek = FALSE;
|
|
|
|
|
|
|
|
GST_DEBUG ("gst_subparse_loop");
|
|
|
|
self = GST_SUBPARSE (element);
|
|
|
|
|
|
|
|
/* make sure we know the format */
|
|
|
|
if (!self->parser_detected) {
|
|
|
|
if (!gst_subparse_format_autodetect (self))
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* handle seeks */
|
|
|
|
if (GST_CLOCK_TIME_IS_VALID (self->seek_time)) {
|
|
|
|
GstEvent *seek;
|
|
|
|
|
|
|
|
seek = gst_event_new_seek (GST_SEEK_FLAG_FLUSH | GST_FORMAT_BYTES |
|
|
|
|
GST_SEEK_METHOD_SET, 0);
|
|
|
|
if (gst_pad_send_event (GST_PAD_PEER (self->sinkpad), seek)) {
|
|
|
|
need_time = self->seek_time;
|
|
|
|
after_seek = TRUE;
|
|
|
|
|
|
|
|
if (self->flush) {
|
|
|
|
gst_pad_push (self->srcpad, GST_DATA (gst_event_new (GST_EVENT_FLUSH)));
|
|
|
|
self->flush = FALSE;
|
|
|
|
}
|
|
|
|
gst_pad_push (self->srcpad,
|
|
|
|
GST_DATA (gst_event_new_discontinuous (FALSE,
|
|
|
|
GST_FORMAT_TIME, need_time, GST_FORMAT_UNDEFINED)));
|
|
|
|
}
|
|
|
|
|
|
|
|
self->seek_time = GST_CLOCK_TIME_NONE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* get a next buffer */
|
|
|
|
GST_INFO ("getting text buffer");
|
|
|
|
if (!self->parser.parse || self->parser.type == GST_SUB_PARSE_FORMAT_UNKNOWN) {
|
|
|
|
GST_ELEMENT_ERROR (self, LIBRARY, INIT, (NULL), (NULL));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
do {
|
|
|
|
subtitle = self->parser.parse (self, &start_time, &end_time, after_seek);
|
|
|
|
if (!subtitle)
|
|
|
|
return;
|
|
|
|
after_seek = FALSE;
|
|
|
|
|
|
|
|
if (GST_CLOCK_TIME_IS_VALID (need_time) && end_time < need_time) {
|
|
|
|
g_free (subtitle);
|
|
|
|
} else {
|
|
|
|
need_time = GST_CLOCK_TIME_NONE;
|
|
|
|
GST_DEBUG ("subparse: loop: text %s, start %lld, end %lld\n",
|
|
|
|
subtitle, start_time, end_time);
|
|
|
|
|
|
|
|
buf = gst_buffer_new ();
|
|
|
|
GST_BUFFER_DATA (buf) = subtitle;
|
|
|
|
GST_BUFFER_SIZE (buf) = strlen (subtitle);
|
|
|
|
GST_BUFFER_TIMESTAMP (buf) = start_time;
|
|
|
|
GST_BUFFER_DURATION (buf) = end_time - start_time;
|
|
|
|
GST_DEBUG ("sending text buffer %s at %lld", subtitle, start_time);
|
|
|
|
gst_pad_push (self->srcpad, GST_DATA (buf));
|
|
|
|
}
|
|
|
|
} while (GST_CLOCK_TIME_IS_VALID (need_time));
|
|
|
|
}
|
|
|
|
|
|
|
|
static GstElementStateReturn
|
|
|
|
gst_subparse_change_state (GstElement * element)
|
|
|
|
{
|
|
|
|
GstSubparse *self = GST_SUBPARSE (element);
|
|
|
|
|
|
|
|
switch (GST_STATE_TRANSITION (element)) {
|
|
|
|
case GST_STATE_PAUSED_TO_READY:
|
|
|
|
self->parser.deinit (self);
|
|
|
|
self->parser.type = GST_SUB_PARSE_FORMAT_UNKNOWN;
|
|
|
|
self->parser_detected = FALSE;
|
|
|
|
self->seek_time = GST_CLOCK_TIME_NONE;
|
|
|
|
self->flush = FALSE;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return parent_class->change_state (element);
|
|
|
|
}
|
|
|
|
|
|
|
|
#if 0
|
|
|
|
/* typefinding stuff */
|
|
|
|
static GstTypeDefinition subparse_definition = {
|
|
|
|
"subparse/x-text",
|
|
|
|
"text/plain",
|
|
|
|
".sub",
|
|
|
|
gst_subparse_type_find,
|
|
|
|
};
|
|
|
|
static GstCaps *
|
|
|
|
gst_subparse_type_find (GstBuffer * buf, gpointer private)
|
|
|
|
{
|
|
|
|
GstSubParseFormat format;
|
|
|
|
|
|
|
|
format = gst_subparse_buffer_format_autodetect (buf);
|
|
|
|
switch (format) {
|
|
|
|
case GST_SUB_PARSE_FORMAT_MDVDSUB:
|
|
|
|
GST_DEBUG (GST_CAT_PLUGIN_INFO, "MicroDVD format detected");
|
|
|
|
return gst_caps_new ("subparse_type_find", "text/plain", NULL);
|
|
|
|
case GST_SUB_PARSE_FORMAT_SUBRIP:
|
|
|
|
GST_DEBUG (GST_CAT_PLUGIN_INFO, "SubRip format detected");
|
|
|
|
return gst_caps_new ("subparse_type_find", "text/plain", NULL);
|
|
|
|
case GST_SUB_PARSE_FORMAT_UNKNOWN:
|
|
|
|
GST_DEBUG (GST_CAT_PLUGIN_INFO, "no subtitle format detected");
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* don't know which this is */
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static gboolean
|
|
|
|
plugin_init (GstPlugin * plugin)
|
|
|
|
{
|
|
|
|
GST_DEBUG_CATEGORY_INIT (subparse_debug, "subparse", 0, ".sub parser");
|
|
|
|
|
|
|
|
return gst_element_register (plugin, "subparse",
|
|
|
|
GST_RANK_PRIMARY, GST_TYPE_SUBPARSE);
|
|
|
|
}
|
|
|
|
|
|
|
|
GST_PLUGIN_DEFINE (GST_VERSION_MAJOR,
|
|
|
|
GST_VERSION_MINOR,
|
|
|
|
"subparse",
|
|
|
|
"Subtitle (.sub) file parsing",
|
|
|
|
plugin_init, VERSION, "LGPL", GST_PACKAGE, GST_ORIGIN)
|