mirror of
https://gitlab.freedesktop.org/gstreamer/gstreamer.git
synced 2025-02-24 15:06:38 +00:00
Adding new h264ccextractor element. This element will extract closed caption meta from H.264 stream, and output in display order. For the frame reordering, this element is implemented as a subclass of h264decoder but without actual frame decoding. Part-of: <https://gitlab.freedesktop.org/gstreamer/gstreamer/-/merge_requests/6580>
460 lines
15 KiB
C
460 lines
15 KiB
C
/* GStreamer
|
|
* Copyright (C) 2024 Seungha Yang <seungha@centricular.com>
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Library General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Library General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Library General Public
|
|
* License along with this library; if not, write to the
|
|
* Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
|
|
* Boston, MA 02110-1301, USA.
|
|
*/
|
|
|
|
/**
|
|
* SECTION:element-h264ccextractor
|
|
* @title: h264ccextractor
|
|
*
|
|
* Extracts closed caption data from H.264 stream and outputs in display order
|
|
*
|
|
* Since: 1.26
|
|
*/
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "config.h"
|
|
#endif
|
|
|
|
#include "gsth264ccextractor.h"
|
|
#include <gst/base/gstqueuearray.h>
|
|
|
|
GST_DEBUG_CATEGORY_STATIC (gst_h264_cc_extractor_debug);
|
|
#define GST_CAT_DEFAULT gst_h264_cc_extractor_debug
|
|
|
|
static GstStaticPadTemplate sink_template = GST_STATIC_PAD_TEMPLATE ("sink",
|
|
GST_PAD_SINK,
|
|
GST_PAD_ALWAYS,
|
|
GST_STATIC_CAPS ("video/x-h264, alignment=(string) au, "
|
|
"parsed=(boolean) true"));
|
|
|
|
static GstStaticPadTemplate src_template = GST_STATIC_PAD_TEMPLATE ("src",
|
|
GST_PAD_SRC,
|
|
GST_PAD_ALWAYS,
|
|
GST_STATIC_CAPS
|
|
("closedcaption/x-cea-608,format={ (string) raw, (string) s334-1a}; "
|
|
"closedcaption/x-cea-708,format={ (string) cc_data, (string) cdp }"));
|
|
|
|
static void gst_h264_cc_extractor_finalize (GObject * object);
|
|
|
|
static gboolean gst_h264_cc_extractor_set_format (GstVideoDecoder * decoder,
|
|
GstVideoCodecState * state);
|
|
static gboolean gst_h264_cc_extractor_negotiate (GstVideoDecoder * decoder);
|
|
static gboolean gst_h264_cc_extractor_transform_meta (GstVideoDecoder * decoder,
|
|
GstVideoCodecFrame * frame, GstMeta * meta);
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_handle_frame (GstVideoDecoder * decoder,
|
|
GstVideoCodecFrame * frame);
|
|
static GstFlowReturn gst_h264_cc_extractor_finish (GstVideoDecoder * decoder);
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_new_sequence (GstH264Decoder * decoder,
|
|
const GstH264SPS * sps, gint max_dpb_size);
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_new_picture (GstH264Decoder * decoder,
|
|
GstVideoCodecFrame * frame, GstH264Picture * picture);
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_new_field_picture (GstH264Decoder * decoder,
|
|
GstH264Picture * first_field, GstH264Picture * second_field);
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_start_picture (GstH264Decoder * decoder,
|
|
GstH264Picture * picture, GstH264Slice * slice, GstH264Dpb * dpb);
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_decode_slice (GstH264Decoder * decoder,
|
|
GstH264Picture * picture, GstH264Slice * slice, GArray * ref_pic_list0,
|
|
GArray * ref_pic_list1);
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_output_picture (GstH264Decoder * decoder,
|
|
GstVideoCodecFrame * frame, GstH264Picture * picture);
|
|
|
|
typedef struct _CaptionData
|
|
{
|
|
GstVideoCaptionType caption_type;
|
|
GstBuffer *buffer;
|
|
} CaptionData;
|
|
|
|
struct _GstH264CCExtractor
|
|
{
|
|
GstH264Decoder parent;
|
|
|
|
GstVideoCaptionType caption_type;
|
|
GstQueueArray *cur_data;
|
|
GstQueueArray *out_data;
|
|
gboolean on_eos;
|
|
gint fps_n;
|
|
gint fps_d;
|
|
};
|
|
|
|
#define gst_h264_cc_extractor_parent_class parent_class
|
|
G_DEFINE_TYPE (GstH264CCExtractor, gst_h264_cc_extractor,
|
|
GST_TYPE_H264_DECODER);
|
|
|
|
GST_ELEMENT_REGISTER_DEFINE (h264ccextractor, "h264ccextractor",
|
|
GST_RANK_NONE, GST_TYPE_H264_CC_EXTRACTOR);
|
|
|
|
static void
|
|
gst_h264_cc_extractor_class_init (GstH264CCExtractorClass * klass)
|
|
{
|
|
GObjectClass *object_class = G_OBJECT_CLASS (klass);
|
|
GstElementClass *element_class = GST_ELEMENT_CLASS (klass);
|
|
GstVideoDecoderClass *decoder_class = GST_VIDEO_DECODER_CLASS (klass);
|
|
GstH264DecoderClass *h264_class = GST_H264_DECODER_CLASS (klass);
|
|
|
|
object_class->finalize = gst_h264_cc_extractor_finalize;
|
|
|
|
gst_element_class_set_static_metadata (element_class,
|
|
"H.264 Closed Caption Extractor",
|
|
"Codec/Video/Filter",
|
|
"Extract GstVideoCaptionMeta from input H.264 stream",
|
|
"Seungha Yang <seungha@centricular.com>");
|
|
|
|
gst_element_class_add_static_pad_template (element_class, &sink_template);
|
|
gst_element_class_add_static_pad_template (element_class, &src_template);
|
|
|
|
decoder_class->set_format =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_set_format);
|
|
decoder_class->negotiate =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_negotiate);
|
|
decoder_class->transform_meta =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_transform_meta);
|
|
decoder_class->handle_frame =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_handle_frame);
|
|
decoder_class->finish = GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_finish);
|
|
|
|
h264_class->new_sequence =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_new_sequence);
|
|
h264_class->new_picture =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_new_picture);
|
|
h264_class->new_field_picture =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_new_field_picture);
|
|
h264_class->start_picture =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_start_picture);
|
|
h264_class->decode_slice =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_decode_slice);
|
|
h264_class->output_picture =
|
|
GST_DEBUG_FUNCPTR (gst_h264_cc_extractor_output_picture);
|
|
|
|
GST_DEBUG_CATEGORY_INIT (gst_h264_cc_extractor_debug, "h264ccextractor",
|
|
0, "h264ccextractor");
|
|
}
|
|
|
|
static void
|
|
caption_data_clear_func (CaptionData * data)
|
|
{
|
|
data->caption_type = GST_VIDEO_CAPTION_TYPE_UNKNOWN;
|
|
gst_clear_buffer (&data->buffer);
|
|
}
|
|
|
|
static GstQueueArray *
|
|
caption_data_queue_new (void)
|
|
{
|
|
GstQueueArray *array =
|
|
gst_queue_array_new_for_struct (sizeof (CaptionData), 2);
|
|
gst_queue_array_set_clear_func (array,
|
|
(GDestroyNotify) caption_data_clear_func);
|
|
return array;
|
|
}
|
|
|
|
static void
|
|
gst_h264_cc_extractor_init (GstH264CCExtractor * self)
|
|
{
|
|
self->cur_data = caption_data_queue_new ();
|
|
self->out_data = gst_queue_array_new_for_struct (sizeof (CaptionData), 2);
|
|
self->caption_type = GST_VIDEO_CAPTION_TYPE_UNKNOWN;
|
|
self->fps_n = 0;
|
|
self->fps_d = 1;
|
|
}
|
|
|
|
static void
|
|
gst_h264_cc_extractor_finalize (GObject * object)
|
|
{
|
|
GstH264CCExtractor *self = GST_H264_CC_EXTRACTOR (object);
|
|
|
|
if (self->cur_data)
|
|
gst_queue_array_free (self->cur_data);
|
|
|
|
gst_queue_array_free (self->out_data);
|
|
|
|
G_OBJECT_CLASS (parent_class)->finalize (object);
|
|
}
|
|
|
|
static gboolean
|
|
gst_h264_cc_extractor_set_format (GstVideoDecoder * decoder,
|
|
GstVideoCodecState * state)
|
|
{
|
|
GstH264CCExtractor *self = GST_H264_CC_EXTRACTOR (decoder);
|
|
GstVideoCodecState *out_state;
|
|
GstCaps *caps;
|
|
gboolean ret;
|
|
|
|
/* Assume caption type is cea708 raw which is common cc type
|
|
* embedded in SEI */
|
|
if (self->caption_type == GST_VIDEO_CAPTION_TYPE_UNKNOWN)
|
|
self->caption_type = GST_VIDEO_CAPTION_TYPE_CEA708_RAW;
|
|
|
|
/* Create dummy output state. Otherwise decoder baseclass will try to create
|
|
* video caps on GAP event */
|
|
out_state = gst_video_decoder_set_output_state (decoder,
|
|
GST_VIDEO_FORMAT_NV12, state->info.width, state->info.height, NULL);
|
|
caps = gst_video_caption_type_to_caps (self->caption_type);
|
|
gst_caps_set_simple (caps, "framerate", GST_TYPE_FRACTION,
|
|
state->info.fps_n, state->info.fps_d, NULL);
|
|
out_state->caps = caps;
|
|
gst_video_codec_state_unref (out_state);
|
|
|
|
ret = GST_VIDEO_DECODER_CLASS (parent_class)->set_format (decoder, state);
|
|
|
|
gst_video_decoder_negotiate (decoder);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static gboolean
|
|
gst_h264_cc_extractor_negotiate (GstVideoDecoder * decoder)
|
|
{
|
|
GstH264CCExtractor *self = GST_H264_CC_EXTRACTOR (decoder);
|
|
GstCaps *caps = gst_video_caption_type_to_caps (self->caption_type);
|
|
|
|
gst_caps_set_simple (caps,
|
|
"framerate", GST_TYPE_FRACTION, self->fps_n, self->fps_d, NULL);
|
|
|
|
gst_pad_set_caps (decoder->srcpad, caps);
|
|
gst_caps_unref (caps);
|
|
|
|
return TRUE;
|
|
}
|
|
|
|
static gboolean
|
|
gst_h264_cc_extractor_transform_meta (GstVideoDecoder * decoder,
|
|
GstVideoCodecFrame * frame, GstMeta * meta)
|
|
{
|
|
/* do not copy any meta */
|
|
return FALSE;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_handle_frame (GstVideoDecoder * decoder,
|
|
GstVideoCodecFrame * frame)
|
|
{
|
|
GstH264CCExtractor *self = GST_H264_CC_EXTRACTOR (decoder);
|
|
GstVideoTimeCodeMeta *tc_meta;
|
|
GstVideoCaptionMeta *cc_meta;
|
|
gpointer iter = NULL;
|
|
GstFlowReturn ret;
|
|
|
|
if (self->cur_data)
|
|
gst_queue_array_clear (self->cur_data);
|
|
|
|
tc_meta = gst_buffer_get_video_time_code_meta (frame->input_buffer);
|
|
|
|
while ((cc_meta = (GstVideoCaptionMeta *)
|
|
gst_buffer_iterate_meta_filtered (frame->input_buffer, &iter,
|
|
GST_VIDEO_CAPTION_META_API_TYPE))) {
|
|
CaptionData data;
|
|
data.caption_type = cc_meta->caption_type;
|
|
data.buffer = gst_buffer_new_memdup (cc_meta->data, cc_meta->size);
|
|
GST_BUFFER_DTS (data.buffer) = GST_CLOCK_TIME_NONE;
|
|
GST_BUFFER_PTS (data.buffer) = GST_BUFFER_PTS (frame->input_buffer);
|
|
GST_BUFFER_DURATION (data.buffer) =
|
|
GST_BUFFER_DURATION (frame->input_buffer);
|
|
|
|
if (tc_meta)
|
|
gst_buffer_add_video_time_code_meta (data.buffer, &tc_meta->tc);
|
|
|
|
if (!self->cur_data)
|
|
self->cur_data = caption_data_queue_new ();
|
|
|
|
gst_queue_array_push_tail_struct (self->cur_data, &data);
|
|
}
|
|
|
|
GST_DEBUG_OBJECT (self, "Queued captions %u",
|
|
self->cur_data ? gst_queue_array_get_length (self->cur_data) : 0);
|
|
|
|
ret = GST_VIDEO_DECODER_CLASS (parent_class)->handle_frame (decoder, frame);
|
|
|
|
if (self->cur_data)
|
|
gst_queue_array_clear (self->cur_data);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_finish (GstVideoDecoder * decoder)
|
|
{
|
|
GST_VIDEO_DECODER_CLASS (parent_class)->finish (decoder);
|
|
|
|
/* baseclass will post error message if there was no output buffer
|
|
* and subclass returns OK. Return flow EOS to avoid the error message */
|
|
return GST_FLOW_EOS;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_new_sequence (GstH264Decoder * decoder,
|
|
const GstH264SPS * sps, gint max_dpb_size)
|
|
{
|
|
return GST_FLOW_OK;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_new_picture (GstH264Decoder * decoder,
|
|
GstVideoCodecFrame * frame, GstH264Picture * picture)
|
|
{
|
|
return GST_FLOW_OK;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_new_field_picture (GstH264Decoder * decoder,
|
|
GstH264Picture * first_field, GstH264Picture * second_field)
|
|
{
|
|
return GST_FLOW_OK;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_start_picture (GstH264Decoder * decoder,
|
|
GstH264Picture * picture, GstH264Slice * slice, GstH264Dpb * dpb)
|
|
{
|
|
GstH264CCExtractor *self = GST_H264_CC_EXTRACTOR (decoder);
|
|
GstH264Picture *target_pic = picture;
|
|
GstQueueArray *pic_data;
|
|
|
|
GST_LOG_OBJECT (self, "Start %s field picture", picture->second_field ?
|
|
"second" : "first");
|
|
|
|
if (!self->cur_data || !gst_queue_array_get_length (self->cur_data))
|
|
return GST_FLOW_OK;
|
|
|
|
/* Baseclass will output only the first field's codec frame.
|
|
* If this second field picture's codec frame is different from
|
|
* the first one, attach */
|
|
if (picture->second_field && picture->other_field &&
|
|
GST_CODEC_PICTURE_FRAME_NUMBER (picture) !=
|
|
GST_CODEC_PICTURE_FRAME_NUMBER (picture->other_field)) {
|
|
target_pic = picture->other_field;
|
|
GST_DEBUG_OBJECT (self, "Found second field picture");
|
|
}
|
|
|
|
pic_data = gst_h264_picture_get_user_data (target_pic);
|
|
if (!pic_data) {
|
|
GST_DEBUG_OBJECT (self, "Creating new picture data, caption size: %u",
|
|
gst_queue_array_get_length (self->cur_data));
|
|
gst_h264_picture_set_user_data (target_pic,
|
|
g_steal_pointer (&self->cur_data),
|
|
(GDestroyNotify) gst_queue_array_free);
|
|
} else {
|
|
gpointer caption_data;
|
|
|
|
GST_DEBUG_OBJECT (self, "Appending %u caption buffers, prev size: %u",
|
|
gst_queue_array_get_length (self->cur_data),
|
|
gst_queue_array_get_length (pic_data));
|
|
|
|
while ((caption_data = gst_queue_array_pop_head_struct (self->cur_data)))
|
|
gst_queue_array_push_tail_struct (pic_data, caption_data);
|
|
}
|
|
|
|
return GST_FLOW_OK;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_decode_slice (GstH264Decoder * decoder,
|
|
GstH264Picture * picture, GstH264Slice * slice, GArray * ref_pic_list0,
|
|
GArray * ref_pic_list1)
|
|
{
|
|
return GST_FLOW_OK;
|
|
}
|
|
|
|
static GstFlowReturn
|
|
gst_h264_cc_extractor_output_picture (GstH264Decoder * decoder,
|
|
GstVideoCodecFrame * frame, GstH264Picture * picture)
|
|
{
|
|
GstVideoDecoder *videodec = GST_VIDEO_DECODER (decoder);
|
|
GstH264CCExtractor *self = GST_H264_CC_EXTRACTOR (decoder);
|
|
gint fps_n = 0;
|
|
gint fps_d = 1;
|
|
gboolean updated = FALSE;
|
|
GstCodecPicture *codec_pic = GST_CODEC_PICTURE (picture);
|
|
GstQueueArray *pic_data;
|
|
CaptionData *caption_data = NULL;
|
|
GstBuffer *front_buf = NULL;
|
|
GstClockTime pts, dur;
|
|
GstFlowReturn ret = GST_FLOW_OK;
|
|
|
|
pic_data = gst_h264_picture_get_user_data (picture);
|
|
|
|
/* Move caption buffer to our temporary storage */
|
|
if (pic_data) {
|
|
while ((caption_data = gst_queue_array_pop_head_struct (pic_data)))
|
|
gst_queue_array_push_tail_struct (self->out_data, caption_data);
|
|
}
|
|
|
|
fps_n = decoder->input_state->info.fps_n;
|
|
fps_d = decoder->input_state->info.fps_d;
|
|
|
|
if (codec_pic->discont_state) {
|
|
fps_n = codec_pic->discont_state->info.fps_n;
|
|
fps_d = codec_pic->discont_state->info.fps_d;
|
|
}
|
|
|
|
if (fps_n != self->fps_n || fps_d != self->fps_d) {
|
|
updated = TRUE;
|
|
self->fps_n = fps_n;
|
|
self->fps_d = fps_d;
|
|
}
|
|
|
|
GST_DEBUG_OBJECT (self, "picture is holding %u caption buffers",
|
|
gst_queue_array_get_length (self->out_data));
|
|
|
|
if (gst_queue_array_get_length (self->out_data)) {
|
|
caption_data = gst_queue_array_pop_head_struct (self->out_data);
|
|
front_buf = caption_data->buffer;
|
|
if (caption_data->caption_type != self->caption_type) {
|
|
GST_DEBUG_OBJECT (self, "Caption type changed, need new caps");
|
|
self->caption_type = caption_data->caption_type;
|
|
updated = TRUE;
|
|
}
|
|
}
|
|
|
|
if (updated)
|
|
gst_video_decoder_negotiate (videodec);
|
|
|
|
gst_h264_picture_unref (picture);
|
|
|
|
pts = GST_BUFFER_PTS (frame->input_buffer);
|
|
dur = GST_BUFFER_DURATION (frame->input_buffer);
|
|
|
|
if (!front_buf) {
|
|
GstEvent *gap;
|
|
|
|
GST_VIDEO_CODEC_FRAME_SET_DECODE_ONLY (frame);
|
|
ret = gst_video_decoder_finish_frame (videodec, frame);
|
|
gap = gst_event_new_gap (pts, dur);
|
|
gst_pad_push_event (videodec->srcpad, gap);
|
|
return ret;
|
|
}
|
|
|
|
frame->output_buffer = front_buf;
|
|
ret = gst_video_decoder_finish_frame (videodec, frame);
|
|
|
|
/* Drain other caption data */
|
|
while ((caption_data = gst_queue_array_pop_head_struct (self->out_data))) {
|
|
if (ret == GST_FLOW_OK)
|
|
ret = gst_pad_push (videodec->srcpad, caption_data->buffer);
|
|
else
|
|
gst_buffer_unref (caption_data->buffer);
|
|
}
|
|
|
|
return ret;
|
|
}
|