jsontovtt: Add an element for fragmented WebVTT

This element converts the CC JSON format to fragmented WebVTT.

Co-authored by Mathieu Duponchelle <mathieu@centricular.com>
This commit is contained in:
Jan Schmidt 2021-07-17 01:54:45 +10:00 committed by Sebastian Dröge
parent bc587a09f8
commit 3260651671
5 changed files with 780 additions and 3 deletions

View file

@ -0,0 +1,38 @@
// Copyright (C) 2021 Jan Schmidt <jan@centricular.com>
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
use std::cmp::Ordering;
#[derive(Copy, Clone, Eq, PartialEq)]
pub struct ForceKeyUnitRequest {
pub running_time: gst::ClockTime,
pub all_headers: bool,
pub count: u32,
}
impl Ord for ForceKeyUnitRequest {
fn cmp(&self, other: &Self) -> Ordering {
self.running_time.cmp(&other.running_time)
}
}
impl PartialOrd for ForceKeyUnitRequest {
fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
Some(self.cmp(other))
}
}
impl ForceKeyUnitRequest {
pub fn new_from_event(fku: &gst_video::UpstreamForceKeyUnitEvent) -> ForceKeyUnitRequest {
ForceKeyUnitRequest {
running_time: fku.running_time.unwrap(),
all_headers: fku.all_headers,
count: fku.count,
}
}
}

View file

@ -0,0 +1,706 @@
// Copyright (C) 2021 Mathieu Duponchelle <mathieu@centricular.com>
// Copyright (C) 2021 Jan Schmidt <jan@centricular.com>
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
use gst::glib;
use gst::prelude::*;
use gst::subclass::prelude::*;
use gst::{element_error, gst_debug, gst_error, gst_log, gst_trace, gst_warning};
use crate::jsontovtt::fku::ForceKeyUnitRequest;
use crate::ttutils::Lines;
use once_cell::sync::Lazy;
use std::collections::{BinaryHeap, VecDeque};
use std::sync::Mutex;
#[derive(Clone, Debug)]
struct TimestampedLines {
lines: Lines,
pts: gst::ClockTime,
duration: gst::ClockTime,
}
struct State {
pending: VecDeque<TimestampedLines>,
need_initial_header: bool,
last_pts: Option<gst::ClockTime>,
keyunit_requests: BinaryHeap<ForceKeyUnitRequest>,
segment: gst::FormattedSegment<gst::ClockTime>,
}
impl Default for State {
fn default() -> Self {
State {
pending: VecDeque::new(),
need_initial_header: true,
last_pts: None,
keyunit_requests: BinaryHeap::new(),
segment: gst::FormattedSegment::new(),
}
}
}
pub struct JsonToVtt {
srcpad: gst::Pad,
sinkpad: gst::Pad,
state: Mutex<State>,
}
static CAT: Lazy<gst::DebugCategory> = Lazy::new(|| {
gst::DebugCategory::new(
"jsontovtt",
gst::DebugColorFlags::empty(),
Some("JSON to WebVTT"),
)
});
fn clamp(
segment: &gst::FormattedSegment<gst::ClockTime>,
mut pts: gst::ClockTime,
mut duration: Option<gst::ClockTime>,
) -> Option<(gst::ClockTime, Option<gst::ClockTime>)> {
let end_pts = duration.map(|duration| pts + duration).unwrap_or(pts);
if let Some(segment_start) = segment.start() {
if end_pts < segment_start {
return None;
}
if pts < segment_start {
if let Some(ref mut duration) = duration {
*duration = duration.saturating_sub(segment_start - pts);
}
pts = segment_start;
}
}
if let Some(segment_stop) = segment.stop() {
if pts > segment_stop {
return None;
}
if end_pts > segment_stop {
if let Some(ref mut duration) = duration {
*duration = duration.saturating_sub(end_pts - segment_stop);
}
}
}
Some((pts, duration))
}
impl State {
fn create_vtt_header(timestamp: gst::ClockTime) -> gst::Buffer {
let mut buffer = gst::Buffer::from_slice(String::from("WEBVTT\n\n").into_bytes());
{
let buffer = buffer.get_mut().unwrap();
buffer.set_pts(timestamp);
}
buffer
}
fn split_time(time: gst::ClockTime) -> (u64, u8, u8, u16) {
let time = time.nseconds();
let mut s = time / 1_000_000_000;
let mut m = s / 60;
let h = m / 60;
s %= 60;
m %= 60;
let ns = time % 1_000_000_000;
(h as u64, m as u8, s as u8, (ns / 1_000_000) as u16)
}
fn create_vtt_buffer(
timestamp: gst::ClockTime,
duration: gst::ClockTime,
text: String,
) -> gst::Buffer {
use std::fmt::Write;
let mut data = String::new();
let (h1, m1, s1, ms1) = Self::split_time(timestamp);
let (h2, m2, s2, ms2) = Self::split_time(timestamp + duration);
writeln!(
&mut data,
"{:02}:{:02}:{:02}.{:03} --> {:02}:{:02}:{:02}.{:03}",
h1, m1, s1, ms1, h2, m2, s2, ms2
)
.unwrap();
writeln!(&mut data, "{}", text).unwrap();
let mut buffer = gst::Buffer::from_mut_slice(data.into_bytes());
{
let buffer = buffer.get_mut().unwrap();
buffer.set_pts(timestamp);
buffer.set_duration(duration);
buffer.set_flags(gst::BufferFlags::DELTA_UNIT);
}
buffer
}
fn check_initial_header(&mut self, pts: gst::ClockTime) -> Option<gst::Buffer> {
if self.need_initial_header {
let ret = Self::create_vtt_header(pts);
self.need_initial_header = false;
Some(ret)
} else {
None
}
}
fn drain(&mut self, buffers: &mut Vec<gst::Buffer>, running_time: Option<gst::ClockTime>) {
/* We don't output anything until we've received the first request, we trigger
* that first request by sending a first header buffer for each new fragment.
*
* In practice, we will never hold more than one request at a time, but handling
* queuing gracefully doesn't hurt.
*/
while let Some(fku) = self
.keyunit_requests
.peek()
.filter(|fku| match running_time {
None => true,
Some(running_time) => fku.running_time <= running_time,
})
{
let mut drained_lines: VecDeque<TimestampedLines> = VecDeque::new();
/* Collect cues, fixing up their duration based on the next cue */
while let Some(lines) = self.pending.front() {
if let Some(mut drained_line) = drained_lines.back_mut() {
drained_line.duration = lines.pts - drained_line.pts;
}
if running_time.is_none()
|| self.segment.to_running_time(lines.pts) <= Some(fku.running_time)
{
drained_lines.push_back(self.pending.pop_front().unwrap());
} else {
break;
}
}
/* cues that end a fragment must be clipped and cloned for the next fragment */
if let Some(mut drained_line) = drained_lines.back_mut() {
/* Clip to either the requested PTS, or segment stop if specified */
let end_pts = if running_time.is_none() {
self.last_pts.unwrap()
} else {
self.segment
.position_from_running_time(fku.running_time)
.unwrap_or_else(|| self.segment.stop().unwrap())
};
if running_time.is_some() {
let mut cloned = drained_line.clone();
cloned.pts = end_pts;
self.pending.push_front(cloned);
}
drained_line.duration = end_pts - drained_line.pts;
}
/* We have gathered, clipped and timestamped all cues, output them now */
for lines in drained_lines {
let mut output_text = String::new();
for line in &lines.lines.lines {
for chunk in &line.chunks {
output_text += &chunk.text;
}
output_text += "\n";
}
// No need to output an explicit cue for eg clear buffers
if !output_text.is_empty() {
buffers.push(Self::create_vtt_buffer(
lines.pts,
lines.duration,
output_text,
));
}
}
// Now open the next fragment, if it lies inside the segment
if let Some(pts) = self.segment.position_from_running_time(fku.running_time) {
buffers.push(Self::create_vtt_header(pts));
}
self.keyunit_requests.pop();
}
}
fn handle_buffer(
&mut self,
pad: &gst::Pad,
buffer: gst::Buffer,
) -> Result<Vec<gst::Buffer>, gst::FlowError> {
let mut ret = vec![];
let data = buffer.map_readable().map_err(|_| {
gst_error!(CAT, obj: pad, "Can't map buffer readable");
gst::FlowError::Error
})?;
let lines: Lines = serde_json::from_slice(&data).map_err(|err| {
gst_error!(CAT, obj: pad, "Failed to parse input as json: {}", err);
gst::FlowError::Error
})?;
let pts = buffer.pts().ok_or_else(|| {
gst_error!(CAT, obj: pad, "Require timestamped buffers");
gst::FlowError::Error
})?;
let duration = buffer.duration().ok_or_else(|| {
gst_error!(CAT, obj: pad, "Require buffers with duration");
gst::FlowError::Error
})?;
let (pts, duration) = match clamp(&self.segment, pts, Some(duration)) {
Some((pts, duration)) => (pts, duration.unwrap()),
None => {
gst_warning!(
CAT,
obj: pad,
"Dropping buffer outside segment: {:?}",
buffer
);
return Ok(ret);
}
};
if let Some(buffer) = self.check_initial_header(pts) {
ret.push(buffer);
}
self.pending.push_back(TimestampedLines {
lines,
pts,
duration,
});
self.drain(&mut ret, self.segment.to_running_time(pts));
self.last_pts = Some(pts + duration);
Ok(ret)
}
fn handle_gap(&mut self, gap: gst::event::Gap) -> Vec<gst::Buffer> {
let mut ret = vec![];
let (pts, duration) = gap.get();
let (pts, duration) = match clamp(&self.segment, pts, duration) {
Some((pts, duration)) => (pts, duration),
None => {
gst_warning!(CAT, "Ignoring gap outside segment");
return ret;
}
};
if let Some(buffer) = self.check_initial_header(pts) {
ret.push(buffer);
}
self.drain(&mut ret, self.segment.to_running_time(pts));
self.last_pts = Some(pts)
.zip(duration)
.map(|(pts, duration)| pts + duration)
.or(Some(pts));
ret
}
fn handle_eos(&mut self) -> Vec<gst::Buffer> {
let mut ret = vec![];
gst_log!(CAT, "handling EOS, {}", self.pending.len());
self.drain(&mut ret, None);
ret
}
}
impl JsonToVtt {
fn sink_chain(
&self,
pad: &gst::Pad,
_element: &super::JsonToVtt,
buffer: gst::Buffer,
) -> Result<gst::FlowSuccess, gst::FlowError> {
gst_trace!(CAT, obj: pad, "Handling buffer {:?}", buffer);
let mut state = self.state.lock().unwrap();
let buffers = state.handle_buffer(pad, buffer)?;
drop(state);
self.output(buffers)?;
Ok(gst::FlowSuccess::Ok)
}
fn handle_fku(&self, fku: ForceKeyUnitRequest) {
let mut state = self.state.lock().unwrap();
state.keyunit_requests.push(fku);
}
fn src_event(&self, pad: &gst::Pad, element: &super::JsonToVtt, event: gst::Event) -> bool {
use gst::EventView;
gst_log!(CAT, obj: pad, "Handling event {:?}", event);
match event.view() {
EventView::CustomUpstream(ref ev) => {
if gst_video::ForceKeyUnitEvent::is(ev) {
match gst_video::UpstreamForceKeyUnitEvent::parse(ev) {
Ok(fku_event) => {
gst_log!(CAT, obj: pad, "Handling fku {:?}", fku_event);
if fku_event.running_time.is_some() {
self.handle_fku(ForceKeyUnitRequest::new_from_event(&fku_event));
}
}
Err(_) => gst_warning!(
CAT,
obj: element,
"Invalid force-key-unit event received from downstream: {:?}",
&ev
),
}
}
pad.event_default(Some(element), event);
true
}
_ => pad.event_default(Some(element), event),
}
}
fn sink_event(&self, pad: &gst::Pad, element: &super::JsonToVtt, event: gst::Event) -> bool {
use gst::EventView;
gst_log!(CAT, obj: pad, "Handling event {:?}", event);
match event.view() {
EventView::Eos(..) => {
gst_log!(CAT, obj: pad, "Handling EOS");
let mut state = self.state.lock().unwrap();
let buffers = state.handle_eos();
drop(state);
let _ = self.output(buffers);
pad.event_default(Some(element), event)
}
EventView::Caps(..) => {
let mut downstream_caps = match self.srcpad.allowed_caps() {
None => self.srcpad.pad_template_caps(),
Some(caps) => caps,
};
if downstream_caps.is_empty() {
gst_error!(CAT, obj: pad, "Empty downstream caps");
return false;
}
downstream_caps.fixate();
gst_debug!(
CAT,
obj: pad,
"Negotiating for downstream caps {}",
downstream_caps
);
let s = downstream_caps.structure(0).unwrap();
let new_caps = if s.name() == "application/x-subtitle-vtt-fragmented" {
gst::Caps::builder("application/x-subtitle-vtt-fragmented")
.field("inline-headers", true)
.build()
} else {
unreachable!();
};
let new_event = gst::event::Caps::new(&new_caps);
self.srcpad.push_event(new_event)
}
EventView::Segment(ev) => {
let mut state = self.state.lock().unwrap();
match ev.segment().clone().downcast::<gst::format::Time>() {
Ok(s) => {
state.segment = s;
}
Err(err) => {
element_error!(
element,
gst::StreamError::Failed,
["Time segment needed: {:?}", err]
);
return false;
}
};
/* FIXME: Handle segment updates by draining? */
pad.event_default(Some(element), event)
}
EventView::Gap(ev) => {
gst_log!(CAT, obj: pad, "Handling gap {:?}", ev);
let mut state = self.state.lock().unwrap();
let buffers = state.handle_gap(ev);
drop(state);
let _ = self.output(buffers);
true
}
_ => pad.event_default(Some(element), event),
}
}
fn output(&self, mut buffers: Vec<gst::Buffer>) -> Result<gst::FlowSuccess, gst::FlowError> {
for buf in buffers.drain(..) {
self.srcpad.push(buf)?;
}
Ok(gst::FlowSuccess::Ok)
}
}
#[glib::object_subclass]
impl ObjectSubclass for JsonToVtt {
const NAME: &'static str = "JsonToVtt";
type Type = super::JsonToVtt;
type ParentType = gst::Element;
fn with_class(klass: &Self::Class) -> Self {
let templ = klass.pad_template("sink").unwrap();
let sinkpad = gst::Pad::builder_with_template(&templ, Some("sink"))
.chain_function(|pad, parent, buffer| {
JsonToVtt::catch_panic_pad_function(
parent,
|| Err(gst::FlowError::Error),
|this, element| this.sink_chain(pad, element, buffer),
)
})
.event_function(|pad, parent, event| {
JsonToVtt::catch_panic_pad_function(
parent,
|| false,
|this, element| this.sink_event(pad, element, event),
)
})
.flags(gst::PadFlags::FIXED_CAPS)
.build();
let templ = klass.pad_template("src").unwrap();
let srcpad = gst::Pad::builder_with_template(&templ, Some("src"))
.flags(gst::PadFlags::FIXED_CAPS)
.event_function(|pad, parent, event| {
JsonToVtt::catch_panic_pad_function(
parent,
|| false,
|this, element| this.src_event(pad, element, event),
)
})
.build();
Self {
srcpad,
sinkpad,
state: Mutex::new(State::default()),
}
}
}
impl ObjectImpl for JsonToVtt {
fn constructed(&self, obj: &Self::Type) {
self.parent_constructed(obj);
obj.add_pad(&self.sinkpad).unwrap();
obj.add_pad(&self.srcpad).unwrap();
}
}
impl ElementImpl for JsonToVtt {
fn metadata() -> Option<&'static gst::subclass::ElementMetadata> {
static ELEMENT_METADATA: Lazy<gst::subclass::ElementMetadata> = Lazy::new(|| {
gst::subclass::ElementMetadata::new(
"JSON to WebVTT",
"Generic",
"Converts JSON to WebVTT",
"Jan Schmidt <jan@centricular.com>",
)
});
Some(&*ELEMENT_METADATA)
}
fn pad_templates() -> &'static [gst::PadTemplate] {
static PAD_TEMPLATES: Lazy<Vec<gst::PadTemplate>> = Lazy::new(|| {
let caps = gst::Caps::builder("application/x-json")
.field("format", "cea608")
.build();
let sink_pad_template = gst::PadTemplate::new(
"sink",
gst::PadDirection::Sink,
gst::PadPresence::Always,
&caps,
)
.unwrap();
let caps = gst::Caps::builder("application/x-subtitle-vtt-fragmented")
.field("inline-headers", true)
.build();
let src_pad_template = gst::PadTemplate::new(
"src",
gst::PadDirection::Src,
gst::PadPresence::Always,
&caps,
)
.unwrap();
vec![src_pad_template, sink_pad_template]
});
PAD_TEMPLATES.as_ref()
}
fn change_state(
&self,
element: &Self::Type,
transition: gst::StateChange,
) -> Result<gst::StateChangeSuccess, gst::StateChangeError> {
gst_trace!(CAT, obj: element, "Changing state {:?}", transition);
if transition == gst::StateChange::ReadyToPaused {
let mut state = self.state.lock().unwrap();
*state = State::default();
}
self.parent_change_state(element, transition)
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_no_clamp() {
gst::init().unwrap();
let segment = gst::FormattedSegment::<gst::ClockTime>::new();
let pts: gst::ClockTime = gst::ClockTime::from_nseconds(0);
let duration: Option<gst::ClockTime> = Some(gst::ClockTime::from_nseconds(10));
assert_eq!(
clamp(&segment, pts, duration),
Some((
gst::ClockTime::from_nseconds(0),
Some(gst::ClockTime::from_nseconds(10))
))
);
}
#[test]
fn test_clamp_start() {
gst::init().unwrap();
let mut segment = gst::FormattedSegment::<gst::ClockTime>::new();
segment.set_start(Some(gst::ClockTime::from_nseconds(2)));
let pts = gst::ClockTime::from_nseconds(0);
let duration = Some(gst::ClockTime::from_nseconds(10));
assert_eq!(
clamp(&segment, pts, duration),
Some((
gst::ClockTime::from_nseconds(2),
Some(gst::ClockTime::from_nseconds(8))
))
);
}
#[test]
fn test_clamp_stop() {
gst::init().unwrap();
let mut segment = gst::FormattedSegment::<gst::ClockTime>::new();
segment.set_stop(Some(gst::ClockTime::from_nseconds(7)));
let pts = gst::ClockTime::from_nseconds(0);
let duration = Some(gst::ClockTime::from_nseconds(10));
assert_eq!(
clamp(&segment, pts, duration),
Some((
gst::ClockTime::from_nseconds(0),
Some(gst::ClockTime::from_nseconds(7))
))
);
}
#[test]
fn test_clamp_start_stop() {
gst::init().unwrap();
let mut segment = gst::FormattedSegment::<gst::ClockTime>::new();
segment.set_start(Some(gst::ClockTime::from_nseconds(2)));
segment.set_stop(Some(gst::ClockTime::from_nseconds(7)));
let pts = gst::ClockTime::from_nseconds(0);
let duration = Some(gst::ClockTime::from_nseconds(10));
assert_eq!(
clamp(&segment, pts, duration),
Some((
gst::ClockTime::from_nseconds(2),
Some(gst::ClockTime::from_nseconds(5))
))
);
}
#[test]
fn test_clamp_before() {
gst::init().unwrap();
let mut segment = gst::FormattedSegment::<gst::ClockTime>::new();
segment.set_start(Some(gst::ClockTime::from_nseconds(15)));
let pts = gst::ClockTime::from_nseconds(0);
let duration = Some(gst::ClockTime::from_nseconds(10));
assert_eq!(clamp(&segment, pts, duration), None);
}
#[test]
fn test_clamp_after() {
gst::init().unwrap();
let mut segment = gst::FormattedSegment::<gst::ClockTime>::new();
segment.set_stop(Some(gst::ClockTime::from_nseconds(10)));
let pts = gst::ClockTime::from_nseconds(15);
let duration = Some(gst::ClockTime::from_nseconds(10));
assert_eq!(clamp(&segment, pts, duration), None);
}
}

View file

@ -0,0 +1,31 @@
// Copyright (C) 2021 Jan Schmidt <jan@centricular.com>
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
use gst::glib;
use gst::prelude::*;
mod fku;
mod imp;
glib::wrapper! {
pub struct JsonToVtt(ObjectSubclass<imp::JsonToVtt>) @extends gst::Element, gst::Object;
}
// GStreamer elements need to be thread-safe. For the private implementation this is automatically
// enforced but for the public wrapper type we need to specify this manually.
unsafe impl Send for JsonToVtt {}
unsafe impl Sync for JsonToVtt {}
pub fn register(plugin: &gst::Plugin) -> Result<(), glib::BoolError> {
gst::Element::register(
Some(plugin),
"jsontovtt",
gst::Rank::None,
JsonToVtt::static_type(),
)
}

View file

@ -30,6 +30,7 @@ mod ccutils;
mod cea608overlay; mod cea608overlay;
mod cea608tojson; mod cea608tojson;
mod cea608tott; mod cea608tott;
mod jsontovtt;
mod line_reader; mod line_reader;
mod mcc_enc; mod mcc_enc;
mod mcc_parse; mod mcc_parse;
@ -52,6 +53,7 @@ fn plugin_init(plugin: &gst::Plugin) -> Result<(), glib::BoolError> {
ccdetect::register(plugin)?; ccdetect::register(plugin)?;
tttojson::register(plugin)?; tttojson::register(plugin)?;
cea608tojson::register(plugin)?; cea608tojson::register(plugin)?;
jsontovtt::register(plugin)?;
transcriberbin::register(plugin)?; transcriberbin::register(plugin)?;
Ok(()) Ok(())
} }

View file

@ -60,14 +60,14 @@ impl From<u32> for TextStyle {
} }
// TODO allow indenting chunks // TODO allow indenting chunks
#[derive(Serialize, Deserialize, Debug)] #[derive(Clone, Serialize, Deserialize, Debug)]
pub struct Chunk { pub struct Chunk {
pub style: TextStyle, pub style: TextStyle,
pub underline: bool, pub underline: bool,
pub text: String, pub text: String,
} }
#[derive(Serialize, Deserialize, Debug)] #[derive(Clone, Serialize, Deserialize, Debug)]
pub struct Line { pub struct Line {
pub column: Option<u32>, pub column: Option<u32>,
pub row: Option<u32>, pub row: Option<u32>,
@ -77,7 +77,7 @@ pub struct Line {
pub carriage_return: Option<bool>, pub carriage_return: Option<bool>,
} }
#[derive(Serialize, Deserialize, Debug)] #[derive(Clone, Serialize, Deserialize, Debug)]
pub struct Lines { pub struct Lines {
pub lines: Vec<Line>, pub lines: Vec<Line>,
pub mode: Option<Cea608Mode>, pub mode: Option<Cea608Mode>,