gst-plugins-rs/mux/mp4/tests/tests.rs
Brad Hards 2130c3bfbe mux/mp4: add image sequence mode
Image sequence is defined in ISO/IEC 23008-12 (HEIF), as a variant of
video. The key difference is that image sequence timing is advisory.

Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-rs/-/merge_requests/2101>
2025-02-26 13:56:09 +00:00

643 lines
18 KiB
Rust

// Copyright (C) 2022 Sebastian Dröge <sebastian@centricular.com>
//
// This Source Code Form is subject to the terms of the Mozilla Public License, v2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at
// <https://mozilla.org/MPL/2.0/>.
//
// SPDX-License-Identifier: MPL-2.0
//
use std::{
fs,
io::{Cursor, Read},
path::Path,
};
use gst_pbutils::prelude::*;
fn init() {
use std::sync::Once;
static INIT: Once = Once::new();
INIT.call_once(|| {
gst::init().unwrap();
gstmp4::plugin_register_static().unwrap();
});
}
struct Pipeline(gst::Pipeline);
impl std::ops::Deref for Pipeline {
type Target = gst::Pipeline;
fn deref(&self) -> &Self::Target {
&self.0
}
}
impl Drop for Pipeline {
fn drop(&mut self) {
let _ = self.0.set_state(gst::State::Null);
}
}
impl Pipeline {
fn into_completion(self) {
self.set_state(gst::State::Playing)
.expect("Unable to set the pipeline to the `Playing` state");
for msg in self.bus().unwrap().iter_timed(gst::ClockTime::NONE) {
use gst::MessageView;
match msg.view() {
MessageView::Eos(..) => break,
MessageView::Error(err) => {
panic!(
"Error from {:?}: {} ({:?})",
err.src().map(|s| s.path_string()),
err.error(),
err.debug()
);
}
_ => (),
}
}
self.set_state(gst::State::Null)
.expect("Unable to set the pipeline to the `Null` state");
}
}
struct FileTypeBox {
major_brand: [u8; 4],
minor_version: u32,
compatible_brands: Vec<[u8; 4]>,
}
impl FileTypeBox {
fn read(mut reader: Cursor<&[u8]>) -> std::io::Result<FileTypeBox> {
let mut box_size_buf = [0u8; 4];
reader.read_exact(&mut box_size_buf)?;
let box_size = u32::from_be_bytes(box_size_buf);
let mut four_cc = [0u8; 4];
reader.read_exact(&mut four_cc)?;
assert_eq!(four_cc, *b"ftyp");
let mut major_brand = [0u8; 4];
reader.read_exact(&mut major_brand)?;
let mut minor_version_buf = [0u8; 4];
reader.read_exact(&mut minor_version_buf)?;
let minor_version = u32::from_be_bytes(minor_version_buf);
let num_brands = (box_size - 16) / 4;
let mut compatible_brands = Vec::with_capacity(num_brands.try_into().unwrap());
for _ in 0..num_brands {
let mut compatible_brand = [0u8; 4];
reader.read_exact(&mut compatible_brand)?;
compatible_brands.push(compatible_brand);
}
Ok(FileTypeBox {
major_brand,
minor_version,
compatible_brands,
})
}
}
fn test_basic_with(video_enc: &str, audio_enc: &str, cb: impl FnOnce(&Path)) {
let Ok(pipeline) = gst::parse::launch(&format!(
"videotestsrc num-buffers=99 ! {video_enc} ! mux. \
audiotestsrc num-buffers=140 ! {audio_enc} ! mux. \
isomp4mux name=mux ! filesink name=sink"
)) else {
println!("could not build encoding pipeline");
return;
};
let pipeline = Pipeline(pipeline.downcast::<gst::Pipeline>().unwrap());
let dir = tempfile::TempDir::new().unwrap();
let mut location = dir.path().to_owned();
location.push("test.mp4");
let sink = pipeline.by_name("sink").unwrap();
sink.set_property("location", location.to_str().expect("Non-UTF8 filename"));
pipeline.into_completion();
cb(&location)
}
#[test]
fn test_basic_x264_aac() {
init();
test_basic_with("x264enc", "fdkaacenc", |location| {
let discoverer = gst_pbutils::Discoverer::new(gst::ClockTime::from_seconds(5))
.expect("Failed to create discoverer");
let info = discoverer
.discover_uri(
url::Url::from_file_path(location)
.expect("Failed to convert filename to URL")
.as_str(),
)
.expect("Failed to discover MP4 file");
assert_eq!(info.duration(), Some(gst::ClockTime::from_mseconds(3_300)));
let audio_streams = info.audio_streams();
assert_eq!(audio_streams.len(), 1);
let audio_stream = &audio_streams[0];
assert_eq!(audio_stream.channels(), 1);
assert_eq!(audio_stream.sample_rate(), 44_100);
let caps = audio_stream.caps().unwrap();
assert!(
caps.can_intersect(
&gst::Caps::builder("audio/mpeg")
.any_features()
.field("mpegversion", 4i32)
.build()
),
"Unexpected audio caps {caps:?}"
);
let video_streams = info.video_streams();
assert_eq!(video_streams.len(), 1);
let video_stream = &video_streams[0];
assert_eq!(video_stream.width(), 320);
assert_eq!(video_stream.height(), 240);
assert_eq!(video_stream.framerate(), gst::Fraction::new(30, 1));
assert_eq!(video_stream.par(), gst::Fraction::new(1, 1));
assert!(!video_stream.is_interlaced());
let caps = video_stream.caps().unwrap();
assert!(
caps.can_intersect(&gst::Caps::builder("video/x-h264").any_features().build()),
"Unexpected video caps {caps:?}"
);
})
}
#[test]
fn test_roundtrip_vp9_flac() {
init();
test_basic_with("vp9enc ! vp9parse", "flacenc ! flacparse", |location| {
let Ok(pipeline) = gst::parse::launch(
"filesrc name=src ! qtdemux name=demux \
demux.audio_0 ! queue ! flacdec ! fakesink \
demux.video_0 ! queue ! vp9dec ! fakesink",
) else {
panic!("could not build decoding pipeline")
};
let pipeline = Pipeline(pipeline.downcast::<gst::Pipeline>().unwrap());
pipeline
.by_name("src")
.unwrap()
.set_property("location", location.display().to_string());
pipeline.into_completion();
})
}
#[test]
fn test_roundtrip_av1_aac() {
init();
test_basic_with("av1enc ! av1parse", "avenc_aac ! aacparse", |location| {
let Ok(pipeline) = gst::parse::launch(
"filesrc name=src ! qtdemux name=demux \
demux.audio_0 ! queue ! avdec_aac ! fakesink \
demux.video_0 ! queue ! av1dec ! fakesink",
) else {
panic!("could not build decoding pipeline")
};
let pipeline = Pipeline(pipeline.downcast::<gst::Pipeline>().unwrap());
pipeline
.by_name("src")
.unwrap()
.set_property("location", location.display().to_string());
pipeline.into_completion();
})
}
fn test_uncompressed_with(format: &str, width: u32, height: u32, cb: impl FnOnce(&Path)) {
let Ok(pipeline) = gst::parse::launch(&format!(
"videotestsrc num-buffers=99 ! video/x-raw,format={format},width={width},height={height} ! mux. \
isomp4mux name=mux ! filesink name=sink"
)) else {
println!("could not build encoding pipeline");
return;
};
let pipeline = Pipeline(pipeline.downcast::<gst::Pipeline>().unwrap());
let dir = tempfile::TempDir::new().unwrap();
let mut location = dir.path().to_owned();
location.push("test.mp4");
let sink = pipeline.by_name("sink").unwrap();
sink.set_property("location", location.to_str().expect("Non-UTF8 filename"));
pipeline.into_completion();
cb(&location)
}
fn test_roundtrip_uncompressed(video_format: &str, width: u32, height: u32) {
test_uncompressed_with(video_format, width, height, |location| {
let Ok(pipeline) = gst::parse::launch(
"filesrc name=src ! qtdemux name=demux \
demux.video_0 ! queue ! fakesink",
) else {
panic!("could not build decoding pipeline")
};
let pipeline = Pipeline(pipeline.downcast::<gst::Pipeline>().unwrap());
pipeline
.by_name("src")
.unwrap()
.set_property("location", location.display().to_string());
pipeline.into_completion();
})
}
fn test_encode_uncompressed(video_format: &str, width: u32, height: u32) {
let filename = format!("{video_format}_{width}x{height}.mp4");
let pipeline_text = format!("videotestsrc num-buffers=250 ! video/x-raw,format={video_format},width={width},height={height} ! isomp4mux ! filesink location={filename}");
let Ok(pipeline) = gst::parse::launch(&pipeline_text) else {
panic!("could not build encoding pipeline")
};
pipeline
.set_state(gst::State::Playing)
.expect("Unable to set the pipeline to the `Playing` state");
for msg in pipeline.bus().unwrap().iter_timed(gst::ClockTime::NONE) {
use gst::MessageView;
match msg.view() {
MessageView::Eos(..) => break,
MessageView::Error(err) => {
panic!(
"Error from {:?}: {} ({:?})",
err.src().map(|s| s.path_string()),
err.error(),
err.debug()
);
}
_ => (),
}
}
pipeline
.set_state(gst::State::Null)
.expect("Unable to set the pipeline to the `Null` state");
test_expected_uncompressed_output(filename);
}
fn test_expected_uncompressed_output(filename: String) {
let check_data: Vec<u8> = fs::read(filename).unwrap();
let cursor = Cursor::new(check_data.as_ref());
test_default_mpeg_file_type_box(cursor);
}
fn test_expected_file_type_box(
expected_major_brand: &[u8; 4],
expected_minor_version: u32,
expected_compatible_brands: Vec<[u8; 4]>,
cursor: Cursor<&[u8]>,
) {
let ftyp = FileTypeBox::read(cursor).unwrap();
assert_eq!(ftyp.major_brand, *expected_major_brand);
assert_eq!(ftyp.minor_version, expected_minor_version);
let mut sorted_compatible_brands = ftyp.compatible_brands.clone();
sorted_compatible_brands.sort();
let mut sorted_expected_compatible_brands = expected_compatible_brands.clone();
sorted_expected_compatible_brands.sort();
assert_eq!(sorted_compatible_brands, sorted_expected_compatible_brands);
}
#[test]
fn encode_uncompressed_iyu2() {
init();
test_encode_uncompressed("IYU2", 1275, 713);
}
#[test]
fn encode_uncompressed_rgb() {
init();
test_encode_uncompressed("RGB", 1275, 713);
}
#[test]
fn encode_uncompressed_rgb_row_align_0() {
init();
test_encode_uncompressed("RGB", 1280, 720);
test_roundtrip_uncompressed("RGB", 1280, 720);
}
#[test]
fn encode_uncompressed_bgr() {
init();
test_encode_uncompressed("BGR", 1275, 713);
}
#[test]
fn encode_uncompressed_bgr_row_align_0() {
init();
test_encode_uncompressed("BGR", 1280, 720);
test_roundtrip_uncompressed("BGR", 1280, 720);
}
#[test]
fn encode_uncompressed_nv12() {
init();
test_encode_uncompressed("NV12", 1275, 714);
}
#[test]
fn encode_uncompressed_nv21() {
init();
test_encode_uncompressed("NV21", 1275, 714);
}
#[test]
fn encode_uncompressed_rgba() {
init();
test_encode_uncompressed("RGBA", 1275, 713);
}
#[test]
fn encode_uncompressed_rgba_row_align_0() {
init();
test_encode_uncompressed("RGBA", 1280, 720);
test_roundtrip_uncompressed("RGBA", 1280, 720);
}
#[test]
fn encode_uncompressed_argb() {
init();
test_encode_uncompressed("ARGB", 1275, 713);
}
#[test]
fn encode_uncompressed_abgr() {
init();
test_encode_uncompressed("ABGR", 1275, 713);
}
#[test]
fn encode_uncompressed_abgr_row_align_0() {
init();
test_encode_uncompressed("ABGR", 1280, 720);
test_roundtrip_uncompressed("ABGR", 1280, 720);
}
#[test]
fn encode_uncompressed_bgra() {
init();
test_encode_uncompressed("BGRA", 1275, 713);
}
#[test]
fn encode_uncompressed_rgbx() {
init();
test_encode_uncompressed("RGBx", 1275, 713);
}
#[test]
fn encode_uncompressed_bgrx() {
init();
test_encode_uncompressed("BGRx", 1275, 713);
}
#[test]
fn encode_uncompressed_y444() {
init();
test_encode_uncompressed("Y444", 1275, 713);
}
#[test]
fn encode_uncompressed_i420() {
init();
test_encode_uncompressed("I420", 1280, 720);
}
#[test]
fn encode_uncompressed_yv12() {
init();
test_encode_uncompressed("YV12", 1280, 720);
}
#[test]
fn encode_uncompressed_yuy2() {
init();
test_encode_uncompressed("YUY2", 320, 120);
}
#[test]
fn encode_uncompressed_yvyu() {
init();
test_encode_uncompressed("YVYU", 320, 120);
}
#[test]
fn encode_uncompressed_vyuy() {
init();
test_encode_uncompressed("VYUY", 320, 120);
}
#[test]
fn encode_uncompressed_uyvy() {
init();
test_encode_uncompressed("UYVY", 320, 120);
}
/*
TODO: report YA4p unknown pixel format to GPAC
*/
#[test]
fn encode_uncompressed_ayuv() {
init();
test_encode_uncompressed("AYUV", 1275, 713);
}
#[test]
fn encode_uncompressed_y41b() {
init();
test_encode_uncompressed("Y41B", 1280, 713);
}
#[test]
fn encode_uncompressed_y42b() {
init();
test_encode_uncompressed("Y42B", 1280, 713);
}
#[test]
fn encode_uncompressed_v308() {
init();
test_encode_uncompressed("v308", 1275, 713);
}
#[test]
fn encode_uncompressed_gray8() {
init();
test_encode_uncompressed("GRAY8", 1275, 713);
}
#[test]
fn encode_uncompressed_gray8_row_align_0() {
init();
test_encode_uncompressed("GRAY8", 1280, 720);
test_roundtrip_uncompressed("GRAY8", 1280, 720);
}
#[test]
fn encode_uncompressed_gray16_be() {
init();
test_encode_uncompressed("GRAY16_BE", 1275, 713);
}
#[test]
fn encode_uncompressed_r210() {
init();
test_encode_uncompressed("r210", 1275, 713);
}
#[test]
fn encode_uncompressed_nv16() {
init();
test_encode_uncompressed("NV16", 1280, 713);
}
#[test]
fn encode_uncompressed_nv61() {
init();
test_encode_uncompressed("NV61", 1280, 713);
}
#[test]
fn encode_uncompressed_gbr() {
init();
test_encode_uncompressed("GBR", 1275, 713);
}
#[test]
fn encode_uncompressed_rgbp() {
init();
test_encode_uncompressed("RGBP", 1275, 713);
}
#[test]
fn encode_uncompressed_bgrp() {
init();
test_encode_uncompressed("BGRP", 1275, 713);
}
fn test_encode_uncompressed_image_sequence(video_format: &str, width: u32, height: u32) {
let filename = format!("{video_format}_{width}x{height}.heifs");
let pipeline_text = format!("videotestsrc num-buffers=10 ! video/x-raw,format={video_format},width={width},height={height} ! isomp4mux name=mux ! filesink location={filename}");
let Ok(pipeline) = gst::parse::launch(&pipeline_text) else {
panic!("could not build encoding pipeline")
};
let pipeline = Pipeline(pipeline.downcast::<gst::Pipeline>().unwrap());
let mux = pipeline.by_name("mux").unwrap();
let sink_pad = &mux.sink_pads()[0];
sink_pad.set_property("image-sequence", true);
pipeline
.set_state(gst::State::Playing)
.expect("Unable to set the pipeline to the `Playing` state");
for msg in pipeline.bus().unwrap().iter_timed(gst::ClockTime::NONE) {
use gst::MessageView;
match msg.view() {
MessageView::Eos(..) => break,
MessageView::Error(err) => {
panic!(
"Error from {:?}: {} ({:?})",
err.src().map(|s| s.path_string()),
err.error(),
err.debug()
);
}
_ => (),
}
}
pipeline
.set_state(gst::State::Null)
.expect("Unable to set the pipeline to the `Null` state");
test_expected_image_sequence_output(filename);
}
fn test_expected_image_sequence_output(filename: String) {
let check_data: Vec<u8> = fs::read(filename).unwrap();
let cursor = Cursor::new(check_data.as_ref());
test_expected_image_sequence_file_type_box_content(cursor);
}
fn test_expected_image_sequence_file_type_box_content(cursor: Cursor<&[u8]>) {
let expected_major_brand = b"msf1";
let expected_minor_version = 0;
let expected_compatible_brands: Vec<[u8; 4]> = vec![*b"iso8", *b"msf1", *b"unif"];
test_expected_file_type_box(
expected_major_brand,
expected_minor_version,
expected_compatible_brands,
cursor,
);
}
#[test]
fn encode_uncompressed_image_sequence_rgb() {
init();
test_encode_uncompressed_image_sequence("RGB", 1275, 713);
}
#[test]
fn encode_uncompressed_image_sequence_nv12() {
init();
test_encode_uncompressed_image_sequence("NV12", 1275, 714);
}
#[test]
fn test_encode_audio_trak() {
init();
let filename = "audio_only.mp4".to_string();
let pipeline_text = format!("audiotestsrc num-buffers=100 ! audioconvert ! opusenc ! isomp4mux ! filesink location={filename}");
let Ok(pipeline) = gst::parse::launch(&pipeline_text) else {
panic!("could not build encoding pipeline")
};
pipeline
.set_state(gst::State::Playing)
.expect("Unable to set the pipeline to the `Playing` state");
for msg in pipeline.bus().unwrap().iter_timed(gst::ClockTime::NONE) {
use gst::MessageView;
match msg.view() {
MessageView::Eos(..) => break,
MessageView::Error(err) => {
panic!(
"Error from {:?}: {} ({:?})",
err.src().map(|s| s.path_string()),
err.error(),
err.debug()
);
}
_ => (),
}
}
pipeline
.set_state(gst::State::Null)
.expect("Unable to set the pipeline to the `Null` state");
test_audio_only_output(filename);
}
fn test_audio_only_output(filename: String) {
let check_data: Vec<u8> = fs::read(filename).unwrap();
let cursor = Cursor::new(check_data.as_ref());
test_default_mpeg_file_type_box(cursor);
}
fn test_default_mpeg_file_type_box(cursor: Cursor<&[u8]>) {
let expected_major_brand = b"iso4";
let expected_minor_version = 0;
let expected_compatible_brands: Vec<[u8; 4]> = vec![*b"isom", *b"mp41", *b"mp42"];
test_expected_file_type_box(
expected_major_brand,
expected_minor_version,
expected_compatible_brands,
cursor,
);
}