nvdecoder: Add support for HEVC GBR output

... and use P012 format for 12bits instead of P016

Fixes: https://gitlab.freedesktop.org/gstreamer/gstreamer/-/issues/2991
Part-of: <https://gitlab.freedesktop.org/gstreamer/gstreamer/-/merge_requests/5375>
This commit is contained in:
Seungha Yang 2023-09-21 22:18:56 +09:00 committed by GStreamer Marge Bot
parent 907c507680
commit c5bd0faee3
4 changed files with 130 additions and 81 deletions

View file

@ -459,6 +459,7 @@ gst_nv_dec_object_export_surface (GstNvDecObject * object,
switch (GST_VIDEO_INFO_FORMAT (&info)) { switch (GST_VIDEO_INFO_FORMAT (&info)) {
case GST_VIDEO_FORMAT_NV12: case GST_VIDEO_FORMAT_NV12:
case GST_VIDEO_FORMAT_P010_10LE: case GST_VIDEO_FORMAT_P010_10LE:
case GST_VIDEO_FORMAT_P012_LE:
case GST_VIDEO_FORMAT_P016_LE: case GST_VIDEO_FORMAT_P016_LE:
info.stride[0] = surface->pitch; info.stride[0] = surface->pitch;
info.stride[1] = surface->pitch; info.stride[1] = surface->pitch;
@ -468,6 +469,8 @@ gst_nv_dec_object_export_surface (GstNvDecObject * object,
break; break;
case GST_VIDEO_FORMAT_Y444: case GST_VIDEO_FORMAT_Y444:
case GST_VIDEO_FORMAT_Y444_16LE: case GST_VIDEO_FORMAT_Y444_16LE:
case GST_VIDEO_FORMAT_GBR:
case GST_VIDEO_FORMAT_GBR_16LE:
info.stride[0] = surface->pitch; info.stride[0] = surface->pitch;
info.stride[1] = surface->pitch; info.stride[1] = surface->pitch;
info.stride[2] = surface->pitch; info.stride[2] = surface->pitch;

View file

@ -55,6 +55,8 @@
#include <gst/cuda/gstcudastream.h> #include <gst/cuda/gstcudastream.h>
#include "gstnvdecoder.h" #include "gstnvdecoder.h"
#include <string.h> #include <string.h>
#include <string>
#include <set>
extern "C" extern "C"
{ {
@ -157,13 +159,13 @@ chroma_format_from_video_format (GstVideoFormat format)
switch (format) { switch (format) {
case GST_VIDEO_FORMAT_NV12: case GST_VIDEO_FORMAT_NV12:
case GST_VIDEO_FORMAT_P010_10LE: case GST_VIDEO_FORMAT_P010_10LE:
case GST_VIDEO_FORMAT_P010_10BE: case GST_VIDEO_FORMAT_P012_LE:
case GST_VIDEO_FORMAT_P016_LE: case GST_VIDEO_FORMAT_P016_LE:
case GST_VIDEO_FORMAT_P016_BE:
return cudaVideoChromaFormat_420; return cudaVideoChromaFormat_420;
case GST_VIDEO_FORMAT_Y444: case GST_VIDEO_FORMAT_Y444:
case GST_VIDEO_FORMAT_Y444_16LE: case GST_VIDEO_FORMAT_Y444_16LE:
case GST_VIDEO_FORMAT_Y444_16BE: case GST_VIDEO_FORMAT_GBR:
case GST_VIDEO_FORMAT_GBR_16LE:
return cudaVideoChromaFormat_444; return cudaVideoChromaFormat_444;
default: default:
g_assert_not_reached (); g_assert_not_reached ();
@ -180,14 +182,14 @@ output_format_from_video_format (GstVideoFormat format)
case GST_VIDEO_FORMAT_NV12: case GST_VIDEO_FORMAT_NV12:
return cudaVideoSurfaceFormat_NV12; return cudaVideoSurfaceFormat_NV12;
case GST_VIDEO_FORMAT_P010_10LE: case GST_VIDEO_FORMAT_P010_10LE:
case GST_VIDEO_FORMAT_P010_10BE: case GST_VIDEO_FORMAT_P012_LE:
case GST_VIDEO_FORMAT_P016_LE: case GST_VIDEO_FORMAT_P016_LE:
case GST_VIDEO_FORMAT_P016_BE:
return cudaVideoSurfaceFormat_P016; return cudaVideoSurfaceFormat_P016;
case GST_VIDEO_FORMAT_Y444: case GST_VIDEO_FORMAT_Y444:
case GST_VIDEO_FORMAT_GBR:
return cudaVideoSurfaceFormat_YUV444; return cudaVideoSurfaceFormat_YUV444;
case GST_VIDEO_FORMAT_Y444_16LE: case GST_VIDEO_FORMAT_Y444_16LE:
case GST_VIDEO_FORMAT_Y444_16BE: case GST_VIDEO_FORMAT_GBR_16LE:
return cudaVideoSurfaceFormat_YUV444_16Bit; return cudaVideoSurfaceFormat_YUV444_16Bit;
default: default:
g_assert_not_reached (); g_assert_not_reached ();
@ -1067,7 +1069,6 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
guint bitdepth_minus8[3] = { 0, 2, 4 }; guint bitdepth_minus8[3] = { 0, 2, 4 };
GstNvDecoderFormatFlags format_flags = (GstNvDecoderFormatFlags) 0; GstNvDecoderFormatFlags format_flags = (GstNvDecoderFormatFlags) 0;
guint c_idx, b_idx; guint c_idx, b_idx;
guint num_support = 0;
cudaVideoChromaFormat chroma_list[] = { cudaVideoChromaFormat chroma_list[] = {
#if 0 #if 0
/* FIXME: support monochrome */ /* FIXME: support monochrome */
@ -1078,12 +1079,11 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
cudaVideoChromaFormat_420, cudaVideoChromaFormat_420,
cudaVideoChromaFormat_444, cudaVideoChromaFormat_444,
}; };
GValue format_list = G_VALUE_INIT;
GValue format = G_VALUE_INIT;
GValue profile_list = G_VALUE_INIT; GValue profile_list = G_VALUE_INIT;
const GstNvdecoderCodecMap *codec_map = nullptr; const GstNvdecoderCodecMap *codec_map = nullptr;
guint i; guint i;
gboolean ret = FALSE; gboolean ret = FALSE;
std::set < std::string > formats;
for (i = 0; i < G_N_ELEMENTS (codec_map_list); i++) { for (i = 0; i < G_N_ELEMENTS (codec_map_list); i++) {
if (codec_map_list[i].codec == codec) { if (codec_map_list[i].codec == codec) {
@ -1127,8 +1127,6 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
return TRUE; return TRUE;
} }
g_value_init (&format_list, GST_TYPE_LIST);
g_value_init (&format, G_TYPE_STRING);
g_value_init (&profile_list, GST_TYPE_LIST); g_value_init (&profile_list, GST_TYPE_LIST);
if (CuCtxPushCurrent (cuda_ctx) != CUDA_SUCCESS) if (CuCtxPushCurrent (cuda_ctx) != CUDA_SUCCESS)
@ -1180,25 +1178,15 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
switch (chroma_list[c_idx]) { switch (chroma_list[c_idx]) {
case cudaVideoChromaFormat_420: case cudaVideoChromaFormat_420:
if (bitdepth_minus8[b_idx] == 0) { if (bitdepth_minus8[b_idx] == 0) {
g_value_set_string (&format, "NV12"); formats.insert ("NV12");
} else if (bitdepth_minus8[b_idx] == 2) { } else if (bitdepth_minus8[b_idx] == 2) {
#if G_BYTE_ORDER == G_LITTLE_ENDIAN formats.insert ("P010_10LE");
g_value_set_string (&format, "P010_10LE");
#else
g_value_set_string (&format, "P010_10BE");
#endif
} else if (bitdepth_minus8[b_idx] == 4) { } else if (bitdepth_minus8[b_idx] == 4) {
#if G_BYTE_ORDER == G_LITTLE_ENDIAN formats.insert ("P012_LE");
g_value_set_string (&format, "P016_LE");
#else
g_value_set_string (&format, "P016_BE");
#endif
} else { } else {
GST_WARNING ("unhandled bitdepth %d", bitdepth_minus8[b_idx] + 8); GST_WARNING ("unhandled bitdepth %d", bitdepth_minus8[b_idx] + 8);
break; break;
} }
num_support++;
gst_value_list_append_value (&format_list, &format);
break; break;
case cudaVideoChromaFormat_444: case cudaVideoChromaFormat_444:
if (cudaVideoCodec_JPEG == codec) { if (cudaVideoCodec_JPEG == codec) {
@ -1208,19 +1196,17 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
} }
if (bitdepth_minus8[b_idx] == 0) { if (bitdepth_minus8[b_idx] == 0) {
g_value_set_string (&format, "Y444"); formats.insert ("Y444");
if (codec == cudaVideoCodec_HEVC)
formats.insert ("GBR");
} else if (bitdepth_minus8[b_idx] == 2 || bitdepth_minus8[b_idx] == 4) { } else if (bitdepth_minus8[b_idx] == 2 || bitdepth_minus8[b_idx] == 4) {
#if G_BYTE_ORDER == G_LITTLE_ENDIAN formats.insert ("Y444_16LE");
g_value_set_string (&format, "Y444_16LE"); if (codec == cudaVideoCodec_HEVC)
#else formats.insert ("GBR_16LE");
g_value_set_string (&format, "Y444_16BE");
#endif
} else { } else {
GST_WARNING ("unhandled bitdepth %d", bitdepth_minus8[b_idx] + 8); GST_WARNING ("unhandled bitdepth %d", bitdepth_minus8[b_idx] + 8);
break; break;
} }
num_support++;
gst_value_list_append_value (&format_list, &format);
break; break;
default: default:
break; break;
@ -1228,35 +1214,74 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
} }
} }
if (num_support == 0) { if (formats.empty ()) {
GST_INFO ("device can not support %s", codec_map->codec_name); GST_INFO ("device can not support %s", codec_map->codec_name);
goto done; goto done;
} }
#define APPEND_STRING(dst,set,str) G_STMT_START { \
src_templ = gst_caps_new_simple ("video/x-raw", if (set.find(str) != set.end()) { \
"width", GST_TYPE_INT_RANGE, min_width, max_width, if (!first) \
"height", GST_TYPE_INT_RANGE, min_height, max_height, dst += ", "; \
"framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, nullptr); dst += str; \
first = false; \
gst_caps_set_value (src_templ, "format", &format_list); } \
} G_STMT_END
{ {
GstCaps *cuda_caps = gst_caps_copy (src_templ); std::string format_str;
gst_caps_set_features_simple (cuda_caps, if (formats.size () == 1) {
format_str += *(formats.begin ());
} else {
bool first = true;
format_str += "{ ";
APPEND_STRING (format_str, formats, "NV12");
APPEND_STRING (format_str, formats, "P010_10LE");
APPEND_STRING (format_str, formats, "P012_LE");
APPEND_STRING (format_str, formats, "Y444");
APPEND_STRING (format_str, formats, "Y444_16LE");
APPEND_STRING (format_str, formats, "GBR");
APPEND_STRING (format_str, formats, "GBR_16LE");
format_str += " }";
}
std::string src_caps_string =
"video/x-raw, format = (string) " + format_str;
GstCaps *raw_caps = gst_caps_from_string (src_caps_string.c_str ());
src_templ = gst_caps_copy (raw_caps);
gst_caps_set_features_simple (src_templ,
gst_caps_features_from_string (GST_CAPS_FEATURE_MEMORY_CUDA_MEMORY)); gst_caps_features_from_string (GST_CAPS_FEATURE_MEMORY_CUDA_MEMORY));
/* OpenGL specific */ /* OpenGL specific */
#ifdef HAVE_CUDA_GST_GL #ifdef HAVE_CUDA_GST_GL
{ format_str.clear ();
GstCaps *gl_caps = gst_caps_copy (src_templ);
if (formats.size () == 1) {
format_str += *(formats.begin ());
} else {
bool first = true;
format_str += "{ ";
APPEND_STRING (format_str, formats, "NV12");
APPEND_STRING (format_str, formats, "P010_10LE");
APPEND_STRING (format_str, formats, "P012_LE");
APPEND_STRING (format_str, formats, "Y444");
APPEND_STRING (format_str, formats, "GBR");
format_str += " }";
}
src_caps_string = "video/x-raw, format = (string) " + format_str;
GstCaps *gl_caps = gst_caps_from_string (src_caps_string.c_str ());
gst_caps_set_features_simple (gl_caps, gst_caps_set_features_simple (gl_caps,
gst_caps_features_from_string (GST_CAPS_FEATURE_MEMORY_GL_MEMORY)); gst_caps_features_from_string (GST_CAPS_FEATURE_MEMORY_GL_MEMORY));
gst_caps_append (src_templ, gl_caps); gst_caps_append (src_templ, gl_caps);
}
#endif #endif
gst_caps_append (src_templ, raw_caps);
gst_caps_append (src_templ, cuda_caps);
} }
#undef APPEND_STRING
gst_caps_set_simple (src_templ,
"width", GST_TYPE_INT_RANGE, min_width, max_width,
"height", GST_TYPE_INT_RANGE, min_height, max_height, nullptr);
sink_templ = gst_caps_from_string (codec_map->sink_caps_string); sink_templ = gst_caps_from_string (codec_map->sink_caps_string);
gst_caps_set_simple (sink_templ, gst_caps_set_simple (sink_templ,
@ -1274,8 +1299,6 @@ gst_nv_decoder_check_device_caps (CUcontext cuda_ctx, cudaVideoCodec codec,
CuCtxPopCurrent (nullptr); CuCtxPopCurrent (nullptr);
done: done:
g_value_unset (&format_list);
g_value_unset (&format);
g_value_unset (&profile_list); g_value_unset (&profile_list);
if (!sink_templ || !src_templ) { if (!sink_templ || !src_templ) {
@ -1487,7 +1510,10 @@ gst_nv_decoder_negotiate (GstNvDecoder * decoder,
break; break;
} }
#ifdef HAVE_CUDA_GST_GL #ifdef HAVE_CUDA_GST_GL
if (features && gst_caps_features_contains (features, /* TODO: gl does not support Y444_16 and GBR_16 */
if (GST_VIDEO_INFO_FORMAT (info) != GST_VIDEO_FORMAT_Y444_16LE &&
GST_VIDEO_INFO_FORMAT (info) != GST_VIDEO_FORMAT_GBR_16LE &&
features && gst_caps_features_contains (features,
GST_CAPS_FEATURE_MEMORY_GL_MEMORY)) { GST_CAPS_FEATURE_MEMORY_GL_MEMORY)) {
GST_DEBUG_OBJECT (videodec, "found GL memory feature"); GST_DEBUG_OBJECT (videodec, "found GL memory feature");
have_gl = TRUE; have_gl = TRUE;

View file

@ -127,6 +127,8 @@ typedef struct _GstNvH265Dec
guint init_max_width; guint init_max_width;
guint init_max_height; guint init_max_height;
gint max_display_delay; gint max_display_delay;
GstVideoFormat out_format;
} GstNvH265Dec; } GstNvH265Dec;
typedef struct _GstNvH265DecClass typedef struct _GstNvH265DecClass
@ -559,6 +561,9 @@ gst_nv_h265_dec_new_sequence (GstH265Decoder * decoder, const GstH265SPS * sps,
guint crop_width, crop_height; guint crop_width, crop_height;
gboolean modified = FALSE; gboolean modified = FALSE;
guint max_width, max_height; guint max_width, max_height;
GstVideoFormat out_format = GST_VIDEO_FORMAT_UNKNOWN;
gboolean is_gbr = FALSE;
const GstH265VUIParams *vui = &sps->vui_params;
GST_LOG_OBJECT (self, "new sequence"); GST_LOG_OBJECT (self, "new sequence");
@ -600,44 +605,59 @@ gst_nv_h265_dec_new_sequence (GstH265Decoder * decoder, const GstH265SPS * sps,
modified = TRUE; modified = TRUE;
} }
if (modified || !gst_nv_decoder_is_configured (self->decoder)) { if (sps->chroma_format_idc == 3 && vui->colour_description_present_flag &&
GstVideoInfo info; gst_video_color_matrix_from_iso (vui->matrix_coefficients) ==
GstVideoFormat out_format = GST_VIDEO_FORMAT_UNKNOWN; GST_VIDEO_COLOR_MATRIX_RGB) {
is_gbr = TRUE;
if (self->bitdepth == 8) {
if (self->chroma_format_idc == 1) {
out_format = GST_VIDEO_FORMAT_NV12;
} else if (self->chroma_format_idc == 3) {
out_format = GST_VIDEO_FORMAT_Y444;
} else {
GST_FIXME_OBJECT (self, "8 bits supports only 4:2:0 or 4:4:4 format");
} }
} else if (self->bitdepth == 10) {
switch (self->bitdepth) {
case 8:
if (self->chroma_format_idc == 1)
out_format = GST_VIDEO_FORMAT_NV12;
else if (self->chroma_format_idc == 3)
out_format = is_gbr ? GST_VIDEO_FORMAT_GBR : GST_VIDEO_FORMAT_Y444;
break;
case 10:
if (self->chroma_format_idc == 1) { if (self->chroma_format_idc == 1) {
out_format = GST_VIDEO_FORMAT_P010_10LE; out_format = GST_VIDEO_FORMAT_P010_10LE;
} else if (self->chroma_format_idc == 3) { } else if (self->chroma_format_idc == 3) {
out_format = GST_VIDEO_FORMAT_Y444_16LE; out_format = is_gbr ?
} else { GST_VIDEO_FORMAT_GBR_16LE : GST_VIDEO_FORMAT_Y444_16LE;
GST_FIXME_OBJECT (self, "10 bits supports only 4:2:0 or 4:4:4 format");
} }
} else if (self->bitdepth == 12 || self->bitdepth == 16) { break;
case 12:
if (self->chroma_format_idc == 1) { if (self->chroma_format_idc == 1) {
out_format = GST_VIDEO_FORMAT_P016_LE; out_format = GST_VIDEO_FORMAT_P012_LE;
} else if (self->chroma_format_idc == 3) { } else if (self->chroma_format_idc == 3) {
out_format = GST_VIDEO_FORMAT_Y444_16LE; out_format = is_gbr ?
} else { GST_VIDEO_FORMAT_GBR_16LE : GST_VIDEO_FORMAT_Y444_16LE;
GST_FIXME_OBJECT (self, "%d bits supports only 4:2:0 or 4:4:4 format",
self->bitdepth);
} }
break;
default:
break;
} }
if (out_format == GST_VIDEO_FORMAT_UNKNOWN) { if (out_format == GST_VIDEO_FORMAT_UNKNOWN) {
GST_ERROR_OBJECT (self, "Could not support bitdepth/chroma format"); GST_ERROR_OBJECT (self,
"Could not support bitdepth (%d) / chroma (%d) format", self->bitdepth,
self->chroma_format_idc);
return GST_FLOW_NOT_NEGOTIATED; return GST_FLOW_NOT_NEGOTIATED;
} }
gst_video_info_set_format (&info, out_format, GST_ROUND_UP_2 (self->width), if (self->out_format != out_format) {
GST_ROUND_UP_2 (self->height)); GST_INFO_OBJECT (self, "Output format changed %s -> %s",
gst_video_format_to_string (self->out_format),
gst_video_format_to_string (out_format));
self->out_format = out_format;
modified = TRUE;
}
if (modified || !gst_nv_decoder_is_configured (self->decoder)) {
GstVideoInfo info;
gst_video_info_set_format (&info, self->out_format,
GST_ROUND_UP_2 (self->width), GST_ROUND_UP_2 (self->height));
self->max_dpb_size = max_dpb_size; self->max_dpb_size = max_dpb_size;
max_width = gst_nv_decoder_get_max_output_size (self->coded_width, max_width = gst_nv_decoder_get_max_output_size (self->coded_width,

View file

@ -483,7 +483,7 @@ gst_nv_vp9_dec_new_sequence (GstVp9Decoder * decoder,
if (frame_hdr->bit_depth == 10) { if (frame_hdr->bit_depth == 10) {
out_format = GST_VIDEO_FORMAT_P010_10LE; out_format = GST_VIDEO_FORMAT_P010_10LE;
} else { } else {
out_format = GST_VIDEO_FORMAT_P016_LE; out_format = GST_VIDEO_FORMAT_P012_LE;
} }
} }