vah265enc: Let FORCE_KEYFRAME be IDR frame rather than just I frame

The FORCE_KEYFRAME frame which has GST_VIDEO_CODEC_FRAME_FLAG_FORCE_KEYFRAME
bit set should be the sync point. So we should let it be an IDR frame to begin
a new GOP, rather than just promote it to an I frame.

Part-of: <https://gitlab.freedesktop.org/gstreamer/gstreamer/-/merge_requests/6857>
This commit is contained in:
He Junyan 2024-04-12 21:48:13 +08:00 committed by Backport Bot
parent 5e24324f4f
commit 7526919fb3

View file

@ -307,6 +307,8 @@ struct _GstVaH265Enc
guint num_reorder_frames; guint num_reorder_frames;
guint max_dpb_size; guint max_dpb_size;
GstVideoCodecFrame *last_keyframe;
} gop; } gop;
struct struct
@ -2025,55 +2027,92 @@ _h265_push_one_frame (GstVaBaseEnc * base, GstVideoCodecFrame * gst_frame,
{ {
GstVaH265Enc *self = GST_VA_H265_ENC (base); GstVaH265Enc *self = GST_VA_H265_ENC (base);
GstVaH265EncFrame *frame; GstVaH265EncFrame *frame;
gboolean add_cached_key_frame = FALSE;
g_return_val_if_fail (self->gop.cur_frame_index <= self->gop.idr_period, g_return_val_if_fail (self->gop.cur_frame_index <= self->gop.idr_period,
FALSE); FALSE);
if (gst_frame) { if (gst_frame) {
/* Begin a new GOP, should have a empty reorder_list. */
if (self->gop.cur_frame_index == self->gop.idr_period) {
g_assert (g_queue_is_empty (&base->reorder_list));
self->gop.cur_frame_index = 0;
}
frame = _enc_frame (gst_frame); frame = _enc_frame (gst_frame);
frame->poc = self->gop.cur_frame_index;
g_assert (self->gop.cur_frame_index <= self->gop.max_pic_order_cnt);
if (self->gop.cur_frame_index == 0) { /* Force to insert the key frame inside a GOP, just end the current
g_assert (frame->poc == 0); GOP and start a new one. */
GST_LOG_OBJECT (self, "system_frame_number: %d, an IDR frame, starts" if (GST_VIDEO_CODEC_FRAME_IS_FORCE_KEYFRAME (gst_frame) &&
" a new GOP", gst_frame->system_frame_number); !(self->gop.cur_frame_index == 0 ||
self->gop.cur_frame_index == self->gop.idr_period)) {
GST_DEBUG_OBJECT (base, "system_frame_number: %d is a force key "
"frame(IDR), begin a new GOP.", gst_frame->system_frame_number);
frame->poc = 0;
frame->type = self->gop.frame_types[0].slice_type;
frame->is_ref = self->gop.frame_types[0].is_ref;
frame->pyramid_level = self->gop.frame_types[0].pyramid_level;
frame->left_ref_poc_diff = self->gop.frame_types[0].left_ref_poc_diff;
frame->right_ref_poc_diff = self->gop.frame_types[0].right_ref_poc_diff;
/* The previous key frame should be already be poped out. */
g_assert (self->gop.last_keyframe == NULL);
/* An empty reorder list, start the new GOP immediately. */
if (g_queue_is_empty (&base->reorder_list)) {
self->gop.cur_frame_index = 1;
g_queue_clear_full (&base->ref_list,
(GDestroyNotify) gst_video_codec_frame_unref);
last = FALSE;
} else {
/* Cache the key frame and end the current GOP.
Next time calling this push() without frame, start the new GOP. */
self->gop.last_keyframe = gst_frame;
last = TRUE;
}
add_cached_key_frame = TRUE;
} else {
/* Begin a new GOP, should have a empty reorder_list. */
if (self->gop.cur_frame_index == self->gop.idr_period) {
g_assert (g_queue_is_empty (&base->reorder_list));
self->gop.cur_frame_index = 0;
}
frame->poc = self->gop.cur_frame_index;
g_assert (self->gop.cur_frame_index <= self->gop.max_pic_order_cnt);
if (self->gop.cur_frame_index == 0) {
g_assert (frame->poc == 0);
GST_LOG_OBJECT (self, "system_frame_number: %d, an IDR frame, starts"
" a new GOP", gst_frame->system_frame_number);
g_queue_clear_full (&base->ref_list,
(GDestroyNotify) gst_video_codec_frame_unref);
}
frame->type = self->gop.frame_types[self->gop.cur_frame_index].slice_type;
frame->is_ref = self->gop.frame_types[self->gop.cur_frame_index].is_ref;
frame->pyramid_level =
self->gop.frame_types[self->gop.cur_frame_index].pyramid_level;
frame->left_ref_poc_diff =
self->gop.frame_types[self->gop.cur_frame_index].left_ref_poc_diff;
frame->right_ref_poc_diff =
self->gop.frame_types[self->gop.cur_frame_index].right_ref_poc_diff;
GST_LOG_OBJECT (self, "Push frame, system_frame_number: %d, poc %d, "
"frame type %s", gst_frame->system_frame_number, frame->poc,
_h265_slice_type_name (frame->type));
self->gop.cur_frame_index++;
g_queue_push_tail (&base->reorder_list,
gst_video_codec_frame_ref (gst_frame));
}
} else if (self->gop.last_keyframe) {
g_assert (self->gop.last_keyframe ==
g_queue_peek_tail (&base->reorder_list));
if (g_queue_get_length (&base->reorder_list) == 1) {
/* The last cached key frame begins a new GOP */
self->gop.cur_frame_index = 1;
self->gop.last_keyframe = NULL;
g_queue_clear_full (&base->ref_list, g_queue_clear_full (&base->ref_list,
(GDestroyNotify) gst_video_codec_frame_unref); (GDestroyNotify) gst_video_codec_frame_unref);
} }
frame->type = self->gop.frame_types[self->gop.cur_frame_index].slice_type;
frame->is_ref = self->gop.frame_types[self->gop.cur_frame_index].is_ref;
frame->pyramid_level =
self->gop.frame_types[self->gop.cur_frame_index].pyramid_level;
frame->left_ref_poc_diff =
self->gop.frame_types[self->gop.cur_frame_index].left_ref_poc_diff;
frame->right_ref_poc_diff =
self->gop.frame_types[self->gop.cur_frame_index].right_ref_poc_diff;
if (GST_VIDEO_CODEC_FRAME_IS_FORCE_KEYFRAME (gst_frame)) {
GST_DEBUG_OBJECT (self, "system_frame_number: %d, a force key frame,"
" promote its type from %s to %s", gst_frame->system_frame_number,
_h265_slice_type_name (frame->type),
_h265_slice_type_name (GST_H265_I_SLICE));
frame->type = GST_H265_I_SLICE;
frame->is_ref = TRUE;
}
GST_LOG_OBJECT (self, "Push frame, system_frame_number: %d, poc %d, "
"frame type %s", gst_frame->system_frame_number, frame->poc,
_h265_slice_type_name (frame->type));
self->gop.cur_frame_index++;
g_queue_push_tail (&base->reorder_list,
gst_video_codec_frame_ref (gst_frame));
} }
/* ensure the last one a non-B and end the GOP. */ /* ensure the last one a non-B and end the GOP. */
@ -2093,6 +2132,12 @@ _h265_push_one_frame (GstVaBaseEnc * base, GstVideoCodecFrame * gst_frame,
} }
} }
/* Insert the cached next key frame after ending the current GOP. */
if (add_cached_key_frame) {
g_queue_push_tail (&base->reorder_list,
gst_video_codec_frame_ref (gst_frame));
}
return TRUE; return TRUE;
} }
@ -2114,7 +2159,7 @@ _count_backward_ref_num (gpointer data, gpointer user_data)
} }
static GstVideoCodecFrame * static GstVideoCodecFrame *
_h265_pop_pyramid_b_frame (GstVaH265Enc * self) _h265_pop_pyramid_b_frame (GstVaH265Enc * self, guint gop_len)
{ {
GstVaBaseEnc *base = GST_VA_BASE_ENC (self); GstVaBaseEnc *base = GST_VA_BASE_ENC (self);
guint i; guint i;
@ -2129,7 +2174,7 @@ _h265_pop_pyramid_b_frame (GstVaH265Enc * self)
b_vaframe = NULL; b_vaframe = NULL;
/* Find the highest level with smallest poc. */ /* Find the highest level with smallest poc. */
for (i = 0; i < g_queue_get_length (&base->reorder_list); i++) { for (i = 0; i < gop_len; i++) {
GstVaH265EncFrame *vaf; GstVaH265EncFrame *vaf;
GstVideoCodecFrame *f; GstVideoCodecFrame *f;
@ -2161,7 +2206,7 @@ again:
/* Check whether its refs are already poped. */ /* Check whether its refs are already poped. */
g_assert (b_vaframe->left_ref_poc_diff != 0); g_assert (b_vaframe->left_ref_poc_diff != 0);
g_assert (b_vaframe->right_ref_poc_diff != 0); g_assert (b_vaframe->right_ref_poc_diff != 0);
for (i = 0; i < g_queue_get_length (&base->reorder_list); i++) { for (i = 0; i < gop_len; i++) {
GstVaH265EncFrame *vaf; GstVaH265EncFrame *vaf;
GstVideoCodecFrame *f; GstVideoCodecFrame *f;
@ -2203,6 +2248,7 @@ _h265_pop_one_frame (GstVaBaseEnc * base, GstVideoCodecFrame ** out_frame)
GstVaH265Enc *self = GST_VA_H265_ENC (base); GstVaH265Enc *self = GST_VA_H265_ENC (base);
GstVaH265EncFrame *vaframe; GstVaH265EncFrame *vaframe;
GstVideoCodecFrame *frame; GstVideoCodecFrame *frame;
guint gop_len;
struct RefFramesCount count; struct RefFramesCount count;
g_return_val_if_fail (self->gop.cur_frame_index <= self->gop.idr_period, g_return_val_if_fail (self->gop.cur_frame_index <= self->gop.idr_period,
@ -2213,16 +2259,21 @@ _h265_pop_one_frame (GstVaBaseEnc * base, GstVideoCodecFrame ** out_frame)
if (g_queue_is_empty (&base->reorder_list)) if (g_queue_is_empty (&base->reorder_list))
return TRUE; return TRUE;
gop_len = g_queue_get_length (&base->reorder_list);
if (self->gop.last_keyframe && gop_len > 1)
gop_len--;
/* Return the last pushed non-B immediately. */ /* Return the last pushed non-B immediately. */
frame = g_queue_peek_tail (&base->reorder_list); frame = g_queue_peek_nth (&base->reorder_list, gop_len - 1);
vaframe = _enc_frame (frame); vaframe = _enc_frame (frame);
if (vaframe->type != GST_H265_B_SLICE) { if (vaframe->type != GST_H265_B_SLICE) {
frame = g_queue_pop_tail (&base->reorder_list); frame = g_queue_pop_nth (&base->reorder_list, gop_len - 1);
goto get_one; goto get_one;
} }
if (self->gop.b_pyramid) { if (self->gop.b_pyramid) {
frame = _h265_pop_pyramid_b_frame (self); frame = _h265_pop_pyramid_b_frame (self, gop_len);
if (frame == NULL) if (frame == NULL)
return TRUE; return TRUE;
@ -2526,6 +2577,7 @@ gst_va_h265_enc_reset_state (GstVaBaseEnc * base)
self->gop.backward_ref_num = 0; self->gop.backward_ref_num = 0;
self->gop.num_reorder_frames = 0; self->gop.num_reorder_frames = 0;
self->gop.max_dpb_size = 0; self->gop.max_dpb_size = 0;
self->gop.last_keyframe = NULL;
self->rc.max_bitrate = 0; self->rc.max_bitrate = 0;
self->rc.target_bitrate = 0; self->rc.target_bitrate = 0;
@ -4600,6 +4652,7 @@ gst_va_h265_enc_flush (GstVideoEncoder * venc)
/* begin from an IDR after flush. */ /* begin from an IDR after flush. */
self->gop.cur_frame_index = 0; self->gop.cur_frame_index = 0;
self->gop.last_keyframe = NULL;
return GST_VIDEO_ENCODER_CLASS (parent_class)->flush (venc); return GST_VIDEO_ENCODER_CLASS (parent_class)->flush (venc);
} }