/* GStreamer H264 encoder plugin * Copyright (C) 2005 Michal Benes * Copyright (C) 2005 Josef Zlomek * Copyright (C) 2008 Mark Nauwelaerts * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public * License along with this library; if not, write to the * Free Software Foundation, Inc., 59 Temple Place - Suite 330, * Boston, MA 02111-1307, USA. */ /** * SECTION:element-x264enc * @see_also: faac * * This element encodes raw video into H264 compressed data, * also otherwise known as MPEG-4 AVC (Advanced Video Codec). * * The #GstX264Enc:pass property controls the type of encoding. In case of Constant * Bitrate Encoding (actually ABR), the #GstX264Enc:bitrate will determine the quality * of the encoding. This will similarly be the case if this target bitrate * is to obtained in multiple (2 or 3) pass encoding. * Alternatively, one may choose to perform Constant Quantizer or Quality encoding, * in which case the #GstX264Enc:quantizer property controls much of the outcome, in that case #GstX264Enc:bitrate is the maximum bitrate. * * The H264 profile that is eventually used depends on a few settings. * If #GstX264Enc:dct8x8 is enabled, then High profile is used. * Otherwise, if #GstX264Enc:cabac entropy coding is enabled or #GstX264Enc:bframes * are allowed, then Main Profile is in effect, and otherwise Baseline profile * applies. The main profile is imposed by default, * which is fine for most software players and settings, * but in some cases (e.g. hardware platforms) a more restricted profile/level * may be necessary. The recommended way to set a profile is to set it in the * downstream caps. * * If a preset/tuning are specified then these will define the default values and * the property defaults will be ignored. After this the option-string property is * applied, followed by the user-set properties, fast first pass restrictions and * finally the profile restrictions. * * Some settings, including the default settings, may lead to quite * some latency (i.e. frame buffering) in the encoder. This may cause problems * with pipeline stalling in non-trivial pipelines, because the encoder latency * is often considerably higher than the default size of a simple queue * element. Such problems are caused by one of the queues in the other * non-x264enc streams/branches filling up and blocking upstream. They can * be fixed by relaxing the default time/size/buffer limits on the queue * elements in the non-x264 branches, or using a (single) multiqueue element * for all branches. Also see the last example below. * * * * Example pipeline * |[ * gst-launch -v videotestsrc num-buffers=1000 ! x264enc qp-min=18 ! \ * avimux ! filesink location=videotestsrc.avi * ]| This example pipeline will encode a test video source to H264 muxed in an * AVI container, while ensuring a sane minimum quantization factor to avoid * some (excessive) waste. * |[ * gst-launch -v videotestsrc num-buffers=1000 ! x264enc pass=quant ! \ * matroskamux ! filesink location=videotestsrc.avi * ]| This example pipeline will encode a test video source to H264 using fixed * quantization, and muxes it in a Matroska container. * |[ * gst-launch -v videotestsrc num-buffers=1000 ! x264enc pass=5 quantizer=25 speed-preset=6 ! video/x-h264, profile=baseline ! \ * qtmux ! filesink location=videotestsrc.mov * ]| This example pipeline will encode a test video source to H264 using * constant quality at around Q25 using the 'medium' speed/quality preset and * restricting the options used so that the output is H.264 Baseline Profile * compliant and finally multiplexing the output in Quicktime mov format. * |[ * gst-launch -v videotestsrc num-buffers=1000 ! tee name=t ! queue ! xvimagesink \ * t. ! queue ! x264enc rc-lookahead=5 ! fakesink * ]| This example pipeline will encode a test video source to H264 while * displaying the input material at the same time. As mentioned above, * specific settings are needed in this case to avoid pipeline stalling. * Depending on goals and context, other approaches are possible, e.g. * tune=zerolatency might be configured, or queue sizes increased. * */ #ifdef HAVE_CONFIG_H # include "config.h" #endif #include "gstx264enc.h" #include #include #if X264_BUILD >= 71 #define X264_DELAYED_FRAMES_API #endif #if X264_BUILD >= 76 #define X264_ENC_NALS 1 #endif #if X264_BUILD >= 69 #define X264_MB_RC #endif #if X264_BUILD >= 78 /* b-pyramid was available before but was changed from boolean here */ #define X264_B_PYRAMID #endif #if X264_BUILD >= 80 #define X264_ENH_THREADING #endif #if X264_BUILD >= 82 #define X264_INTRA_REFRESH #endif #if X264_BUILD >= 86 #define X264_PRESETS #endif #if X264_BUILD >= 95 #define FORCE_INTRA_API #endif #include #include GST_DEBUG_CATEGORY_STATIC (x264_enc_debug); #define GST_CAT_DEFAULT x264_enc_debug enum { ARG_0, ARG_THREADS, ARG_SLICED_THREADS, ARG_SYNC_LOOKAHEAD, ARG_PASS, ARG_QUANTIZER, ARG_STATS_FILE, ARG_MULTIPASS_CACHE_FILE, ARG_BYTE_STREAM, ARG_BITRATE, ARG_INTRA_REFRESH, ARG_VBV_BUF_CAPACITY, ARG_ME, ARG_SUBME, ARG_ANALYSE, ARG_DCT8x8, ARG_REF, ARG_BFRAMES, ARG_B_ADAPT, ARG_B_PYRAMID, ARG_WEIGHTB, ARG_SPS_ID, ARG_AU_NALU, ARG_TRELLIS, ARG_KEYINT_MAX, ARG_CABAC, ARG_QP_MIN, ARG_QP_MAX, ARG_QP_STEP, ARG_IP_FACTOR, ARG_PB_FACTOR, ARG_RC_MB_TREE, ARG_RC_LOOKAHEAD, ARG_NR, ARG_INTERLACED, ARG_OPTION_STRING, ARG_PROFILE, ARG_SPEED_PRESET, ARG_PSY_TUNE, ARG_TUNE, }; #define ARG_THREADS_DEFAULT 0 /* 0 means 'auto' which is 1.5x number of CPU cores */ #define ARG_PASS_DEFAULT 0 #define ARG_QUANTIZER_DEFAULT 21 #define ARG_MULTIPASS_CACHE_FILE_DEFAULT "x264.log" #define ARG_STATS_FILE_DEFAULT ARG_MULTIPASS_CACHE_FILE_DEFAULT #define ARG_BYTE_STREAM_DEFAULT FALSE #define ARG_BITRATE_DEFAULT (2 * 1024) #define ARG_VBV_BUF_CAPACITY_DEFAULT 600 #define ARG_ME_DEFAULT X264_ME_HEX #define ARG_SUBME_DEFAULT 1 #define ARG_ANALYSE_DEFAULT 0 #define ARG_DCT8x8_DEFAULT FALSE #define ARG_REF_DEFAULT 1 #define ARG_BFRAMES_DEFAULT 0 #define ARG_B_ADAPT_DEFAULT TRUE #define ARG_B_PYRAMID_DEFAULT FALSE #define ARG_WEIGHTB_DEFAULT FALSE #define ARG_SPS_ID_DEFAULT 0 #define ARG_AU_NALU_DEFAULT TRUE #define ARG_TRELLIS_DEFAULT TRUE #define ARG_KEYINT_MAX_DEFAULT 0 #define ARG_CABAC_DEFAULT TRUE #define ARG_QP_MIN_DEFAULT 10 #define ARG_QP_MAX_DEFAULT 51 #define ARG_QP_STEP_DEFAULT 4 #define ARG_IP_FACTOR_DEFAULT 1.4 #define ARG_PB_FACTOR_DEFAULT 1.3 #define ARG_NR_DEFAULT 0 #define ARG_INTERLACED_DEFAULT FALSE #define ARG_SLICED_THREADS_DEFAULT FALSE #define ARG_SYNC_LOOKAHEAD_DEFAULT -1 #define ARG_RC_MB_TREE_DEFAULT TRUE #define ARG_RC_LOOKAHEAD_DEFAULT 40 #define ARG_INTRA_REFRESH_DEFAULT FALSE #define ARG_PROFILE_DEFAULT 2 /* 'Main Profile' - matches profile of property defaults */ #define ARG_OPTION_STRING_DEFAULT "" static GString *x264enc_defaults; #define ARG_SPEED_PRESET_DEFAULT 6 /* 'medium' preset - matches x264 CLI default */ #define ARG_PSY_TUNE_DEFAULT 0 /* no psy tuning */ #define ARG_TUNE_DEFAULT 0 /* no tuning */ enum { GST_X264_ENC_STREAM_FORMAT_FROM_PROPERTY, GST_X264_ENC_STREAM_FORMAT_AVC, GST_X264_ENC_STREAM_FORMAT_BYTE_STREAM }; enum { GST_X264_ENC_PASS_CBR = 0, GST_X264_ENC_PASS_QUANT = 0x04, GST_X264_ENC_PASS_QUAL, GST_X264_ENC_PASS_PASS1 = 0x11, GST_X264_ENC_PASS_PASS2, GST_X264_ENC_PASS_PASS3 }; #define GST_X264_ENC_PASS_TYPE (gst_x264_enc_pass_get_type()) static GType gst_x264_enc_pass_get_type (void) { static GType pass_type = 0; static const GEnumValue pass_types[] = { {GST_X264_ENC_PASS_CBR, "Constant Bitrate Encoding", "cbr"}, {GST_X264_ENC_PASS_QUANT, "Constant Quantizer (debugging only)", "quant"}, {GST_X264_ENC_PASS_QUAL, "Constant Quality", "qual"}, {GST_X264_ENC_PASS_PASS1, "VBR Encoding - Pass 1", "pass1"}, {GST_X264_ENC_PASS_PASS2, "VBR Encoding - Pass 2", "pass2"}, {GST_X264_ENC_PASS_PASS3, "VBR Encoding - Pass 3", "pass3"}, {0, NULL, NULL} }; if (!pass_type) { pass_type = g_enum_register_static ("GstX264EncPass", pass_types); } return pass_type; } #define GST_X264_ENC_ME_TYPE (gst_x264_enc_me_get_type()) static GType gst_x264_enc_me_get_type (void) { static GType me_type = 0; static GEnumValue *me_types; int n, i; if (me_type != 0) return me_type; n = 0; while (x264_motion_est_names[n] != NULL) n++; me_types = g_new0 (GEnumValue, n + 1); for (i = 0; i < n; i++) { me_types[i].value = i; me_types[i].value_name = x264_motion_est_names[i]; me_types[i].value_nick = x264_motion_est_names[i]; } me_type = g_enum_register_static ("GstX264EncMe", me_types); return me_type; } #define GST_X264_ENC_ANALYSE_TYPE (gst_x264_enc_analyse_get_type()) static GType gst_x264_enc_analyse_get_type (void) { static GType analyse_type = 0; static const GFlagsValue analyse_types[] = { {X264_ANALYSE_I4x4, "i4x4", "i4x4"}, {X264_ANALYSE_I8x8, "i8x8", "i8x8"}, {X264_ANALYSE_PSUB16x16, "p8x8", "p8x8"}, {X264_ANALYSE_PSUB8x8, "p4x4", "p4x4"}, {X264_ANALYSE_BSUB16x16, "b8x8", "b8x8"}, {0, NULL, NULL}, }; if (!analyse_type) { analyse_type = g_flags_register_static ("GstX264EncAnalyse", analyse_types); } return analyse_type; } #ifdef X264_PRESETS #define GST_X264_ENC_PROFILE_TYPE (gst_x264_enc_profile_get_type()) static GType gst_x264_enc_profile_get_type (void) { static GType profile_type = 0; static GEnumValue *profile_types; int n, i; if (profile_type != 0) return profile_type; n = 0; while (x264_profile_names[n] != NULL) n++; profile_types = g_new0 (GEnumValue, n + 2); i = 0; profile_types[i].value = i; profile_types[i].value_name = "No profile"; profile_types[i].value_nick = "None"; for (i = 1; i <= n; i++) { profile_types[i].value = i; profile_types[i].value_name = x264_profile_names[i - 1]; profile_types[i].value_nick = x264_profile_names[i - 1]; } profile_type = g_enum_register_static ("GstX264EncProfile", profile_types); return profile_type; } #define GST_X264_ENC_SPEED_PRESET_TYPE (gst_x264_enc_speed_preset_get_type()) static GType gst_x264_enc_speed_preset_get_type (void) { static GType speed_preset_type = 0; static GEnumValue *speed_preset_types; int n, i; if (speed_preset_type != 0) return speed_preset_type; n = 0; while (x264_preset_names[n] != NULL) n++; speed_preset_types = g_new0 (GEnumValue, n + 2); speed_preset_types[0].value = 0; speed_preset_types[0].value_name = "No preset"; speed_preset_types[0].value_nick = "None"; for (i = 1; i <= n; i++) { speed_preset_types[i].value = i; speed_preset_types[i].value_name = x264_preset_names[i - 1]; speed_preset_types[i].value_nick = x264_preset_names[i - 1]; } speed_preset_type = g_enum_register_static ("GstX264EncPreset", speed_preset_types); return speed_preset_type; } static const GFlagsValue tune_types[] = { {0x0, "No tuning", "none"}, {0x1, "Still image", "stillimage"}, {0x2, "Fast decode", "fastdecode"}, {0x4, "Zero latency (requires constant framerate)", "zerolatency"}, {0, NULL, NULL}, }; #define GST_X264_ENC_TUNE_TYPE (gst_x264_enc_tune_get_type()) static GType gst_x264_enc_tune_get_type (void) { static GType tune_type = 0; if (!tune_type) { tune_type = g_flags_register_static ("GstX264EncTune", tune_types + 1); } return tune_type; } enum { GST_X264_ENC_TUNE_NONE, GST_X264_ENC_TUNE_FILM, GST_X264_ENC_TUNE_ANIMATION, GST_X264_ENC_TUNE_GRAIN, GST_X264_ENC_TUNE_PSNR, GST_X264_ENC_TUNE_SSIM, GST_X264_ENC_TUNE_LAST }; static const GEnumValue psy_tune_types[] = { {GST_X264_ENC_TUNE_NONE, "No tuning", "none"}, {GST_X264_ENC_TUNE_FILM, "Film", "film"}, {GST_X264_ENC_TUNE_ANIMATION, "Animation", "animation"}, {GST_X264_ENC_TUNE_GRAIN, "Grain", "grain"}, {GST_X264_ENC_TUNE_PSNR, "PSNR", "psnr"}, {GST_X264_ENC_TUNE_SSIM, "SSIM", "ssim"}, {0, NULL, NULL}, }; #define GST_X264_ENC_PSY_TUNE_TYPE (gst_x264_enc_psy_tune_get_type()) static GType gst_x264_enc_psy_tune_get_type (void) { static GType psy_tune_type = 0; if (!psy_tune_type) { psy_tune_type = g_enum_register_static ("GstX264EncPsyTune", psy_tune_types); } return psy_tune_type; } static void gst_x264_enc_build_tunings_string (GstX264Enc * x264enc) { int i = 1; if (x264enc->tunings) g_string_free (x264enc->tunings, TRUE); if (x264enc->psy_tune) { x264enc->tunings = g_string_new (psy_tune_types[x264enc->psy_tune].value_nick); } else { x264enc->tunings = g_string_new (NULL); } while (tune_types[i].value_name) { if (x264enc->tune & (1 << (i - 1))) g_string_append_printf (x264enc->tunings, "%s%s", x264enc->tunings->len ? "," : "", tune_types[i].value_nick); i++; } if (x264enc->tunings->len) GST_DEBUG_OBJECT (x264enc, "Constructed tunings string: %s", x264enc->tunings->str); } #endif static GstStaticPadTemplate sink_factory = GST_STATIC_PAD_TEMPLATE ("sink", GST_PAD_SINK, GST_PAD_ALWAYS, GST_STATIC_CAPS ("video/x-raw, " "format = (string) { I420, YV12 }, " "framerate = (fraction) [0, MAX], " "width = (int) [ 16, MAX ], " "height = (int) [ 16, MAX ]") ); static GstStaticPadTemplate src_factory = GST_STATIC_PAD_TEMPLATE ("src", GST_PAD_SRC, GST_PAD_ALWAYS, GST_STATIC_CAPS ("video/x-h264, " "framerate = (fraction) [0/1, MAX], " "width = (int) [ 1, MAX ], " "height = (int) [ 1, MAX ], " "stream-format = (string) { byte-stream, avc }, " "alignment = (string) { au }, " "profile = (string) { high-10, high, main, baseline, " "constrained-baseline, high-10-intra }") ); static void gst_x264_enc_finalize (GObject * object); static void gst_x264_enc_reset (GstX264Enc * encoder); static gboolean gst_x264_enc_init_encoder (GstX264Enc * encoder); static void gst_x264_enc_close_encoder (GstX264Enc * encoder); static gboolean gst_x264_enc_sink_set_caps (GstPad * pad, GstCaps * caps); static GstCaps *gst_x264_enc_sink_get_caps (GstPad * pad, GstCaps * filter); static gboolean gst_x264_enc_sink_event (GstPad * pad, GstObject * parent, GstEvent * event); static gboolean gst_x264_enc_sink_query (GstPad * pad, GstObject * parent, GstQuery * query); static gboolean gst_x264_enc_src_event (GstPad * pad, GstObject * parent, GstEvent * event); static GstFlowReturn gst_x264_enc_chain (GstPad * pad, GstObject * parent, GstBuffer * buf); static void gst_x264_enc_flush_frames (GstX264Enc * encoder, gboolean send); static GstFlowReturn gst_x264_enc_encode_frame (GstX264Enc * encoder, x264_picture_t * pic_in, int *i_nal, gboolean send); static GstStateChangeReturn gst_x264_enc_change_state (GstElement * element, GstStateChange transition); static void gst_x264_enc_set_property (GObject * object, guint prop_id, const GValue * value, GParamSpec * pspec); static void gst_x264_enc_get_property (GObject * object, guint prop_id, GValue * value, GParamSpec * pspec); #define gst_x264_enc_parent_class parent_class G_DEFINE_TYPE_WITH_CODE (GstX264Enc, gst_x264_enc, GST_TYPE_ELEMENT, G_IMPLEMENT_INTERFACE (GST_TYPE_PRESET, NULL)); /* don't forget to free the string after use */ static const gchar * gst_x264_enc_build_partitions (gint analyse) { GString *string; if (!analyse) return NULL; string = g_string_new (NULL); if (analyse & X264_ANALYSE_I4x4) g_string_append (string, "i4x4"); if (analyse & X264_ANALYSE_I8x8) g_string_append (string, ",i8x8"); if (analyse & X264_ANALYSE_PSUB16x16) g_string_append (string, ",p8x8"); if (analyse & X264_ANALYSE_PSUB8x8) g_string_append (string, ",p4x4"); if (analyse & X264_ANALYSE_BSUB16x16) g_string_append (string, ",b8x8"); return (const gchar *) g_string_free (string, FALSE); } static void gst_x264_enc_class_init (GstX264EncClass * klass) { GObjectClass *gobject_class; GstElementClass *gstelement_class; const gchar *partitions = NULL; x264enc_defaults = g_string_new (""); gobject_class = (GObjectClass *) klass; gstelement_class = (GstElementClass *) klass; gobject_class->set_property = gst_x264_enc_set_property; gobject_class->get_property = gst_x264_enc_get_property; gobject_class->finalize = gst_x264_enc_finalize; /* options for which we don't use string equivalents */ g_object_class_install_property (gobject_class, ARG_PASS, g_param_spec_enum ("pass", "Encoding pass/type", "Encoding pass/type", GST_X264_ENC_PASS_TYPE, ARG_PASS_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_object_class_install_property (gobject_class, ARG_QUANTIZER, g_param_spec_uint ("quantizer", "Constant Quantizer", "Constant quantizer or quality to apply", 1, 50, ARG_QUANTIZER_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_object_class_install_property (gobject_class, ARG_BITRATE, g_param_spec_uint ("bitrate", "Bitrate", "Bitrate in kbit/sec", 1, 100 * 1024, ARG_BITRATE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS | GST_PARAM_MUTABLE_PLAYING)); g_object_class_install_property (gobject_class, ARG_VBV_BUF_CAPACITY, g_param_spec_uint ("vbv-buf-capacity", "VBV buffer capacity", "Size of the VBV buffer in milliseconds", 0, 10000, ARG_VBV_BUF_CAPACITY_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS | GST_PARAM_MUTABLE_PLAYING)); #ifdef X264_PRESETS g_object_class_install_property (gobject_class, ARG_SPEED_PRESET, g_param_spec_enum ("speed-preset", "Speed/quality preset", "Preset name for speed/quality tradeoff options (can affect decode " "compatibility - impose restrictions separately for your target decoder)", GST_X264_ENC_SPEED_PRESET_TYPE, ARG_SPEED_PRESET_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_object_class_install_property (gobject_class, ARG_PSY_TUNE, g_param_spec_enum ("psy-tune", "Psychovisual tuning preset", "Preset name for psychovisual tuning options", GST_X264_ENC_PSY_TUNE_TYPE, ARG_PSY_TUNE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_object_class_install_property (gobject_class, ARG_TUNE, g_param_spec_flags ("tune", "Content tuning preset", "Preset name for non-psychovisual tuning options", GST_X264_ENC_TUNE_TYPE, ARG_TUNE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_object_class_install_property (gobject_class, ARG_PROFILE, g_param_spec_enum ("profile", "H.264 profile", "Apply restrictions to meet H.264 Profile constraints. This will " "override other properties if necessary. This will only be used " "if downstream elements do not specify a profile in their caps (DEPRECATED)", GST_X264_ENC_PROFILE_TYPE, ARG_PROFILE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); #endif /* X264_PRESETS */ g_object_class_install_property (gobject_class, ARG_OPTION_STRING, g_param_spec_string ("option-string", "Option string", "String of x264 options (overridden by element properties)", ARG_OPTION_STRING_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); /* options for which we _do_ use string equivalents */ g_object_class_install_property (gobject_class, ARG_THREADS, g_param_spec_uint ("threads", "Threads", "Number of threads used by the codec (0 for automatic)", 0, 4, ARG_THREADS_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); /* NOTE: this first string append doesn't require the ':' delimiter but the * rest do */ g_string_append_printf (x264enc_defaults, "threads=%d", ARG_THREADS_DEFAULT); #ifdef X264_ENH_THREADING g_object_class_install_property (gobject_class, ARG_SLICED_THREADS, g_param_spec_boolean ("sliced-threads", "Sliced Threads", "Low latency but lower efficiency threading", ARG_SLICED_THREADS_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":sliced-threads=%d", ARG_SLICED_THREADS_DEFAULT); g_object_class_install_property (gobject_class, ARG_SYNC_LOOKAHEAD, g_param_spec_int ("sync-lookahead", "Sync Lookahead", "Number of buffer frames for threaded lookahead (-1 for automatic)", -1, 250, ARG_SYNC_LOOKAHEAD_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":sync-lookahead=%d", ARG_SYNC_LOOKAHEAD_DEFAULT); #endif g_object_class_install_property (gobject_class, ARG_STATS_FILE, g_param_spec_string ("stats-file", "Stats File", "Filename for multipass statistics (deprecated, use multipass-cache-file)", ARG_STATS_FILE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_object_class_install_property (gobject_class, ARG_MULTIPASS_CACHE_FILE, g_param_spec_string ("multipass-cache-file", "Multipass Cache File", "Filename for multipass cache file", ARG_MULTIPASS_CACHE_FILE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":stats=%s", ARG_MULTIPASS_CACHE_FILE_DEFAULT); g_object_class_install_property (gobject_class, ARG_BYTE_STREAM, g_param_spec_boolean ("byte-stream", "Byte Stream", "Generate byte stream format of NALU", ARG_BYTE_STREAM_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":annexb=%d", ARG_BYTE_STREAM_DEFAULT); #ifdef X264_INTRA_REFRESH g_object_class_install_property (gobject_class, ARG_INTRA_REFRESH, g_param_spec_boolean ("intra-refresh", "Intra Refresh", "Use Periodic Intra Refresh instead of IDR frames", ARG_INTRA_REFRESH_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":intra-refresh=%d", ARG_INTRA_REFRESH_DEFAULT); #endif g_object_class_install_property (gobject_class, ARG_ME, g_param_spec_enum ("me", "Motion Estimation", "Integer pixel motion estimation method", GST_X264_ENC_ME_TYPE, ARG_ME_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":me=%s", x264_motion_est_names[ARG_ME_DEFAULT]); g_object_class_install_property (gobject_class, ARG_SUBME, g_param_spec_uint ("subme", "Subpixel Motion Estimation", "Subpixel motion estimation and partition decision quality: 1=fast, 10=best", 1, 10, ARG_SUBME_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":subme=%d", ARG_SUBME_DEFAULT); g_object_class_install_property (gobject_class, ARG_ANALYSE, g_param_spec_flags ("analyse", "Analyse", "Partitions to consider", GST_X264_ENC_ANALYSE_TYPE, ARG_ANALYSE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); partitions = gst_x264_enc_build_partitions (ARG_ANALYSE_DEFAULT); if (partitions) { g_string_append_printf (x264enc_defaults, ":partitions=%s", partitions); g_free ((gpointer) partitions); } g_object_class_install_property (gobject_class, ARG_DCT8x8, g_param_spec_boolean ("dct8x8", "DCT8x8", "Adaptive spatial transform size", ARG_DCT8x8_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":8x8dct=%d", ARG_DCT8x8_DEFAULT); g_object_class_install_property (gobject_class, ARG_REF, g_param_spec_uint ("ref", "Reference Frames", "Number of reference frames", 1, 12, ARG_REF_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":ref=%d", ARG_REF_DEFAULT); g_object_class_install_property (gobject_class, ARG_BFRAMES, g_param_spec_uint ("bframes", "B-Frames", "Number of B-frames between I and P", 0, 4, ARG_BFRAMES_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":bframes=%d", ARG_BFRAMES_DEFAULT); g_object_class_install_property (gobject_class, ARG_B_ADAPT, g_param_spec_boolean ("b-adapt", "B-Adapt", "Automatically decide how many B-frames to use", ARG_B_ADAPT_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":b-adapt=%d", ARG_B_ADAPT_DEFAULT); g_object_class_install_property (gobject_class, ARG_B_PYRAMID, g_param_spec_boolean ("b-pyramid", "B-Pyramid", "Keep some B-frames as references", ARG_B_PYRAMID_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); #ifdef X264_B_PYRAMID g_string_append_printf (x264enc_defaults, ":b-pyramid=%s", x264_b_pyramid_names[ARG_B_PYRAMID_DEFAULT]); #else g_string_append_printf (x264enc_defaults, ":b-pyramid=%d", ARG_B_PYRAMID_DEFAULT); #endif /* X264_B_PYRAMID */ g_object_class_install_property (gobject_class, ARG_WEIGHTB, g_param_spec_boolean ("weightb", "Weighted B-Frames", "Weighted prediction for B-frames", ARG_WEIGHTB_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":weightb=%d", ARG_WEIGHTB_DEFAULT); g_object_class_install_property (gobject_class, ARG_SPS_ID, g_param_spec_uint ("sps-id", "SPS ID", "SPS and PPS ID number", 0, 31, ARG_SPS_ID_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":sps-id=%d", ARG_SPS_ID_DEFAULT); g_object_class_install_property (gobject_class, ARG_AU_NALU, g_param_spec_boolean ("aud", "AUD", "Use AU (Access Unit) delimiter", ARG_AU_NALU_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":aud=%d", ARG_AU_NALU_DEFAULT); g_object_class_install_property (gobject_class, ARG_TRELLIS, g_param_spec_boolean ("trellis", "Trellis quantization", "Enable trellis searched quantization", ARG_TRELLIS_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":trellis=%d", ARG_TRELLIS_DEFAULT); g_object_class_install_property (gobject_class, ARG_KEYINT_MAX, g_param_spec_uint ("key-int-max", "Key-frame maximal interval", "Maximal distance between two key-frames (0 for automatic)", 0, G_MAXINT, ARG_KEYINT_MAX_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":keyint=%d", ARG_KEYINT_MAX_DEFAULT); g_object_class_install_property (gobject_class, ARG_CABAC, g_param_spec_boolean ("cabac", "Use CABAC", "Enable CABAC entropy coding", ARG_CABAC_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":cabac=%d", ARG_CABAC_DEFAULT); g_object_class_install_property (gobject_class, ARG_QP_MIN, g_param_spec_uint ("qp-min", "Minimum Quantizer", "Minimum quantizer", 1, 51, ARG_QP_MIN_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":qpmin=%d", ARG_QP_MIN_DEFAULT); g_object_class_install_property (gobject_class, ARG_QP_MAX, g_param_spec_uint ("qp-max", "Maximum Quantizer", "Maximum quantizer", 1, 51, ARG_QP_MAX_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":qpmax=%d", ARG_QP_MAX_DEFAULT); g_object_class_install_property (gobject_class, ARG_QP_STEP, g_param_spec_uint ("qp-step", "Maximum Quantizer Difference", "Maximum quantizer difference between frames", 1, 50, ARG_QP_STEP_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":qpstep=%d", ARG_QP_STEP_DEFAULT); g_object_class_install_property (gobject_class, ARG_IP_FACTOR, g_param_spec_float ("ip-factor", "IP-Factor", "Quantizer factor between I- and P-frames", 0, 2, ARG_IP_FACTOR_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":ip-factor=%f", ARG_IP_FACTOR_DEFAULT); g_object_class_install_property (gobject_class, ARG_PB_FACTOR, g_param_spec_float ("pb-factor", "PB-Factor", "Quantizer factor between P- and B-frames", 0, 2, ARG_PB_FACTOR_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":pb-factor=%f", ARG_PB_FACTOR_DEFAULT); #ifdef X264_MB_RC g_object_class_install_property (gobject_class, ARG_RC_MB_TREE, g_param_spec_boolean ("mb-tree", "Macroblock Tree", "Macroblock-Tree ratecontrol", ARG_RC_MB_TREE_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":mbtree=%d", ARG_RC_MB_TREE_DEFAULT); g_object_class_install_property (gobject_class, ARG_RC_LOOKAHEAD, g_param_spec_int ("rc-lookahead", "Rate Control Lookahead", "Number of frames for frametype lookahead", 0, 250, ARG_RC_LOOKAHEAD_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":rc-lookahead=%d", ARG_RC_LOOKAHEAD_DEFAULT); #endif g_object_class_install_property (gobject_class, ARG_NR, g_param_spec_uint ("noise-reduction", "Noise Reduction", "Noise reduction strength", 0, 100000, ARG_NR_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":nr=%d", ARG_NR_DEFAULT); g_object_class_install_property (gobject_class, ARG_INTERLACED, g_param_spec_boolean ("interlaced", "Interlaced", "Interlaced material", ARG_INTERLACED_DEFAULT, G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS)); g_string_append_printf (x264enc_defaults, ":interlaced=%d", ARG_INTERLACED_DEFAULT); /* append deblock parameters */ g_string_append_printf (x264enc_defaults, ":deblock=0,0"); /* append weighted prediction parameter */ g_string_append_printf (x264enc_defaults, ":weightp=0"); gst_element_class_set_details_simple (gstelement_class, "x264enc", "Codec/Encoder/Video", "H264 Encoder", "Josef Zlomek , " "Mark Nauwelaerts "); gst_element_class_add_pad_template (gstelement_class, gst_static_pad_template_get (&src_factory)); gst_element_class_add_pad_template (gstelement_class, gst_static_pad_template_get (&sink_factory)); gstelement_class->change_state = GST_DEBUG_FUNCPTR (gst_x264_enc_change_state); } static void gst_x264_enc_log_callback (gpointer private, gint level, const char *format, va_list args) { #ifndef GST_DISABLE_GST_DEBUG GstDebugLevel gst_level; GObject *object = (GObject *) private; switch (level) { case X264_LOG_NONE: gst_level = GST_LEVEL_NONE; break; case X264_LOG_ERROR: gst_level = GST_LEVEL_ERROR; break; case X264_LOG_WARNING: gst_level = GST_LEVEL_WARNING; break; case X264_LOG_INFO: gst_level = GST_LEVEL_INFO; break; default: /* push x264enc debug down to our lower levels to avoid some clutter */ gst_level = GST_LEVEL_LOG; break; } gst_debug_log_valist (x264_enc_debug, gst_level, "", "", 0, object, format, args); #endif /* GST_DISABLE_GST_DEBUG */ } /* initialize the new element * instantiate pads and add them to element * set functions * initialize structure */ static void gst_x264_enc_init (GstX264Enc * encoder) { encoder->sinkpad = gst_pad_new_from_static_template (&sink_factory, "sink"); gst_pad_set_event_function (encoder->sinkpad, GST_DEBUG_FUNCPTR (gst_x264_enc_sink_event)); gst_pad_set_chain_function (encoder->sinkpad, GST_DEBUG_FUNCPTR (gst_x264_enc_chain)); gst_pad_set_query_function (encoder->sinkpad, GST_DEBUG_FUNCPTR (gst_x264_enc_sink_query)); gst_element_add_pad (GST_ELEMENT (encoder), encoder->sinkpad); encoder->srcpad = gst_pad_new_from_static_template (&src_factory, "src"); gst_pad_use_fixed_caps (encoder->srcpad); gst_element_add_pad (GST_ELEMENT (encoder), encoder->srcpad); gst_pad_set_event_function (encoder->srcpad, GST_DEBUG_FUNCPTR (gst_x264_enc_src_event)); /* properties */ encoder->threads = ARG_THREADS_DEFAULT; encoder->sliced_threads = ARG_SLICED_THREADS_DEFAULT; encoder->sync_lookahead = ARG_SYNC_LOOKAHEAD_DEFAULT; encoder->pass = ARG_PASS_DEFAULT; encoder->quantizer = ARG_QUANTIZER_DEFAULT; encoder->mp_cache_file = g_strdup (ARG_MULTIPASS_CACHE_FILE_DEFAULT); encoder->byte_stream = ARG_BYTE_STREAM_DEFAULT; encoder->bitrate = ARG_BITRATE_DEFAULT; encoder->intra_refresh = ARG_INTRA_REFRESH_DEFAULT; encoder->vbv_buf_capacity = ARG_VBV_BUF_CAPACITY_DEFAULT; encoder->me = ARG_ME_DEFAULT; encoder->subme = ARG_SUBME_DEFAULT; encoder->analyse = ARG_ANALYSE_DEFAULT; encoder->dct8x8 = ARG_DCT8x8_DEFAULT; encoder->ref = ARG_REF_DEFAULT; encoder->bframes = ARG_BFRAMES_DEFAULT; encoder->b_adapt = ARG_B_ADAPT_DEFAULT; encoder->b_pyramid = ARG_B_PYRAMID_DEFAULT; encoder->weightb = ARG_WEIGHTB_DEFAULT; encoder->sps_id = ARG_SPS_ID_DEFAULT; encoder->au_nalu = ARG_AU_NALU_DEFAULT; encoder->trellis = ARG_TRELLIS_DEFAULT; encoder->keyint_max = ARG_KEYINT_MAX_DEFAULT; encoder->cabac = ARG_CABAC_DEFAULT; encoder->qp_min = ARG_QP_MIN_DEFAULT; encoder->qp_max = ARG_QP_MAX_DEFAULT; encoder->qp_step = ARG_QP_STEP_DEFAULT; encoder->ip_factor = ARG_IP_FACTOR_DEFAULT; encoder->pb_factor = ARG_PB_FACTOR_DEFAULT; encoder->mb_tree = ARG_RC_MB_TREE_DEFAULT; encoder->rc_lookahead = ARG_RC_LOOKAHEAD_DEFAULT; encoder->noise_reduction = ARG_NR_DEFAULT; encoder->interlaced = ARG_INTERLACED_DEFAULT; encoder->profile = ARG_PROFILE_DEFAULT; encoder->option_string = g_string_new (NULL); encoder->option_string_prop = g_string_new (ARG_OPTION_STRING_DEFAULT); encoder->speed_preset = ARG_SPEED_PRESET_DEFAULT; encoder->psy_tune = ARG_PSY_TUNE_DEFAULT; encoder->tune = ARG_TUNE_DEFAULT; /* resources */ encoder->delay = g_queue_new (); encoder->buffer_size = 100000; encoder->buffer = g_malloc (encoder->buffer_size); x264_param_default (&encoder->x264param); /* log callback setup; part of parameters */ encoder->x264param.pf_log = gst_x264_enc_log_callback; encoder->x264param.p_log_private = encoder; encoder->x264param.i_log_level = X264_LOG_DEBUG; gst_segment_init (&encoder->segment, GST_FORMAT_TIME); encoder->force_key_unit_event = NULL; gst_x264_enc_reset (encoder); } static void gst_x264_enc_reset (GstX264Enc * encoder) { encoder->x264enc = NULL; gst_video_info_init (&encoder->info); encoder->current_byte_stream = GST_X264_ENC_STREAM_FORMAT_FROM_PROPERTY; gst_segment_init (&encoder->segment, GST_FORMAT_UNDEFINED); GST_OBJECT_LOCK (encoder); gst_event_replace (&encoder->force_key_unit_event, NULL); encoder->pending_key_unit_ts = GST_CLOCK_TIME_NONE; GST_OBJECT_UNLOCK (encoder); } static void gst_x264_enc_finalize (GObject * object) { GstX264Enc *encoder = GST_X264_ENC (object); #define FREE_STRING(ptr) \ if (ptr) \ g_string_free (ptr, TRUE); FREE_STRING (encoder->tunings); FREE_STRING (encoder->option_string); FREE_STRING (encoder->option_string_prop); #undef FREE_STRING g_free (encoder->mp_cache_file); encoder->mp_cache_file = NULL; g_free (encoder->buffer); encoder->buffer = NULL; g_queue_free (encoder->delay); encoder->delay = NULL; gst_x264_enc_close_encoder (encoder); G_OBJECT_CLASS (parent_class)->finalize (object); } /* * gst_x264_enc_parse_options * @encoder: Encoder to which options are assigned * @str: Option string * * Parse option string and assign to x264 parameters * */ static gboolean gst_x264_enc_parse_options (GstX264Enc * encoder, const gchar * str) { GStrv kvpairs; guint npairs, i; gint parse_result = 0, ret = 0; gchar *options = (gchar *) str; while (*options == ':') options++; kvpairs = g_strsplit (options, ":", 0); npairs = g_strv_length (kvpairs); for (i = 0; i < npairs; i++) { GStrv key_val = g_strsplit (kvpairs[i], "=", 2); parse_result = x264_param_parse (&encoder->x264param, key_val[0], key_val[1]); if (parse_result == X264_PARAM_BAD_NAME) { GST_ERROR_OBJECT (encoder, "Bad name for option %s=%s", key_val[0] ? key_val[0] : "", key_val[1] ? key_val[1] : ""); } if (parse_result == X264_PARAM_BAD_VALUE) { GST_ERROR_OBJECT (encoder, "Bad value for option %s=%s (Note: a NULL value for a non-boolean triggers this)", key_val[0] ? key_val[0] : "", key_val[1] ? key_val[1] : ""); } g_strfreev (key_val); if (parse_result) ret++; } g_strfreev (kvpairs); return !ret; } /* * gst_x264_enc_init_encoder * @encoder: Encoder which should be initialized. * * Initialize x264 encoder. * */ static gboolean gst_x264_enc_init_encoder (GstX264Enc * encoder) { guint pass = 0; gint width, height, fps_n, fps_d; /* make sure that the encoder is closed */ gst_x264_enc_close_encoder (encoder); GST_OBJECT_LOCK (encoder); #ifdef X264_PRESETS gst_x264_enc_build_tunings_string (encoder); /* set x264 parameters and use preset/tuning if present */ GST_DEBUG_OBJECT (encoder, "Applying defaults with preset %s, tunings %s", encoder->speed_preset ? x264_preset_names[encoder->speed_preset - 1] : "", encoder->tunings && encoder->tunings->len ? encoder->tunings->str : ""); x264_param_default_preset (&encoder->x264param, encoder->speed_preset ? x264_preset_names[encoder->speed_preset - 1] : NULL, encoder->tunings && encoder->tunings->len ? encoder->tunings->str : NULL); /* log callback setup; part of parameters * this needs to be done again after every *param_default* () call */ encoder->x264param.pf_log = gst_x264_enc_log_callback; encoder->x264param.p_log_private = encoder; encoder->x264param.i_log_level = X264_LOG_DEBUG; /* if no preset nor tuning, use property defaults */ if (!encoder->speed_preset && !encoder->tunings->len) { #endif /* X264_PRESETS */ GST_DEBUG_OBJECT (encoder, "Applying x264enc_defaults"); if (x264enc_defaults->len && gst_x264_enc_parse_options (encoder, x264enc_defaults->str) == FALSE) { GST_DEBUG_OBJECT (encoder, "x264enc_defaults string contains errors. This is a bug."); goto unlock_and_return; } #ifdef X264_PRESETS } else { /* When using presets we need to respect the default output format */ encoder->x264param.b_aud = encoder->au_nalu; encoder->x264param.b_annexb = encoder->byte_stream; } #endif /* X264_PRESETS */ #if X264_BUILD >= 81 /* setup appropriate timebase for gstreamer */ encoder->x264param.i_timebase_num = 1; encoder->x264param.i_timebase_den = 1000000000; #endif /* apply option-string property */ if (encoder->option_string_prop && encoder->option_string_prop->len) { GST_DEBUG_OBJECT (encoder, "Applying option-string: %s", encoder->option_string_prop->str); if (gst_x264_enc_parse_options (encoder, encoder->option_string_prop->str) == FALSE) { GST_DEBUG_OBJECT (encoder, "Your option-string contains errors."); goto unlock_and_return; } } /* apply user-set options */ if (encoder->option_string && encoder->option_string->len) { GST_DEBUG_OBJECT (encoder, "Applying user-set options: %s", encoder->option_string->str); if (gst_x264_enc_parse_options (encoder, encoder->option_string->str) == FALSE) { GST_DEBUG_OBJECT (encoder, "Failed to parse internal option string. " "This could be due to use of an old libx264 version. Option string " "was: %s", encoder->option_string->str); } } width = GST_VIDEO_INFO_WIDTH (&encoder->info); height = GST_VIDEO_INFO_HEIGHT (&encoder->info); fps_n = GST_VIDEO_INFO_FPS_N (&encoder->info); fps_d = GST_VIDEO_INFO_FPS_D (&encoder->info); /* set up encoder parameters */ encoder->x264param.i_fps_num = fps_n; encoder->x264param.i_fps_den = fps_d; encoder->x264param.i_width = width; encoder->x264param.i_height = height; if (GST_VIDEO_INFO_PAR_D (&encoder->info) > 0) { encoder->x264param.vui.i_sar_width = GST_VIDEO_INFO_PAR_N (&encoder->info); encoder->x264param.vui.i_sar_height = GST_VIDEO_INFO_PAR_D (&encoder->info); } /* FIXME 0.11 : 2s default keyframe interval seems excessive * (10s is x264 default) */ encoder->x264param.i_keyint_max = encoder->keyint_max ? encoder->keyint_max : (2 * fps_n / fps_d); if ((((height == 576) && ((width == 720) || (width == 704) || (width == 352))) || ((height == 288) && (width == 352))) && (fps_d == 1) && (fps_n == 25)) { encoder->x264param.vui.i_vidformat = 1; /* PAL */ } else if ((((height == 480) && ((width == 720) || (width == 704) || (width == 352))) || ((height == 240) && (width == 352))) && (fps_d == 1001) && ((fps_n == 30000) || (fps_n == 24000))) { encoder->x264param.vui.i_vidformat = 2; /* NTSC */ } else encoder->x264param.vui.i_vidformat = 5; /* unspecified */ encoder->x264param.analyse.b_psnr = 0; switch (encoder->pass) { case GST_X264_ENC_PASS_QUANT: encoder->x264param.rc.i_rc_method = X264_RC_CQP; encoder->x264param.rc.i_qp_constant = encoder->quantizer; break; case GST_X264_ENC_PASS_QUAL: encoder->x264param.rc.i_rc_method = X264_RC_CRF; encoder->x264param.rc.f_rf_constant = encoder->quantizer; encoder->x264param.rc.i_vbv_max_bitrate = encoder->bitrate; encoder->x264param.rc.i_vbv_buffer_size = encoder->x264param.rc.i_vbv_max_bitrate * encoder->vbv_buf_capacity / 1000; break; case GST_X264_ENC_PASS_CBR: case GST_X264_ENC_PASS_PASS1: case GST_X264_ENC_PASS_PASS2: case GST_X264_ENC_PASS_PASS3: default: encoder->x264param.rc.i_rc_method = X264_RC_ABR; encoder->x264param.rc.i_bitrate = encoder->bitrate; encoder->x264param.rc.i_vbv_max_bitrate = encoder->bitrate; encoder->x264param.rc.i_vbv_buffer_size = encoder->x264param.rc.i_vbv_max_bitrate * encoder->vbv_buf_capacity / 1000; pass = encoder->pass & 0xF; break; } switch (pass) { case 0: encoder->x264param.rc.b_stat_read = 0; encoder->x264param.rc.b_stat_write = 0; break; case 1: encoder->x264param.rc.b_stat_read = 0; encoder->x264param.rc.b_stat_write = 1; #ifdef X264_PRESETS x264_param_apply_fastfirstpass (&encoder->x264param); #else encoder->x264param.i_frame_reference = 1; encoder->x264param.analyse.b_transform_8x8 = 0; encoder->x264param.analyse.inter = 0; encoder->x264param.analyse.i_me_method = X264_ME_DIA; encoder->x264param.analyse.i_subpel_refine = MIN (2, encoder->x264param.analyse.i_subpel_refine); encoder->x264param.analyse.i_trellis = 0; encoder->x264param.analyse.b_fast_pskip = 1; #endif /* X264_PRESETS */ break; case 2: encoder->x264param.rc.b_stat_read = 1; encoder->x264param.rc.b_stat_write = 0; break; case 3: encoder->x264param.rc.b_stat_read = 1; encoder->x264param.rc.b_stat_write = 1; break; } #if X264_BUILD >= 81 && X264_BUILD < 106 /* When vfr is disabled, libx264 ignores buffer timestamps. This causes * issues with rate control in libx264 with our nanosecond timebase. This * has been fixed upstream in libx264 but this workaround is required for * pre-fix versions. */ if (!encoder->x264param.b_vfr_input) { if (encoder->x264param.i_fps_num == 0) { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, ("Constant framerate is required."), ("The framerate caps (%d/%d) indicate VFR but VFR is disabled in libx264. (Is the zerolatency tuning in use?)", encoder->x264param.i_fps_num, encoder->x264param.i_fps_den)); return FALSE; } encoder->x264param.i_timebase_num = encoder->x264param.i_fps_den; encoder->x264param.i_timebase_den = encoder->x264param.i_fps_num; } #endif #ifdef X264_PRESETS if (encoder->peer_profile) { if (x264_param_apply_profile (&encoder->x264param, encoder->peer_profile)) GST_WARNING_OBJECT (encoder, "Bad downstream profile name: %s", encoder->peer_profile); } else if (encoder->profile) { if (x264_param_apply_profile (&encoder->x264param, x264_profile_names[encoder->profile - 1])) GST_WARNING_OBJECT (encoder, "Bad profile name: %s", x264_profile_names[encoder->profile - 1]); } #endif /* X264_PRESETS */ /* If using an intra profile, all frames are intra frames */ if (encoder->peer_intra_profile) encoder->x264param.i_keyint_max = encoder->x264param.i_keyint_min = 1; /* Enforce level limits if they were in the caps */ if (encoder->peer_level) { encoder->x264param.i_level_idc = encoder->peer_level->level_idc; encoder->x264param.rc.i_bitrate = MIN (encoder->x264param.rc.i_bitrate, encoder->peer_level->bitrate); encoder->x264param.rc.i_vbv_max_bitrate = MIN (encoder->x264param.rc.i_vbv_max_bitrate, encoder->peer_level->bitrate); encoder->x264param.rc.i_vbv_buffer_size = MIN (encoder->x264param.rc.i_vbv_buffer_size, encoder->peer_level->cpb); encoder->x264param.analyse.i_mv_range = MIN (encoder->x264param.analyse.i_mv_range, encoder->peer_level->mv_range); if (encoder->peer_level->frame_only) { encoder->x264param.b_interlaced = FALSE; #if X264_BUILD >= 95 encoder->x264param.b_fake_interlaced = FALSE; #endif } } encoder->reconfig = FALSE; GST_OBJECT_UNLOCK (encoder); encoder->x264enc = x264_encoder_open (&encoder->x264param); if (!encoder->x264enc) { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, ("Can not initialize x264 encoder."), (NULL)); return FALSE; } return TRUE; unlock_and_return: GST_OBJECT_UNLOCK (encoder); return FALSE; } /* gst_x264_enc_close_encoder * @encoder: Encoder which should close. * * Close x264 encoder. */ static void gst_x264_enc_close_encoder (GstX264Enc * encoder) { if (encoder->x264enc != NULL) { x264_encoder_close (encoder->x264enc); encoder->x264enc = NULL; } } static gboolean gst_x264_enc_set_profile_and_level (GstX264Enc * encoder, GstCaps * caps) { x264_nal_t *nal; int i_nal; int header_return; gint sps_ni = 0; guint8 *sps; header_return = x264_encoder_headers (encoder->x264enc, &nal, &i_nal); if (header_return < 0) { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, ("Encode x264 header failed."), ("x264_encoder_headers return code=%d", header_return)); return FALSE; } /* old x264 returns SEI, SPS and PPS, newer one has SEI last */ if (i_nal == 3 && nal[sps_ni].i_type != 7) sps_ni = 1; /* old style API: nal's are not encapsulated, and have no sync/size prefix, * new style API: nal's are encapsulated, and have 4-byte size prefix */ #ifndef X264_ENC_NALS sps = nal[sps_ni].p_payload; #else sps = nal[sps_ni].p_payload + 4; /* skip NAL unit type */ sps++; #endif gst_codec_utils_h264_caps_set_level_and_profile (caps, sps, 3); return TRUE; } /* * Returns: Buffer with the stream headers. */ static GstBuffer * gst_x264_enc_header_buf (GstX264Enc * encoder) { GstBuffer *buf; x264_nal_t *nal; int i_nal; int header_return; int i_size; int nal_size; #ifndef X264_ENC_NALS int i_data; #endif guint8 *buffer, *sps; gulong buffer_size; gint sei_ni = 2, sps_ni = 0, pps_ni = 1; if (G_UNLIKELY (encoder->x264enc == NULL)) return NULL; /* Create avcC header. */ header_return = x264_encoder_headers (encoder->x264enc, &nal, &i_nal); if (header_return < 0) { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, ("Encode x264 header failed."), ("x264_encoder_headers return code=%d", header_return)); return NULL; } /* old x264 returns SEI, SPS and PPS, newer one has SEI last */ if (i_nal == 3 && nal[sps_ni].i_type != 7) { sei_ni = 0; sps_ni = 1; pps_ni = 2; } /* x264 is expected to return an SEI (some identification info), * and SPS and PPS */ if (i_nal != 3 || nal[sps_ni].i_type != 7 || nal[pps_ni].i_type != 8 || nal[sps_ni].i_payload < 4 || nal[pps_ni].i_payload < 1) { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, (NULL), ("Unexpected x264 header.")); return NULL; } GST_MEMDUMP ("SEI", nal[sei_ni].p_payload, nal[sei_ni].i_payload); GST_MEMDUMP ("SPS", nal[sps_ni].p_payload, nal[sps_ni].i_payload); GST_MEMDUMP ("PPS", nal[pps_ni].p_payload, nal[pps_ni].i_payload); /* nal payloads with emulation_prevention_three_byte, and some header data */ buffer_size = (nal[sps_ni].i_payload + nal[pps_ni].i_payload) * 4 + 100; buffer = g_malloc (buffer_size); /* old style API: nal's are not encapsulated, and have no sync/size prefix, * new style API: nal's are encapsulated, and have 4-byte size prefix */ #ifndef X264_ENC_NALS sps = nal[sps_ni].p_payload; #else sps = nal[sps_ni].p_payload + 4; /* skip NAL unit type */ sps++; #endif buffer[0] = 1; /* AVC Decoder Configuration Record ver. 1 */ buffer[1] = sps[0]; /* profile_idc */ buffer[2] = sps[1]; /* profile_compability */ buffer[3] = sps[2]; /* level_idc */ buffer[4] = 0xfc | (4 - 1); /* nal_length_size_minus1 */ i_size = 5; buffer[i_size++] = 0xe0 | 1; /* number of SPSs */ #ifndef X264_ENC_NALS i_data = buffer_size - i_size - 2; nal_size = x264_nal_encode (buffer + i_size + 2, &i_data, 0, &nal[sps_ni]); #else nal_size = nal[sps_ni].i_payload - 4; memcpy (buffer + i_size + 2, nal[sps_ni].p_payload + 4, nal_size); #endif GST_WRITE_UINT16_BE (buffer + i_size, nal_size); i_size += nal_size + 2; buffer[i_size++] = 1; /* number of PPSs */ #ifndef X264_ENC_NALS i_data = buffer_size - i_size - 2; nal_size = x264_nal_encode (buffer + i_size + 2, &i_data, 0, &nal[pps_ni]); #else nal_size = nal[pps_ni].i_payload - 4; memcpy (buffer + i_size + 2, nal[pps_ni].p_payload + 4, nal_size); #endif GST_WRITE_UINT16_BE (buffer + i_size, nal_size); i_size += nal_size + 2; buf = gst_buffer_new_and_alloc (i_size); gst_buffer_fill (buf, 0, buffer, i_size); GST_MEMDUMP ("header", buffer, i_size); g_free (buffer); return buf; } /* gst_x264_enc_set_src_caps * Returns: TRUE on success. */ static gboolean gst_x264_enc_set_src_caps (GstX264Enc * encoder, GstPad * pad, GstCaps * caps) { GstBuffer *buf; GstCaps *outcaps; GstStructure *structure; gboolean res; outcaps = gst_caps_new_simple ("video/x-h264", "width", G_TYPE_INT, GST_VIDEO_INFO_WIDTH (&encoder->info), "height", G_TYPE_INT, GST_VIDEO_INFO_HEIGHT (&encoder->info), "framerate", GST_TYPE_FRACTION, GST_VIDEO_INFO_FPS_N (&encoder->info), GST_VIDEO_INFO_FPS_D (&encoder->info), "pixel-aspect-ratio", GST_TYPE_FRACTION, GST_VIDEO_INFO_PAR_N (&encoder->info), GST_VIDEO_INFO_PAR_D (&encoder->info), NULL); structure = gst_caps_get_structure (outcaps, 0); if (encoder->current_byte_stream == GST_X264_ENC_STREAM_FORMAT_FROM_PROPERTY) { if (encoder->byte_stream) { encoder->current_byte_stream = GST_X264_ENC_STREAM_FORMAT_BYTE_STREAM; } else { encoder->current_byte_stream = GST_X264_ENC_STREAM_FORMAT_AVC; } } if (encoder->current_byte_stream == GST_X264_ENC_STREAM_FORMAT_AVC) { buf = gst_x264_enc_header_buf (encoder); if (buf != NULL) { gst_caps_set_simple (outcaps, "codec_data", GST_TYPE_BUFFER, buf, NULL); gst_buffer_unref (buf); } gst_structure_set (structure, "stream-format", G_TYPE_STRING, "avc", NULL); } else { gst_structure_set (structure, "stream-format", G_TYPE_STRING, "byte-stream", NULL); } gst_structure_set (structure, "alignment", G_TYPE_STRING, "au", NULL); if (!gst_x264_enc_set_profile_and_level (encoder, outcaps)) { gst_caps_unref (outcaps); return FALSE; } res = gst_pad_set_caps (pad, outcaps); gst_caps_unref (outcaps); return res; } static gboolean gst_x264_enc_sink_set_caps (GstPad * pad, GstCaps * caps) { GstX264Enc *encoder = GST_X264_ENC (GST_OBJECT_PARENT (pad)); GstVideoInfo info; gint width, height; gint fps_n, fps_d; gint par_n, par_d; GstCaps *peer_caps; GstCaps *allowed_caps = NULL; gboolean level_ok = TRUE; /* get info from caps */ if (!gst_video_info_from_caps (&info, caps)) goto invalid_caps; width = GST_VIDEO_INFO_WIDTH (&info); height = GST_VIDEO_INFO_HEIGHT (&info); fps_n = GST_VIDEO_INFO_FPS_N (&info); fps_d = GST_VIDEO_INFO_FPS_D (&info); par_n = GST_VIDEO_INFO_PAR_N (&info); par_d = GST_VIDEO_INFO_PAR_D (&info); /* If the encoder is initialized, do not reinitialize it again if not * necessary */ if (encoder->x264enc) { if (width == GST_VIDEO_INFO_WIDTH (&encoder->info) && height == GST_VIDEO_INFO_HEIGHT (&encoder->info) && fps_n == GST_VIDEO_INFO_FPS_N (&encoder->info) && fps_d == GST_VIDEO_INFO_FPS_D (&encoder->info) && par_n == GST_VIDEO_INFO_PAR_N (&encoder->info) && par_d == GST_VIDEO_INFO_PAR_D (&encoder->info)) return TRUE; /* clear out pending frames */ gst_x264_enc_flush_frames (encoder, TRUE); encoder->sps_id++; } /* store input description */ encoder->info = info; encoder->peer_profile = NULL; encoder->peer_intra_profile = FALSE; encoder->peer_level = NULL; /* FIXME: Remove THIS bit in 0.11 when the profile property is removed */ peer_caps = gst_pad_peer_query_caps (encoder->srcpad, NULL); if (peer_caps) { gint i; gboolean has_profile_or_level_or_format = FALSE; for (i = 0; i < gst_caps_get_size (peer_caps); i++) { GstStructure *s = gst_caps_get_structure (peer_caps, i); if (gst_structure_has_name (s, "video/x-h264") && (gst_structure_has_field (s, "profile") || gst_structure_has_field (s, "level") || gst_structure_has_field (s, "stream-format"))) { has_profile_or_level_or_format = TRUE; break; } } if (has_profile_or_level_or_format) { GstCaps *template_caps; template_caps = gst_pad_get_pad_template_caps (encoder->srcpad); allowed_caps = gst_caps_intersect (peer_caps, template_caps); gst_caps_unref (template_caps); } gst_caps_unref (peer_caps); } /* Replace the bit since FIXME with this * allowed_caps = gst_pad_get_allowed_caps (encoder->srcpad); */ if (allowed_caps) { GstStructure *s; const gchar *profile; const gchar *level; const gchar *stream_format; if (gst_caps_is_empty (allowed_caps)) { gst_caps_unref (allowed_caps); return FALSE; } allowed_caps = gst_caps_fixate (allowed_caps); allowed_caps = gst_caps_make_writable (allowed_caps); s = gst_caps_get_structure (allowed_caps, 0); profile = gst_structure_get_string (s, "profile"); if (profile) { /* FIXME - if libx264 ever adds support for FMO, ASO or redundant slices * make sure constrained profile has a separate case which disables * those */ if (!strcmp (profile, "constrained-baseline") || !strcmp (profile, "baseline")) { encoder->peer_profile = "baseline"; } else if (!strcmp (profile, "high-10-intra")) { encoder->peer_intra_profile = TRUE; encoder->peer_profile = "high10"; } else if (!strcmp (profile, "high-10")) { encoder->peer_profile = "high10"; } else if (!strcmp (profile, "high")) { encoder->peer_profile = "high"; } else if (!strcmp (profile, "main")) { encoder->peer_profile = "main"; } else { g_assert_not_reached (); } } level = gst_structure_get_string (s, "level"); if (level) { int level_idc = gst_codec_utils_h264_get_level_idc (level); if (level_idc) { gint i; for (i = 0; x264_levels[i].level_idc; i++) { if (level_idc == x264_levels[i].level_idc) { int mb_width = (width + 15) / 16; int mb_height = (height + 15) / 16; int mbs = mb_width * mb_height; if (x264_levels[i].frame_size < mbs || x264_levels[i].frame_size * 8 < mb_width * mb_width || x264_levels[i].frame_size * 8 < mb_height * mb_height) { GST_WARNING_OBJECT (encoder, "Frame size larger than level %s allows", level); level_ok = FALSE; break; } if (fps_d && x264_levels[i].mbps < (gint64) mbs * fps_n / fps_d) { GST_WARNING_OBJECT (encoder, "Macroblock rate higher than level %s allows", level); level_ok = FALSE; break; } encoder->peer_level = &x264_levels[i]; break; } } } } stream_format = gst_structure_get_string (s, "stream-format"); encoder->current_byte_stream = GST_X264_ENC_STREAM_FORMAT_FROM_PROPERTY; if (stream_format) { if (!strcmp (stream_format, "avc")) { encoder->current_byte_stream = GST_X264_ENC_STREAM_FORMAT_AVC; g_string_append_printf (encoder->option_string, ":annexb=0"); } else if (!strcmp (stream_format, "byte-stream")) { encoder->current_byte_stream = GST_X264_ENC_STREAM_FORMAT_BYTE_STREAM; g_string_append_printf (encoder->option_string, ":annexb=1"); } else { /* means we have both in caps and _FROM_PROPERTY should be the option */ } } gst_caps_unref (allowed_caps); } if (!level_ok) return FALSE; if (!gst_x264_enc_init_encoder (encoder)) return FALSE; if (!gst_x264_enc_set_src_caps (encoder, encoder->srcpad, caps)) { gst_x264_enc_close_encoder (encoder); return FALSE; } return TRUE; /* ERRORS */ invalid_caps: { GST_ERROR_OBJECT (encoder, "invalid caps"); return FALSE; } } static GstCaps * gst_x264_enc_sink_get_caps (GstPad * pad, GstCaps * filter) { GstX264Enc *encoder; GstPad *peer; GstCaps *caps, *current; GstCaps *templcaps; encoder = GST_X264_ENC (gst_pad_get_parent (pad)); if (!encoder) return gst_caps_new_empty (); templcaps = gst_pad_get_pad_template_caps (pad); peer = gst_pad_get_peer (encoder->srcpad); if (peer) { GstCaps *peercaps; guint i, n; peercaps = gst_pad_query_caps (peer, NULL); /* Translate peercaps to YUV */ peercaps = gst_caps_make_writable (peercaps); n = gst_caps_get_size (peercaps); for (i = 0; i < n; i++) { GstStructure *s = gst_caps_get_structure (peercaps, i); gst_structure_set_name (s, "video/x-raw"); gst_structure_remove_field (s, "stream-format"); gst_structure_remove_field (s, "alignment"); } caps = gst_caps_intersect (peercaps, templcaps); gst_caps_unref (peercaps); gst_caps_unref (templcaps); gst_object_unref (peer); peer = NULL; } else { caps = templcaps; } /* If we already have caps return them */ current = gst_pad_get_current_caps (pad); if (current) { if (gst_caps_can_intersect (current, caps)) { caps = gst_caps_merge (current, caps); } else { gst_caps_unref (current); } } gst_object_unref (encoder); return caps; } static gboolean gst_x264_enc_src_event (GstPad * pad, GstObject * parent, GstEvent * event) { gboolean ret = TRUE; GstX264Enc *encoder; gboolean forward = TRUE; encoder = GST_X264_ENC (parent); switch (GST_EVENT_TYPE (event)) { case GST_EVENT_CUSTOM_UPSTREAM:{ guint count; gboolean all_headers; if (!gst_video_event_is_force_key_unit (event)) goto out; GST_OBJECT_LOCK (encoder); gst_video_event_parse_upstream_force_key_unit (event, &encoder->pending_key_unit_ts, &all_headers, &count); GST_INFO_OBJECT (encoder, "received upstream force-key-unit event, " "seqnum %d running_time %" GST_TIME_FORMAT " all_headers %d count %d", gst_event_get_seqnum (event), GST_TIME_ARGS (encoder->pending_key_unit_ts), all_headers, count); gst_event_replace (&encoder->force_key_unit_event, event); gst_event_unref (event); GST_OBJECT_UNLOCK (encoder); forward = FALSE; break; } default: break; } out: if (forward) ret = gst_pad_push_event (encoder->sinkpad, event); return ret; } static gboolean gst_x264_enc_sink_event (GstPad * pad, GstObject * parent, GstEvent * event) { gboolean ret = FALSE, forward = TRUE; GstX264Enc *encoder; encoder = GST_X264_ENC (parent); switch (GST_EVENT_TYPE (event)) { case GST_EVENT_CAPS: { GstCaps *caps; gst_event_parse_caps (event, &caps); ret = gst_x264_enc_sink_set_caps (pad, caps); forward = FALSE; break; } case GST_EVENT_SEGMENT: gst_event_copy_segment (event, &encoder->segment); break; case GST_EVENT_FLUSH_STOP: gst_segment_init (&encoder->segment, GST_FORMAT_UNDEFINED); break; case GST_EVENT_EOS: gst_x264_enc_flush_frames (encoder, TRUE); break; case GST_EVENT_TAG:{ GstTagList *tags = NULL; event = GST_EVENT (gst_mini_object_make_writable (GST_MINI_OBJECT (event))); gst_event_parse_tag (event, &tags); /* drop codec/video-codec and replace encoder/encoder-version */ gst_tag_list_remove_tag (tags, GST_TAG_VIDEO_CODEC); gst_tag_list_remove_tag (tags, GST_TAG_CODEC); gst_tag_list_add (tags, GST_TAG_MERGE_REPLACE, GST_TAG_ENCODER, "x264", GST_TAG_ENCODER_VERSION, X264_BUILD, NULL); /* push is done below */ break; /* no flushing if flush received, * buffers in encoder are considered (in the) past */ } case GST_EVENT_CUSTOM_DOWNSTREAM:{ guint count; gboolean all_headers; if (!gst_video_event_is_force_key_unit (event)) break; GST_OBJECT_LOCK (encoder); gst_video_event_parse_downstream_force_key_unit (event, NULL, NULL, &encoder->pending_key_unit_ts, &all_headers, &count); GST_INFO_OBJECT (encoder, "received downstream force-key-unit event, " "seqnum %d running_time %" GST_TIME_FORMAT " all_headers %d count %d", gst_event_get_seqnum (event), GST_TIME_ARGS (encoder->pending_key_unit_ts), all_headers, count); gst_event_replace (&encoder->force_key_unit_event, event); gst_event_unref (event); GST_OBJECT_UNLOCK (encoder); break; } default: break; } if (forward) ret = gst_pad_push_event (encoder->srcpad, event); else gst_event_unref (event); return ret; } static gboolean gst_x264_enc_sink_query (GstPad * pad, GstObject * parent, GstQuery * query) { gboolean ret = FALSE; switch (GST_QUERY_TYPE (query)) { case GST_QUERY_CAPS: { GstCaps *filter, *caps; gst_query_parse_caps (query, &filter); caps = gst_x264_enc_sink_get_caps (pad, filter); gst_query_set_caps_result (query, caps); gst_caps_unref (caps); ret = TRUE; break; } default: ret = gst_pad_query_default (pad, parent, query); break; } return ret; } /* chain function * this function does the actual processing */ static GstFlowReturn gst_x264_enc_chain (GstPad * pad, GstObject * parent, GstBuffer * buf) { GstX264Enc *encoder = GST_X264_ENC (parent); GstFlowReturn ret; x264_picture_t pic_in; gint i_nal, i; GstVideoFrame frame; if (G_UNLIKELY (encoder->x264enc == NULL)) goto not_inited; /* create x264_picture_t from the buffer */ /* mostly taken from mplayer (file ve_x264.c) */ if (!gst_video_frame_map (&frame, &encoder->info, buf, GST_MAP_READ)) goto wrong_video_frame; /* remember the timestamp and duration */ g_queue_push_tail (encoder->delay, buf); /* set up input picture */ memset (&pic_in, 0, sizeof (pic_in)); pic_in.img.i_csp = X264_CSP_I420; pic_in.img.i_plane = 3; for (i = 0; i < 3; i++) { pic_in.img.plane[i] = GST_VIDEO_FRAME_COMP_DATA (&frame, i); pic_in.img.i_stride[i] = GST_VIDEO_FRAME_COMP_STRIDE (&frame, i); } pic_in.i_type = X264_TYPE_AUTO; pic_in.i_dts = GST_BUFFER_DTS (buf); pic_in.i_pts = GST_BUFFER_PTS (buf); ret = gst_x264_enc_encode_frame (encoder, &pic_in, &i_nal, TRUE); gst_video_frame_unmap (&frame); /* input buffer is released later on */ return ret; /* ERRORS */ not_inited: { GST_WARNING_OBJECT (encoder, "Got buffer before set_caps was called"); gst_buffer_unref (buf); return GST_FLOW_NOT_NEGOTIATED; } wrong_video_frame: { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, ("Encode x264 frame failed."), ("Could not map video frame")); gst_buffer_unref (buf); return GST_FLOW_ERROR; } } static GstEvent * check_pending_key_unit_event (GstEvent * pending_event, GstSegment * segment, GstClockTime timestamp, GstClockTime pending_key_unit_ts) { GstClockTime running_time, stream_time; gboolean all_headers; guint count; GstEvent *event = NULL; g_return_val_if_fail (pending_event != NULL, NULL); g_return_val_if_fail (segment != NULL, NULL); if (pending_event == NULL || timestamp == GST_CLOCK_TIME_NONE) goto out; running_time = gst_segment_to_running_time (segment, GST_FORMAT_TIME, timestamp); GST_INFO ("now %" GST_TIME_FORMAT " wanted %" GST_TIME_FORMAT, GST_TIME_ARGS (running_time), GST_TIME_ARGS (pending_key_unit_ts)); if (running_time < pending_key_unit_ts) goto out; stream_time = gst_segment_to_stream_time (segment, GST_FORMAT_TIME, timestamp); gst_video_event_parse_upstream_force_key_unit (pending_event, NULL, &all_headers, &count); event = gst_video_event_new_downstream_force_key_unit (timestamp, stream_time, running_time, all_headers, count); gst_event_set_seqnum (event, gst_event_get_seqnum (pending_event)); out: return event; } static GstFlowReturn gst_x264_enc_encode_frame (GstX264Enc * encoder, x264_picture_t * pic_in, int *i_nal, gboolean send) { GstFlowReturn ret; GstBuffer *out_buf = NULL, *in_buf = NULL; x264_picture_t pic_out; x264_nal_t *nal; int i_size; #ifndef X264_ENC_NALS int nal_size; gint i; #endif int encoder_return; GstClockTime duration; guint8 *data; GstEvent *event = NULL; if (G_UNLIKELY (encoder->x264enc == NULL)) return GST_FLOW_NOT_NEGOTIATED; GST_OBJECT_LOCK (encoder); if (encoder->reconfig) { encoder->reconfig = FALSE; if (x264_encoder_reconfig (encoder->x264enc, &encoder->x264param) < 0) GST_WARNING_OBJECT (encoder, "Could not reconfigure"); } if (encoder->pending_key_unit_ts != GST_CLOCK_TIME_NONE && pic_in != NULL) { event = check_pending_key_unit_event (encoder->force_key_unit_event, &encoder->segment, pic_in->i_pts, encoder->pending_key_unit_ts); if (event) { encoder->pending_key_unit_ts = GST_CLOCK_TIME_NONE; gst_event_replace (&encoder->force_key_unit_event, NULL); #ifdef FORCE_INTRA_API if (encoder->intra_refresh) x264_encoder_intra_refresh (encoder->x264enc); else pic_in->i_type = X264_TYPE_IDR; #else pic_in->i_type = X264_TYPE_IDR; #endif } } GST_OBJECT_UNLOCK (encoder); encoder_return = x264_encoder_encode (encoder->x264enc, &nal, i_nal, pic_in, &pic_out); if (encoder_return < 0) goto encode_failed; if (!*i_nal) { ret = GST_FLOW_OK; goto out; } #ifndef X264_ENC_NALS i_size = 0; for (i = 0; i < *i_nal; i++) { gint i_data = encoder->buffer_size - i_size - 4; if (i_data < nal[i].i_payload * 2) { encoder->buffer_size += 2 * nal[i].i_payload; encoder->buffer = g_realloc (encoder->buffer, encoder->buffer_size); i_data = encoder->buffer_size - i_size - 4; } nal_size = x264_nal_encode (encoder->buffer + i_size + 4, &i_data, 0, &nal[i]); g_assert (encoder->current_byte_stream != GST_X264_ENC_STREAM_FORMAT_FROM_PROPERTY); if (encoder->current_byte_stream == GST_X264_ENC_STREAM_FORMAT_BYTE_STREAM) GST_WRITE_UINT32_BE (encoder->buffer + i_size, 1); else GST_WRITE_UINT32_BE (encoder->buffer + i_size, nal_size); i_size += nal_size + 4; } data = encoder->buffer; #else i_size = encoder_return; data = nal[0].p_payload; #endif in_buf = g_queue_pop_head (encoder->delay); if (in_buf) { duration = GST_BUFFER_DURATION (in_buf); gst_buffer_unref (in_buf); } else { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, (NULL), ("Timestamp queue empty.")); ret = GST_FLOW_ERROR; goto out; } if (!send) { ret = GST_FLOW_OK; goto out; } out_buf = gst_buffer_new_allocate (NULL, i_size, NULL); gst_buffer_fill (out_buf, 0, data, i_size); GST_LOG_OBJECT (encoder, "output: dts %" G_GINT64_FORMAT " pts %" G_GINT64_FORMAT, (gint64) pic_out.i_dts, (gint64) pic_out.i_pts); if (pic_out.i_dts < 0) GST_BUFFER_DTS (out_buf) = GST_CLOCK_TIME_NONE; else GST_BUFFER_DTS (out_buf) = pic_out.i_dts; GST_BUFFER_PTS (out_buf) = pic_out.i_pts; GST_BUFFER_DURATION (out_buf) = duration; #ifdef X264_INTRA_REFRESH if (pic_out.b_keyframe) { #else if (pic_out.i_type == X264_TYPE_IDR) { #endif GST_BUFFER_FLAG_UNSET (out_buf, GST_BUFFER_FLAG_DELTA_UNIT); } else { GST_BUFFER_FLAG_SET (out_buf, GST_BUFFER_FLAG_DELTA_UNIT); } if (event) gst_pad_push_event (encoder->srcpad, gst_event_ref (event)); ret = gst_pad_push (encoder->srcpad, out_buf); out: if (event) gst_event_unref (event); return ret; /* ERRORS */ encode_failed: { GST_ELEMENT_ERROR (encoder, STREAM, ENCODE, ("Encode x264 frame failed."), ("x264_encoder_encode return code=%d", encoder_return)); ret = GST_FLOW_ERROR; goto out; } } static void gst_x264_enc_flush_frames (GstX264Enc * encoder, gboolean send) { GstFlowReturn flow_ret; gint i_nal; /* first send the remaining frames */ if (encoder->x264enc) do { flow_ret = gst_x264_enc_encode_frame (encoder, NULL, &i_nal, send); #ifdef X264_DELAYED_FRAMES_API } while (flow_ret == GST_FLOW_OK && x264_encoder_delayed_frames (encoder->x264enc) > 0); #else /* note that this doesn't flush all frames for > 1 delayed frame */ } while (flow_ret == GST_FLOW_OK && i_nal > 0); #endif /* in any case, make sure the delay queue is emptied */ while (!g_queue_is_empty (encoder->delay)) gst_buffer_unref (g_queue_pop_head (encoder->delay)); } static GstStateChangeReturn gst_x264_enc_change_state (GstElement * element, GstStateChange transition) { GstX264Enc *encoder = GST_X264_ENC (element); GstStateChangeReturn ret = GST_STATE_CHANGE_SUCCESS; ret = GST_ELEMENT_CLASS (parent_class)->change_state (element, transition); if (ret == GST_STATE_CHANGE_FAILURE) goto out; switch (transition) { case GST_STATE_CHANGE_PAUSED_TO_READY: gst_x264_enc_flush_frames (encoder, FALSE); gst_x264_enc_close_encoder (encoder); gst_x264_enc_reset (encoder); break; default: break; } out: return ret; } static void gst_x264_enc_reconfig (GstX264Enc * encoder) { switch (encoder->pass) { case GST_X264_ENC_PASS_QUAL: encoder->x264param.rc.f_rf_constant = encoder->quantizer; encoder->x264param.rc.i_vbv_max_bitrate = encoder->bitrate; encoder->x264param.rc.i_vbv_buffer_size = encoder->x264param.rc.i_vbv_max_bitrate * encoder->vbv_buf_capacity / 1000; break; case GST_X264_ENC_PASS_CBR: case GST_X264_ENC_PASS_PASS1: case GST_X264_ENC_PASS_PASS2: case GST_X264_ENC_PASS_PASS3: default: encoder->x264param.rc.i_bitrate = encoder->bitrate; encoder->x264param.rc.i_vbv_max_bitrate = encoder->bitrate; encoder->x264param.rc.i_vbv_buffer_size = encoder->x264param.rc.i_vbv_max_bitrate * encoder->vbv_buf_capacity / 1000; break; } encoder->reconfig = TRUE; } static void gst_x264_enc_set_property (GObject * object, guint prop_id, const GValue * value, GParamSpec * pspec) { GstX264Enc *encoder; GstState state; const gchar *partitions = NULL; encoder = GST_X264_ENC (object); GST_OBJECT_LOCK (encoder); /* state at least matters for sps, bytestream, pass, * and so by extension ... */ state = GST_STATE (encoder); if ((state != GST_STATE_READY && state != GST_STATE_NULL) && !(pspec->flags & GST_PARAM_MUTABLE_PLAYING)) goto wrong_state; switch (prop_id) { case ARG_PASS: encoder->pass = g_value_get_enum (value); break; case ARG_QUANTIZER: encoder->quantizer = g_value_get_uint (value); gst_x264_enc_reconfig (encoder); break; case ARG_BITRATE: encoder->bitrate = g_value_get_uint (value); gst_x264_enc_reconfig (encoder); break; case ARG_VBV_BUF_CAPACITY: encoder->vbv_buf_capacity = g_value_get_uint (value); gst_x264_enc_reconfig (encoder); break; case ARG_SPEED_PRESET: encoder->speed_preset = g_value_get_enum (value); break; case ARG_PSY_TUNE: encoder->psy_tune = g_value_get_enum (value); break; case ARG_TUNE: encoder->tune = g_value_get_flags (value); break; case ARG_PROFILE: encoder->profile = g_value_get_enum (value); break; case ARG_OPTION_STRING: g_string_assign (encoder->option_string_prop, g_value_get_string (value)); break; case ARG_THREADS: encoder->threads = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":threads=%d", encoder->threads); break; case ARG_SLICED_THREADS: encoder->sliced_threads = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":sliced-threads=%d", encoder->sliced_threads); break; case ARG_SYNC_LOOKAHEAD: encoder->sync_lookahead = g_value_get_int (value); g_string_append_printf (encoder->option_string, ":sync-lookahead=%d", encoder->sync_lookahead); break; case ARG_STATS_FILE: case ARG_MULTIPASS_CACHE_FILE: if (encoder->mp_cache_file) g_free (encoder->mp_cache_file); encoder->mp_cache_file = g_value_dup_string (value); g_string_append_printf (encoder->option_string, ":stats=%s", encoder->mp_cache_file); break; case ARG_BYTE_STREAM: encoder->byte_stream = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":annexb=%d", encoder->byte_stream); break; case ARG_INTRA_REFRESH: encoder->intra_refresh = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":intra-refresh=%d", encoder->intra_refresh); break; case ARG_ME: encoder->me = g_value_get_enum (value); g_string_append_printf (encoder->option_string, ":me=%s", x264_motion_est_names[encoder->me]); break; case ARG_SUBME: encoder->subme = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":subme=%d", encoder->subme); break; case ARG_ANALYSE: encoder->analyse = g_value_get_flags (value); partitions = gst_x264_enc_build_partitions (encoder->analyse); if (partitions) { g_string_append_printf (encoder->option_string, ":partitions=%s", partitions); g_free ((gpointer) partitions); } break; case ARG_DCT8x8: encoder->dct8x8 = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":8x8dct=%d", encoder->dct8x8); break; case ARG_REF: encoder->ref = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":ref=%d", encoder->ref); break; case ARG_BFRAMES: encoder->bframes = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":bframes=%d", encoder->bframes); break; case ARG_B_ADAPT: encoder->b_adapt = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":b-adapt=%d", encoder->b_adapt); break; case ARG_B_PYRAMID: encoder->b_pyramid = g_value_get_boolean (value); #ifdef X264_B_PYRAMID g_string_append_printf (encoder->option_string, ":b-pyramid=%s", x264_b_pyramid_names[encoder->b_pyramid]); #else g_string_append_printf (encoder->option_string, ":b-pyramid=%d", encoder->b_pyramid); #endif /* X264_B_PYRAMID */ break; case ARG_WEIGHTB: encoder->weightb = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":weightb=%d", encoder->weightb); break; case ARG_SPS_ID: encoder->sps_id = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":sps-id=%d", encoder->sps_id); break; case ARG_AU_NALU: encoder->au_nalu = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":aud=%d", encoder->au_nalu); break; case ARG_TRELLIS: encoder->trellis = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":trellis=%d", encoder->trellis); break; case ARG_KEYINT_MAX: encoder->keyint_max = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":keyint=%d", encoder->keyint_max); break; case ARG_CABAC: encoder->cabac = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":cabac=%d", encoder->cabac); break; case ARG_QP_MIN: encoder->qp_min = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":qpmin=%d", encoder->qp_min); break; case ARG_QP_MAX: encoder->qp_max = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":qpmax=%d", encoder->qp_max); break; case ARG_QP_STEP: encoder->qp_step = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":qpstep=%d", encoder->qp_step); break; case ARG_IP_FACTOR: encoder->ip_factor = g_value_get_float (value); g_string_append_printf (encoder->option_string, ":ip-factor=%f", encoder->ip_factor); break; case ARG_PB_FACTOR: encoder->pb_factor = g_value_get_float (value); g_string_append_printf (encoder->option_string, ":pb-factor=%f", encoder->pb_factor); break; case ARG_RC_MB_TREE: encoder->mb_tree = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":mbtree=%d", encoder->mb_tree); break; case ARG_RC_LOOKAHEAD: encoder->rc_lookahead = g_value_get_int (value); g_string_append_printf (encoder->option_string, ":rc-lookahead=%d", encoder->rc_lookahead); break; case ARG_NR: encoder->noise_reduction = g_value_get_uint (value); g_string_append_printf (encoder->option_string, ":nr=%d", encoder->noise_reduction); break; case ARG_INTERLACED: encoder->interlaced = g_value_get_boolean (value); g_string_append_printf (encoder->option_string, ":interlaced=%d", encoder->interlaced); break; default: G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec); break; } GST_OBJECT_UNLOCK (encoder); return; /* ERROR */ wrong_state: { GST_WARNING_OBJECT (encoder, "setting property in wrong state"); GST_OBJECT_UNLOCK (encoder); } } static void gst_x264_enc_get_property (GObject * object, guint prop_id, GValue * value, GParamSpec * pspec) { GstX264Enc *encoder; encoder = GST_X264_ENC (object); GST_OBJECT_LOCK (encoder); switch (prop_id) { case ARG_THREADS: g_value_set_uint (value, encoder->threads); break; case ARG_SLICED_THREADS: g_value_set_boolean (value, encoder->sliced_threads); break; case ARG_SYNC_LOOKAHEAD: g_value_set_int (value, encoder->sync_lookahead); break; case ARG_PASS: g_value_set_enum (value, encoder->pass); break; case ARG_QUANTIZER: g_value_set_uint (value, encoder->quantizer); break; case ARG_STATS_FILE: case ARG_MULTIPASS_CACHE_FILE: g_value_set_string (value, encoder->mp_cache_file); break; case ARG_BYTE_STREAM: g_value_set_boolean (value, encoder->byte_stream); break; case ARG_BITRATE: g_value_set_uint (value, encoder->bitrate); break; case ARG_INTRA_REFRESH: g_value_set_boolean (value, encoder->intra_refresh); break; case ARG_VBV_BUF_CAPACITY: g_value_set_uint (value, encoder->vbv_buf_capacity); break; case ARG_ME: g_value_set_enum (value, encoder->me); break; case ARG_SUBME: g_value_set_uint (value, encoder->subme); break; case ARG_ANALYSE: g_value_set_flags (value, encoder->analyse); break; case ARG_DCT8x8: g_value_set_boolean (value, encoder->dct8x8); break; case ARG_REF: g_value_set_uint (value, encoder->ref); break; case ARG_BFRAMES: g_value_set_uint (value, encoder->bframes); break; case ARG_B_ADAPT: g_value_set_boolean (value, encoder->b_adapt); break; case ARG_B_PYRAMID: g_value_set_boolean (value, encoder->b_pyramid); break; case ARG_WEIGHTB: g_value_set_boolean (value, encoder->weightb); break; case ARG_SPS_ID: g_value_set_uint (value, encoder->sps_id); break; case ARG_AU_NALU: g_value_set_boolean (value, encoder->au_nalu); break; case ARG_TRELLIS: g_value_set_boolean (value, encoder->trellis); break; case ARG_KEYINT_MAX: g_value_set_uint (value, encoder->keyint_max); break; case ARG_QP_MIN: g_value_set_uint (value, encoder->qp_min); break; case ARG_QP_MAX: g_value_set_uint (value, encoder->qp_max); break; case ARG_QP_STEP: g_value_set_uint (value, encoder->qp_step); break; case ARG_CABAC: g_value_set_boolean (value, encoder->cabac); break; case ARG_IP_FACTOR: g_value_set_float (value, encoder->ip_factor); break; case ARG_PB_FACTOR: g_value_set_float (value, encoder->pb_factor); break; case ARG_RC_MB_TREE: g_value_set_boolean (value, encoder->mb_tree); break; case ARG_RC_LOOKAHEAD: g_value_set_int (value, encoder->rc_lookahead); break; case ARG_NR: g_value_set_uint (value, encoder->noise_reduction); break; case ARG_INTERLACED: g_value_set_boolean (value, encoder->interlaced); break; case ARG_SPEED_PRESET: g_value_set_enum (value, encoder->speed_preset); break; case ARG_PSY_TUNE: g_value_set_enum (value, encoder->psy_tune); break; case ARG_TUNE: g_value_set_flags (value, encoder->tune); break; case ARG_PROFILE: g_value_set_enum (value, encoder->profile); break; case ARG_OPTION_STRING: g_value_set_string (value, encoder->option_string_prop->str); break; default: G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec); break; } GST_OBJECT_UNLOCK (encoder); } static gboolean plugin_init (GstPlugin * plugin) { GST_DEBUG_CATEGORY_INIT (x264_enc_debug, "x264enc", 0, "h264 encoding element"); return gst_element_register (plugin, "x264enc", GST_RANK_PRIMARY, GST_TYPE_X264_ENC); } GST_PLUGIN_DEFINE (GST_VERSION_MAJOR, GST_VERSION_MINOR, "x264", "libx264-based H264 plugins", plugin_init, VERSION, "GPL", GST_PACKAGE_NAME, GST_PACKAGE_ORIGIN)