/* * This copyright notice applies to this header file only: * * Copyright (c) 2010-2021 NVIDIA Corporation * * Permission is hereby granted, free of charge, to any person * obtaining a copy of this software and associated documentation * files (the "Software"), to deal in the Software without * restriction, including without limitation the rights to use, * copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the software, and to permit persons to whom the * software is furnished to do so, subject to the following * conditions: * * The above copyright notice and this permission notice shall be * included in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. */ /*****************************************************************************************************/ //! \file cuviddec.h //! NVDECODE API provides video decoding interface to NVIDIA GPU devices. //! This file contains constants, structure definitions and function prototypes used for decoding. /*****************************************************************************************************/ #if !defined(__CUDA_VIDEO_H__) #define __CUDA_VIDEO_H__ #ifndef __cuda_cuda_h__ #include #endif // __cuda_cuda_h__ #if defined(_WIN64) || defined(__LP64__) || defined(__x86_64) || defined(AMD64) || defined(_M_AMD64) #if (CUDA_VERSION >= 3020) && (!defined(CUDA_FORCE_API_VERSION) || (CUDA_FORCE_API_VERSION >= 3020)) #define __CUVID_DEVPTR64 #endif #endif #if defined(__cplusplus) extern "C" { #endif /* __cplusplus */ typedef void *CUvideodecoder; typedef struct _CUcontextlock_st *CUvideoctxlock; /*********************************************************************************/ //! \enum cudaVideoCodec //! Video codec enums //! These enums are used in CUVIDDECODECREATEINFO and CUVIDDECODECAPS structures /*********************************************************************************/ typedef enum cudaVideoCodec_enum { cudaVideoCodec_MPEG1=0, /**< MPEG1 */ cudaVideoCodec_MPEG2, /**< MPEG2 */ cudaVideoCodec_MPEG4, /**< MPEG4 */ cudaVideoCodec_VC1, /**< VC1 */ cudaVideoCodec_H264, /**< H264 */ cudaVideoCodec_JPEG, /**< JPEG */ cudaVideoCodec_H264_SVC, /**< H264-SVC */ cudaVideoCodec_H264_MVC, /**< H264-MVC */ cudaVideoCodec_HEVC, /**< HEVC */ cudaVideoCodec_VP8, /**< VP8 */ cudaVideoCodec_VP9, /**< VP9 */ cudaVideoCodec_AV1, /**< AV1 */ cudaVideoCodec_NumCodecs, /**< Max codecs */ // Uncompressed YUV cudaVideoCodec_YUV420 = (('I'<<24)|('Y'<<16)|('U'<<8)|('V')), /**< Y,U,V (4:2:0) */ cudaVideoCodec_YV12 = (('Y'<<24)|('V'<<16)|('1'<<8)|('2')), /**< Y,V,U (4:2:0) */ cudaVideoCodec_NV12 = (('N'<<24)|('V'<<16)|('1'<<8)|('2')), /**< Y,UV (4:2:0) */ cudaVideoCodec_YUYV = (('Y'<<24)|('U'<<16)|('Y'<<8)|('V')), /**< YUYV/YUY2 (4:2:2) */ cudaVideoCodec_UYVY = (('U'<<24)|('Y'<<16)|('V'<<8)|('Y')) /**< UYVY (4:2:2) */ } cudaVideoCodec; /*********************************************************************************/ //! \enum cudaVideoSurfaceFormat //! Video surface format enums used for output format of decoded output //! These enums are used in CUVIDDECODECREATEINFO structure /*********************************************************************************/ typedef enum cudaVideoSurfaceFormat_enum { cudaVideoSurfaceFormat_NV12=0, /**< Semi-Planar YUV [Y plane followed by interleaved UV plane] */ cudaVideoSurfaceFormat_P016=1, /**< 16 bit Semi-Planar YUV [Y plane followed by interleaved UV plane]. Can be used for 10 bit(6LSB bits 0), 12 bit (4LSB bits 0) */ cudaVideoSurfaceFormat_YUV444=2, /**< Planar YUV [Y plane followed by U and V planes] */ cudaVideoSurfaceFormat_YUV444_16Bit=3, /**< 16 bit Planar YUV [Y plane followed by U and V planes]. Can be used for 10 bit(6LSB bits 0), 12 bit (4LSB bits 0) */ } cudaVideoSurfaceFormat; /******************************************************************************************************************/ //! \enum cudaVideoDeinterlaceMode //! Deinterlacing mode enums //! These enums are used in CUVIDDECODECREATEINFO structure //! Use cudaVideoDeinterlaceMode_Weave for progressive content and for content that doesn't need deinterlacing //! cudaVideoDeinterlaceMode_Adaptive needs more video memory than other DImodes /******************************************************************************************************************/ typedef enum cudaVideoDeinterlaceMode_enum { cudaVideoDeinterlaceMode_Weave=0, /**< Weave both fields (no deinterlacing) */ cudaVideoDeinterlaceMode_Bob, /**< Drop one field */ cudaVideoDeinterlaceMode_Adaptive /**< Adaptive deinterlacing */ } cudaVideoDeinterlaceMode; /**************************************************************************************************************/ //! \enum cudaVideoChromaFormat //! Chroma format enums //! These enums are used in CUVIDDECODECREATEINFO and CUVIDDECODECAPS structures /**************************************************************************************************************/ typedef enum cudaVideoChromaFormat_enum { cudaVideoChromaFormat_Monochrome=0, /**< MonoChrome */ cudaVideoChromaFormat_420, /**< YUV 4:2:0 */ cudaVideoChromaFormat_422, /**< YUV 4:2:2 */ cudaVideoChromaFormat_444 /**< YUV 4:4:4 */ } cudaVideoChromaFormat; /*************************************************************************************************************/ //! \enum cudaVideoCreateFlags //! Decoder flag enums to select preferred decode path //! cudaVideoCreate_Default and cudaVideoCreate_PreferCUVID are most optimized, use these whenever possible /*************************************************************************************************************/ typedef enum cudaVideoCreateFlags_enum { cudaVideoCreate_Default = 0x00, /**< Default operation mode: use dedicated video engines */ cudaVideoCreate_PreferCUDA = 0x01, /**< Use CUDA-based decoder (requires valid vidLock object for multi-threading) */ cudaVideoCreate_PreferDXVA = 0x02, /**< Go through DXVA internally if possible (requires D3D9 interop) */ cudaVideoCreate_PreferCUVID = 0x04 /**< Use dedicated video engines directly */ } cudaVideoCreateFlags; /*************************************************************************/ //! \enum cuvidDecodeStatus //! Decode status enums //! These enums are used in CUVIDGETDECODESTATUS structure /*************************************************************************/ typedef enum cuvidDecodeStatus_enum { cuvidDecodeStatus_Invalid = 0, // Decode status is not valid cuvidDecodeStatus_InProgress = 1, // Decode is in progress cuvidDecodeStatus_Success = 2, // Decode is completed without any errors // 3 to 7 enums are reserved for future use cuvidDecodeStatus_Error = 8, // Decode is completed with an error (error is not concealed) cuvidDecodeStatus_Error_Concealed = 9, // Decode is completed with an error and error is concealed } cuvidDecodeStatus; /**************************************************************************************************************/ //! \struct CUVIDDECODECAPS; //! This structure is used in cuvidGetDecoderCaps API /**************************************************************************************************************/ typedef struct _CUVIDDECODECAPS { cudaVideoCodec eCodecType; /**< IN: cudaVideoCodec_XXX */ cudaVideoChromaFormat eChromaFormat; /**< IN: cudaVideoChromaFormat_XXX */ unsigned int nBitDepthMinus8; /**< IN: The Value "BitDepth minus 8" */ unsigned int reserved1[3]; /**< Reserved for future use - set to zero */ unsigned char bIsSupported; /**< OUT: 1 if codec supported, 0 if not supported */ unsigned char nNumNVDECs; /**< OUT: Number of NVDECs that can support IN params */ unsigned short nOutputFormatMask; /**< OUT: each bit represents corresponding cudaVideoSurfaceFormat enum */ unsigned int nMaxWidth; /**< OUT: Max supported coded width in pixels */ unsigned int nMaxHeight; /**< OUT: Max supported coded height in pixels */ unsigned int nMaxMBCount; /**< OUT: Max supported macroblock count CodedWidth*CodedHeight/256 must be <= nMaxMBCount */ unsigned short nMinWidth; /**< OUT: Min supported coded width in pixels */ unsigned short nMinHeight; /**< OUT: Min supported coded height in pixels */ unsigned char bIsHistogramSupported; /**< OUT: 1 if Y component histogram output is supported, 0 if not Note: histogram is computed on original picture data before any post-processing like scaling, cropping, etc. is applied */ unsigned char nCounterBitDepth; /**< OUT: histogram counter bit depth */ unsigned short nMaxHistogramBins; /**< OUT: Max number of histogram bins */ unsigned int reserved3[10]; /**< Reserved for future use - set to zero */ } CUVIDDECODECAPS; /**************************************************************************************************************/ //! \struct CUVIDDECODECREATEINFO //! This structure is used in cuvidCreateDecoder API /**************************************************************************************************************/ typedef struct _CUVIDDECODECREATEINFO { unsigned long ulWidth; /**< IN: Coded sequence width in pixels */ unsigned long ulHeight; /**< IN: Coded sequence height in pixels */ unsigned long ulNumDecodeSurfaces; /**< IN: Maximum number of internal decode surfaces */ cudaVideoCodec CodecType; /**< IN: cudaVideoCodec_XXX */ cudaVideoChromaFormat ChromaFormat; /**< IN: cudaVideoChromaFormat_XXX */ unsigned long ulCreationFlags; /**< IN: Decoder creation flags (cudaVideoCreateFlags_XXX) */ unsigned long bitDepthMinus8; /**< IN: The value "BitDepth minus 8" */ unsigned long ulIntraDecodeOnly; /**< IN: Set 1 only if video has all intra frames (default value is 0). This will optimize video memory for Intra frames only decoding. The support is limited to specific codecs - H264, HEVC, VP9, the flag will be ignored for codecs which are not supported. However decoding might fail if the flag is enabled in case of supported codecs for regular bit streams having P and/or B frames. */ unsigned long ulMaxWidth; /**< IN: Coded sequence max width in pixels used with reconfigure Decoder */ unsigned long ulMaxHeight; /**< IN: Coded sequence max height in pixels used with reconfigure Decoder */ unsigned long Reserved1; /**< Reserved for future use - set to zero */ /** * IN: area of the frame that should be displayed */ struct { short left; short top; short right; short bottom; } display_area; cudaVideoSurfaceFormat OutputFormat; /**< IN: cudaVideoSurfaceFormat_XXX */ cudaVideoDeinterlaceMode DeinterlaceMode; /**< IN: cudaVideoDeinterlaceMode_XXX */ unsigned long ulTargetWidth; /**< IN: Post-processed output width (Should be aligned to 2) */ unsigned long ulTargetHeight; /**< IN: Post-processed output height (Should be aligned to 2) */ unsigned long ulNumOutputSurfaces; /**< IN: Maximum number of output surfaces simultaneously mapped */ CUvideoctxlock vidLock; /**< IN: If non-NULL, context lock used for synchronizing ownership of the cuda context. Needed for cudaVideoCreate_PreferCUDA decode */ /** * IN: target rectangle in the output frame (for aspect ratio conversion) * if a null rectangle is specified, {0,0,ulTargetWidth,ulTargetHeight} will be used */ struct { short left; short top; short right; short bottom; } target_rect; unsigned long enableHistogram; /**< IN: enable histogram output, if supported */ unsigned long Reserved2[4]; /**< Reserved for future use - set to zero */ } CUVIDDECODECREATEINFO; /*********************************************************/ //! \struct CUVIDH264DPBENTRY //! H.264 DPB entry //! This structure is used in CUVIDH264PICPARAMS structure /*********************************************************/ typedef struct _CUVIDH264DPBENTRY { int PicIdx; /**< picture index of reference frame */ int FrameIdx; /**< frame_num(short-term) or LongTermFrameIdx(long-term) */ int is_long_term; /**< 0=short term reference, 1=long term reference */ int not_existing; /**< non-existing reference frame (corresponding PicIdx should be set to -1) */ int used_for_reference; /**< 0=unused, 1=top_field, 2=bottom_field, 3=both_fields */ int FieldOrderCnt[2]; /**< field order count of top and bottom fields */ } CUVIDH264DPBENTRY; /************************************************************/ //! \struct CUVIDH264MVCEXT //! H.264 MVC picture parameters ext //! This structure is used in CUVIDH264PICPARAMS structure /************************************************************/ typedef struct _CUVIDH264MVCEXT { int num_views_minus1; /**< Max number of coded views minus 1 in video : Range - 0 to 1023 */ int view_id; /**< view identifier */ unsigned char inter_view_flag; /**< 1 if used for inter-view prediction, 0 if not */ unsigned char num_inter_view_refs_l0; /**< number of inter-view ref pics in RefPicList0 */ unsigned char num_inter_view_refs_l1; /**< number of inter-view ref pics in RefPicList1 */ unsigned char MVCReserved8Bits; /**< Reserved bits */ int InterViewRefsL0[16]; /**< view id of the i-th view component for inter-view prediction in RefPicList0 */ int InterViewRefsL1[16]; /**< view id of the i-th view component for inter-view prediction in RefPicList1 */ } CUVIDH264MVCEXT; /*********************************************************/ //! \struct CUVIDH264SVCEXT //! H.264 SVC picture parameters ext //! This structure is used in CUVIDH264PICPARAMS structure /*********************************************************/ typedef struct _CUVIDH264SVCEXT { unsigned char profile_idc; unsigned char level_idc; unsigned char DQId; unsigned char DQIdMax; unsigned char disable_inter_layer_deblocking_filter_idc; unsigned char ref_layer_chroma_phase_y_plus1; signed char inter_layer_slice_alpha_c0_offset_div2; signed char inter_layer_slice_beta_offset_div2; unsigned short DPBEntryValidFlag; unsigned char inter_layer_deblocking_filter_control_present_flag; unsigned char extended_spatial_scalability_idc; unsigned char adaptive_tcoeff_level_prediction_flag; unsigned char slice_header_restriction_flag; unsigned char chroma_phase_x_plus1_flag; unsigned char chroma_phase_y_plus1; unsigned char tcoeff_level_prediction_flag; unsigned char constrained_intra_resampling_flag; unsigned char ref_layer_chroma_phase_x_plus1_flag; unsigned char store_ref_base_pic_flag; unsigned char Reserved8BitsA; unsigned char Reserved8BitsB; short scaled_ref_layer_left_offset; short scaled_ref_layer_top_offset; short scaled_ref_layer_right_offset; short scaled_ref_layer_bottom_offset; unsigned short Reserved16Bits; struct _CUVIDPICPARAMS *pNextLayer; /**< Points to the picparams for the next layer to be decoded. Linked list ends at the target layer. */ int bRefBaseLayer; /**< whether to store ref base pic */ } CUVIDH264SVCEXT; /******************************************************/ //! \struct CUVIDH264PICPARAMS //! H.264 picture parameters //! This structure is used in CUVIDPICPARAMS structure /******************************************************/ typedef struct _CUVIDH264PICPARAMS { // SPS int log2_max_frame_num_minus4; int pic_order_cnt_type; int log2_max_pic_order_cnt_lsb_minus4; int delta_pic_order_always_zero_flag; int frame_mbs_only_flag; int direct_8x8_inference_flag; int num_ref_frames; // NOTE: shall meet level 4.1 restrictions unsigned char residual_colour_transform_flag; unsigned char bit_depth_luma_minus8; // Must be 0 (only 8-bit supported) unsigned char bit_depth_chroma_minus8; // Must be 0 (only 8-bit supported) unsigned char qpprime_y_zero_transform_bypass_flag; // PPS int entropy_coding_mode_flag; int pic_order_present_flag; int num_ref_idx_l0_active_minus1; int num_ref_idx_l1_active_minus1; int weighted_pred_flag; int weighted_bipred_idc; int pic_init_qp_minus26; int deblocking_filter_control_present_flag; int redundant_pic_cnt_present_flag; int transform_8x8_mode_flag; int MbaffFrameFlag; int constrained_intra_pred_flag; int chroma_qp_index_offset; int second_chroma_qp_index_offset; int ref_pic_flag; int frame_num; int CurrFieldOrderCnt[2]; // DPB CUVIDH264DPBENTRY dpb[16]; // List of reference frames within the DPB // Quantization Matrices (raster-order) unsigned char WeightScale4x4[6][16]; unsigned char WeightScale8x8[2][64]; // FMO/ASO unsigned char fmo_aso_enable; unsigned char num_slice_groups_minus1; unsigned char slice_group_map_type; signed char pic_init_qs_minus26; unsigned int slice_group_change_rate_minus1; union { unsigned long long slice_group_map_addr; const unsigned char *pMb2SliceGroupMap; } fmo; unsigned int Reserved[12]; // SVC/MVC union { CUVIDH264MVCEXT mvcext; CUVIDH264SVCEXT svcext; }; } CUVIDH264PICPARAMS; /********************************************************/ //! \struct CUVIDMPEG2PICPARAMS //! MPEG-2 picture parameters //! This structure is used in CUVIDPICPARAMS structure /********************************************************/ typedef struct _CUVIDMPEG2PICPARAMS { int ForwardRefIdx; // Picture index of forward reference (P/B-frames) int BackwardRefIdx; // Picture index of backward reference (B-frames) int picture_coding_type; int full_pel_forward_vector; int full_pel_backward_vector; int f_code[2][2]; int intra_dc_precision; int frame_pred_frame_dct; int concealment_motion_vectors; int q_scale_type; int intra_vlc_format; int alternate_scan; int top_field_first; // Quantization matrices (raster order) unsigned char QuantMatrixIntra[64]; unsigned char QuantMatrixInter[64]; } CUVIDMPEG2PICPARAMS; // MPEG-4 has VOP types instead of Picture types #define I_VOP 0 #define P_VOP 1 #define B_VOP 2 #define S_VOP 3 /*******************************************************/ //! \struct CUVIDMPEG4PICPARAMS //! MPEG-4 picture parameters //! This structure is used in CUVIDPICPARAMS structure /*******************************************************/ typedef struct _CUVIDMPEG4PICPARAMS { int ForwardRefIdx; // Picture index of forward reference (P/B-frames) int BackwardRefIdx; // Picture index of backward reference (B-frames) // VOL int video_object_layer_width; int video_object_layer_height; int vop_time_increment_bitcount; int top_field_first; int resync_marker_disable; int quant_type; int quarter_sample; int short_video_header; int divx_flags; // VOP int vop_coding_type; int vop_coded; int vop_rounding_type; int alternate_vertical_scan_flag; int interlaced; int vop_fcode_forward; int vop_fcode_backward; int trd[2]; int trb[2]; // Quantization matrices (raster order) unsigned char QuantMatrixIntra[64]; unsigned char QuantMatrixInter[64]; int gmc_enabled; } CUVIDMPEG4PICPARAMS; /********************************************************/ //! \struct CUVIDVC1PICPARAMS //! VC1 picture parameters //! This structure is used in CUVIDPICPARAMS structure /********************************************************/ typedef struct _CUVIDVC1PICPARAMS { int ForwardRefIdx; /**< Picture index of forward reference (P/B-frames) */ int BackwardRefIdx; /**< Picture index of backward reference (B-frames) */ int FrameWidth; /**< Actual frame width */ int FrameHeight; /**< Actual frame height */ // PICTURE int intra_pic_flag; /**< Set to 1 for I,BI frames */ int ref_pic_flag; /**< Set to 1 for I,P frames */ int progressive_fcm; /**< Progressive frame */ // SEQUENCE int profile; int postprocflag; int pulldown; int interlace; int tfcntrflag; int finterpflag; int psf; int multires; int syncmarker; int rangered; int maxbframes; // ENTRYPOINT int panscan_flag; int refdist_flag; int extended_mv; int dquant; int vstransform; int loopfilter; int fastuvmc; int overlap; int quantizer; int extended_dmv; int range_mapy_flag; int range_mapy; int range_mapuv_flag; int range_mapuv; int rangeredfrm; // range reduction state } CUVIDVC1PICPARAMS; /***********************************************************/ //! \struct CUVIDJPEGPICPARAMS //! JPEG picture parameters //! This structure is used in CUVIDPICPARAMS structure /***********************************************************/ typedef struct _CUVIDJPEGPICPARAMS { int Reserved; } CUVIDJPEGPICPARAMS; /*******************************************************/ //! \struct CUVIDHEVCPICPARAMS //! HEVC picture parameters //! This structure is used in CUVIDPICPARAMS structure /*******************************************************/ typedef struct _CUVIDHEVCPICPARAMS { // sps int pic_width_in_luma_samples; int pic_height_in_luma_samples; unsigned char log2_min_luma_coding_block_size_minus3; unsigned char log2_diff_max_min_luma_coding_block_size; unsigned char log2_min_transform_block_size_minus2; unsigned char log2_diff_max_min_transform_block_size; unsigned char pcm_enabled_flag; unsigned char log2_min_pcm_luma_coding_block_size_minus3; unsigned char log2_diff_max_min_pcm_luma_coding_block_size; unsigned char pcm_sample_bit_depth_luma_minus1; unsigned char pcm_sample_bit_depth_chroma_minus1; unsigned char pcm_loop_filter_disabled_flag; unsigned char strong_intra_smoothing_enabled_flag; unsigned char max_transform_hierarchy_depth_intra; unsigned char max_transform_hierarchy_depth_inter; unsigned char amp_enabled_flag; unsigned char separate_colour_plane_flag; unsigned char log2_max_pic_order_cnt_lsb_minus4; unsigned char num_short_term_ref_pic_sets; unsigned char long_term_ref_pics_present_flag; unsigned char num_long_term_ref_pics_sps; unsigned char sps_temporal_mvp_enabled_flag; unsigned char sample_adaptive_offset_enabled_flag; unsigned char scaling_list_enable_flag; unsigned char IrapPicFlag; unsigned char IdrPicFlag; unsigned char bit_depth_luma_minus8; unsigned char bit_depth_chroma_minus8; //sps/pps extension fields unsigned char log2_max_transform_skip_block_size_minus2; unsigned char log2_sao_offset_scale_luma; unsigned char log2_sao_offset_scale_chroma; unsigned char high_precision_offsets_enabled_flag; unsigned char reserved1[10]; // pps unsigned char dependent_slice_segments_enabled_flag; unsigned char slice_segment_header_extension_present_flag; unsigned char sign_data_hiding_enabled_flag; unsigned char cu_qp_delta_enabled_flag; unsigned char diff_cu_qp_delta_depth; signed char init_qp_minus26; signed char pps_cb_qp_offset; signed char pps_cr_qp_offset; unsigned char constrained_intra_pred_flag; unsigned char weighted_pred_flag; unsigned char weighted_bipred_flag; unsigned char transform_skip_enabled_flag; unsigned char transquant_bypass_enabled_flag; unsigned char entropy_coding_sync_enabled_flag; unsigned char log2_parallel_merge_level_minus2; unsigned char num_extra_slice_header_bits; unsigned char loop_filter_across_tiles_enabled_flag; unsigned char loop_filter_across_slices_enabled_flag; unsigned char output_flag_present_flag; unsigned char num_ref_idx_l0_default_active_minus1; unsigned char num_ref_idx_l1_default_active_minus1; unsigned char lists_modification_present_flag; unsigned char cabac_init_present_flag; unsigned char pps_slice_chroma_qp_offsets_present_flag; unsigned char deblocking_filter_override_enabled_flag; unsigned char pps_deblocking_filter_disabled_flag; signed char pps_beta_offset_div2; signed char pps_tc_offset_div2; unsigned char tiles_enabled_flag; unsigned char uniform_spacing_flag; unsigned char num_tile_columns_minus1; unsigned char num_tile_rows_minus1; unsigned short column_width_minus1[21]; unsigned short row_height_minus1[21]; // sps and pps extension HEVC-main 444 unsigned char sps_range_extension_flag; unsigned char transform_skip_rotation_enabled_flag; unsigned char transform_skip_context_enabled_flag; unsigned char implicit_rdpcm_enabled_flag; unsigned char explicit_rdpcm_enabled_flag; unsigned char extended_precision_processing_flag; unsigned char intra_smoothing_disabled_flag; unsigned char persistent_rice_adaptation_enabled_flag; unsigned char cabac_bypass_alignment_enabled_flag; unsigned char pps_range_extension_flag; unsigned char cross_component_prediction_enabled_flag; unsigned char chroma_qp_offset_list_enabled_flag; unsigned char diff_cu_chroma_qp_offset_depth; unsigned char chroma_qp_offset_list_len_minus1; signed char cb_qp_offset_list[6]; signed char cr_qp_offset_list[6]; unsigned char reserved2[2]; unsigned int reserved3[8]; // RefPicSets int NumBitsForShortTermRPSInSlice; int NumDeltaPocsOfRefRpsIdx; int NumPocTotalCurr; int NumPocStCurrBefore; int NumPocStCurrAfter; int NumPocLtCurr; int CurrPicOrderCntVal; int RefPicIdx[16]; // [refpic] Indices of valid reference pictures (-1 if unused for reference) int PicOrderCntVal[16]; // [refpic] unsigned char IsLongTerm[16]; // [refpic] 0=not a long-term reference, 1=long-term reference unsigned char RefPicSetStCurrBefore[8]; // [0..NumPocStCurrBefore-1] -> refpic (0..15) unsigned char RefPicSetStCurrAfter[8]; // [0..NumPocStCurrAfter-1] -> refpic (0..15) unsigned char RefPicSetLtCurr[8]; // [0..NumPocLtCurr-1] -> refpic (0..15) unsigned char RefPicSetInterLayer0[8]; unsigned char RefPicSetInterLayer1[8]; unsigned int reserved4[12]; // scaling lists (diag order) unsigned char ScalingList4x4[6][16]; // [matrixId][i] unsigned char ScalingList8x8[6][64]; // [matrixId][i] unsigned char ScalingList16x16[6][64]; // [matrixId][i] unsigned char ScalingList32x32[2][64]; // [matrixId][i] unsigned char ScalingListDCCoeff16x16[6]; // [matrixId] unsigned char ScalingListDCCoeff32x32[2]; // [matrixId] } CUVIDHEVCPICPARAMS; /***********************************************************/ //! \struct CUVIDVP8PICPARAMS //! VP8 picture parameters //! This structure is used in CUVIDPICPARAMS structure /***********************************************************/ typedef struct _CUVIDVP8PICPARAMS { int width; int height; unsigned int first_partition_size; //Frame Indexes unsigned char LastRefIdx; unsigned char GoldenRefIdx; unsigned char AltRefIdx; union { struct { unsigned char frame_type : 1; /**< 0 = KEYFRAME, 1 = INTERFRAME */ unsigned char version : 3; unsigned char show_frame : 1; unsigned char update_mb_segmentation_data : 1; /**< Must be 0 if segmentation is not enabled */ unsigned char Reserved2Bits : 2; }vp8_frame_tag; unsigned char wFrameTagFlags; }; unsigned char Reserved1[4]; unsigned int Reserved2[3]; } CUVIDVP8PICPARAMS; /***********************************************************/ //! \struct CUVIDVP9PICPARAMS //! VP9 picture parameters //! This structure is used in CUVIDPICPARAMS structure /***********************************************************/ typedef struct _CUVIDVP9PICPARAMS { unsigned int width; unsigned int height; //Frame Indices unsigned char LastRefIdx; unsigned char GoldenRefIdx; unsigned char AltRefIdx; unsigned char colorSpace; unsigned short profile : 3; unsigned short frameContextIdx : 2; unsigned short frameType : 1; unsigned short showFrame : 1; unsigned short errorResilient : 1; unsigned short frameParallelDecoding : 1; unsigned short subSamplingX : 1; unsigned short subSamplingY : 1; unsigned short intraOnly : 1; unsigned short allow_high_precision_mv : 1; unsigned short refreshEntropyProbs : 1; unsigned short reserved2Bits : 2; unsigned short reserved16Bits; unsigned char refFrameSignBias[4]; unsigned char bitDepthMinus8Luma; unsigned char bitDepthMinus8Chroma; unsigned char loopFilterLevel; unsigned char loopFilterSharpness; unsigned char modeRefLfEnabled; unsigned char log2_tile_columns; unsigned char log2_tile_rows; unsigned char segmentEnabled : 1; unsigned char segmentMapUpdate : 1; unsigned char segmentMapTemporalUpdate : 1; unsigned char segmentFeatureMode : 1; unsigned char reserved4Bits : 4; unsigned char segmentFeatureEnable[8][4]; short segmentFeatureData[8][4]; unsigned char mb_segment_tree_probs[7]; unsigned char segment_pred_probs[3]; unsigned char reservedSegment16Bits[2]; int qpYAc; int qpYDc; int qpChDc; int qpChAc; unsigned int activeRefIdx[3]; unsigned int resetFrameContext; unsigned int mcomp_filter_type; unsigned int mbRefLfDelta[4]; unsigned int mbModeLfDelta[2]; unsigned int frameTagSize; unsigned int offsetToDctParts; unsigned int reserved128Bits[4]; } CUVIDVP9PICPARAMS; /***********************************************************/ //! \struct CUVIDAV1PICPARAMS //! AV1 picture parameters //! This structure is used in CUVIDPICPARAMS structure /***********************************************************/ typedef struct _CUVIDAV1PICPARAMS { unsigned int width; // coded width, if superres enabled then it is upscaled width unsigned int height; // coded height unsigned int frame_offset; // defined as order_hint in AV1 specification int decodePicIdx; // decoded output pic index, if film grain enabled, it will keep decoded (without film grain) output // It can be used as reference frame for future frames // sequence header unsigned int profile : 3; // 0 = profile0, 1 = profile1, 2 = profile2 unsigned int use_128x128_superblock : 1; // superblock size 0:64x64, 1: 128x128 unsigned int subsampling_x : 1; // (subsampling_x, _y) 1,1 = 420, 1,0 = 422, 0,0 = 444 unsigned int subsampling_y : 1; unsigned int mono_chrome : 1; // for monochrome content, mono_chrome = 1 and (subsampling_x, _y) should be 1,1 unsigned int bit_depth_minus8 : 4; // bit depth minus 8 unsigned int enable_filter_intra : 1; // tool enable in seq level, 0 : disable 1: frame header control unsigned int enable_intra_edge_filter : 1; // intra edge filtering process, 0 : disable 1: enabled unsigned int enable_interintra_compound : 1; // interintra, 0 : not present 1: present unsigned int enable_masked_compound : 1; // 1: mode info for inter blocks may contain the syntax element compound_type. // 0: syntax element compound_type will not be present unsigned int enable_dual_filter : 1; // vertical and horiz filter selection, 1: enable and 0: disable unsigned int enable_order_hint : 1; // order hint, and related tools, 1: enable and 0: disable unsigned int order_hint_bits_minus1 : 3; // is used to compute OrderHintBits unsigned int enable_jnt_comp : 1; // joint compound modes, 1: enable and 0: disable unsigned int enable_superres : 1; // superres in seq level, 0 : disable 1: frame level control unsigned int enable_cdef : 1; // cdef filtering in seq level, 0 : disable 1: frame level control unsigned int enable_restoration : 1; // loop restoration filtering in seq level, 0 : disable 1: frame level control unsigned int enable_fgs : 1; // defined as film_grain_params_present in AV1 specification unsigned int reserved0_7bits : 7; // reserved bits; must be set to 0 // frame header unsigned int frame_type : 2 ; // 0:Key frame, 1:Inter frame, 2:intra only, 3:s-frame unsigned int show_frame : 1 ; // show_frame = 1 implies that frame should be immediately output once decoded unsigned int disable_cdf_update : 1; // CDF update during symbol decoding, 1: disabled, 0: enabled unsigned int allow_screen_content_tools : 1; // 1: intra blocks may use palette encoding, 0: palette encoding is never used unsigned int force_integer_mv : 1; // 1: motion vectors will always be integers, 0: can contain fractional bits unsigned int coded_denom : 3; // coded_denom of the superres scale as specified in AV1 specification unsigned int allow_intrabc : 1; // 1: intra block copy may be used, 0: intra block copy is not allowed unsigned int allow_high_precision_mv : 1; // 1/8 precision mv enable unsigned int interp_filter : 3; // interpolation filter. Refer to section 6.8.9 of the AV1 specification Version 1.0.0 with Errata 1 unsigned int switchable_motion_mode : 1; // defined as is_motion_mode_switchable in AV1 specification unsigned int use_ref_frame_mvs : 1; // 1: current frame can use the previous frame mv information, 0: will not use. unsigned int disable_frame_end_update_cdf : 1; // 1: indicates that the end of frame CDF update is disabled unsigned int delta_q_present : 1; // quantizer index delta values are present in the block level unsigned int delta_q_res : 2; // left shift which should be applied to decoded quantizer index delta values unsigned int using_qmatrix : 1; // 1: quantizer matrix will be used to compute quantizers unsigned int coded_lossless : 1; // 1: all segments use lossless coding unsigned int use_superres : 1; // 1: superres enabled for frame unsigned int tx_mode : 2; // 0: ONLY4x4,1:LARGEST,2:SELECT unsigned int reference_mode : 1; // 0: SINGLE, 1: SELECT unsigned int allow_warped_motion : 1; // 1: allow_warped_motion may be present, 0: allow_warped_motion will not be present unsigned int reduced_tx_set : 1; // 1: frame is restricted to subset of the full set of transform types, 0: no such restriction unsigned int skip_mode : 1; // 1: most of the mode info is skipped, 0: mode info is not skipped unsigned int reserved1_3bits : 3; // reserved bits; must be set to 0 // tiling info unsigned int num_tile_cols : 8; // number of tiles across the frame., max is 64 unsigned int num_tile_rows : 8; // number of tiles down the frame., max is 64 unsigned int context_update_tile_id : 16; // specifies which tile to use for the CDF update unsigned short tile_widths[64]; // Width of each column in superblocks unsigned short tile_heights[64]; // height of each row in superblocks // CDEF - refer to section 6.10.14 of the AV1 specification Version 1.0.0 with Errata 1 unsigned char cdef_damping_minus_3 : 2; // controls the amount of damping in the deringing filter unsigned char cdef_bits : 2; // the number of bits needed to specify which CDEF filter to apply unsigned char reserved2_4bits : 4; // reserved bits; must be set to 0 unsigned char cdef_y_strength[8]; // 0-3 bits: y_pri_strength, 4-7 bits y_sec_strength unsigned char cdef_uv_strength[8]; // 0-3 bits: uv_pri_strength, 4-7 bits uv_sec_strength // SkipModeFrames unsigned char SkipModeFrame0 : 4; // specifies the frames to use for compound prediction when skip_mode is equal to 1. unsigned char SkipModeFrame1 : 4; // qp information - refer to section 6.8.11 of the AV1 specification Version 1.0.0 with Errata 1 unsigned char base_qindex; // indicates the base frame qindex. Defined as base_q_idx in AV1 specification char qp_y_dc_delta_q; // indicates the Y DC quantizer relative to base_q_idx. Defined as DeltaQYDc in AV1 specification char qp_u_dc_delta_q; // indicates the U DC quantizer relative to base_q_idx. Defined as DeltaQUDc in AV1 specification char qp_v_dc_delta_q; // indicates the V DC quantizer relative to base_q_idx. Defined as DeltaQVDc in AV1 specification char qp_u_ac_delta_q; // indicates the U AC quantizer relative to base_q_idx. Defined as DeltaQUAc in AV1 specification char qp_v_ac_delta_q; // indicates the V AC quantizer relative to base_q_idx. Defined as DeltaQVAc in AV1 specification unsigned char qm_y; // specifies the level in the quantizer matrix that should be used for luma plane decoding unsigned char qm_u; // specifies the level in the quantizer matrix that should be used for chroma U plane decoding unsigned char qm_v; // specifies the level in the quantizer matrix that should be used for chroma V plane decoding // segmentation - refer to section 6.8.13 of the AV1 specification Version 1.0.0 with Errata 1 unsigned char segmentation_enabled : 1; // 1 indicates that this frame makes use of the segmentation tool unsigned char segmentation_update_map : 1; // 1 indicates that the segmentation map are updated during the decoding of this frame unsigned char segmentation_update_data : 1; // 1 indicates that new parameters are about to be specified for each segment unsigned char segmentation_temporal_update : 1; // 1 indicates that the updates to the segmentation map are coded relative to the existing segmentation map unsigned char reserved3_4bits : 4; // reserved bits; must be set to 0 short segmentation_feature_data[8][8]; // specifies the feature data for a segment feature unsigned char segmentation_feature_mask[8]; // indicates that the corresponding feature is unused or feature value is coded // loopfilter - refer to section 6.8.10 of the AV1 specification Version 1.0.0 with Errata 1 unsigned char loop_filter_level[2]; // contains loop filter strength values unsigned char loop_filter_level_u; // loop filter strength value of U plane unsigned char loop_filter_level_v; // loop filter strength value of V plane unsigned char loop_filter_sharpness; // indicates the sharpness level char loop_filter_ref_deltas[8]; // contains the adjustment needed for the filter level based on the chosen reference frame char loop_filter_mode_deltas[2]; // contains the adjustment needed for the filter level based on the chosen mode unsigned char loop_filter_delta_enabled : 1; // indicates that the filter level depends on the mode and reference frame used to predict a block unsigned char loop_filter_delta_update : 1; // indicates that additional syntax elements are present that specify which mode and // reference frame deltas are to be updated unsigned char delta_lf_present : 1; // specifies whether loop filter delta values are present in the block level unsigned char delta_lf_res : 2; // specifies the left shift to apply to the decoded loop filter values unsigned char delta_lf_multi : 1; // separate loop filter deltas for Hy,Vy,U,V edges unsigned char reserved4_2bits : 2; // reserved bits; must be set to 0 // restoration - refer to section 6.10.15 of the AV1 specification Version 1.0.0 with Errata 1 unsigned char lr_unit_size[3]; // specifies the size of loop restoration units: 0: 32, 1: 64, 2: 128, 3: 256 unsigned char lr_type[3] ; // used to compute FrameRestorationType // reference frames unsigned char primary_ref_frame; // specifies which reference frame contains the CDF values and other state that should be // loaded at the start of the frame unsigned char ref_frame_map[8]; // frames in dpb that can be used as reference for current or future frames unsigned char temporal_layer_id : 4; // temporal layer id unsigned char spatial_layer_id : 4; // spatial layer id unsigned char reserved5_32bits[4]; // reserved bits; must be set to 0 // ref frame list struct { unsigned int width; unsigned int height; unsigned char index; unsigned char reserved24Bits[3]; // reserved bits; must be set to 0 } ref_frame[7]; // frames used as reference frame for current frame. // global motion struct { unsigned char invalid : 1; unsigned char wmtype : 2; // defined as GmType in AV1 specification unsigned char reserved5Bits : 5; // reserved bits; must be set to 0 char reserved24Bits[3]; // reserved bits; must be set to 0 int wmmat[6]; // defined as gm_params[] in AV1 specification } global_motion[7]; // global motion params for reference frames // film grain params - refer to section 6.8.20 of the AV1 specification Version 1.0.0 with Errata 1 unsigned short apply_grain : 1; unsigned short overlap_flag : 1; unsigned short scaling_shift_minus8 : 2; unsigned short chroma_scaling_from_luma : 1; unsigned short ar_coeff_lag : 2; unsigned short ar_coeff_shift_minus6 : 2; unsigned short grain_scale_shift : 2; unsigned short clip_to_restricted_range : 1; unsigned short reserved6_4bits : 4; // reserved bits; must be set to 0 unsigned char num_y_points; unsigned char scaling_points_y[14][2]; unsigned char num_cb_points; unsigned char scaling_points_cb[10][2]; unsigned char num_cr_points; unsigned char scaling_points_cr[10][2]; unsigned char reserved7_8bits; // reserved bits; must be set to 0 unsigned short random_seed; short ar_coeffs_y[24]; short ar_coeffs_cb[25]; short ar_coeffs_cr[25]; unsigned char cb_mult; unsigned char cb_luma_mult; short cb_offset; unsigned char cr_mult; unsigned char cr_luma_mult; short cr_offset; int reserved[7]; // reserved bits; must be set to 0 } CUVIDAV1PICPARAMS; /******************************************************************************************/ //! \struct CUVIDPICPARAMS //! Picture parameters for decoding //! This structure is used in cuvidDecodePicture API //! IN for cuvidDecodePicture /******************************************************************************************/ typedef struct _CUVIDPICPARAMS { int PicWidthInMbs; /**< IN: Coded frame size in macroblocks */ int FrameHeightInMbs; /**< IN: Coded frame height in macroblocks */ int CurrPicIdx; /**< IN: Output index of the current picture */ int field_pic_flag; /**< IN: 0=frame picture, 1=field picture */ int bottom_field_flag; /**< IN: 0=top field, 1=bottom field (ignored if field_pic_flag=0) */ int second_field; /**< IN: Second field of a complementary field pair */ // Bitstream data unsigned int nBitstreamDataLen; /**< IN: Number of bytes in bitstream data buffer */ const unsigned char *pBitstreamData; /**< IN: Ptr to bitstream data for this picture (slice-layer) */ unsigned int nNumSlices; /**< IN: Number of slices in this picture */ const unsigned int *pSliceDataOffsets; /**< IN: nNumSlices entries, contains offset of each slice within the bitstream data buffer */ int ref_pic_flag; /**< IN: This picture is a reference picture */ int intra_pic_flag; /**< IN: This picture is entirely intra coded */ unsigned int Reserved[30]; /**< Reserved for future use */ // IN: Codec-specific data union { CUVIDMPEG2PICPARAMS mpeg2; /**< Also used for MPEG-1 */ CUVIDH264PICPARAMS h264; CUVIDVC1PICPARAMS vc1; CUVIDMPEG4PICPARAMS mpeg4; CUVIDJPEGPICPARAMS jpeg; CUVIDHEVCPICPARAMS hevc; CUVIDVP8PICPARAMS vp8; CUVIDVP9PICPARAMS vp9; CUVIDAV1PICPARAMS av1; unsigned int CodecReserved[1024]; } CodecSpecific; } CUVIDPICPARAMS; /******************************************************/ //! \struct CUVIDPROCPARAMS //! Picture parameters for postprocessing //! This structure is used in cuvidMapVideoFrame API /******************************************************/ typedef struct _CUVIDPROCPARAMS { int progressive_frame; /**< IN: Input is progressive (deinterlace_mode will be ignored) */ int second_field; /**< IN: Output the second field (ignored if deinterlace mode is Weave) */ int top_field_first; /**< IN: Input frame is top field first (1st field is top, 2nd field is bottom) */ int unpaired_field; /**< IN: Input only contains one field (2nd field is invalid) */ // The fields below are used for raw YUV input unsigned int reserved_flags; /**< Reserved for future use (set to zero) */ unsigned int reserved_zero; /**< Reserved (set to zero) */ unsigned long long raw_input_dptr; /**< IN: Input CUdeviceptr for raw YUV extensions */ unsigned int raw_input_pitch; /**< IN: pitch in bytes of raw YUV input (should be aligned appropriately) */ unsigned int raw_input_format; /**< IN: Input YUV format (cudaVideoCodec_enum) */ unsigned long long raw_output_dptr; /**< IN: Output CUdeviceptr for raw YUV extensions */ unsigned int raw_output_pitch; /**< IN: pitch in bytes of raw YUV output (should be aligned appropriately) */ unsigned int Reserved1; /**< Reserved for future use (set to zero) */ CUstream output_stream; /**< IN: stream object used by cuvidMapVideoFrame */ unsigned int Reserved[46]; /**< Reserved for future use (set to zero) */ unsigned long long *histogram_dptr; /**< OUT: Output CUdeviceptr for histogram extensions */ void *Reserved2[1]; /**< Reserved for future use (set to zero) */ } CUVIDPROCPARAMS; /*********************************************************************************************************/ //! \struct CUVIDGETDECODESTATUS //! Struct for reporting decode status. //! This structure is used in cuvidGetDecodeStatus API. /*********************************************************************************************************/ typedef struct _CUVIDGETDECODESTATUS { cuvidDecodeStatus decodeStatus; unsigned int reserved[31]; void *pReserved[8]; } CUVIDGETDECODESTATUS; /****************************************************/ //! \struct CUVIDRECONFIGUREDECODERINFO //! Struct for decoder reset //! This structure is used in cuvidReconfigureDecoder() API /****************************************************/ typedef struct _CUVIDRECONFIGUREDECODERINFO { unsigned int ulWidth; /**< IN: Coded sequence width in pixels, MUST be < = ulMaxWidth defined at CUVIDDECODECREATEINFO */ unsigned int ulHeight; /**< IN: Coded sequence height in pixels, MUST be < = ulMaxHeight defined at CUVIDDECODECREATEINFO */ unsigned int ulTargetWidth; /**< IN: Post processed output width */ unsigned int ulTargetHeight; /**< IN: Post Processed output height */ unsigned int ulNumDecodeSurfaces; /**< IN: Maximum number of internal decode surfaces */ unsigned int reserved1[12]; /**< Reserved for future use. Set to Zero */ /** * IN: Area of frame to be displayed. Use-case : Source Cropping */ struct { short left; short top; short right; short bottom; } display_area; /** * IN: Target Rectangle in the OutputFrame. Use-case : Aspect ratio Conversion */ struct { short left; short top; short right; short bottom; } target_rect; unsigned int reserved2[11]; /**< Reserved for future use. Set to Zero */ } CUVIDRECONFIGUREDECODERINFO; /***********************************************************************************************************/ //! VIDEO_DECODER //! //! In order to minimize decode latencies, there should be always at least 2 pictures in the decode //! queue at any time, in order to make sure that all decode engines are always busy. //! //! Overall data flow: //! - cuvidGetDecoderCaps(...) //! - cuvidCreateDecoder(...) //! - For each picture: //! + cuvidDecodePicture(N) //! + cuvidMapVideoFrame(N-4) //! + do some processing in cuda //! + cuvidUnmapVideoFrame(N-4) //! + cuvidDecodePicture(N+1) //! + cuvidMapVideoFrame(N-3) //! + ... //! - cuvidDestroyDecoder(...) //! //! NOTE: //! - When the cuda context is created from a D3D device, the D3D device must also be created //! with the D3DCREATE_MULTITHREADED flag. //! - There is a limit to how many pictures can be mapped simultaneously (ulNumOutputSurfaces) //! - cuvidDecodePicture may block the calling thread if there are too many pictures pending //! in the decode queue /***********************************************************************************************************/ /**********************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidGetDecoderCaps(CUVIDDECODECAPS *pdc) //! Queries decode capabilities of NVDEC-HW based on CodecType, ChromaFormat and BitDepthMinus8 parameters. //! 1. Application fills IN parameters CodecType, ChromaFormat and BitDepthMinus8 of CUVIDDECODECAPS structure //! 2. On calling cuvidGetDecoderCaps, driver fills OUT parameters if the IN parameters are supported //! If IN parameters passed to the driver are not supported by NVDEC-HW, then all OUT params are set to 0. //! E.g. on Geforce GTX 960: //! App fills - eCodecType = cudaVideoCodec_H264; eChromaFormat = cudaVideoChromaFormat_420; nBitDepthMinus8 = 0; //! Given IN parameters are supported, hence driver fills: bIsSupported = 1; nMinWidth = 48; nMinHeight = 16; //! nMaxWidth = 4096; nMaxHeight = 4096; nMaxMBCount = 65536; //! CodedWidth*CodedHeight/256 must be less than or equal to nMaxMBCount /**********************************************************************************************************************/ extern CUresult CUDAAPI cuvidGetDecoderCaps(CUVIDDECODECAPS *pdc); /*****************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidCreateDecoder(CUvideodecoder *phDecoder, CUVIDDECODECREATEINFO *pdci) //! Create the decoder object based on pdci. A handle to the created decoder is returned /*****************************************************************************************************/ extern CUresult CUDAAPI cuvidCreateDecoder(CUvideodecoder *phDecoder, CUVIDDECODECREATEINFO *pdci); /*****************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidDestroyDecoder(CUvideodecoder hDecoder) //! Destroy the decoder object /*****************************************************************************************************/ extern CUresult CUDAAPI cuvidDestroyDecoder(CUvideodecoder hDecoder); /*****************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidDecodePicture(CUvideodecoder hDecoder, CUVIDPICPARAMS *pPicParams) //! Decode a single picture (field or frame) //! Kicks off HW decoding /*****************************************************************************************************/ extern CUresult CUDAAPI cuvidDecodePicture(CUvideodecoder hDecoder, CUVIDPICPARAMS *pPicParams); /************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidGetDecodeStatus(CUvideodecoder hDecoder, int nPicIdx); //! Get the decode status for frame corresponding to nPicIdx //! API is supported for Maxwell and above generation GPUs. //! API is currently supported for HEVC, H264 and JPEG codecs. //! API returns CUDA_ERROR_NOT_SUPPORTED error code for unsupported GPU or codec. /************************************************************************************************************/ extern CUresult CUDAAPI cuvidGetDecodeStatus(CUvideodecoder hDecoder, int nPicIdx, CUVIDGETDECODESTATUS* pDecodeStatus); /*********************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidReconfigureDecoder(CUvideodecoder hDecoder, CUVIDRECONFIGUREDECODERINFO *pDecReconfigParams) //! Used to reuse single decoder for multiple clips. Currently supports resolution change, resize params, display area //! params, target area params change for same codec. Must be called during CUVIDPARSERPARAMS::pfnSequenceCallback /*********************************************************************************************************/ extern CUresult CUDAAPI cuvidReconfigureDecoder(CUvideodecoder hDecoder, CUVIDRECONFIGUREDECODERINFO *pDecReconfigParams); #if !defined(__CUVID_DEVPTR64) || defined(__CUVID_INTERNAL) /************************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidMapVideoFrame(CUvideodecoder hDecoder, int nPicIdx, unsigned int *pDevPtr, //! unsigned int *pPitch, CUVIDPROCPARAMS *pVPP); //! Post-process and map video frame corresponding to nPicIdx for use in cuda. Returns cuda device pointer and associated //! pitch of the video frame /************************************************************************************************************************/ extern CUresult CUDAAPI cuvidMapVideoFrame(CUvideodecoder hDecoder, int nPicIdx, unsigned int *pDevPtr, unsigned int *pPitch, CUVIDPROCPARAMS *pVPP); /*****************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidUnmapVideoFrame(CUvideodecoder hDecoder, unsigned int DevPtr) //! Unmap a previously mapped video frame /*****************************************************************************************************/ extern CUresult CUDAAPI cuvidUnmapVideoFrame(CUvideodecoder hDecoder, unsigned int DevPtr); #endif #if defined(_WIN64) || defined(__LP64__) || defined(__x86_64) || defined(AMD64) || defined(_M_AMD64) /****************************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidMapVideoFrame64(CUvideodecoder hDecoder, int nPicIdx, unsigned long long *pDevPtr, //! unsigned int * pPitch, CUVIDPROCPARAMS *pVPP); //! Post-process and map video frame corresponding to nPicIdx for use in cuda. Returns cuda device pointer and associated //! pitch of the video frame /****************************************************************************************************************************/ extern CUresult CUDAAPI cuvidMapVideoFrame64(CUvideodecoder hDecoder, int nPicIdx, unsigned long long *pDevPtr, unsigned int *pPitch, CUVIDPROCPARAMS *pVPP); /**************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidUnmapVideoFrame64(CUvideodecoder hDecoder, unsigned long long DevPtr); //! Unmap a previously mapped video frame /**************************************************************************************************/ extern CUresult CUDAAPI cuvidUnmapVideoFrame64(CUvideodecoder hDecoder, unsigned long long DevPtr); #if defined(__CUVID_DEVPTR64) && !defined(__CUVID_INTERNAL) #define cuvidMapVideoFrame cuvidMapVideoFrame64 #define cuvidUnmapVideoFrame cuvidUnmapVideoFrame64 #endif #endif /********************************************************************************************************************/ //! //! Context-locking: to facilitate multi-threaded implementations, the following 4 functions //! provide a simple mutex-style host synchronization. If a non-NULL context is specified //! in CUVIDDECODECREATEINFO, the codec library will acquire the mutex associated with the given //! context before making any cuda calls. //! A multi-threaded application could create a lock associated with a context handle so that //! multiple threads can safely share the same cuda context: //! - use cuCtxPopCurrent immediately after context creation in order to create a 'floating' context //! that can be passed to cuvidCtxLockCreate. //! - When using a floating context, all cuda calls should only be made within a cuvidCtxLock/cuvidCtxUnlock section. //! //! NOTE: This is a safer alternative to cuCtxPushCurrent and cuCtxPopCurrent, and is not related to video //! decoder in any way (implemented as a critical section associated with cuCtx{Push|Pop}Current calls). /********************************************************************************************************************/ /********************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidCtxLockCreate(CUvideoctxlock *pLock, CUcontext ctx) //! This API is used to create CtxLock object /********************************************************************************************************************/ extern CUresult CUDAAPI cuvidCtxLockCreate(CUvideoctxlock *pLock, CUcontext ctx); /********************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidCtxLockDestroy(CUvideoctxlock lck) //! This API is used to free CtxLock object /********************************************************************************************************************/ extern CUresult CUDAAPI cuvidCtxLockDestroy(CUvideoctxlock lck); /********************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidCtxLock(CUvideoctxlock lck, unsigned int reserved_flags) //! This API is used to acquire ctxlock /********************************************************************************************************************/ extern CUresult CUDAAPI cuvidCtxLock(CUvideoctxlock lck, unsigned int reserved_flags); /********************************************************************************************************************/ //! \fn CUresult CUDAAPI cuvidCtxUnlock(CUvideoctxlock lck, unsigned int reserved_flags) //! This API is used to release ctxlock /********************************************************************************************************************/ extern CUresult CUDAAPI cuvidCtxUnlock(CUvideoctxlock lck, unsigned int reserved_flags); /**********************************************************************************************/ #if defined(__cplusplus) } // Auto-lock helper for C++ applications class CCtxAutoLock { private: CUvideoctxlock m_ctx; public: CCtxAutoLock(CUvideoctxlock ctx):m_ctx(ctx) { cuvidCtxLock(m_ctx,0); } ~CCtxAutoLock() { cuvidCtxUnlock(m_ctx,0); } }; #endif /* __cplusplus */ #endif // __CUDA_VIDEO_H__