summaryrefslogtreecommitdiff
path: root/compat/cuda/dynlink_cuviddec.h
diff options
context:
space:
mode:
Diffstat (limited to 'compat/cuda/dynlink_cuviddec.h')
-rw-r--r--compat/cuda/dynlink_cuviddec.h815
1 files changed, 815 insertions, 0 deletions
diff --git a/compat/cuda/dynlink_cuviddec.h b/compat/cuda/dynlink_cuviddec.h
new file mode 100644
index 0000000000..4d237643a1
--- /dev/null
+++ b/compat/cuda/dynlink_cuviddec.h
@@ -0,0 +1,815 @@
+/*
+ * This copyright notice applies to this header file only:
+ *
+ * Copyright (c) 2010-2016 NVIDIA Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the software, and to permit persons to whom the
+ * software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/**
+ * \file cuviddec.h
+ * NvCuvid API provides Video Decoding interface to NVIDIA GPU devices.
+ * \date 2015-2016
+ * This file contains constants, structure definitions and function prototypes used for decoding.
+ */
+
+#if !defined(__CUDA_VIDEO_H__)
+#define __CUDA_VIDEO_H__
+
+#if defined(__x86_64) || defined(AMD64) || defined(_M_AMD64)
+#if (CUDA_VERSION >= 3020) && (!defined(CUDA_FORCE_API_VERSION) || (CUDA_FORCE_API_VERSION >= 3020))
+#define __CUVID_DEVPTR64
+#endif
+#endif
+
+#if defined(__cplusplus)
+extern "C" {
+#endif /* __cplusplus */
+
+#if defined(__CYGWIN__)
+typedef unsigned int tcu_ulong;
+#else
+typedef unsigned long tcu_ulong;
+#endif
+
+typedef void *CUvideodecoder;
+typedef struct _CUcontextlock_st *CUvideoctxlock;
+
+/**
+ * \addtogroup VIDEO_DECODER Video Decoder
+ * @{
+ */
+
+/*!
+ * \enum cudaVideoCodec
+ * Video Codec Enums
+ */
+typedef enum cudaVideoCodec_enum {
+ cudaVideoCodec_MPEG1=0, /**< MPEG1 */
+ cudaVideoCodec_MPEG2, /**< MPEG2 */
+ cudaVideoCodec_MPEG4, /**< MPEG4 */
+ cudaVideoCodec_VC1, /**< VC1 */
+ cudaVideoCodec_H264, /**< H264 */
+ cudaVideoCodec_JPEG, /**< JPEG */
+ cudaVideoCodec_H264_SVC, /**< H264-SVC */
+ cudaVideoCodec_H264_MVC, /**< H264-MVC */
+ cudaVideoCodec_HEVC, /**< HEVC */
+ cudaVideoCodec_VP8, /**< VP8 */
+ cudaVideoCodec_VP9, /**< VP9 */
+ cudaVideoCodec_NumCodecs, /**< Max COdecs */
+ // Uncompressed YUV
+ cudaVideoCodec_YUV420 = (('I'<<24)|('Y'<<16)|('U'<<8)|('V')), /**< Y,U,V (4:2:0) */
+ cudaVideoCodec_YV12 = (('Y'<<24)|('V'<<16)|('1'<<8)|('2')), /**< Y,V,U (4:2:0) */
+ cudaVideoCodec_NV12 = (('N'<<24)|('V'<<16)|('1'<<8)|('2')), /**< Y,UV (4:2:0) */
+ cudaVideoCodec_YUYV = (('Y'<<24)|('U'<<16)|('Y'<<8)|('V')), /**< YUYV/YUY2 (4:2:2) */
+ cudaVideoCodec_UYVY = (('U'<<24)|('Y'<<16)|('V'<<8)|('Y')) /**< UYVY (4:2:2) */
+} cudaVideoCodec;
+
+/*!
+ * \enum cudaVideoSurfaceFormat
+ * Video Surface Formats Enums
+ */
+typedef enum cudaVideoSurfaceFormat_enum {
+ cudaVideoSurfaceFormat_NV12=0, /**< NV12 */
+ cudaVideoSurfaceFormat_P016=1 /**< P016 */
+} cudaVideoSurfaceFormat;
+
+/*!
+ * \enum cudaVideoDeinterlaceMode
+ * Deinterlacing Modes Enums
+ */
+typedef enum cudaVideoDeinterlaceMode_enum {
+ cudaVideoDeinterlaceMode_Weave=0, /**< Weave both fields (no deinterlacing) */
+ cudaVideoDeinterlaceMode_Bob, /**< Drop one field */
+ cudaVideoDeinterlaceMode_Adaptive /**< Adaptive deinterlacing */
+} cudaVideoDeinterlaceMode;
+
+/*!
+ * \enum cudaVideoChromaFormat
+ * Chroma Formats Enums
+ */
+typedef enum cudaVideoChromaFormat_enum {
+ cudaVideoChromaFormat_Monochrome=0, /**< MonoChrome */
+ cudaVideoChromaFormat_420, /**< 4:2:0 */
+ cudaVideoChromaFormat_422, /**< 4:2:2 */
+ cudaVideoChromaFormat_444 /**< 4:4:4 */
+} cudaVideoChromaFormat;
+
+/*!
+ * \enum cudaVideoCreateFlags
+ * Decoder Flags Enums
+ */
+typedef enum cudaVideoCreateFlags_enum {
+ cudaVideoCreate_Default = 0x00, /**< Default operation mode: use dedicated video engines */
+ cudaVideoCreate_PreferCUDA = 0x01, /**< Use a CUDA-based decoder if faster than dedicated engines (requires a valid vidLock object for multi-threading) */
+ cudaVideoCreate_PreferDXVA = 0x02, /**< Go through DXVA internally if possible (requires D3D9 interop) */
+ cudaVideoCreate_PreferCUVID = 0x04 /**< Use dedicated video engines directly */
+} cudaVideoCreateFlags;
+
+/*!
+ * \struct CUVIDDECODECREATEINFO
+ * Struct used in create decoder
+ */
+typedef struct _CUVIDDECODECREATEINFO
+{
+ tcu_ulong ulWidth; /**< Coded Sequence Width */
+ tcu_ulong ulHeight; /**< Coded Sequence Height */
+ tcu_ulong ulNumDecodeSurfaces; /**< Maximum number of internal decode surfaces */
+ cudaVideoCodec CodecType; /**< cudaVideoCodec_XXX */
+ cudaVideoChromaFormat ChromaFormat; /**< cudaVideoChromaFormat_XXX (only 4:2:0 is currently supported) */
+ tcu_ulong ulCreationFlags; /**< Decoder creation flags (cudaVideoCreateFlags_XXX) */
+ tcu_ulong bitDepthMinus8;
+ tcu_ulong Reserved1[4]; /**< Reserved for future use - set to zero */
+ /**
+ * area of the frame that should be displayed
+ */
+ struct {
+ short left;
+ short top;
+ short right;
+ short bottom;
+ } display_area;
+
+ cudaVideoSurfaceFormat OutputFormat; /**< cudaVideoSurfaceFormat_XXX */
+ cudaVideoDeinterlaceMode DeinterlaceMode; /**< cudaVideoDeinterlaceMode_XXX */
+ tcu_ulong ulTargetWidth; /**< Post-processed Output Width (Should be aligned to 2) */
+ tcu_ulong ulTargetHeight; /**< Post-processed Output Height (Should be aligbed to 2) */
+ tcu_ulong ulNumOutputSurfaces; /**< Maximum number of output surfaces simultaneously mapped */
+ CUvideoctxlock vidLock; /**< If non-NULL, context lock used for synchronizing ownership of the cuda context */
+ /**
+ * target rectangle in the output frame (for aspect ratio conversion)
+ * if a null rectangle is specified, {0,0,ulTargetWidth,ulTargetHeight} will be used
+ */
+ struct {
+ short left;
+ short top;
+ short right;
+ short bottom;
+ } target_rect;
+ tcu_ulong Reserved2[5]; /**< Reserved for future use - set to zero */
+} CUVIDDECODECREATEINFO;
+
+/*!
+ * \struct CUVIDH264DPBENTRY
+ * H.264 DPB Entry
+ */
+typedef struct _CUVIDH264DPBENTRY
+{
+ int PicIdx; /**< picture index of reference frame */
+ int FrameIdx; /**< frame_num(short-term) or LongTermFrameIdx(long-term) */
+ int is_long_term; /**< 0=short term reference, 1=long term reference */
+ int not_existing; /**< non-existing reference frame (corresponding PicIdx should be set to -1) */
+ int used_for_reference; /**< 0=unused, 1=top_field, 2=bottom_field, 3=both_fields */
+ int FieldOrderCnt[2]; /**< field order count of top and bottom fields */
+} CUVIDH264DPBENTRY;
+
+/*!
+ * \struct CUVIDH264MVCEXT
+ * H.264 MVC Picture Parameters Ext
+ */
+typedef struct _CUVIDH264MVCEXT
+{
+ int num_views_minus1;
+ int view_id;
+ unsigned char inter_view_flag;
+ unsigned char num_inter_view_refs_l0;
+ unsigned char num_inter_view_refs_l1;
+ unsigned char MVCReserved8Bits;
+ int InterViewRefsL0[16];
+ int InterViewRefsL1[16];
+} CUVIDH264MVCEXT;
+
+/*!
+ * \struct CUVIDH264SVCEXT
+ * H.264 SVC Picture Parameters Ext
+ */
+typedef struct _CUVIDH264SVCEXT
+{
+ unsigned char profile_idc;
+ unsigned char level_idc;
+ unsigned char DQId;
+ unsigned char DQIdMax;
+ unsigned char disable_inter_layer_deblocking_filter_idc;
+ unsigned char ref_layer_chroma_phase_y_plus1;
+ signed char inter_layer_slice_alpha_c0_offset_div2;
+ signed char inter_layer_slice_beta_offset_div2;
+
+ unsigned short DPBEntryValidFlag;
+ unsigned char inter_layer_deblocking_filter_control_present_flag;
+ unsigned char extended_spatial_scalability_idc;
+ unsigned char adaptive_tcoeff_level_prediction_flag;
+ unsigned char slice_header_restriction_flag;
+ unsigned char chroma_phase_x_plus1_flag;
+ unsigned char chroma_phase_y_plus1;
+
+ unsigned char tcoeff_level_prediction_flag;
+ unsigned char constrained_intra_resampling_flag;
+ unsigned char ref_layer_chroma_phase_x_plus1_flag;
+ unsigned char store_ref_base_pic_flag;
+ unsigned char Reserved8BitsA;
+ unsigned char Reserved8BitsB;
+ // For the 4 scaled_ref_layer_XX fields below,
+ // if (extended_spatial_scalability_idc == 1), SPS field, G.7.3.2.1.4, add prefix "seq_"
+ // if (extended_spatial_scalability_idc == 2), SLH field, G.7.3.3.4,
+ short scaled_ref_layer_left_offset;
+ short scaled_ref_layer_top_offset;
+ short scaled_ref_layer_right_offset;
+ short scaled_ref_layer_bottom_offset;
+ unsigned short Reserved16Bits;
+ struct _CUVIDPICPARAMS *pNextLayer; /**< Points to the picparams for the next layer to be decoded. Linked list ends at the target layer. */
+ int bRefBaseLayer; /**< whether to store ref base pic */
+} CUVIDH264SVCEXT;
+
+/*!
+ * \struct CUVIDH264PICPARAMS
+ * H.264 Picture Parameters
+ */
+typedef struct _CUVIDH264PICPARAMS
+{
+ // SPS
+ int log2_max_frame_num_minus4;
+ int pic_order_cnt_type;
+ int log2_max_pic_order_cnt_lsb_minus4;
+ int delta_pic_order_always_zero_flag;
+ int frame_mbs_only_flag;
+ int direct_8x8_inference_flag;
+ int num_ref_frames; // NOTE: shall meet level 4.1 restrictions
+ unsigned char residual_colour_transform_flag;
+ unsigned char bit_depth_luma_minus8; // Must be 0 (only 8-bit supported)
+ unsigned char bit_depth_chroma_minus8; // Must be 0 (only 8-bit supported)
+ unsigned char qpprime_y_zero_transform_bypass_flag;
+ // PPS
+ int entropy_coding_mode_flag;
+ int pic_order_present_flag;
+ int num_ref_idx_l0_active_minus1;
+ int num_ref_idx_l1_active_minus1;
+ int weighted_pred_flag;
+ int weighted_bipred_idc;
+ int pic_init_qp_minus26;
+ int deblocking_filter_control_present_flag;
+ int redundant_pic_cnt_present_flag;
+ int transform_8x8_mode_flag;
+ int MbaffFrameFlag;
+ int constrained_intra_pred_flag;
+ int chroma_qp_index_offset;
+ int second_chroma_qp_index_offset;
+ int ref_pic_flag;
+ int frame_num;
+ int CurrFieldOrderCnt[2];
+ // DPB
+ CUVIDH264DPBENTRY dpb[16]; // List of reference frames within the DPB
+ // Quantization Matrices (raster-order)
+ unsigned char WeightScale4x4[6][16];
+ unsigned char WeightScale8x8[2][64];
+ // FMO/ASO
+ unsigned char fmo_aso_enable;
+ unsigned char num_slice_groups_minus1;
+ unsigned char slice_group_map_type;
+ signed char pic_init_qs_minus26;
+ unsigned int slice_group_change_rate_minus1;
+ union
+ {
+ unsigned long long slice_group_map_addr;
+ const unsigned char *pMb2SliceGroupMap;
+ } fmo;
+ unsigned int Reserved[12];
+ // SVC/MVC
+ union
+ {
+ CUVIDH264MVCEXT mvcext;
+ CUVIDH264SVCEXT svcext;
+ } svcmvc;
+} CUVIDH264PICPARAMS;
+
+
+/*!
+ * \struct CUVIDMPEG2PICPARAMS
+ * MPEG-2 Picture Parameters
+ */
+typedef struct _CUVIDMPEG2PICPARAMS
+{
+ int ForwardRefIdx; // Picture index of forward reference (P/B-frames)
+ int BackwardRefIdx; // Picture index of backward reference (B-frames)
+ int picture_coding_type;
+ int full_pel_forward_vector;
+ int full_pel_backward_vector;
+ int f_code[2][2];
+ int intra_dc_precision;
+ int frame_pred_frame_dct;
+ int concealment_motion_vectors;
+ int q_scale_type;
+ int intra_vlc_format;
+ int alternate_scan;
+ int top_field_first;
+ // Quantization matrices (raster order)
+ unsigned char QuantMatrixIntra[64];
+ unsigned char QuantMatrixInter[64];
+} CUVIDMPEG2PICPARAMS;
+
+////////////////////////////////////////////////////////////////////////////////////////////////
+//
+// MPEG-4 Picture Parameters
+//
+
+// MPEG-4 has VOP types instead of Picture types
+#define I_VOP 0
+#define P_VOP 1
+#define B_VOP 2
+#define S_VOP 3
+
+/*!
+ * \struct CUVIDMPEG4PICPARAMS
+ * MPEG-4 Picture Parameters
+ */
+typedef struct _CUVIDMPEG4PICPARAMS
+{
+ int ForwardRefIdx; // Picture index of forward reference (P/B-frames)
+ int BackwardRefIdx; // Picture index of backward reference (B-frames)
+ // VOL
+ int video_object_layer_width;
+ int video_object_layer_height;
+ int vop_time_increment_bitcount;
+ int top_field_first;
+ int resync_marker_disable;
+ int quant_type;
+ int quarter_sample;
+ int short_video_header;
+ int divx_flags;
+ // VOP
+ int vop_coding_type;
+ int vop_coded;
+ int vop_rounding_type;
+ int alternate_vertical_scan_flag;
+ int interlaced;
+ int vop_fcode_forward;
+ int vop_fcode_backward;
+ int trd[2];
+ int trb[2];
+ // Quantization matrices (raster order)
+ unsigned char QuantMatrixIntra[64];
+ unsigned char QuantMatrixInter[64];
+ int gmc_enabled;
+} CUVIDMPEG4PICPARAMS;
+
+/*!
+ * \struct CUVIDVC1PICPARAMS
+ * VC1 Picture Parameters
+ */
+typedef struct _CUVIDVC1PICPARAMS
+{
+ int ForwardRefIdx; /**< Picture index of forward reference (P/B-frames) */
+ int BackwardRefIdx; /**< Picture index of backward reference (B-frames) */
+ int FrameWidth; /**< Actual frame width */
+ int FrameHeight; /**< Actual frame height */
+ // PICTURE
+ int intra_pic_flag; /**< Set to 1 for I,BI frames */
+ int ref_pic_flag; /**< Set to 1 for I,P frames */
+ int progressive_fcm; /**< Progressive frame */
+ // SEQUENCE
+ int profile;
+ int postprocflag;
+ int pulldown;
+ int interlace;
+ int tfcntrflag;
+ int finterpflag;
+ int psf;
+ int multires;
+ int syncmarker;
+ int rangered;
+ int maxbframes;
+ // ENTRYPOINT
+ int panscan_flag;
+ int refdist_flag;
+ int extended_mv;
+ int dquant;
+ int vstransform;
+ int loopfilter;
+ int fastuvmc;
+ int overlap;
+ int quantizer;
+ int extended_dmv;
+ int range_mapy_flag;
+ int range_mapy;
+ int range_mapuv_flag;
+ int range_mapuv;
+ int rangeredfrm; // range reduction state
+} CUVIDVC1PICPARAMS;
+
+/*!
+ * \struct CUVIDJPEGPICPARAMS
+ * JPEG Picture Parameters
+ */
+typedef struct _CUVIDJPEGPICPARAMS
+{
+ int Reserved;
+} CUVIDJPEGPICPARAMS;
+
+
+ /*!
+ * \struct CUVIDHEVCPICPARAMS
+ * HEVC Picture Parameters
+ */
+typedef struct _CUVIDHEVCPICPARAMS
+{
+ // sps
+ int pic_width_in_luma_samples;
+ int pic_height_in_luma_samples;
+ unsigned char log2_min_luma_coding_block_size_minus3;
+ unsigned char log2_diff_max_min_luma_coding_block_size;
+ unsigned char log2_min_transform_block_size_minus2;
+ unsigned char log2_diff_max_min_transform_block_size;
+ unsigned char pcm_enabled_flag;
+ unsigned char log2_min_pcm_luma_coding_block_size_minus3;
+ unsigned char log2_diff_max_min_pcm_luma_coding_block_size;
+ unsigned char pcm_sample_bit_depth_luma_minus1;
+
+ unsigned char pcm_sample_bit_depth_chroma_minus1;
+ unsigned char pcm_loop_filter_disabled_flag;
+ unsigned char strong_intra_smoothing_enabled_flag;
+ unsigned char max_transform_hierarchy_depth_intra;
+ unsigned char max_transform_hierarchy_depth_inter;
+ unsigned char amp_enabled_flag;
+ unsigned char separate_colour_plane_flag;
+ unsigned char log2_max_pic_order_cnt_lsb_minus4;
+
+ unsigned char num_short_term_ref_pic_sets;
+ unsigned char long_term_ref_pics_present_flag;
+ unsigned char num_long_term_ref_pics_sps;
+ unsigned char sps_temporal_mvp_enabled_flag;
+ unsigned char sample_adaptive_offset_enabled_flag;
+ unsigned char scaling_list_enable_flag;
+ unsigned char IrapPicFlag;
+ unsigned char IdrPicFlag;
+
+ unsigned char bit_depth_luma_minus8;
+ unsigned char bit_depth_chroma_minus8;
+ unsigned char reserved1[14];
+
+ // pps
+ unsigned char dependent_slice_segments_enabled_flag;
+ unsigned char slice_segment_header_extension_present_flag;
+ unsigned char sign_data_hiding_enabled_flag;
+ unsigned char cu_qp_delta_enabled_flag;
+ unsigned char diff_cu_qp_delta_depth;
+ signed char init_qp_minus26;
+ signed char pps_cb_qp_offset;
+ signed char pps_cr_qp_offset;
+
+ unsigned char constrained_intra_pred_flag;
+ unsigned char weighted_pred_flag;
+ unsigned char weighted_bipred_flag;
+ unsigned char transform_skip_enabled_flag;
+ unsigned char transquant_bypass_enabled_flag;
+ unsigned char entropy_coding_sync_enabled_flag;
+ unsigned char log2_parallel_merge_level_minus2;
+ unsigned char num_extra_slice_header_bits;
+
+ unsigned char loop_filter_across_tiles_enabled_flag;
+ unsigned char loop_filter_across_slices_enabled_flag;
+ unsigned char output_flag_present_flag;
+ unsigned char num_ref_idx_l0_default_active_minus1;
+ unsigned char num_ref_idx_l1_default_active_minus1;
+ unsigned char lists_modification_present_flag;
+ unsigned char cabac_init_present_flag;
+ unsigned char pps_slice_chroma_qp_offsets_present_flag;
+
+ unsigned char deblocking_filter_override_enabled_flag;
+ unsigned char pps_deblocking_filter_disabled_flag;
+ signed char pps_beta_offset_div2;
+ signed char pps_tc_offset_div2;
+ unsigned char tiles_enabled_flag;
+ unsigned char uniform_spacing_flag;
+ unsigned char num_tile_columns_minus1;
+ unsigned char num_tile_rows_minus1;
+
+ unsigned short column_width_minus1[21];
+ unsigned short row_height_minus1[21];
+ unsigned int reserved3[15];
+
+ // RefPicSets
+ int NumBitsForShortTermRPSInSlice;
+ int NumDeltaPocsOfRefRpsIdx;
+ int NumPocTotalCurr;
+ int NumPocStCurrBefore;
+ int NumPocStCurrAfter;
+ int NumPocLtCurr;
+ int CurrPicOrderCntVal;
+ int RefPicIdx[16]; // [refpic] Indices of valid reference pictures (-1 if unused for reference)
+ int PicOrderCntVal[16]; // [refpic]
+ unsigned char IsLongTerm[16]; // [refpic] 0=not a long-term reference, 1=long-term reference
+ unsigned char RefPicSetStCurrBefore[8]; // [0..NumPocStCurrBefore-1] -> refpic (0..15)
+ unsigned char RefPicSetStCurrAfter[8]; // [0..NumPocStCurrAfter-1] -> refpic (0..15)
+ unsigned char RefPicSetLtCurr[8]; // [0..NumPocLtCurr-1] -> refpic (0..15)
+ unsigned char RefPicSetInterLayer0[8];
+ unsigned char RefPicSetInterLayer1[8];
+ unsigned int reserved4[12];
+
+ // scaling lists (diag order)
+ unsigned char ScalingList4x4[6][16]; // [matrixId][i]
+ unsigned char ScalingList8x8[6][64]; // [matrixId][i]
+ unsigned char ScalingList16x16[6][64]; // [matrixId][i]
+ unsigned char ScalingList32x32[2][64]; // [matrixId][i]
+ unsigned char ScalingListDCCoeff16x16[6]; // [matrixId]
+ unsigned char ScalingListDCCoeff32x32[2]; // [matrixId]
+} CUVIDHEVCPICPARAMS;
+
+
+/*!
+ * \struct CUVIDVP8PICPARAMS
+ * VP8 Picture Parameters
+ */
+typedef struct _CUVIDVP8PICPARAMS
+{
+ int width;
+ int height;
+ unsigned int first_partition_size;
+ //Frame Indexes
+ unsigned char LastRefIdx;
+ unsigned char GoldenRefIdx;
+ unsigned char AltRefIdx;
+ union {
+ struct {
+ unsigned char frame_type : 1; /**< 0 = KEYFRAME, 1 = INTERFRAME */
+ unsigned char version : 3;
+ unsigned char show_frame : 1;
+ unsigned char update_mb_segmentation_data : 1; /**< Must be 0 if segmentation is not enabled */
+ unsigned char Reserved2Bits : 2;
+ };
+ unsigned char wFrameTagFlags;
+ } tagflags;
+ unsigned char Reserved1[4];
+ unsigned int Reserved2[3];
+} CUVIDVP8PICPARAMS;
+
+/*!
+ * \struct CUVIDVP9PICPARAMS
+ * VP9 Picture Parameters
+ */
+typedef struct _CUVIDVP9PICPARAMS
+{
+ unsigned int width;
+ unsigned int height;
+
+ //Frame Indices
+ unsigned char LastRefIdx;
+ unsigned char GoldenRefIdx;
+ unsigned char AltRefIdx;
+ unsigned char colorSpace;
+
+ unsigned short profile : 3;
+ unsigned short frameContextIdx : 2;
+ unsigned short frameType : 1;
+ unsigned short showFrame : 1;
+ unsigned short errorResilient : 1;
+ unsigned short frameParallelDecoding : 1;
+ unsigned short subSamplingX : 1;
+ unsigned short subSamplingY : 1;
+ unsigned short intraOnly : 1;
+ unsigned short allow_high_precision_mv : 1;
+ unsigned short refreshEntropyProbs : 1;
+ unsigned short reserved2Bits : 2;
+
+ unsigned short reserved16Bits;
+
+ unsigned char refFrameSignBias[4];
+
+ unsigned char bitDepthMinus8Luma;
+ unsigned char bitDepthMinus8Chroma;
+ unsigned char loopFilterLevel;
+ unsigned char loopFilterSharpness;
+
+ unsigned char modeRefLfEnabled;
+ unsigned char log2_tile_columns;
+ unsigned char log2_tile_rows;
+
+ unsigned char segmentEnabled : 1;
+ unsigned char segmentMapUpdate : 1;
+ unsigned char segmentMapTemporalUpdate : 1;
+ unsigned char segmentFeatureMode : 1;
+ unsigned char reserved4Bits : 4;
+
+
+ unsigned char segmentFeatureEnable[8][4];
+ short segmentFeatureData[8][4];
+ unsigned char mb_segment_tree_probs[7];
+ unsigned char segment_pred_probs[3];
+ unsigned char reservedSegment16Bits[2];
+
+ int qpYAc;
+ int qpYDc;
+ int qpChDc;
+ int qpChAc;
+
+ unsigned int activeRefIdx[3];
+ unsigned int resetFrameContext;
+ unsigned int mcomp_filter_type;
+ unsigned int mbRefLfDelta[4];
+ unsigned int mbModeLfDelta[2];
+ unsigned int frameTagSize;
+ unsigned int offsetToDctParts;
+ unsigned int reserved128Bits[4];
+
+} CUVIDVP9PICPARAMS;
+
+
+/*!
+ * \struct CUVIDPICPARAMS
+ * Picture Parameters for Decoding
+ */
+typedef struct _CUVIDPICPARAMS
+{
+ int PicWidthInMbs; /**< Coded Frame Size */
+ int FrameHeightInMbs; /**< Coded Frame Height */
+ int CurrPicIdx; /**< Output index of the current picture */
+ int field_pic_flag; /**< 0=frame picture, 1=field picture */
+ int bottom_field_flag; /**< 0=top field, 1=bottom field (ignored if field_pic_flag=0) */
+ int second_field; /**< Second field of a complementary field pair */
+ // Bitstream data
+ unsigned int nBitstreamDataLen; /**< Number of bytes in bitstream data buffer */
+ const unsigned char *pBitstreamData; /**< Ptr to bitstream data for this picture (slice-layer) */
+ unsigned int nNumSlices; /**< Number of slices in this picture */
+ const unsigned int *pSliceDataOffsets; /**< nNumSlices entries, contains offset of each slice within the bitstream data buffer */
+ int ref_pic_flag; /**< This picture is a reference picture */
+ int intra_pic_flag; /**< This picture is entirely intra coded */
+ unsigned int Reserved[30]; /**< Reserved for future use */
+ // Codec-specific data
+ union {
+ CUVIDMPEG2PICPARAMS mpeg2; /**< Also used for MPEG-1 */
+ CUVIDH264PICPARAMS h264;
+ CUVIDVC1PICPARAMS vc1;
+ CUVIDMPEG4PICPARAMS mpeg4;
+ CUVIDJPEGPICPARAMS jpeg;
+ CUVIDHEVCPICPARAMS hevc;
+ CUVIDVP8PICPARAMS vp8;
+ CUVIDVP9PICPARAMS vp9;
+ unsigned int CodecReserved[1024];
+ } CodecSpecific;
+} CUVIDPICPARAMS;
+
+
+/*!
+ * \struct CUVIDPROCPARAMS
+ * Picture Parameters for Postprocessing
+ */
+typedef struct _CUVIDPROCPARAMS
+{
+ int progressive_frame; /**< Input is progressive (deinterlace_mode will be ignored) */
+ int second_field; /**< Output the second field (ignored if deinterlace mode is Weave) */
+ int top_field_first; /**< Input frame is top field first (1st field is top, 2nd field is bottom) */
+ int unpaired_field; /**< Input only contains one field (2nd field is invalid) */
+ // The fields below are used for raw YUV input
+ unsigned int reserved_flags; /**< Reserved for future use (set to zero) */
+ unsigned int reserved_zero; /**< Reserved (set to zero) */
+ unsigned long long raw_input_dptr; /**< Input CUdeviceptr for raw YUV extensions */
+ unsigned int raw_input_pitch; /**< pitch in bytes of raw YUV input (should be aligned appropriately) */
+ unsigned int raw_input_format; /**< Reserved for future use (set to zero) */
+ unsigned long long raw_output_dptr; /**< Reserved for future use (set to zero) */
+ unsigned int raw_output_pitch; /**< Reserved for future use (set to zero) */
+ unsigned int Reserved[48];
+ void *Reserved3[3];
+} CUVIDPROCPARAMS;
+
+
+/**
+ *
+ * In order to minimize decode latencies, there should be always at least 2 pictures in the decode
+ * queue at any time, in order to make sure that all decode engines are always busy.
+ *
+ * Overall data flow:
+ * - cuvidCreateDecoder(...)
+ * For each picture:
+ * - cuvidDecodePicture(N)
+ * - cuvidMapVideoFrame(N-4)
+ * - do some processing in cuda
+ * - cuvidUnmapVideoFrame(N-4)
+ * - cuvidDecodePicture(N+1)
+ * - cuvidMapVideoFrame(N-3)
+ * ...
+ * - cuvidDestroyDecoder(...)
+ *
+ * NOTE:
+ * - When the cuda context is created from a D3D device, the D3D device must also be created
+ * with the D3DCREATE_MULTITHREADED flag.
+ * - There is a limit to how many pictures can be mapped simultaneously (ulNumOutputSurfaces)
+ * - cuVidDecodePicture may block the calling thread if there are too many pictures pending
+ * in the decode queue
+ */
+
+/**
+ * \fn CUresult CUDAAPI cuvidCreateDecoder(CUvideodecoder *phDecoder, CUVIDDECODECREATEINFO *pdci)
+ * Create the decoder object
+ */
+typedef CUresult CUDAAPI tcuvidCreateDecoder(CUvideodecoder *phDecoder, CUVIDDECODECREATEINFO *pdci);
+
+/**
+ * \fn CUresult CUDAAPI cuvidDestroyDecoder(CUvideodecoder hDecoder)
+ * Destroy the decoder object
+ */
+typedef CUresult CUDAAPI tcuvidDestroyDecoder(CUvideodecoder hDecoder);
+
+/**
+ * \fn CUresult CUDAAPI cuvidDecodePicture(CUvideodecoder hDecoder, CUVIDPICPARAMS *pPicParams)
+ * Decode a single picture (field or frame)
+ */
+typedef CUresult CUDAAPI tcuvidDecodePicture(CUvideodecoder hDecoder, CUVIDPICPARAMS *pPicParams);
+
+
+#if !defined(__CUVID_DEVPTR64) || defined(__CUVID_INTERNAL)
+/**
+ * \fn CUresult CUDAAPI cuvidMapVideoFrame(CUvideodecoder hDecoder, int nPicIdx, unsigned int *pDevPtr, unsigned int *pPitch, CUVIDPROCPARAMS *pVPP);
+ * Post-process and map a video frame for use in cuda
+ */
+typedef CUresult CUDAAPI tcuvidMapVideoFrame(CUvideodecoder hDecoder, int nPicIdx,
+ unsigned int *pDevPtr, unsigned int *pPitch,
+ CUVIDPROCPARAMS *pVPP);
+
+/**
+ * \fn CUresult CUDAAPI cuvidUnmapVideoFrame(CUvideodecoder hDecoder, unsigned int DevPtr)
+ * Unmap a previously mapped video frame
+ */
+typedef CUresult CUDAAPI tcuvidUnmapVideoFrame(CUvideodecoder hDecoder, unsigned int DevPtr);
+#endif
+
+#if defined(WIN64) || defined(_WIN64) || defined(__x86_64) || defined(AMD64) || defined(_M_AMD64)
+/**
+ * \fn CUresult CUDAAPI cuvidMapVideoFrame64(CUvideodecoder hDecoder, int nPicIdx, unsigned long long *pDevPtr, unsigned int *pPitch, CUVIDPROCPARAMS *pVPP);
+ * map a video frame
+ */
+typedef CUresult CUDAAPI tcuvidMapVideoFrame64(CUvideodecoder hDecoder, int nPicIdx, unsigned long long *pDevPtr,
+ unsigned int *pPitch, CUVIDPROCPARAMS *pVPP);
+
+/**
+ * \fn CUresult CUDAAPI cuvidUnmapVideoFrame64(CUvideodecoder hDecoder, unsigned long long DevPtr);
+ * Unmap a previously mapped video frame
+ */
+typedef CUresult CUDAAPI tcuvidUnmapVideoFrame64(CUvideodecoder hDecoder, unsigned long long DevPtr);
+
+#if defined(__CUVID_DEVPTR64) && !defined(__CUVID_INTERNAL)
+#define tcuvidMapVideoFrame tcuvidMapVideoFrame64
+#define tcuvidUnmapVideoFrame tcuvidUnmapVideoFrame64
+#endif
+#endif
+
+
+/**
+ *
+ * Context-locking: to facilitate multi-threaded implementations, the following 4 functions
+ * provide a simple mutex-style host synchronization. If a non-NULL context is specified
+ * in CUVIDDECODECREATEINFO, the codec library will acquire the mutex associated with the given
+ * context before making any cuda calls.
+ * A multi-threaded application could create a lock associated with a context handle so that
+ * multiple threads can safely share the same cuda context:
+ * - use cuCtxPopCurrent immediately after context creation in order to create a 'floating' context
+ * that can be passed to cuvidCtxLockCreate.
+ * - When using a floating context, all cuda calls should only be made within a cuvidCtxLock/cuvidCtxUnlock section.
+ *
+ * NOTE: This is a safer alternative to cuCtxPushCurrent and cuCtxPopCurrent, and is not related to video
+ * decoder in any way (implemented as a critical section associated with cuCtx{Push|Pop}Current calls).
+*/
+
+/**
+ * \fn CUresult CUDAAPI cuvidCtxLockCreate(CUvideoctxlock *pLock, CUcontext ctx)
+ */
+typedef CUresult CUDAAPI tcuvidCtxLockCreate(CUvideoctxlock *pLock, CUcontext ctx);
+
+/**
+ * \fn CUresult CUDAAPI cuvidCtxLockDestroy(CUvideoctxlock lck)
+ */
+typedef CUresult CUDAAPI tcuvidCtxLockDestroy(CUvideoctxlock lck);
+
+/**
+ * \fn CUresult CUDAAPI cuvidCtxLock(CUvideoctxlock lck, unsigned int reserved_flags)
+ */
+typedef CUresult CUDAAPI tcuvidCtxLock(CUvideoctxlock lck, unsigned int reserved_flags);
+
+/**
+ * \fn CUresult CUDAAPI cuvidCtxUnlock(CUvideoctxlock lck, unsigned int reserved_flags)
+ */
+typedef CUresult CUDAAPI tcuvidCtxUnlock(CUvideoctxlock lck, unsigned int reserved_flags);
+
+/** @} */ /* End VIDEO_DECODER */
+
+#if defined(__cplusplus)
+}
+#endif /* __cplusplus */
+
+#endif // __CUDA_VIDEO_H__