summaryrefslogtreecommitdiff
path: root/libavcodec/nvdec_vp9.c
diff options
context:
space:
mode:
Diffstat (limited to 'libavcodec/nvdec_vp9.c')
-rw-r--r--libavcodec/nvdec_vp9.c184
1 files changed, 184 insertions, 0 deletions
diff --git a/libavcodec/nvdec_vp9.c b/libavcodec/nvdec_vp9.c
new file mode 100644
index 0000000000..a76bcf9943
--- /dev/null
+++ b/libavcodec/nvdec_vp9.c
@@ -0,0 +1,184 @@
+/*
+ * VP9 HW decode acceleration through NVDEC
+ *
+ * Copyright (c) 2016 Timo Rothenpieler
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include "libavutil/pixdesc.h"
+
+#include "avcodec.h"
+#include "nvdec.h"
+#include "decode.h"
+#include "internal.h"
+#include "vp9shared.h"
+
+static int nvdec_vp9_start_frame(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
+{
+ VP9SharedContext *h = avctx->priv_data;
+ const AVPixFmtDescriptor *pixdesc = av_pix_fmt_desc_get(avctx->sw_pix_fmt);
+
+ NVDECContext *ctx = avctx->internal->hwaccel_priv_data;
+ CUVIDPICPARAMS *pp = &ctx->pic_params;
+ CUVIDVP9PICPARAMS *ppc = &pp->CodecSpecific.vp9;
+ FrameDecodeData *fdd;
+ NVDECFrame *cf;
+ AVFrame *cur_frame = h->frames[CUR_FRAME].tf.f;
+
+ int ret, i;
+
+ ret = ff_nvdec_start_frame(avctx, cur_frame);
+ if (ret < 0)
+ return ret;
+
+ fdd = (FrameDecodeData*)cur_frame->private_ref->data;
+ cf = (NVDECFrame*)fdd->hwaccel_priv;
+
+ *pp = (CUVIDPICPARAMS) {
+ .PicWidthInMbs = (cur_frame->width + 15) / 16,
+ .FrameHeightInMbs = (cur_frame->height + 15) / 16,
+ .CurrPicIdx = cf->idx,
+
+ .CodecSpecific.vp9 = {
+ .width = cur_frame->width,
+ .height = cur_frame->height,
+
+ .LastRefIdx = ff_nvdec_get_ref_idx(h->refs[h->h.refidx[0]].f),
+ .GoldenRefIdx = ff_nvdec_get_ref_idx(h->refs[h->h.refidx[1]].f),
+ .AltRefIdx = ff_nvdec_get_ref_idx(h->refs[h->h.refidx[2]].f),
+
+ .profile = h->h.profile,
+ .frameContextIdx = h->h.framectxid,
+ .frameType = !h->h.keyframe,
+ .showFrame = !h->h.invisible,
+ .errorResilient = h->h.errorres,
+ .frameParallelDecoding = h->h.parallelmode,
+ .subSamplingX = pixdesc->log2_chroma_w,
+ .subSamplingY = pixdesc->log2_chroma_h,
+ .intraOnly = h->h.intraonly,
+ .allow_high_precision_mv = h->h.keyframe ? 0 : h->h.highprecisionmvs,
+ .refreshEntropyProbs = h->h.refreshctx,
+
+ .bitDepthMinus8Luma = pixdesc->comp[0].depth - 8,
+ .bitDepthMinus8Chroma = pixdesc->comp[1].depth - 8,
+
+ .loopFilterLevel = h->h.filter.level,
+ .loopFilterSharpness = h->h.filter.sharpness,
+ .modeRefLfEnabled = h->h.lf_delta.enabled,
+
+ .log2_tile_columns = h->h.tiling.log2_tile_cols,
+ .log2_tile_rows = h->h.tiling.log2_tile_rows,
+
+ .segmentEnabled = h->h.segmentation.enabled,
+ .segmentMapUpdate = h->h.segmentation.update_map,
+ .segmentMapTemporalUpdate = h->h.segmentation.temporal,
+ .segmentFeatureMode = h->h.segmentation.absolute_vals,
+
+ .qpYAc = h->h.yac_qi,
+ .qpYDc = h->h.ydc_qdelta,
+ .qpChDc = h->h.uvdc_qdelta,
+ .qpChAc = h->h.uvac_qdelta,
+
+ .resetFrameContext = h->h.resetctx,
+ .mcomp_filter_type = h->h.filtermode ^ (h->h.filtermode <= 1),
+
+ .frameTagSize = h->h.uncompressed_header_size,
+ .offsetToDctParts = h->h.compressed_header_size,
+
+ .refFrameSignBias[0] = 0,
+ }
+ };
+
+ for (i = 0; i < 2; i++)
+ ppc->mbModeLfDelta[i] = h->h.lf_delta.mode[i];
+
+ for (i = 0; i < 4; i++)
+ ppc->mbRefLfDelta[i] = h->h.lf_delta.ref[i];
+
+ for (i = 0; i < 7; i++)
+ ppc->mb_segment_tree_probs[i] = h->h.segmentation.prob[i];
+
+ for (i = 0; i < 3; i++) {
+ ppc->activeRefIdx[i] = h->h.refidx[i];
+ ppc->segment_pred_probs[i] = h->h.segmentation.pred_prob[i];
+ ppc->refFrameSignBias[i + 1] = h->h.signbias[i];
+ }
+
+ for (i = 0; i < 8; i++) {
+ ppc->segmentFeatureEnable[i][0] = h->h.segmentation.feat[i].q_enabled;
+ ppc->segmentFeatureEnable[i][1] = h->h.segmentation.feat[i].lf_enabled;
+ ppc->segmentFeatureEnable[i][2] = h->h.segmentation.feat[i].ref_enabled;
+ ppc->segmentFeatureEnable[i][3] = h->h.segmentation.feat[i].skip_enabled;
+
+ ppc->segmentFeatureData[i][0] = h->h.segmentation.feat[i].q_val;
+ ppc->segmentFeatureData[i][1] = h->h.segmentation.feat[i].lf_val;
+ ppc->segmentFeatureData[i][2] = h->h.segmentation.feat[i].ref_val;
+ ppc->segmentFeatureData[i][3] = 0;
+ }
+
+ switch (avctx->colorspace) {
+ default:
+ case AVCOL_SPC_UNSPECIFIED:
+ ppc->colorSpace = 0;
+ break;
+ case AVCOL_SPC_BT470BG:
+ ppc->colorSpace = 1;
+ break;
+ case AVCOL_SPC_BT709:
+ ppc->colorSpace = 2;
+ break;
+ case AVCOL_SPC_SMPTE170M:
+ ppc->colorSpace = 3;
+ break;
+ case AVCOL_SPC_SMPTE240M:
+ ppc->colorSpace = 4;
+ break;
+ case AVCOL_SPC_BT2020_NCL:
+ ppc->colorSpace = 5;
+ break;
+ case AVCOL_SPC_RESERVED:
+ ppc->colorSpace = 6;
+ break;
+ case AVCOL_SPC_RGB:
+ ppc->colorSpace = 7;
+ break;
+ }
+
+ return 0;
+}
+
+static int nvdec_vp9_frame_params(AVCodecContext *avctx,
+ AVBufferRef *hw_frames_ctx)
+{
+ // VP9 uses a fixed size pool of 8 possible reference frames
+ return ff_nvdec_frame_params(avctx, hw_frames_ctx, 8, 0);
+}
+
+const AVHWAccel ff_vp9_nvdec_hwaccel = {
+ .name = "vp9_nvdec",
+ .type = AVMEDIA_TYPE_VIDEO,
+ .id = AV_CODEC_ID_VP9,
+ .pix_fmt = AV_PIX_FMT_CUDA,
+ .start_frame = nvdec_vp9_start_frame,
+ .end_frame = ff_nvdec_simple_end_frame,
+ .decode_slice = ff_nvdec_simple_decode_slice,
+ .frame_params = nvdec_vp9_frame_params,
+ .init = ff_nvdec_decode_init,
+ .uninit = ff_nvdec_decode_uninit,
+ .priv_data_size = sizeof(NVDECContext),
+};