Permalink
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Showing
with
234 additions
and 1 deletion.
- +2 −0 configure
- +1 −0 libavcodec/Makefile
- +1 −0 libavcodec/allcodecs.c
- +8 −0 libavcodec/cuviddec.c
- +212 −0 libavcodec/nvdec_vp9.c
- +10 −1 libavcodec/vp9.c
| @@ -0,0 +1,212 @@ | ||
| /* | ||
| * VP9 HW decode acceleration through NVDEC | ||
| * | ||
| * Copyright (c) 2016 Timo Rothenpieler | ||
| * | ||
| * This file is part of FFmpeg. | ||
| * | ||
| * FFmpeg is free software; you can redistribute it and/or | ||
| * modify it under the terms of the GNU Lesser General Public | ||
| * License as published by the Free Software Foundation; either | ||
| * version 2.1 of the License, or (at your option) any later version. | ||
| * | ||
| * FFmpeg is distributed in the hope that it will be useful, | ||
| * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
| * Lesser General Public License for more details. | ||
| * | ||
| * You should have received a copy of the GNU Lesser General Public | ||
| * License along with FFmpeg; if not, write to the Free Software | ||
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| */ | ||
|
|
||
| #include "libavutil/pixdesc.h" | ||
|
|
||
| #include "avcodec.h" | ||
| #include "nvdec.h" | ||
| #include "decode.h" | ||
| #include "internal.h" | ||
| #include "vp9shared.h" | ||
|
|
||
| static int nvdec_vp9_start_frame(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size) | ||
| { | ||
| VP9SharedContext *h = avctx->priv_data; | ||
| const AVPixFmtDescriptor *pixdesc = av_pix_fmt_desc_get(avctx->sw_pix_fmt); | ||
|
|
||
| NVDECContext *ctx = avctx->internal->hwaccel_priv_data; | ||
| CUVIDPICPARAMS *pp = &ctx->pic_params; | ||
| CUVIDVP9PICPARAMS *ppc = &pp->CodecSpecific.vp9; | ||
| FrameDecodeData *fdd; | ||
| NVDECFrame *cf; | ||
| AVFrame *cur_frame = h->frames[CUR_FRAME].tf.f; | ||
|
|
||
| int ret, i; | ||
|
|
||
| ret = ff_nvdec_start_frame(avctx, cur_frame); | ||
| if (ret < 0) | ||
| return ret; | ||
|
|
||
| fdd = (FrameDecodeData*)cur_frame->private_ref->data; | ||
| cf = (NVDECFrame*)fdd->hwaccel_priv; | ||
|
|
||
| *pp = (CUVIDPICPARAMS) { | ||
| .PicWidthInMbs = cur_frame->width / 16, | ||
| .FrameHeightInMbs = cur_frame->height / 16, | ||
| .CurrPicIdx = cf->idx, | ||
|
|
||
| .CodecSpecific.vp9 = { | ||
| .width = cur_frame->width, | ||
| .height = cur_frame->height, | ||
|
|
||
| .LastRefIdx = h->h.refidx[0], | ||
| .GoldenRefIdx = h->h.refidx[1], | ||
| .AltRefIdx = h->h.refidx[2], | ||
|
|
||
| .profile = h->h.profile, | ||
| .frameContextIdx = h->h.framectxid, | ||
| .frameType = !h->h.keyframe, | ||
| .showFrame = !h->h.invisible, | ||
| .errorResilient = h->h.errorres, | ||
| .frameParallelDecoding = h->h.parallelmode, | ||
| .subSamplingX = pixdesc->log2_chroma_w, | ||
| .subSamplingY = pixdesc->log2_chroma_h, | ||
| .intraOnly = h->h.intraonly, | ||
| .allow_high_precision_mv = h->h.keyframe ? 0 : h->h.highprecisionmvs, | ||
| .refreshEntropyProbs = 0, //TODO | ||
|
|
||
| .refFrameSignBias[0] = h->h.signbias[0], | ||
| .refFrameSignBias[1] = h->h.signbias[1], | ||
| .refFrameSignBias[2] = h->h.signbias[2], | ||
| .refFrameSignBias[3] = 0, //TODO: ??? | ||
|
|
||
| .bitDepthMinus8Luma = pixdesc->comp[0].depth - 8, | ||
| .bitDepthMinus8Chroma = pixdesc->comp[1].depth - 8, | ||
|
|
||
| .loopFilterLevel = h->h.filter.level, | ||
| .loopFilterSharpness = h->h.filter.sharpness, | ||
| .modeRefLfEnabled = h->h.lf_delta.enabled, | ||
|
|
||
| .log2_tile_columns = h->h.tiling.log2_tile_cols, | ||
| .log2_tile_rows = h->h.tiling.log2_tile_rows, | ||
|
|
||
| .segmentEnabled = h->h.segmentation.enabled, | ||
| .segmentMapUpdate = h->h.segmentation.update_map, | ||
| .segmentMapTemporalUpdate = h->h.segmentation.temporal, | ||
| .segmentFeatureMode = h->h.segmentation.absolute_vals, //TODO: verify | ||
|
|
||
| // TODO: verify if needs processing | ||
| .qpYAc = h->h.yac_qi, | ||
| .qpYDc = h->h.ydc_qdelta, | ||
| .qpChDc = h->h.uvdc_qdelta, | ||
| .qpChAc = h->h.uvac_qdelta, | ||
|
|
||
| // TODO: ??? | ||
| .activeRefIdx[0] = 0, | ||
| .activeRefIdx[1] = 0, | ||
| .activeRefIdx[2] = 0, | ||
|
|
||
| .resetFrameContext = h->h.resetctx, | ||
| .mcomp_filter_type = h->h.filtermode ^ (h->h.filtermode <= 1), | ||
| .frameTagSize = 0, //TODO | ||
| .offsetToDctParts = 0, //TODO | ||
| } | ||
| }; | ||
|
|
||
| for (i = 0; i < 2; i++) | ||
| ppc->mbModeLfDelta[i] = h->h.lf_delta.mode[i]; | ||
|
|
||
| for (i = 0; i < 4; i++) | ||
| ppc->mbRefLfDelta[i] = h->h.lf_delta.ref[i]; | ||
|
|
||
| for (i = 0; i < 7; i++) | ||
| ppc->mb_segment_tree_probs[i] = h->h.segmentation.prob[i]; | ||
|
|
||
| for (i = 0; i < 3; i++) | ||
| ppc->segment_pred_probs[i] = h->h.segmentation.pred_prob[i]; | ||
|
|
||
| for (i = 0; i < 8; i++) { | ||
| ppc->segmentFeatureEnable[i][0] = h->h.segmentation.feat[i].q_enabled; | ||
| ppc->segmentFeatureEnable[i][1] = h->h.segmentation.feat[i].lf_enabled; | ||
| ppc->segmentFeatureEnable[i][2] = h->h.segmentation.feat[i].ref_enabled; | ||
| ppc->segmentFeatureEnable[i][3] = h->h.segmentation.feat[i].skip_enabled; | ||
|
|
||
| ppc->segmentFeatureData[i][0] = h->h.segmentation.feat[i].q_val; | ||
| ppc->segmentFeatureData[i][1] = h->h.segmentation.feat[i].lf_val; | ||
| ppc->segmentFeatureData[i][2] = h->h.segmentation.feat[i].ref_val; | ||
| ppc->segmentFeatureData[i][3] = 0; | ||
| } | ||
|
|
||
| switch (avctx->colorspace) { | ||
| default: | ||
| case AVCOL_SPC_UNSPECIFIED: | ||
| ppc->colorSpace = 0; | ||
| break; | ||
| case AVCOL_SPC_BT470BG: | ||
| ppc->colorSpace = 1; | ||
| break; | ||
| case AVCOL_SPC_BT709: | ||
| ppc->colorSpace = 2; | ||
| break; | ||
| case AVCOL_SPC_SMPTE170M: | ||
| ppc->colorSpace = 3; | ||
| break; | ||
| case AVCOL_SPC_SMPTE240M: | ||
| ppc->colorSpace = 4; | ||
| break; | ||
| case AVCOL_SPC_BT2020_NCL: | ||
| ppc->colorSpace = 5; | ||
| break; | ||
| case AVCOL_SPC_RESERVED: | ||
| ppc->colorSpace = 6; | ||
| break; | ||
| case AVCOL_SPC_RGB: | ||
| ppc->colorSpace = 7; | ||
| break; | ||
| } | ||
|
|
||
| return 0; | ||
| } | ||
|
|
||
| static int nvdec_vp9_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size) | ||
| { | ||
| NVDECContext *ctx = avctx->internal->hwaccel_priv_data; | ||
| void *tmp; | ||
|
|
||
| tmp = av_fast_realloc(ctx->bitstream, &ctx->bitstream_allocated, | ||
| ctx->bitstream_len + size); | ||
| if (!tmp) | ||
| return AVERROR(ENOMEM); | ||
| ctx->bitstream = tmp; | ||
|
|
||
| tmp = av_fast_realloc(ctx->slice_offsets, &ctx->slice_offsets_allocated, | ||
| (ctx->nb_slices + 1) * sizeof(*ctx->slice_offsets)); | ||
| if (!tmp) | ||
| return AVERROR(ENOMEM); | ||
| ctx->slice_offsets = tmp; | ||
|
|
||
| memcpy(ctx->bitstream + ctx->bitstream_len, buffer, size); | ||
| ctx->slice_offsets[ctx->nb_slices] = ctx->bitstream_len; | ||
| ctx->bitstream_len += size; | ||
| ctx->nb_slices++; | ||
|
|
||
| return 0; | ||
| } | ||
|
|
||
| static int nvdec_vp9_decode_init(AVCodecContext *avctx) | ||
| { | ||
| // VP9 uses a fixed size pool of 8 possible reference frames | ||
| return ff_nvdec_decode_init(avctx, 8); | ||
| } | ||
|
|
||
| AVHWAccel ff_vp9_nvdec_hwaccel = { | ||
| .name = "vp9_nvdec", | ||
| .type = AVMEDIA_TYPE_VIDEO, | ||
| .id = AV_CODEC_ID_VP9, | ||
| .pix_fmt = AV_PIX_FMT_CUDA, | ||
| .start_frame = nvdec_vp9_start_frame, | ||
| .end_frame = ff_nvdec_end_frame, | ||
| .decode_slice = nvdec_vp9_decode_slice, | ||
| .init = nvdec_vp9_decode_init, | ||
| .uninit = ff_nvdec_decode_uninit, | ||
| .priv_data_size = sizeof(NVDECContext), | ||
| }; |