|
|
|
@@ -43,6 +43,20 @@ typedef struct CuvidContext |
|
|
|
char *cu_gpu; |
|
|
|
int nb_surfaces; |
|
|
|
int drop_second_field; |
|
|
|
char *crop_expr; |
|
|
|
char *resize_expr; |
|
|
|
|
|
|
|
struct { |
|
|
|
int left; |
|
|
|
int top; |
|
|
|
int right; |
|
|
|
int bottom; |
|
|
|
} crop; |
|
|
|
|
|
|
|
struct { |
|
|
|
int width; |
|
|
|
int height; |
|
|
|
} resize; |
|
|
|
|
|
|
|
AVBufferRef *hwdevice; |
|
|
|
AVBufferRef *hwframe; |
|
|
|
@@ -107,17 +121,46 @@ static int CUDAAPI cuvid_handle_video_sequence(void *opaque, CUVIDEOFORMAT* form |
|
|
|
CUVIDDECODECREATEINFO cuinfo; |
|
|
|
int surface_fmt; |
|
|
|
|
|
|
|
int old_width = avctx->width; |
|
|
|
int old_height = avctx->height; |
|
|
|
|
|
|
|
enum AVPixelFormat pix_fmts[3] = { AV_PIX_FMT_CUDA, |
|
|
|
AV_PIX_FMT_NONE, // Will be updated below |
|
|
|
AV_PIX_FMT_NONE }; |
|
|
|
|
|
|
|
av_log(avctx, AV_LOG_TRACE, "pfnSequenceCallback, progressive_sequence=%d\n", format->progressive_sequence); |
|
|
|
|
|
|
|
memset(&cuinfo, 0, sizeof(cuinfo)); |
|
|
|
|
|
|
|
ctx->internal_error = 0; |
|
|
|
|
|
|
|
avctx->coded_width = cuinfo.ulWidth = format->coded_width; |
|
|
|
avctx->coded_height = cuinfo.ulHeight = format->coded_height; |
|
|
|
|
|
|
|
// apply cropping |
|
|
|
cuinfo.display_area.left = format->display_area.left + ctx->crop.left; |
|
|
|
cuinfo.display_area.top = format->display_area.top + ctx->crop.top; |
|
|
|
cuinfo.display_area.right = format->display_area.right - ctx->crop.right; |
|
|
|
cuinfo.display_area.bottom = format->display_area.bottom - ctx->crop.bottom; |
|
|
|
|
|
|
|
// width and height need to be set before calling ff_get_format |
|
|
|
avctx->width = format->display_area.right; |
|
|
|
avctx->height = format->display_area.bottom; |
|
|
|
if (ctx->resize_expr) { |
|
|
|
avctx->width = ctx->resize.width; |
|
|
|
avctx->height = ctx->resize.height; |
|
|
|
} else { |
|
|
|
avctx->width = cuinfo.display_area.right - cuinfo.display_area.left; |
|
|
|
avctx->height = cuinfo.display_area.bottom - cuinfo.display_area.top; |
|
|
|
} |
|
|
|
|
|
|
|
// target width/height need to be multiples of two |
|
|
|
cuinfo.ulTargetWidth = avctx->width = (avctx->width + 1) & ~1; |
|
|
|
cuinfo.ulTargetHeight = avctx->height = (avctx->height + 1) & ~1; |
|
|
|
|
|
|
|
// aspect ratio conversion, 1:1, depends on scaled resolution |
|
|
|
cuinfo.target_rect.left = 0; |
|
|
|
cuinfo.target_rect.top = 0; |
|
|
|
cuinfo.target_rect.right = cuinfo.ulTargetWidth; |
|
|
|
cuinfo.target_rect.bottom = cuinfo.ulTargetHeight; |
|
|
|
|
|
|
|
switch (format->bit_depth_luma_minus8) { |
|
|
|
case 0: // 8-bit |
|
|
|
@@ -195,6 +238,8 @@ static int CUDAAPI cuvid_handle_video_sequence(void *opaque, CUVIDEOFORMAT* form |
|
|
|
if (ctx->cudecoder |
|
|
|
&& avctx->coded_width == format->coded_width |
|
|
|
&& avctx->coded_height == format->coded_height |
|
|
|
&& avctx->width == old_width |
|
|
|
&& avctx->height == old_height |
|
|
|
&& ctx->chroma_format == format->chroma_format |
|
|
|
&& ctx->codec_type == format->codec) |
|
|
|
return 1; |
|
|
|
@@ -228,13 +273,8 @@ static int CUDAAPI cuvid_handle_video_sequence(void *opaque, CUVIDEOFORMAT* form |
|
|
|
return 0; |
|
|
|
} |
|
|
|
|
|
|
|
avctx->coded_width = format->coded_width; |
|
|
|
avctx->coded_height = format->coded_height; |
|
|
|
|
|
|
|
ctx->chroma_format = format->chroma_format; |
|
|
|
|
|
|
|
memset(&cuinfo, 0, sizeof(cuinfo)); |
|
|
|
|
|
|
|
cuinfo.CodecType = ctx->codec_type = format->codec; |
|
|
|
cuinfo.ChromaFormat = format->chroma_format; |
|
|
|
|
|
|
|
@@ -252,16 +292,6 @@ static int CUDAAPI cuvid_handle_video_sequence(void *opaque, CUVIDEOFORMAT* form |
|
|
|
return 0; |
|
|
|
} |
|
|
|
|
|
|
|
cuinfo.ulWidth = avctx->coded_width; |
|
|
|
cuinfo.ulHeight = avctx->coded_height; |
|
|
|
cuinfo.ulTargetWidth = cuinfo.ulWidth; |
|
|
|
cuinfo.ulTargetHeight = cuinfo.ulHeight; |
|
|
|
|
|
|
|
cuinfo.target_rect.left = 0; |
|
|
|
cuinfo.target_rect.top = 0; |
|
|
|
cuinfo.target_rect.right = cuinfo.ulWidth; |
|
|
|
cuinfo.target_rect.bottom = cuinfo.ulHeight; |
|
|
|
|
|
|
|
cuinfo.ulNumDecodeSurfaces = ctx->nb_surfaces; |
|
|
|
cuinfo.ulNumOutputSurfaces = 1; |
|
|
|
cuinfo.ulCreationFlags = cudaVideoCreate_PreferCUVID; |
|
|
|
@@ -486,7 +516,7 @@ static int cuvid_output_frame(AVCodecContext *avctx, AVFrame *frame) |
|
|
|
if (ret < 0) |
|
|
|
goto error; |
|
|
|
|
|
|
|
offset += avctx->coded_height; |
|
|
|
offset += avctx->height; |
|
|
|
} |
|
|
|
} else if (avctx->pix_fmt == AV_PIX_FMT_NV12 || |
|
|
|
avctx->pix_fmt == AV_PIX_FMT_P010 || |
|
|
|
@@ -502,7 +532,7 @@ static int cuvid_output_frame(AVCodecContext *avctx, AVFrame *frame) |
|
|
|
tmp_frame->hw_frames_ctx = av_buffer_ref(ctx->hwframe); |
|
|
|
tmp_frame->data[0] = (uint8_t*)mapped_frame; |
|
|
|
tmp_frame->linesize[0] = pitch; |
|
|
|
tmp_frame->data[1] = (uint8_t*)(mapped_frame + avctx->coded_height * pitch); |
|
|
|
tmp_frame->data[1] = (uint8_t*)(mapped_frame + avctx->height * pitch); |
|
|
|
tmp_frame->linesize[1] = pitch; |
|
|
|
tmp_frame->width = avctx->width; |
|
|
|
tmp_frame->height = avctx->height; |
|
|
|
@@ -708,6 +738,21 @@ static av_cold int cuvid_decode_init(AVCodecContext *avctx) |
|
|
|
} |
|
|
|
avctx->pix_fmt = ret; |
|
|
|
|
|
|
|
if (ctx->resize_expr && sscanf(ctx->resize_expr, "%dx%d", |
|
|
|
&ctx->resize.width, &ctx->resize.height) != 2) { |
|
|
|
av_log(avctx, AV_LOG_ERROR, "Invalid resize expressions\n"); |
|
|
|
ret = AVERROR(EINVAL); |
|
|
|
goto error; |
|
|
|
} |
|
|
|
|
|
|
|
if (ctx->crop_expr && sscanf(ctx->crop_expr, "%dx%dx%dx%d", |
|
|
|
&ctx->crop.top, &ctx->crop.bottom, |
|
|
|
&ctx->crop.left, &ctx->crop.right) != 4) { |
|
|
|
av_log(avctx, AV_LOG_ERROR, "Invalid cropping expressions\n"); |
|
|
|
ret = AVERROR(EINVAL); |
|
|
|
goto error; |
|
|
|
} |
|
|
|
|
|
|
|
ret = cuvid_load_functions(&ctx->cvdl); |
|
|
|
if (ret < 0) { |
|
|
|
av_log(avctx, AV_LOG_ERROR, "Failed loading nvcuvid.\n"); |
|
|
|
@@ -953,6 +998,8 @@ static const AVOption options[] = { |
|
|
|
{ "gpu", "GPU to be used for decoding", OFFSET(cu_gpu), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, VD }, |
|
|
|
{ "surfaces", "Maximum surfaces to be used for decoding", OFFSET(nb_surfaces), AV_OPT_TYPE_INT, { .i64 = 25 }, 0, INT_MAX, VD }, |
|
|
|
{ "drop_second_field", "Drop second field when deinterlacing", OFFSET(drop_second_field), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VD }, |
|
|
|
{ "crop", "Crop (top)x(bottom)x(left)x(right)", OFFSET(crop_expr), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, VD }, |
|
|
|
{ "resize", "Resize (width)x(height)", OFFSET(resize_expr), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, VD }, |
|
|
|
{ NULL } |
|
|
|
}; |
|
|
|
|
|
|
|
|