|
|
|
@@ -18,9 +18,8 @@ |
|
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
|
|
*/ |
|
|
|
|
|
|
|
#include <cuda.h> |
|
|
|
#include "libavutil/avassert.h" |
|
|
|
#include "libavutil/hwcontext_cuda.h" |
|
|
|
#include "libavutil/hwcontext_cuda_internal.h" |
|
|
|
#include "libavutil/cuda_check.h" |
|
|
|
#include "internal.h" |
|
|
|
#include "yadif.h" |
|
|
|
@@ -49,7 +48,7 @@ typedef struct DeintCUDAContext { |
|
|
|
#define BLOCKX 32 |
|
|
|
#define BLOCKY 16 |
|
|
|
|
|
|
|
#define CHECK_CU(x) FF_CUDA_CHECK(ctx, x) |
|
|
|
#define CHECK_CU(x) FF_CUDA_CHECK_DL(ctx, s->hwctx->internal->cuda_dl, x) |
|
|
|
|
|
|
|
static CUresult call_kernel(AVFilterContext *ctx, CUfunction func, |
|
|
|
CUdeviceptr prev, CUdeviceptr cur, CUdeviceptr next, |
|
|
|
@@ -64,6 +63,7 @@ static CUresult call_kernel(AVFilterContext *ctx, CUfunction func, |
|
|
|
int parity, int tff) |
|
|
|
{ |
|
|
|
DeintCUDAContext *s = ctx->priv; |
|
|
|
CudaFunctions *cu = s->hwctx->internal->cuda_dl; |
|
|
|
CUtexObject tex_prev = 0, tex_cur = 0, tex_next = 0; |
|
|
|
int ret; |
|
|
|
int skip_spatial_check = s->yadif.mode&2; |
|
|
|
@@ -88,32 +88,32 @@ static CUresult call_kernel(AVFilterContext *ctx, CUfunction func, |
|
|
|
}; |
|
|
|
|
|
|
|
res_desc.res.pitch2D.devPtr = (CUdeviceptr)prev; |
|
|
|
ret = CHECK_CU(cuTexObjectCreate(&tex_prev, &res_desc, &tex_desc, NULL)); |
|
|
|
ret = CHECK_CU(cu->cuTexObjectCreate(&tex_prev, &res_desc, &tex_desc, NULL)); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
res_desc.res.pitch2D.devPtr = (CUdeviceptr)cur; |
|
|
|
ret = CHECK_CU(cuTexObjectCreate(&tex_cur, &res_desc, &tex_desc, NULL)); |
|
|
|
ret = CHECK_CU(cu->cuTexObjectCreate(&tex_cur, &res_desc, &tex_desc, NULL)); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
res_desc.res.pitch2D.devPtr = (CUdeviceptr)next; |
|
|
|
ret = CHECK_CU(cuTexObjectCreate(&tex_next, &res_desc, &tex_desc, NULL)); |
|
|
|
ret = CHECK_CU(cu->cuTexObjectCreate(&tex_next, &res_desc, &tex_desc, NULL)); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuLaunchKernel(func, |
|
|
|
DIV_UP(dst_width, BLOCKX), DIV_UP(dst_height, BLOCKY), 1, |
|
|
|
BLOCKX, BLOCKY, 1, |
|
|
|
0, s->stream, args, NULL)); |
|
|
|
ret = CHECK_CU(cu->cuLaunchKernel(func, |
|
|
|
DIV_UP(dst_width, BLOCKX), DIV_UP(dst_height, BLOCKY), 1, |
|
|
|
BLOCKX, BLOCKY, 1, |
|
|
|
0, s->stream, args, NULL)); |
|
|
|
|
|
|
|
exit: |
|
|
|
if (tex_prev) |
|
|
|
CHECK_CU(cuTexObjectDestroy(tex_prev)); |
|
|
|
CHECK_CU(cu->cuTexObjectDestroy(tex_prev)); |
|
|
|
if (tex_cur) |
|
|
|
CHECK_CU(cuTexObjectDestroy(tex_cur)); |
|
|
|
CHECK_CU(cu->cuTexObjectDestroy(tex_cur)); |
|
|
|
if (tex_next) |
|
|
|
CHECK_CU(cuTexObjectDestroy(tex_next)); |
|
|
|
CHECK_CU(cu->cuTexObjectDestroy(tex_next)); |
|
|
|
|
|
|
|
return ret; |
|
|
|
} |
|
|
|
@@ -123,10 +123,11 @@ static void filter(AVFilterContext *ctx, AVFrame *dst, |
|
|
|
{ |
|
|
|
DeintCUDAContext *s = ctx->priv; |
|
|
|
YADIFContext *y = &s->yadif; |
|
|
|
CudaFunctions *cu = s->hwctx->internal->cuda_dl; |
|
|
|
CUcontext dummy; |
|
|
|
int i, ret; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuCtxPushCurrent(s->cu_ctx)); |
|
|
|
ret = CHECK_CU(cu->cuCtxPushCurrent(s->cu_ctx)); |
|
|
|
if (ret < 0) |
|
|
|
return; |
|
|
|
|
|
|
|
@@ -179,10 +180,10 @@ static void filter(AVFilterContext *ctx, AVFrame *dst, |
|
|
|
parity, tff); |
|
|
|
} |
|
|
|
|
|
|
|
CHECK_CU(cuStreamSynchronize(s->stream)); |
|
|
|
CHECK_CU(cu->cuStreamSynchronize(s->stream)); |
|
|
|
|
|
|
|
exit: |
|
|
|
CHECK_CU(cuCtxPopCurrent(&dummy)); |
|
|
|
CHECK_CU(cu->cuCtxPopCurrent(&dummy)); |
|
|
|
return; |
|
|
|
} |
|
|
|
|
|
|
|
@@ -192,10 +193,11 @@ static av_cold void deint_cuda_uninit(AVFilterContext *ctx) |
|
|
|
DeintCUDAContext *s = ctx->priv; |
|
|
|
YADIFContext *y = &s->yadif; |
|
|
|
|
|
|
|
if (s->cu_module) { |
|
|
|
CHECK_CU(cuCtxPushCurrent(s->cu_ctx)); |
|
|
|
CHECK_CU(cuModuleUnload(s->cu_module)); |
|
|
|
CHECK_CU(cuCtxPopCurrent(&dummy)); |
|
|
|
if (s->hwctx && s->cu_module) { |
|
|
|
CudaFunctions *cu = s->hwctx->internal->cuda_dl; |
|
|
|
CHECK_CU(cu->cuCtxPushCurrent(s->cu_ctx)); |
|
|
|
CHECK_CU(cu->cuModuleUnload(s->cu_module)); |
|
|
|
CHECK_CU(cu->cuCtxPopCurrent(&dummy)); |
|
|
|
} |
|
|
|
|
|
|
|
av_frame_free(&y->prev); |
|
|
|
@@ -253,6 +255,7 @@ static int config_output(AVFilterLink *link) |
|
|
|
AVFilterContext *ctx = link->src; |
|
|
|
DeintCUDAContext *s = ctx->priv; |
|
|
|
YADIFContext *y = &s->yadif; |
|
|
|
CudaFunctions *cu; |
|
|
|
int ret = 0; |
|
|
|
CUcontext dummy; |
|
|
|
|
|
|
|
@@ -266,6 +269,7 @@ static int config_output(AVFilterLink *link) |
|
|
|
s->hwctx = ((AVHWDeviceContext*)s->device_ref->data)->hwctx; |
|
|
|
s->cu_ctx = s->hwctx->cuda_ctx; |
|
|
|
s->stream = s->hwctx->stream; |
|
|
|
cu = s->hwctx->internal->cuda_dl; |
|
|
|
|
|
|
|
link->hw_frames_ctx = av_hwframe_ctx_alloc(s->device_ref); |
|
|
|
if (!link->hw_frames_ctx) { |
|
|
|
@@ -313,32 +317,32 @@ static int config_output(AVFilterLink *link) |
|
|
|
y->csp = av_pix_fmt_desc_get(output_frames->sw_format); |
|
|
|
y->filter = filter; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuCtxPushCurrent(s->cu_ctx)); |
|
|
|
ret = CHECK_CU(cu->cuCtxPushCurrent(s->cu_ctx)); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuModuleLoadData(&s->cu_module, vf_yadif_cuda_ptx)); |
|
|
|
ret = CHECK_CU(cu->cuModuleLoadData(&s->cu_module, vf_yadif_cuda_ptx)); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuModuleGetFunction(&s->cu_func_uchar, s->cu_module, "yadif_uchar")); |
|
|
|
ret = CHECK_CU(cu->cuModuleGetFunction(&s->cu_func_uchar, s->cu_module, "yadif_uchar")); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuModuleGetFunction(&s->cu_func_uchar2, s->cu_module, "yadif_uchar2")); |
|
|
|
ret = CHECK_CU(cu->cuModuleGetFunction(&s->cu_func_uchar2, s->cu_module, "yadif_uchar2")); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuModuleGetFunction(&s->cu_func_ushort, s->cu_module, "yadif_ushort")); |
|
|
|
ret = CHECK_CU(cu->cuModuleGetFunction(&s->cu_func_ushort, s->cu_module, "yadif_ushort")); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
ret = CHECK_CU(cuModuleGetFunction(&s->cu_func_ushort2, s->cu_module, "yadif_ushort2")); |
|
|
|
ret = CHECK_CU(cu->cuModuleGetFunction(&s->cu_func_ushort2, s->cu_module, "yadif_ushort2")); |
|
|
|
if (ret < 0) |
|
|
|
goto exit; |
|
|
|
|
|
|
|
exit: |
|
|
|
CHECK_CU(cuCtxPopCurrent(&dummy)); |
|
|
|
CHECK_CU(cu->cuCtxPopCurrent(&dummy)); |
|
|
|
|
|
|
|
return ret; |
|
|
|
} |
|
|
|
|