|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#include "config.h" |
|
|
|
#include "libavutil/hwcontext.h" |
|
#include "libavutil/hwcontext_cuda_internal.h" |
|
#include "libavutil/cuda_check.h" |
|
|
|
#if CONFIG_PTX_COMPRESSION |
|
#include <zlib.h> |
|
#define CHUNK_SIZE 1024 * 64 |
|
#endif |
|
|
|
#include "load_helper.h" |
|
|
|
#define CHECK_CU(x) FF_CUDA_CHECK_DL(avctx, cu, x) |
|
|
|
int ff_cuda_load_module(void *avctx, AVCUDADeviceContext *hwctx, CUmodule *cu_module, |
|
const unsigned char *data, const unsigned int length) |
|
{ |
|
CudaFunctions *cu = hwctx->internal->cuda_dl; |
|
|
|
#if CONFIG_PTX_COMPRESSION |
|
z_stream stream = { 0 }; |
|
uint8_t *buf, *tmp; |
|
uint64_t buf_size; |
|
int ret; |
|
|
|
if (inflateInit2(&stream, 32 + 15) != Z_OK) { |
|
av_log(avctx, AV_LOG_ERROR, "Error during zlib initialisation: %s\n", stream.msg); |
|
return AVERROR(ENOSYS); |
|
} |
|
|
|
buf_size = CHUNK_SIZE * 4; |
|
buf = av_realloc(NULL, buf_size); |
|
if (!buf) { |
|
inflateEnd(&stream); |
|
return AVERROR(ENOMEM); |
|
} |
|
|
|
stream.next_in = data; |
|
stream.avail_in = length; |
|
|
|
do { |
|
stream.avail_out = buf_size - stream.total_out; |
|
stream.next_out = buf + stream.total_out; |
|
|
|
ret = inflate(&stream, Z_FINISH); |
|
if (ret != Z_OK && ret != Z_STREAM_END && ret != Z_BUF_ERROR) { |
|
av_log(avctx, AV_LOG_ERROR, "zlib inflate error(%d): %s\n", ret, stream.msg); |
|
inflateEnd(&stream); |
|
av_free(buf); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
if (stream.avail_out == 0) { |
|
buf_size += CHUNK_SIZE; |
|
tmp = av_realloc(buf, buf_size); |
|
if (!tmp) { |
|
inflateEnd(&stream); |
|
av_free(buf); |
|
return AVERROR(ENOMEM); |
|
} |
|
buf = tmp; |
|
} |
|
} while (ret != Z_STREAM_END); |
|
|
|
|
|
|
|
buf[stream.total_out] = 0; |
|
|
|
inflateEnd(&stream); |
|
|
|
ret = CHECK_CU(cu->cuModuleLoadData(cu_module, buf)); |
|
av_free(buf); |
|
return ret; |
|
#else |
|
return CHECK_CU(cu->cuModuleLoadData(cu_module, data)); |
|
#endif |
|
} |
|
|