Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Contribute to GitLab
Sign in / Register
Toggle navigation
F
ffmpeg.wasm-core
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Linshizhi
ffmpeg.wasm-core
Commits
e6464a44
Commit
e6464a44
authored
Oct 10, 2016
by
Timo Rothenpieler
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
avutil/hwcontext_cuda: use dynamically loaded CUDA
parent
5c02d282
Show whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
120 additions
and
25 deletions
+120
-25
configure
configure
+2
-0
hwcontext_cuda.c
libavutil/hwcontext_cuda.c
+75
-24
hwcontext_cuda.h
libavutil/hwcontext_cuda.h
+5
-0
hwcontext_cuda_internal.h
libavutil/hwcontext_cuda_internal.h
+37
-0
version.h
libavutil/version.h
+1
-1
No files found.
configure
View file @
e6464a44
...
@@ -2537,6 +2537,7 @@ audiotoolbox_extralibs="-framework CoreFoundation -framework AudioToolbox -frame
...
@@ -2537,6 +2537,7 @@ audiotoolbox_extralibs="-framework CoreFoundation -framework AudioToolbox -frame
# hardware accelerators
# hardware accelerators
crystalhd_deps
=
"libcrystalhd_libcrystalhd_if_h"
crystalhd_deps
=
"libcrystalhd_libcrystalhd_if_h"
cuda_deps_any
=
"dlopen LoadLibrary"
cuvid_deps
=
"cuda"
cuvid_deps
=
"cuda"
d3d11va_deps
=
"d3d11_h dxva_h ID3D11VideoDecoder ID3D11VideoContext"
d3d11va_deps
=
"d3d11_h dxva_h ID3D11VideoDecoder ID3D11VideoContext"
dxva2_deps
=
"dxva2api_h DXVA2_ConfigPictureDecode"
dxva2_deps
=
"dxva2api_h DXVA2_ConfigPictureDecode"
...
@@ -5414,6 +5415,7 @@ elif check_func dlopen -ldl && check_func dlsym -ldl; then
...
@@ -5414,6 +5415,7 @@ elif check_func dlopen -ldl && check_func dlsym -ldl; then
fi
fi
avisynth_demuxer_extralibs
=
'$ldl'
avisynth_demuxer_extralibs
=
'$ldl'
cuda_extralibs
=
'$ldl'
decklink_outdev_extralibs
=
"
$decklink_outdev_extralibs
$ldl
"
decklink_outdev_extralibs
=
"
$decklink_outdev_extralibs
$ldl
"
decklink_indev_extralibs
=
"
$decklink_indev_extralibs
$ldl
"
decklink_indev_extralibs
=
"
$decklink_indev_extralibs
$ldl
"
frei0r_filter_extralibs
=
'$ldl'
frei0r_filter_extralibs
=
'$ldl'
...
...
libavutil/hwcontext_cuda.c
View file @
e6464a44
...
@@ -20,7 +20,7 @@
...
@@ -20,7 +20,7 @@
#include "common.h"
#include "common.h"
#include "hwcontext.h"
#include "hwcontext.h"
#include "hwcontext_internal.h"
#include "hwcontext_internal.h"
#include "hwcontext_cuda.h"
#include "hwcontext_cuda
_internal
.h"
#include "mem.h"
#include "mem.h"
#include "pixdesc.h"
#include "pixdesc.h"
#include "pixfmt.h"
#include "pixfmt.h"
...
@@ -41,44 +41,46 @@ static void cuda_buffer_free(void *opaque, uint8_t *data)
...
@@ -41,44 +41,46 @@ static void cuda_buffer_free(void *opaque, uint8_t *data)
{
{
AVHWFramesContext
*
ctx
=
opaque
;
AVHWFramesContext
*
ctx
=
opaque
;
AVCUDADeviceContext
*
hwctx
=
ctx
->
device_ctx
->
hwctx
;
AVCUDADeviceContext
*
hwctx
=
ctx
->
device_ctx
->
hwctx
;
CudaFunctions
*
cu
=
hwctx
->
internal
->
cuda_dl
;
CUcontext
dummy
;
CUcontext
dummy
;
cuCtxPushCurrent
(
hwctx
->
cuda_ctx
);
cu
->
cu
CtxPushCurrent
(
hwctx
->
cuda_ctx
);
cuMemFree
((
CUdeviceptr
)
data
);
cu
->
cu
MemFree
((
CUdeviceptr
)
data
);
cuCtxPopCurrent
(
&
dummy
);
cu
->
cu
CtxPopCurrent
(
&
dummy
);
}
}
static
AVBufferRef
*
cuda_pool_alloc
(
void
*
opaque
,
int
size
)
static
AVBufferRef
*
cuda_pool_alloc
(
void
*
opaque
,
int
size
)
{
{
AVHWFramesContext
*
ctx
=
opaque
;
AVHWFramesContext
*
ctx
=
opaque
;
AVCUDADeviceContext
*
hwctx
=
ctx
->
device_ctx
->
hwctx
;
AVCUDADeviceContext
*
hwctx
=
ctx
->
device_ctx
->
hwctx
;
CudaFunctions
*
cu
=
hwctx
->
internal
->
cuda_dl
;
AVBufferRef
*
ret
=
NULL
;
AVBufferRef
*
ret
=
NULL
;
CUcontext
dummy
=
NULL
;
CUcontext
dummy
=
NULL
;
CUdeviceptr
data
;
CUdeviceptr
data
;
CUresult
err
;
CUresult
err
;
err
=
cuCtxPushCurrent
(
hwctx
->
cuda_ctx
);
err
=
cu
->
cu
CtxPushCurrent
(
hwctx
->
cuda_ctx
);
if
(
err
!=
CUDA_SUCCESS
)
{
if
(
err
!=
CUDA_SUCCESS
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error setting current CUDA context
\n
"
);
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error setting current CUDA context
\n
"
);
return
NULL
;
return
NULL
;
}
}
err
=
cuMemAlloc
(
&
data
,
size
);
err
=
cu
->
cu
MemAlloc
(
&
data
,
size
);
if
(
err
!=
CUDA_SUCCESS
)
if
(
err
!=
CUDA_SUCCESS
)
goto
fail
;
goto
fail
;
ret
=
av_buffer_create
((
uint8_t
*
)
data
,
size
,
cuda_buffer_free
,
ctx
,
0
);
ret
=
av_buffer_create
((
uint8_t
*
)
data
,
size
,
cuda_buffer_free
,
ctx
,
0
);
if
(
!
ret
)
{
if
(
!
ret
)
{
cuMemFree
(
data
);
cu
->
cu
MemFree
(
data
);
goto
fail
;
goto
fail
;
}
}
fail:
fail:
cuCtxPopCurrent
(
&
dummy
);
cu
->
cu
CtxPopCurrent
(
&
dummy
);
return
ret
;
return
ret
;
}
}
...
@@ -187,12 +189,13 @@ static int cuda_transfer_data_from(AVHWFramesContext *ctx, AVFrame *dst,
...
@@ -187,12 +189,13 @@ static int cuda_transfer_data_from(AVHWFramesContext *ctx, AVFrame *dst,
{
{
CUDAFramesContext
*
priv
=
ctx
->
internal
->
priv
;
CUDAFramesContext
*
priv
=
ctx
->
internal
->
priv
;
AVCUDADeviceContext
*
device_hwctx
=
ctx
->
device_ctx
->
hwctx
;
AVCUDADeviceContext
*
device_hwctx
=
ctx
->
device_ctx
->
hwctx
;
CudaFunctions
*
cu
=
device_hwctx
->
internal
->
cuda_dl
;
CUcontext
dummy
;
CUcontext
dummy
;
CUresult
err
;
CUresult
err
;
int
i
;
int
i
;
err
=
cuCtxPushCurrent
(
device_hwctx
->
cuda_ctx
);
err
=
cu
->
cu
CtxPushCurrent
(
device_hwctx
->
cuda_ctx
);
if
(
err
!=
CUDA_SUCCESS
)
if
(
err
!=
CUDA_SUCCESS
)
return
AVERROR_UNKNOWN
;
return
AVERROR_UNKNOWN
;
...
@@ -208,14 +211,14 @@ static int cuda_transfer_data_from(AVHWFramesContext *ctx, AVFrame *dst,
...
@@ -208,14 +211,14 @@ static int cuda_transfer_data_from(AVHWFramesContext *ctx, AVFrame *dst,
.
Height
=
src
->
height
>>
(
i
?
priv
->
shift_height
:
0
),
.
Height
=
src
->
height
>>
(
i
?
priv
->
shift_height
:
0
),
};
};
err
=
cuMemcpy2D
(
&
cpy
);
err
=
cu
->
cu
Memcpy2D
(
&
cpy
);
if
(
err
!=
CUDA_SUCCESS
)
{
if
(
err
!=
CUDA_SUCCESS
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error transferring the data from the CUDA frame
\n
"
);
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error transferring the data from the CUDA frame
\n
"
);
return
AVERROR_UNKNOWN
;
return
AVERROR_UNKNOWN
;
}
}
}
}
cuCtxPopCurrent
(
&
dummy
);
cu
->
cu
CtxPopCurrent
(
&
dummy
);
return
0
;
return
0
;
}
}
...
@@ -225,12 +228,13 @@ static int cuda_transfer_data_to(AVHWFramesContext *ctx, AVFrame *dst,
...
@@ -225,12 +228,13 @@ static int cuda_transfer_data_to(AVHWFramesContext *ctx, AVFrame *dst,
{
{
CUDAFramesContext
*
priv
=
ctx
->
internal
->
priv
;
CUDAFramesContext
*
priv
=
ctx
->
internal
->
priv
;
AVCUDADeviceContext
*
device_hwctx
=
ctx
->
device_ctx
->
hwctx
;
AVCUDADeviceContext
*
device_hwctx
=
ctx
->
device_ctx
->
hwctx
;
CudaFunctions
*
cu
=
device_hwctx
->
internal
->
cuda_dl
;
CUcontext
dummy
;
CUcontext
dummy
;
CUresult
err
;
CUresult
err
;
int
i
;
int
i
;
err
=
cuCtxPushCurrent
(
device_hwctx
->
cuda_ctx
);
err
=
cu
->
cu
CtxPushCurrent
(
device_hwctx
->
cuda_ctx
);
if
(
err
!=
CUDA_SUCCESS
)
if
(
err
!=
CUDA_SUCCESS
)
return
AVERROR_UNKNOWN
;
return
AVERROR_UNKNOWN
;
...
@@ -246,28 +250,64 @@ static int cuda_transfer_data_to(AVHWFramesContext *ctx, AVFrame *dst,
...
@@ -246,28 +250,64 @@ static int cuda_transfer_data_to(AVHWFramesContext *ctx, AVFrame *dst,
.
Height
=
src
->
height
>>
(
i
?
priv
->
shift_height
:
0
),
.
Height
=
src
->
height
>>
(
i
?
priv
->
shift_height
:
0
),
};
};
err
=
cuMemcpy2D
(
&
cpy
);
err
=
cu
->
cu
Memcpy2D
(
&
cpy
);
if
(
err
!=
CUDA_SUCCESS
)
{
if
(
err
!=
CUDA_SUCCESS
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error transferring the data from the CUDA frame
\n
"
);
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error transferring the data from the CUDA frame
\n
"
);
return
AVERROR_UNKNOWN
;
return
AVERROR_UNKNOWN
;
}
}
}
}
cuCtxPopCurrent
(
&
dummy
);
cu
->
cu
CtxPopCurrent
(
&
dummy
);
return
0
;
return
0
;
}
}
static
void
cuda_device_
free
(
AVHWDeviceContext
*
ctx
)
static
void
cuda_device_
uninit
(
AVHWDeviceContext
*
ctx
)
{
{
AVCUDADeviceContext
*
hwctx
=
ctx
->
hwctx
;
AVCUDADeviceContext
*
hwctx
=
ctx
->
hwctx
;
cuCtxDestroy
(
hwctx
->
cuda_ctx
);
if
(
hwctx
->
internal
)
{
if
(
hwctx
->
internal
->
is_allocated
&&
hwctx
->
cuda_ctx
)
{
hwctx
->
internal
->
cuda_dl
->
cuCtxDestroy
(
hwctx
->
cuda_ctx
);
hwctx
->
cuda_ctx
=
NULL
;
}
cuda_free_functions
(
&
hwctx
->
internal
->
cuda_dl
);
}
av_freep
(
&
hwctx
->
internal
);
}
static
int
cuda_device_init
(
AVHWDeviceContext
*
ctx
)
{
AVCUDADeviceContext
*
hwctx
=
ctx
->
hwctx
;
int
ret
;
if
(
!
hwctx
->
internal
)
{
hwctx
->
internal
=
av_mallocz
(
sizeof
(
*
hwctx
->
internal
));
if
(
!
hwctx
->
internal
)
return
AVERROR
(
ENOMEM
);
}
if
(
!
hwctx
->
internal
->
cuda_dl
)
{
ret
=
cuda_load_functions
(
&
hwctx
->
internal
->
cuda_dl
);
if
(
ret
<
0
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Could not dynamically load CUDA
\n
"
);
goto
error
;
}
}
return
0
;
error:
cuda_device_uninit
(
ctx
);
return
ret
;
}
}
static
int
cuda_device_create
(
AVHWDeviceContext
*
ctx
,
const
char
*
device
,
static
int
cuda_device_create
(
AVHWDeviceContext
*
ctx
,
const
char
*
device
,
AVDictionary
*
opts
,
int
flags
)
AVDictionary
*
opts
,
int
flags
)
{
{
AVCUDADeviceContext
*
hwctx
=
ctx
->
hwctx
;
AVCUDADeviceContext
*
hwctx
=
ctx
->
hwctx
;
CudaFunctions
*
cu
;
CUdevice
cu_device
;
CUdevice
cu_device
;
CUcontext
dummy
;
CUcontext
dummy
;
CUresult
err
;
CUresult
err
;
...
@@ -276,29 +316,38 @@ static int cuda_device_create(AVHWDeviceContext *ctx, const char *device,
...
@@ -276,29 +316,38 @@ static int cuda_device_create(AVHWDeviceContext *ctx, const char *device,
if
(
device
)
if
(
device
)
device_idx
=
strtol
(
device
,
NULL
,
0
);
device_idx
=
strtol
(
device
,
NULL
,
0
);
err
=
cuInit
(
0
);
if
(
cuda_device_init
(
ctx
)
<
0
)
goto
error
;
cu
=
hwctx
->
internal
->
cuda_dl
;
err
=
cu
->
cuInit
(
0
);
if
(
err
!=
CUDA_SUCCESS
)
{
if
(
err
!=
CUDA_SUCCESS
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Could not initialize the CUDA driver API
\n
"
);
av_log
(
ctx
,
AV_LOG_ERROR
,
"Could not initialize the CUDA driver API
\n
"
);
return
AVERROR_UNKNOWN
;
goto
error
;
}
}
err
=
cuDeviceGet
(
&
cu_device
,
device_idx
);
err
=
cu
->
cu
DeviceGet
(
&
cu_device
,
device_idx
);
if
(
err
!=
CUDA_SUCCESS
)
{
if
(
err
!=
CUDA_SUCCESS
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Could not get the device number %d
\n
"
,
device_idx
);
av_log
(
ctx
,
AV_LOG_ERROR
,
"Could not get the device number %d
\n
"
,
device_idx
);
return
AVERROR_UNKNOWN
;
goto
error
;
}
}
err
=
cuCtxCreate
(
&
hwctx
->
cuda_ctx
,
CU_CTX_SCHED_BLOCKING_SYNC
,
cu_device
);
err
=
cu
->
cu
CtxCreate
(
&
hwctx
->
cuda_ctx
,
CU_CTX_SCHED_BLOCKING_SYNC
,
cu_device
);
if
(
err
!=
CUDA_SUCCESS
)
{
if
(
err
!=
CUDA_SUCCESS
)
{
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error creating a CUDA context
\n
"
);
av_log
(
ctx
,
AV_LOG_ERROR
,
"Error creating a CUDA context
\n
"
);
return
AVERROR_UNKNOWN
;
goto
error
;
}
}
cuCtxPopCurrent
(
&
dummy
);
cu
->
cu
CtxPopCurrent
(
&
dummy
);
ctx
->
free
=
cuda_device_free
;
hwctx
->
internal
->
is_allocated
=
1
;
return
0
;
return
0
;
error:
cuda_device_uninit
(
ctx
);
return
AVERROR_UNKNOWN
;
}
}
const
HWContextType
ff_hwcontext_type_cuda
=
{
const
HWContextType
ff_hwcontext_type_cuda
=
{
...
@@ -309,6 +358,8 @@ const HWContextType ff_hwcontext_type_cuda = {
...
@@ -309,6 +358,8 @@ const HWContextType ff_hwcontext_type_cuda = {
.
frames_priv_size
=
sizeof
(
CUDAFramesContext
),
.
frames_priv_size
=
sizeof
(
CUDAFramesContext
),
.
device_create
=
cuda_device_create
,
.
device_create
=
cuda_device_create
,
.
device_init
=
cuda_device_init
,
.
device_uninit
=
cuda_device_uninit
,
.
frames_init
=
cuda_frames_init
,
.
frames_init
=
cuda_frames_init
,
.
frames_get_buffer
=
cuda_get_buffer
,
.
frames_get_buffer
=
cuda_get_buffer
,
.
transfer_get_formats
=
cuda_transfer_get_formats
,
.
transfer_get_formats
=
cuda_transfer_get_formats
,
...
...
libavutil/hwcontext_cuda.h
View file @
e6464a44
...
@@ -20,7 +20,9 @@
...
@@ -20,7 +20,9 @@
#ifndef AVUTIL_HWCONTEXT_CUDA_H
#ifndef AVUTIL_HWCONTEXT_CUDA_H
#define AVUTIL_HWCONTEXT_CUDA_H
#define AVUTIL_HWCONTEXT_CUDA_H
#ifndef CUDA_VERSION
#include <cuda.h>
#include <cuda.h>
#endif
#include "pixfmt.h"
#include "pixfmt.h"
...
@@ -32,11 +34,14 @@
...
@@ -32,11 +34,14 @@
* AVBufferRefs whose data pointer is a CUdeviceptr.
* AVBufferRefs whose data pointer is a CUdeviceptr.
*/
*/
typedef
struct
AVCUDADeviceContextInternal
AVCUDADeviceContextInternal
;
/**
/**
* This struct is allocated as AVHWDeviceContext.hwctx
* This struct is allocated as AVHWDeviceContext.hwctx
*/
*/
typedef
struct
AVCUDADeviceContext
{
typedef
struct
AVCUDADeviceContext
{
CUcontext
cuda_ctx
;
CUcontext
cuda_ctx
;
AVCUDADeviceContextInternal
*
internal
;
}
AVCUDADeviceContext
;
}
AVCUDADeviceContext
;
/**
/**
...
...
libavutil/hwcontext_cuda_internal.h
0 → 100644
View file @
e6464a44
/*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#ifndef AVUTIL_HWCONTEXT_CUDA_INTERNAL_H
#define AVUTIL_HWCONTEXT_CUDA_INTERNAL_H
#include "compat/cuda/dynlink_loader.h"
#include "hwcontext_cuda.h"
/**
* @file
* FFmpeg internal API for CUDA.
*/
struct
AVCUDADeviceContextInternal
{
CudaFunctions
*
cuda_dl
;
int
is_allocated
;
};
#endif
/* AVUTIL_HWCONTEXT_CUDA_INTERNAL_H */
libavutil/version.h
View file @
e6464a44
...
@@ -80,7 +80,7 @@
...
@@ -80,7 +80,7 @@
#define LIBAVUTIL_VERSION_MAJOR 55
#define LIBAVUTIL_VERSION_MAJOR 55
#define LIBAVUTIL_VERSION_MINOR 40
#define LIBAVUTIL_VERSION_MINOR 40
#define LIBAVUTIL_VERSION_MICRO 10
0
#define LIBAVUTIL_VERSION_MICRO 10
1
#define LIBAVUTIL_VERSION_INT AV_VERSION_INT(LIBAVUTIL_VERSION_MAJOR, \
#define LIBAVUTIL_VERSION_INT AV_VERSION_INT(LIBAVUTIL_VERSION_MAJOR, \
LIBAVUTIL_VERSION_MINOR, \
LIBAVUTIL_VERSION_MINOR, \
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment