gstreamer/subprojects/gst-plugins-bad/gst-libs/gst/cuda/gstcudanvrtc.c
Seungha Yang 75e8f80999 cuda: Hide runtime compiler related header and symbols
That's already abstracted via gst_cuda_nvrtc_compile() method
and therefore, we do not need to expose such symbols yet.

Part-of: <https://gitlab.freedesktop.org/gstreamer/gstreamer/-/merge_requests/2884>
2022-08-18 05:20:08 +09:00

315 lines
8.3 KiB
C

/* GStreamer
* Copyright (C) 2019 Seungha Yang <seungha.yang@navercorp.com>
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Library General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Library General Public License for more details.
*
* You should have received a copy of the GNU Library General Public
* License along with this library; if not, write to the
* Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
* Boston, MA 02110-1301, USA.
*/
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#include "cuda-gst.h"
#include "gstcudanvrtc.h"
#include "gstcudaloader.h"
#include <nvrtc.h>
#include <gmodule.h>
GST_DEBUG_CATEGORY_STATIC (gst_cuda_nvrtc_debug);
#define GST_CAT_DEFAULT gst_cuda_nvrtc_debug
#ifndef G_OS_WIN32
#define NVRTC_LIBNAME "libnvrtc.so"
#else
#define NVRTC_LIBNAME "nvrtc64_%d%d_0.dll"
#endif
#define LOAD_SYMBOL(name,func) G_STMT_START { \
if (!g_module_symbol (module, G_STRINGIFY (name), (gpointer *) &vtable->func)) { \
GST_ERROR ("Failed to load '%s' from %s, %s", G_STRINGIFY (name), fname, g_module_error()); \
goto error; \
} \
} G_STMT_END;
/* *INDENT-OFF* */
typedef struct _GstCudaNvrtcVTable
{
gboolean loaded;
nvrtcResult (*NvrtcCompileProgram) (nvrtcProgram prog, int numOptions,
const char **options);
nvrtcResult (*NvrtcCreateProgram) (nvrtcProgram * prog, const char *src,
const char *name, int numHeaders, const char **headers,
const char **includeNames);
nvrtcResult (*NvrtcDestroyProgram) (nvrtcProgram * prog);
nvrtcResult (*NvrtcGetPTX) (nvrtcProgram prog, char *ptx);
nvrtcResult (*NvrtcGetPTXSize) (nvrtcProgram prog, size_t * ptxSizeRet);
nvrtcResult (*NvrtcGetProgramLog) (nvrtcProgram prog, char *log);
nvrtcResult (*NvrtcGetProgramLogSize) (nvrtcProgram prog,
size_t * logSizeRet);
} GstCudaNvrtcVTable;
/* *INDENT-ON* */
static GstCudaNvrtcVTable gst_cuda_nvrtc_vtable = { 0, };
static gboolean
gst_cuda_nvrtc_load_library_once (void)
{
GModule *module = NULL;
gchar *filename = NULL;
const gchar *filename_env;
const gchar *fname;
gint cuda_version;
GstCudaNvrtcVTable *vtable;
CuDriverGetVersion (&cuda_version);
fname = filename_env = g_getenv ("GST_CUDA_NVRTC_LIBNAME");
if (filename_env)
module = g_module_open (filename_env, G_MODULE_BIND_LAZY);
if (!module) {
#ifndef G_OS_WIN32
filename = g_strdup (NVRTC_LIBNAME);
fname = filename;
module = g_module_open (filename, G_MODULE_BIND_LAZY);
#else
/* XXX: On Windows, minor version of nvrtc library might not be exactly
* same as CUDA library */
{
gint cuda_major_version = cuda_version / 1000;
gint cuda_minor_version = (cuda_version % 1000) / 10;
gint minor_version;
for (minor_version = cuda_minor_version; minor_version >= 0;
minor_version--) {
g_free (filename);
filename = g_strdup_printf (NVRTC_LIBNAME, cuda_major_version,
minor_version);
fname = filename;
module = g_module_open (filename, G_MODULE_BIND_LAZY);
if (module) {
GST_INFO ("%s is available", filename);
break;
}
GST_DEBUG ("Couldn't open library %s", filename);
}
}
#endif
}
if (module == NULL) {
GST_WARNING ("Could not open library %s, %s", filename, g_module_error ());
g_free (filename);
return FALSE;
}
vtable = &gst_cuda_nvrtc_vtable;
LOAD_SYMBOL (nvrtcCompileProgram, NvrtcCompileProgram);
LOAD_SYMBOL (nvrtcCreateProgram, NvrtcCreateProgram);
LOAD_SYMBOL (nvrtcDestroyProgram, NvrtcDestroyProgram);
LOAD_SYMBOL (nvrtcGetPTX, NvrtcGetPTX);
LOAD_SYMBOL (nvrtcGetPTXSize, NvrtcGetPTXSize);
LOAD_SYMBOL (nvrtcGetProgramLog, NvrtcGetProgramLog);
LOAD_SYMBOL (nvrtcGetProgramLogSize, NvrtcGetProgramLogSize);
vtable->loaded = TRUE;
g_free (filename);
return TRUE;
error:
g_module_close (module);
g_free (filename);
return FALSE;
}
/**
* gst_cuda_nvrtc_load_library:
*
* Loads the nvrtc library.
*
* Returns: %TRUE if the library could be loaded, %FALSE otherwise
*
* Since: 1.22
*/
gboolean
gst_cuda_nvrtc_load_library (void)
{
static gsize init_once = 0;
if (g_once_init_enter (&init_once)) {
GST_DEBUG_CATEGORY_INIT (gst_cuda_nvrtc_debug, "cudanvrtc", 0,
"CUDA runtime compiler");
if (gst_cuda_load_library ())
gst_cuda_nvrtc_load_library_once ();
g_once_init_leave (&init_once, 1);
}
return gst_cuda_nvrtc_vtable.loaded;
}
/* *INDENT-OFF* */
static nvrtcResult
NvrtcCompileProgram (nvrtcProgram prog, int numOptions, const char **options)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcCompileProgram != NULL);
return gst_cuda_nvrtc_vtable.NvrtcCompileProgram (prog, numOptions, options);
}
static nvrtcResult
NvrtcCreateProgram (nvrtcProgram * prog, const char *src, const char *name,
int numHeaders, const char **headers, const char **includeNames)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcCreateProgram != NULL);
return gst_cuda_nvrtc_vtable.NvrtcCreateProgram (prog, src, name, numHeaders,
headers, includeNames);
}
static nvrtcResult
NvrtcDestroyProgram (nvrtcProgram * prog)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcDestroyProgram != NULL);
return gst_cuda_nvrtc_vtable.NvrtcDestroyProgram (prog);
}
static nvrtcResult
NvrtcGetPTX (nvrtcProgram prog, char *ptx)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcGetPTX != NULL);
return gst_cuda_nvrtc_vtable.NvrtcGetPTX (prog, ptx);
}
static nvrtcResult
NvrtcGetPTXSize (nvrtcProgram prog, size_t *ptxSizeRet)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcGetPTXSize != NULL);
return gst_cuda_nvrtc_vtable.NvrtcGetPTXSize (prog, ptxSizeRet);
}
static nvrtcResult
NvrtcGetProgramLog (nvrtcProgram prog, char *log)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcGetProgramLog != NULL);
return gst_cuda_nvrtc_vtable.NvrtcGetProgramLog (prog, log);
}
static nvrtcResult
NvrtcGetProgramLogSize (nvrtcProgram prog, size_t *logSizeRet)
{
g_assert (gst_cuda_nvrtc_vtable.NvrtcGetProgramLogSize != NULL);
return gst_cuda_nvrtc_vtable.NvrtcGetProgramLogSize (prog, logSizeRet);
}
/* *INDENT-ON* */
/**
* gst_cuda_nvrtc_compile:
* @source: Source code to compile
*
* Since: 1.22
*/
gchar *
gst_cuda_nvrtc_compile (const gchar * source)
{
nvrtcProgram prog;
nvrtcResult ret;
CUresult curet;
const gchar *opts[] = { "--gpu-architecture=compute_30" };
gsize ptx_size;
gchar *ptx = NULL;
int driverVersion;
g_return_val_if_fail (source != NULL, NULL);
if (!gst_cuda_nvrtc_load_library ()) {
return NULL;
}
GST_TRACE ("CUDA kernel source \n%s", source);
curet = CuDriverGetVersion (&driverVersion);
if (curet != CUDA_SUCCESS) {
GST_ERROR ("Failed to query CUDA Driver version, ret %d", curet);
return NULL;
}
GST_DEBUG ("CUDA Driver Version %d.%d", driverVersion / 1000,
(driverVersion % 1000) / 10);
ret = NvrtcCreateProgram (&prog, source, NULL, 0, NULL, NULL);
if (ret != NVRTC_SUCCESS) {
GST_ERROR ("couldn't create nvrtc program, ret %d", ret);
return NULL;
}
/* Starting from CUDA 11, the lowest supported architecture is 5.2 */
if (driverVersion >= 11000)
opts[0] = "--gpu-architecture=compute_52";
ret = NvrtcCompileProgram (prog, 1, opts);
if (ret != NVRTC_SUCCESS) {
gsize log_size;
GST_ERROR ("couldn't compile nvrtc program, ret %d", ret);
if (NvrtcGetProgramLogSize (prog, &log_size) == NVRTC_SUCCESS &&
log_size > 0) {
gchar *compile_log = g_alloca (log_size);
if (NvrtcGetProgramLog (prog, compile_log) == NVRTC_SUCCESS) {
GST_ERROR ("nvrtc compile log %s", compile_log);
}
}
goto error;
}
ret = NvrtcGetPTXSize (prog, &ptx_size);
if (ret != NVRTC_SUCCESS) {
GST_ERROR ("unknown ptx size, ret %d", ret);
goto error;
}
ptx = g_malloc0 (ptx_size);
ret = NvrtcGetPTX (prog, ptx);
if (ret != NVRTC_SUCCESS) {
GST_ERROR ("couldn't get ptx, ret %d", ret);
g_free (ptx);
goto error;
}
NvrtcDestroyProgram (&prog);
GST_TRACE ("compiled CUDA PTX %s\n", ptx);
return ptx;
error:
NvrtcDestroyProgram (&prog);
return NULL;
}