2019-10-16 13:42:24 +00:00
|
|
|
/* GStreamer
|
|
|
|
* Copyright (C) 2019 Seungha Yang <seungha.yang@navercorp.com>
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Library General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Library General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Library General Public
|
|
|
|
* License along with this library; if not, write to the
|
|
|
|
* Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
|
|
|
|
* Boston, MA 02110-1301, USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
#include "config.h"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "gstcudanvrtc.h"
|
|
|
|
|
|
|
|
GST_DEBUG_CATEGORY_STATIC (gst_cuda_nvrtc_debug);
|
|
|
|
#define GST_CAT_DEFAULT gst_cuda_nvrtc_debug
|
|
|
|
|
|
|
|
static void
|
|
|
|
_init_debug (void)
|
|
|
|
{
|
2021-03-22 03:34:36 +00:00
|
|
|
static gsize once_init = 0;
|
2019-10-16 13:42:24 +00:00
|
|
|
|
|
|
|
if (g_once_init_enter (&once_init)) {
|
|
|
|
|
|
|
|
GST_DEBUG_CATEGORY_INIT (gst_cuda_nvrtc_debug, "cudanvrtc", 0,
|
|
|
|
"CUDA runtime compiler");
|
|
|
|
g_once_init_leave (&once_init, 1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
gchar *
|
|
|
|
gst_cuda_nvrtc_compile (const gchar * source)
|
|
|
|
{
|
|
|
|
nvrtcProgram prog;
|
|
|
|
nvrtcResult ret;
|
2020-11-25 16:59:54 +00:00
|
|
|
CUresult curet;
|
2019-10-16 13:42:24 +00:00
|
|
|
const gchar *opts[] = { "--gpu-architecture=compute_30" };
|
|
|
|
gsize ptx_size;
|
|
|
|
gchar *ptx = NULL;
|
2020-11-25 16:59:54 +00:00
|
|
|
int driverVersion;
|
2019-10-16 13:42:24 +00:00
|
|
|
|
|
|
|
g_return_val_if_fail (source != NULL, FALSE);
|
|
|
|
|
|
|
|
_init_debug ();
|
|
|
|
|
|
|
|
GST_TRACE ("CUDA kernel source \n%s", source);
|
|
|
|
|
2020-11-25 16:59:54 +00:00
|
|
|
curet = CuDriverGetVersion (&driverVersion);
|
|
|
|
if (curet != CUDA_SUCCESS) {
|
|
|
|
GST_ERROR ("Failed to query CUDA Driver version, ret %d", curet);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
GST_DEBUG ("CUDA Driver Version %d.%d", driverVersion / 1000,
|
|
|
|
(driverVersion % 1000) / 10);
|
|
|
|
|
2019-10-16 13:42:24 +00:00
|
|
|
ret = NvrtcCreateProgram (&prog, source, NULL, 0, NULL, NULL);
|
|
|
|
if (ret != NVRTC_SUCCESS) {
|
|
|
|
GST_ERROR ("couldn't create nvrtc program, ret %d", ret);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2020-11-25 16:59:54 +00:00
|
|
|
/* Starting from CUDA 11, the lowest supported architecture is 5.2 */
|
|
|
|
if (driverVersion >= 11000)
|
|
|
|
opts[0] = "--gpu-architecture=compute_52";
|
|
|
|
|
2019-10-16 13:42:24 +00:00
|
|
|
ret = NvrtcCompileProgram (prog, 1, opts);
|
|
|
|
if (ret != NVRTC_SUCCESS) {
|
|
|
|
gsize log_size;
|
|
|
|
|
|
|
|
GST_ERROR ("couldn't compile nvrtc program, ret %d", ret);
|
|
|
|
if (NvrtcGetProgramLogSize (prog, &log_size) == NVRTC_SUCCESS &&
|
|
|
|
log_size > 0) {
|
|
|
|
gchar *compile_log = g_alloca (log_size);
|
|
|
|
if (NvrtcGetProgramLog (prog, compile_log) == NVRTC_SUCCESS) {
|
|
|
|
GST_ERROR ("nvrtc compile log %s", compile_log);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = NvrtcGetPTXSize (prog, &ptx_size);
|
|
|
|
if (ret != NVRTC_SUCCESS) {
|
|
|
|
GST_ERROR ("unknown ptx size, ret %d", ret);
|
|
|
|
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
ptx = g_malloc0 (ptx_size);
|
|
|
|
ret = NvrtcGetPTX (prog, ptx);
|
|
|
|
if (ret != NVRTC_SUCCESS) {
|
|
|
|
GST_ERROR ("couldn't get ptx, ret %d", ret);
|
|
|
|
g_free (ptx);
|
|
|
|
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
NvrtcDestroyProgram (&prog);
|
|
|
|
|
|
|
|
GST_TRACE ("compiled CUDA PTX %s\n", ptx);
|
|
|
|
|
|
|
|
return ptx;
|
|
|
|
|
|
|
|
error:
|
|
|
|
NvrtcDestroyProgram (&prog);
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|