gstreamer/sys/nvcodec/gstcudacontext.c

/* GStreamer
 * Copyright (C) <2018-2019> Seungha Yang <seungha.yang@navercorp.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Library General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Library General Public License for more details.
 *
 * You should have received a copy of the GNU Library General Public
 * License along with this library; if not, write to the
 * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
 * Boston, MA 02110-1301, USA.
 */

#ifdef HAVE_CONFIG_H
#include "config.h"
#endif

#include "gstcudaloader.h"
#include "gstcudacontext.h"
#include "gstcudautils.h"

GST_DEBUG_CATEGORY_STATIC (gst_cuda_context_debug);
#define GST_CAT_DEFAULT gst_cuda_context_debug

/* store all context object with weak ref */
static GList *context_list = NULL;
G_LOCK_DEFINE_STATIC (list_lock);

enum
{
  PROP_0,
  PROP_DEVICE_ID
};

#define DEFAULT_DEVICE_ID -1

struct _GstCudaContextPrivate
{
  CUcontext context;
  CUdevice device;
  gint device_id;

  gint tex_align;

  GHashTable *accessible_peer;
};

#define gst_cuda_context_parent_class parent_class
G_DEFINE_TYPE_WITH_PRIVATE (GstCudaContext, gst_cuda_context, GST_TYPE_OBJECT);

static void gst_cuda_context_set_property (GObject * object, guint prop_id,
    const GValue * value, GParamSpec * pspec);
static void gst_cuda_context_get_property (GObject * object, guint prop_id,
    GValue * value, GParamSpec * pspec);
static void gst_cuda_context_constructed (GObject * object);
static void gst_cuda_context_finalize (GObject * object);
static void gst_cuda_context_weak_ref_notify (gpointer data,
    GstCudaContext * context);
static void gst_cuda_context_enable_peer_access (GstCudaContext * context,
    GstCudaContext * peer);

static void
gst_cuda_context_class_init (GstCudaContextClass * klass)
{
  GObjectClass *gobject_class = G_OBJECT_CLASS (klass);

  gobject_class->set_property = gst_cuda_context_set_property;
  gobject_class->get_property = gst_cuda_context_get_property;
  gobject_class->constructed = gst_cuda_context_constructed;
  gobject_class->finalize = gst_cuda_context_finalize;

  g_object_class_install_property (gobject_class, PROP_DEVICE_ID,
      g_param_spec_int ("cuda-device-id", "Cuda Device ID",
          "Set the GPU device to use for operations (-1 = auto)",
          -1, G_MAXINT, DEFAULT_DEVICE_ID,
          G_PARAM_CONSTRUCT_ONLY | G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS));

  GST_DEBUG_CATEGORY_INIT (gst_cuda_context_debug,
      "cudacontext", 0, "CUDA Context");
}

static void
gst_cuda_context_init (GstCudaContext * context)
{
  GstCudaContextPrivate *priv = gst_cuda_context_get_instance_private (context);

  priv->context = NULL;
  priv->device_id = DEFAULT_DEVICE_ID;
  priv->accessible_peer = g_hash_table_new (g_direct_hash, g_direct_equal);

  context->priv = priv;
}

static void
gst_cuda_context_set_property (GObject * object, guint prop_id,
    const GValue * value, GParamSpec * pspec)
{
  GstCudaContext *context = GST_CUDA_CONTEXT (object);
  GstCudaContextPrivate *priv = context->priv;

  switch (prop_id) {
    case PROP_DEVICE_ID:
      priv->device_id = g_value_get_int (value);
      break;
    default:
      G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
      break;
  }
}

static void
gst_cuda_context_get_property (GObject * object, guint prop_id,
    GValue * value, GParamSpec * pspec)
{
  GstCudaContext *context = GST_CUDA_CONTEXT (object);
  GstCudaContextPrivate *priv = context->priv;

  switch (prop_id) {
    case PROP_DEVICE_ID:
      g_value_set_int (value, priv->device_id);
      break;
    default:
      G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
      break;
  }
}

static void
gst_cuda_context_constructed (GObject * object)
{
  static gsize once = 0;
  GstCudaContext *context = GST_CUDA_CONTEXT (object);
  GstCudaContextPrivate *priv = context->priv;
  CUcontext cuda_ctx, old_ctx;
  gboolean ret = TRUE;
  CUdevice cdev = 0, cuda_dev = -1;
  gint dev_count = 0;
  gchar name[256];
  gint min = 0, maj = 0;
  gint i;
  gint tex_align = 0;
  GList *iter;

  if (g_once_init_enter (&once)) {
    if (CuInit (0) != CUDA_SUCCESS) {
      GST_ERROR_OBJECT (context, "Failed to cuInit");
      ret = FALSE;
    }
    g_once_init_leave (&once, ret);

    if (!ret)
      return;
  }

  if (!gst_cuda_result (CuDeviceGetCount (&dev_count)) || dev_count == 0) {
    GST_WARNING ("No CUDA devices detected");
    return;
  }

  for (i = 0; i < dev_count; ++i) {
    if (gst_cuda_result (CuDeviceGet (&cdev, i)) &&
        gst_cuda_result (CuDeviceGetName (name, sizeof (name), cdev)) &&
        gst_cuda_result (CuDeviceGetAttribute (&maj,
                CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MAJOR, cdev)) &&
        gst_cuda_result (CuDeviceGetAttribute (&min,
                CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MINOR, cdev)) &&
        gst_cuda_result (CuDeviceGetAttribute (&tex_align,
                CU_DEVICE_ATTRIBUTE_TEXTURE_ALIGNMENT, cdev))) {
      GST_INFO ("GPU #%d supports NVENC: %s (%s) (Compute SM %d.%d)", i,
          (((maj << 4) + min) >= 0x30) ? "yes" : "no", name, maj, min);
      if (priv->device_id == -1 || priv->device_id == cdev) {
        priv->device_id = cuda_dev = cdev;
        priv->tex_align = tex_align;
        break;
      }
    }
  }

  if (cuda_dev == -1) {
    GST_WARNING ("Device with id %d does not exist", priv->device_id);
    return;
  }

  GST_DEBUG ("Creating cuda context for device index %d", cuda_dev);

  if (!gst_cuda_result (CuCtxCreate (&cuda_ctx, 0, cuda_dev))) {
    GST_WARNING ("Failed to create CUDA context for cuda device %d", cuda_dev);
    return;
  }

  if (!gst_cuda_result (CuCtxPopCurrent (&old_ctx))) {
    return;
  }

  GST_INFO ("Created CUDA context %p with device-id %d", cuda_ctx, cuda_dev);

  priv->context = cuda_ctx;
  priv->device = cuda_dev;

  G_LOCK (list_lock);
  g_object_weak_ref (G_OBJECT (object),
      (GWeakNotify) gst_cuda_context_weak_ref_notify, NULL);
  for (iter = context_list; iter; iter = g_list_next (iter)) {
    GstCudaContext *peer = (GstCudaContext *) iter->data;

    /* EnablePeerAccess is unidirectional */
    gst_cuda_context_enable_peer_access (context, peer);
    gst_cuda_context_enable_peer_access (peer, context);
  }

  context_list = g_list_append (context_list, context);
  G_UNLOCK (list_lock);
}

/* must be called with list_lock taken */
static void
gst_cuda_context_enable_peer_access (GstCudaContext * context,
    GstCudaContext * peer)
{
  GstCudaContextPrivate *priv = context->priv;
  GstCudaContextPrivate *peer_priv = peer->priv;
  CUdevice device = priv->device;
  CUdevice other_dev = peer_priv->device;
  CUresult cuda_ret;
  gint can_access = 0;

  cuda_ret = CuDeviceCanAccessPeer (&can_access, device, other_dev);

  if (!gst_cuda_result (cuda_ret) || !can_access) {
    GST_DEBUG_OBJECT (context,
        "Peer access to %" GST_PTR_FORMAT " is not allowed", peer);
    return;
  }

  gst_cuda_context_push (context);
  if (gst_cuda_result (CuCtxEnablePeerAccess (peer_priv->context, 0))) {
    GST_DEBUG_OBJECT (context, "Enable peer access to %" GST_PTR_FORMAT, peer);
    g_hash_table_add (priv->accessible_peer, peer);
  }

  gst_cuda_context_pop (NULL);
}

static void
gst_cuda_context_weak_ref_notify (gpointer data, GstCudaContext * context)
{
  GList *iter;

  G_LOCK (list_lock);
  context_list = g_list_remove (context_list, context);

  /* disable self -> peer access */
  if (context->priv->accessible_peer) {
    GHashTableIter iter;
    gpointer key;
    g_hash_table_iter_init (&iter, context->priv->accessible_peer);
    if (gst_cuda_context_push (context)) {
      while (g_hash_table_iter_next (&iter, &key, NULL)) {
        GstCudaContext *peer = GST_CUDA_CONTEXT (key);
        CUcontext peer_handle = gst_cuda_context_get_handle (peer);
        GST_DEBUG_OBJECT (context,
            "Disable peer access to %" GST_PTR_FORMAT, peer);
        gst_cuda_result (CuCtxDisablePeerAccess (peer_handle));
      }
      gst_cuda_context_pop (NULL);
    }

    g_hash_table_destroy (context->priv->accessible_peer);
    context->priv->accessible_peer = NULL;
  }

  /* disable peer -> self access */
  for (iter = context_list; iter; iter = g_list_next (iter)) {
    GstCudaContext *other = (GstCudaContext *) iter->data;
    GstCudaContextPrivate *other_priv = other->priv;
    CUcontext self_handle;

    if (!other_priv->accessible_peer)
      continue;

    if (g_hash_table_lookup (other_priv->accessible_peer, context)) {
      if (gst_cuda_context_push (other)) {
        self_handle = gst_cuda_context_get_handle (context);
        GST_DEBUG_OBJECT (other,
            "Disable peer access to %" GST_PTR_FORMAT, context);
        gst_cuda_result (CuCtxDisablePeerAccess (self_handle));
        gst_cuda_context_pop (NULL);
      }

      g_hash_table_remove (other_priv->accessible_peer, context);
    }
  }
  G_UNLOCK (list_lock);
}

static void
gst_cuda_context_finalize (GObject * object)
{
  GstCudaContext *context = GST_CUDA_CONTEXT_CAST (object);
  GstCudaContextPrivate *priv = context->priv;

  if (priv->context) {
    GST_DEBUG_OBJECT (context, "Destroying CUDA context %p", priv->context);
    gst_cuda_result (CuCtxDestroy (priv->context));
  }

  G_OBJECT_CLASS (parent_class)->finalize (object);
}

/**
 * gst_cuda_context_new:
 * @device_id: device-id for creating #GstCudaContext or -1 for auto selection
 *
 * Create #GstCudaContext with given device_id. If the @device_id was not -1
 * but was out of range (e.g., exceed the number of device),
 * #GstCudaContext will not be created.
 *
 * Returns: a new #GstCudaContext or %NULL on failure
 */
GstCudaContext *
gst_cuda_context_new (gint device_id)
{
  GstCudaContext *self =
      g_object_new (GST_TYPE_CUDA_CONTEXT, "cuda-device-id", device_id, NULL);

  gst_object_ref_sink (self);

  if (!self->priv->context) {
    GST_ERROR ("Failed to create CUDA context");
    gst_clear_object (&self);
  }

  return self;
}

/**
 * gst_cuda_context_push:
 * @ctx: a #GstCudaContext to push current thread
 *
 * Pushes the given @ctx onto the CPU thread's stack of current contexts.
 * The specified context becomes the CPU thread's current context,
 * so all CUDA functions that operate on the current context are affected.
 *
 * Returns: %TRUE if @ctx was pushed without error.
 */
gboolean
gst_cuda_context_push (GstCudaContext * ctx)
{
  g_return_val_if_fail (ctx, FALSE);
  g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), FALSE);

  return gst_cuda_result (CuCtxPushCurrent (ctx->priv->context));
}

/**
 * gst_cuda_context_pop:
 *
 * Pops the current CUDA context from CPU thread
 *
 * Returns: %TRUE if @ctx was pushed without error.
 */
gboolean
gst_cuda_context_pop (CUcontext * cuda_ctx)
{
  return gst_cuda_result (CuCtxPopCurrent (cuda_ctx));
}

/**
 * gst_cuda_context_get_handle:
 * @ctx: a #GstCudaContext
 *
 * Get CUDA device context. Caller must not modify and/or destroy
 * returned device context.
 *
 * Returns: the #CUcontext of @ctx
 */
gpointer
gst_cuda_context_get_handle (GstCudaContext * ctx)
{
  g_return_val_if_fail (ctx, NULL);
  g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), NULL);

  return ctx->priv->context;
}

/**
 * gst_cuda_context_get_texture_alignment:
 * @ctx: a #GstCudaContext
 *
 * Get required texture alignment by device
 *
 * Returns: the #CUcontext of @ctx
 */
gint
gst_cuda_context_get_texture_alignment (GstCudaContext * ctx)
{
  g_return_val_if_fail (ctx, 0);
  g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), 0);

  return ctx->priv->tex_align;
}

/**
 * gst_cuda_context_can_access_peer:
 * @ctx: a #GstCudaContext
 * @peer: a #GstCudaContext
 *
 * Query whether @ctx can access any memory which belongs to @peer directly.

 * Returns: %TRUE if @ctx can access @peer directly
 */
gboolean
gst_cuda_context_can_access_peer (GstCudaContext * ctx, GstCudaContext * peer)
{
  gboolean ret = FALSE;

  g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), FALSE);
  g_return_val_if_fail (GST_IS_CUDA_CONTEXT (peer), FALSE);

  G_LOCK (list_lock);
  if (ctx->priv->accessible_peer &&
      g_hash_table_lookup (ctx->priv->accessible_peer, peer)) {
    ret = TRUE;
  }
  G_UNLOCK (list_lock);

  return ret;
}
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`/* GStreamer`
			`* Copyright (C) <2018-2019> Seungha Yang <seungha.yang@navercorp.com>`
			`*`
			`* This library is free software; you can redistribute it and/or`
			`* modify it under the terms of the GNU Library General Public`
			`* License as published by the Free Software Foundation; either`
			`* version 2 of the License, or (at your option) any later version.`
			`*`
			`* This library is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`* Library General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU Library General Public`
			`* License along with this library; if not, write to the`
			`* Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,`
			`* Boston, MA 02110-1301, USA.`
			`*/`

			`#ifdef HAVE_CONFIG_H`
			`#include "config.h"`
			`#endif`

			`#include "gstcudaloader.h"`
			`#include "gstcudacontext.h"`
			`#include "gstcudautils.h"`

			`GST_DEBUG_CATEGORY_STATIC (gst_cuda_context_debug);`
			`#define GST_CAT_DEFAULT gst_cuda_context_debug`

cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00			`/* store all context object with weak ref */`
			`static GList *context_list = NULL;`
			`G_LOCK_DEFINE_STATIC (list_lock);`

nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`enum`
			`{`
			`PROP_0,`
			`PROP_DEVICE_ID`
			`};`

			`#define DEFAULT_DEVICE_ID -1`

			`struct _GstCudaContextPrivate`
			`{`
			`CUcontext context;`
			`CUdevice device;`
			`gint device_id;`
cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00
nvcodec: Add generic CUDA video convert object Introducing generic video convert object similar to video-converter but using CUDA. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-10-16 13:42:39 +00:00			`gint tex_align;`

cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00			`GHashTable *accessible_peer;`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`};`

			`#define gst_cuda_context_parent_class parent_class`
			`G_DEFINE_TYPE_WITH_PRIVATE (GstCudaContext, gst_cuda_context, GST_TYPE_OBJECT);`

			`static void gst_cuda_context_set_property (GObject * object, guint prop_id,`
			`const GValue * value, GParamSpec * pspec);`
			`static void gst_cuda_context_get_property (GObject * object, guint prop_id,`
			`GValue * value, GParamSpec * pspec);`
			`static void gst_cuda_context_constructed (GObject * object);`
			`static void gst_cuda_context_finalize (GObject * object);`
cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00			`static void gst_cuda_context_weak_ref_notify (gpointer data,`
			`GstCudaContext * context);`
			`static void gst_cuda_context_enable_peer_access (GstCudaContext * context,`
			`GstCudaContext * peer);`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00
			`static void`
			`gst_cuda_context_class_init (GstCudaContextClass * klass)`
			`{`
			`GObjectClass *gobject_class = G_OBJECT_CLASS (klass);`

			`gobject_class->set_property = gst_cuda_context_set_property;`
			`gobject_class->get_property = gst_cuda_context_get_property;`
			`gobject_class->constructed = gst_cuda_context_constructed;`
			`gobject_class->finalize = gst_cuda_context_finalize;`

			`g_object_class_install_property (gobject_class, PROP_DEVICE_ID,`
			`g_param_spec_int ("cuda-device-id", "Cuda Device ID",`
			`"Set the GPU device to use for operations (-1 = auto)",`
			`-1, G_MAXINT, DEFAULT_DEVICE_ID,`
			`G_PARAM_CONSTRUCT_ONLY \| G_PARAM_READWRITE \| G_PARAM_STATIC_STRINGS));`

			`GST_DEBUG_CATEGORY_INIT (gst_cuda_context_debug,`
			`"cudacontext", 0, "CUDA Context");`
			`}`

			`static void`
			`gst_cuda_context_init (GstCudaContext * context)`
			`{`
			`GstCudaContextPrivate *priv = gst_cuda_context_get_instance_private (context);`

			`priv->context = NULL;`
			`priv->device_id = DEFAULT_DEVICE_ID;`
cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00			`priv->accessible_peer = g_hash_table_new (g_direct_hash, g_direct_equal);`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00
			`context->priv = priv;`
			`}`

			`static void`
			`gst_cuda_context_set_property (GObject * object, guint prop_id,`
			`const GValue * value, GParamSpec * pspec)`
			`{`
			`GstCudaContext *context = GST_CUDA_CONTEXT (object);`
			`GstCudaContextPrivate *priv = context->priv;`

			`switch (prop_id) {`
			`case PROP_DEVICE_ID:`
			`priv->device_id = g_value_get_int (value);`
			`break;`
			`default:`
			`G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);`
			`break;`
			`}`
			`}`

			`static void`
			`gst_cuda_context_get_property (GObject * object, guint prop_id,`
			`GValue * value, GParamSpec * pspec)`
			`{`
			`GstCudaContext *context = GST_CUDA_CONTEXT (object);`
			`GstCudaContextPrivate *priv = context->priv;`

			`switch (prop_id) {`
			`case PROP_DEVICE_ID:`
			`g_value_set_int (value, priv->device_id);`
			`break;`
			`default:`
			`G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);`
			`break;`
			`}`
			`}`

			`static void`
			`gst_cuda_context_constructed (GObject * object)`
			`{`
gst: don't use volatile to mean atomic volatile is not sufficient to provide atomic guarantees and real atomics should be used instead. GCC 11 has started warning about using volatile with atomic operations. https://gitlab.gnome.org/GNOME/glib/-/merge_requests/1719 Discovered in https://gitlab.freedesktop.org/gstreamer/gst-plugins-good/-/issues/868 Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/2098> 2021-03-22 03:34:36 +00:00			`static gsize once = 0;`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`GstCudaContext *context = GST_CUDA_CONTEXT (object);`
			`GstCudaContextPrivate *priv = context->priv;`
			`CUcontext cuda_ctx, old_ctx;`
			`gboolean ret = TRUE;`
			`CUdevice cdev = 0, cuda_dev = -1;`
			`gint dev_count = 0;`
			`gchar name[256];`
			`gint min = 0, maj = 0;`
			`gint i;`
nvcodec: Add generic CUDA video convert object Introducing generic video convert object similar to video-converter but using CUDA. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-10-16 13:42:39 +00:00			`gint tex_align = 0;`
cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00			`GList *iter;`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00
			`if (g_once_init_enter (&once)) {`
			`if (CuInit (0) != CUDA_SUCCESS) {`
			`GST_ERROR_OBJECT (context, "Failed to cuInit");`
			`ret = FALSE;`
			`}`
			`g_once_init_leave (&once, ret);`

			`if (!ret)`
			`return;`
			`}`

			`if (!gst_cuda_result (CuDeviceGetCount (&dev_count)) \|\| dev_count == 0) {`
			`GST_WARNING ("No CUDA devices detected");`
			`return;`
			`}`

			`for (i = 0; i < dev_count; ++i) {`
			`if (gst_cuda_result (CuDeviceGet (&cdev, i)) &&`
			`gst_cuda_result (CuDeviceGetName (name, sizeof (name), cdev)) &&`
			`gst_cuda_result (CuDeviceGetAttribute (&maj,`
			`CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MAJOR, cdev)) &&`
			`gst_cuda_result (CuDeviceGetAttribute (&min,`
nvcodec: Add generic CUDA video convert object Introducing generic video convert object similar to video-converter but using CUDA. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-10-16 13:42:39 +00:00			`CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MINOR, cdev)) &&`
			`gst_cuda_result (CuDeviceGetAttribute (&tex_align,`
			`CU_DEVICE_ATTRIBUTE_TEXTURE_ALIGNMENT, cdev))) {`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`GST_INFO ("GPU #%d supports NVENC: %s (%s) (Compute SM %d.%d)", i,`
			`(((maj << 4) + min) >= 0x30) ? "yes" : "no", name, maj, min);`
			`if (priv->device_id == -1 \|\| priv->device_id == cdev) {`
			`priv->device_id = cuda_dev = cdev;`
nvcodec: Add generic CUDA video convert object Introducing generic video convert object similar to video-converter but using CUDA. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-10-16 13:42:39 +00:00			`priv->tex_align = tex_align;`
			`break;`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`}`
			`}`
			`}`

			`if (cuda_dev == -1) {`
			`GST_WARNING ("Device with id %d does not exist", priv->device_id);`
			`return;`
			`}`

			`GST_DEBUG ("Creating cuda context for device index %d", cuda_dev);`

			`if (!gst_cuda_result (CuCtxCreate (&cuda_ctx, 0, cuda_dev))) {`
			`GST_WARNING ("Failed to create CUDA context for cuda device %d", cuda_dev);`
			`return;`
			`}`

			`if (!gst_cuda_result (CuCtxPopCurrent (&old_ctx))) {`
			`return;`
			`}`

			`GST_INFO ("Created CUDA context %p with device-id %d", cuda_ctx, cuda_dev);`

			`priv->context = cuda_ctx;`
			`priv->device = cuda_dev;`
cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00
			`G_LOCK (list_lock);`
			`g_object_weak_ref (G_OBJECT (object),`
			`(GWeakNotify) gst_cuda_context_weak_ref_notify, NULL);`
			`for (iter = context_list; iter; iter = g_list_next (iter)) {`
			`GstCudaContext peer = (GstCudaContext ) iter->data;`

			`/* EnablePeerAccess is unidirectional */`
			`gst_cuda_context_enable_peer_access (context, peer);`
			`gst_cuda_context_enable_peer_access (peer, context);`
			`}`

			`context_list = g_list_append (context_list, context);`
			`G_UNLOCK (list_lock);`
			`}`

			`/* must be called with list_lock taken */`
			`static void`
			`gst_cuda_context_enable_peer_access (GstCudaContext * context,`
			`GstCudaContext * peer)`
			`{`
			`GstCudaContextPrivate *priv = context->priv;`
			`GstCudaContextPrivate *peer_priv = peer->priv;`
			`CUdevice device = priv->device;`
			`CUdevice other_dev = peer_priv->device;`
			`CUresult cuda_ret;`
			`gint can_access = 0;`

			`cuda_ret = CuDeviceCanAccessPeer (&can_access, device, other_dev);`

			`if (!gst_cuda_result (cuda_ret) \|\| !can_access) {`
			`GST_DEBUG_OBJECT (context,`
			`"Peer access to %" GST_PTR_FORMAT " is not allowed", peer);`
			`return;`
			`}`

			`gst_cuda_context_push (context);`
			`if (gst_cuda_result (CuCtxEnablePeerAccess (peer_priv->context, 0))) {`
			`GST_DEBUG_OBJECT (context, "Enable peer access to %" GST_PTR_FORMAT, peer);`
			`g_hash_table_add (priv->accessible_peer, peer);`
			`}`

			`gst_cuda_context_pop (NULL);`
			`}`

			`static void`
			`gst_cuda_context_weak_ref_notify (gpointer data, GstCudaContext * context)`
			`{`
			`GList *iter;`

			`G_LOCK (list_lock);`
			`context_list = g_list_remove (context_list, context);`

			`/* disable self -> peer access */`
			`if (context->priv->accessible_peer) {`
			`GHashTableIter iter;`
			`gpointer key;`
			`g_hash_table_iter_init (&iter, context->priv->accessible_peer);`
			`if (gst_cuda_context_push (context)) {`
			`while (g_hash_table_iter_next (&iter, &key, NULL)) {`
			`GstCudaContext *peer = GST_CUDA_CONTEXT (key);`
			`CUcontext peer_handle = gst_cuda_context_get_handle (peer);`
			`GST_DEBUG_OBJECT (context,`
			`"Disable peer access to %" GST_PTR_FORMAT, peer);`
			`gst_cuda_result (CuCtxDisablePeerAccess (peer_handle));`
			`}`
			`gst_cuda_context_pop (NULL);`
			`}`

			`g_hash_table_destroy (context->priv->accessible_peer);`
			`context->priv->accessible_peer = NULL;`
			`}`

			`/* disable peer -> self access */`
			`for (iter = context_list; iter; iter = g_list_next (iter)) {`
			`GstCudaContext other = (GstCudaContext ) iter->data;`
			`GstCudaContextPrivate *other_priv = other->priv;`
			`CUcontext self_handle;`

			`if (!other_priv->accessible_peer)`
			`continue;`

			`if (g_hash_table_lookup (other_priv->accessible_peer, context)) {`
			`if (gst_cuda_context_push (other)) {`
			`self_handle = gst_cuda_context_get_handle (context);`
			`GST_DEBUG_OBJECT (other,`
			`"Disable peer access to %" GST_PTR_FORMAT, context);`
			`gst_cuda_result (CuCtxDisablePeerAccess (self_handle));`
			`gst_cuda_context_pop (NULL);`
			`}`

			`g_hash_table_remove (other_priv->accessible_peer, context);`
			`}`
			`}`
			`G_UNLOCK (list_lock);`
nvcodec: Introduce NVIDA CUDA helpers New object and helper functions can remove duplicated code from nvenc/nvdec. Also this is prework for CUDA device context sharing among nvdec(s)/nvenc(s). 2018-11-23 13:01:41 +00:00			`}`

			`static void`
			`gst_cuda_context_finalize (GObject * object)`
			`{`
			`GstCudaContext *context = GST_CUDA_CONTEXT_CAST (object);`
			`GstCudaContextPrivate *priv = context->priv;`

			`if (priv->context) {`
			`GST_DEBUG_OBJECT (context, "Destroying CUDA context %p", priv->context);`
			`gst_cuda_result (CuCtxDestroy (priv->context));`
			`}`

			`G_OBJECT_CLASS (parent_class)->finalize (object);`
			`}`

			`/**`
			`* gst_cuda_context_new:`
			`* @device_id: device-id for creating #GstCudaContext or -1 for auto selection`
			`*`
			`* Create #GstCudaContext with given device_id. If the @device_id was not -1`
			`* but was out of range (e.g., exceed the number of device),`
			`* #GstCudaContext will not be created.`
			`*`
			`* Returns: a new #GstCudaContext or %NULL on failure`
			`*/`
			`GstCudaContext *`
			`gst_cuda_context_new (gint device_id)`
			`{`
			`GstCudaContext *self =`
			`g_object_new (GST_TYPE_CUDA_CONTEXT, "cuda-device-id", device_id, NULL);`

			`gst_object_ref_sink (self);`

			`if (!self->priv->context) {`
			`GST_ERROR ("Failed to create CUDA context");`
			`gst_clear_object (&self);`
			`}`

			`return self;`
			`}`

			`/**`
			`* gst_cuda_context_push:`
			`* @ctx: a #GstCudaContext to push current thread`
			`*`
			`* Pushes the given @ctx onto the CPU thread's stack of current contexts.`
			`* The specified context becomes the CPU thread's current context,`
			`* so all CUDA functions that operate on the current context are affected.`
			`*`
			`* Returns: %TRUE if @ctx was pushed without error.`
			`*/`
			`gboolean`
			`gst_cuda_context_push (GstCudaContext * ctx)`
			`{`
			`g_return_val_if_fail (ctx, FALSE);`
			`g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), FALSE);`

			`return gst_cuda_result (CuCtxPushCurrent (ctx->priv->context));`
			`}`

			`/**`
			`* gst_cuda_context_pop:`
			`*`
			`* Pops the current CUDA context from CPU thread`
			`*`
			`* Returns: %TRUE if @ctx was pushed without error.`
			`*/`
			`gboolean`
			`gst_cuda_context_pop (CUcontext * cuda_ctx)`
			`{`
			`return gst_cuda_result (CuCtxPopCurrent (cuda_ctx));`
			`}`

			`/**`
			`* gst_cuda_context_get_handle:`
			`* @ctx: a #GstCudaContext`
			`*`
			`* Get CUDA device context. Caller must not modify and/or destroy`
			`* returned device context.`
			`*`
			`* Returns: the #CUcontext of @ctx`
			`*/`
			`gpointer`
			`gst_cuda_context_get_handle (GstCudaContext * ctx)`
			`{`
			`g_return_val_if_fail (ctx, NULL);`
			`g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), NULL);`

			`return ctx->priv->context;`
			`}`
cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00
nvcodec: Add generic CUDA video convert object Introducing generic video convert object similar to video-converter but using CUDA. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-10-16 13:42:39 +00:00			`/**`
			`* gst_cuda_context_get_texture_alignment:`
			`* @ctx: a #GstCudaContext`
			`*`
			`* Get required texture alignment by device`
			`*`
			`* Returns: the #CUcontext of @ctx`
			`*/`
			`gint`
			`gst_cuda_context_get_texture_alignment (GstCudaContext * ctx)`
			`{`
			`g_return_val_if_fail (ctx, 0);`
			`g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), 0);`

			`return ctx->priv->tex_align;`
			`}`

cudacontext: Enable direct CUDA memory access over multiple GPUs If each device context can access each other, enable peer access for better interoperability. Part-of: <https://gitlab.freedesktop.org/gstreamer/gst-plugins-bad/-/merge_requests/1633> 2019-08-30 08:19:44 +00:00			`/**`
			`* gst_cuda_context_can_access_peer:`
			`* @ctx: a #GstCudaContext`
			`* @peer: a #GstCudaContext`
			`*`
			`* Query whether @ctx can access any memory which belongs to @peer directly.`

			`* Returns: %TRUE if @ctx can access @peer directly`
			`*/`
			`gboolean`
			`gst_cuda_context_can_access_peer (GstCudaContext * ctx, GstCudaContext * peer)`
			`{`
			`gboolean ret = FALSE;`

			`g_return_val_if_fail (GST_IS_CUDA_CONTEXT (ctx), FALSE);`
			`g_return_val_if_fail (GST_IS_CUDA_CONTEXT (peer), FALSE);`

			`G_LOCK (list_lock);`
			`if (ctx->priv->accessible_peer &&`
			`g_hash_table_lookup (ctx->priv->accessible_peer, peer)) {`
			`ret = TRUE;`
			`}`
			`G_UNLOCK (list_lock);`

			`return ret;`
			`}`