[vlc-commits] nvdec: add direct rendering in OpenGL
Steve Lhomme
git at videolan.org
Wed Sep 18 09:05:28 CEST 2019
vlc | branch: master | Steve Lhomme <robux4 at ycbcr.xyz> | Tue Sep 17 13:06:44 2019 +0200| [31fdbd4863f50e75135d66622b2ab1f25a54f4a6] | committer: Steve Lhomme
nvdec: add direct rendering in OpenGL
> http://git.videolan.org/gitweb.cgi/vlc.git/?a=commit;h=31fdbd4863f50e75135d66622b2ab1f25a54f4a6
---
modules/hw/nvdec/Makefile.am | 8 ++
modules/hw/nvdec/nvdec_gl.c | 231 +++++++++++++++++++++++++++++++++++++++++++
2 files changed, 239 insertions(+)
diff --git a/modules/hw/nvdec/Makefile.am b/modules/hw/nvdec/Makefile.am
index 17bddf8f18..ac52c0f511 100644
--- a/modules/hw/nvdec/Makefile.am
+++ b/modules/hw/nvdec/Makefile.am
@@ -17,3 +17,11 @@ if HAVE_NVDEC
nvdec_LTLIBRARIES = libnvdec_chroma_plugin.la
endif
+libglconv_nvdec_plugin_la_SOURCES = hw/nvdec/nvdec_gl.c \
+ video_output/opengl/converter.h hw/nvdec/nvdec_fmt.h
+libglconv_nvdec_plugin_la_LIBADD = $(LIBDL)
+if HAVE_GL
+if HAVE_NVDEC
+nvdec_LTLIBRARIES += libglconv_nvdec_plugin.la
+endif
+endif
diff --git a/modules/hw/nvdec/nvdec_gl.c b/modules/hw/nvdec/nvdec_gl.c
new file mode 100644
index 0000000000..96fdf801e0
--- /dev/null
+++ b/modules/hw/nvdec/nvdec_gl.c
@@ -0,0 +1,231 @@
+/*****************************************************************************
+ * converter_nvdec.c: OpenGL NVDEC opaque converter
+ *****************************************************************************
+ * Copyright (C) 2019 VLC authors, VideoLAN and VideoLabs
+ *
+ * Authors: Steve Lhomme <robux4 at videolabs.io>
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU Lesser General Public License as published by
+ * the Free Software Foundation; either version 2.1 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public License
+ * along with this program; if not, write to the Free Software Foundation,
+ * Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
+ *****************************************************************************/
+
+#ifdef HAVE_CONFIG_H
+# include "config.h"
+#endif
+
+#include <assert.h>
+
+#include <vlc_common.h>
+#include <vlc_vout_window.h>
+#include <vlc_codec.h>
+
+#include <ffnvcodec/dynlink_loader.h>
+
+#include "../../hw/nvdec/nvdec_fmt.h"
+
+#include "../../video_output/opengl/internal.h"
+#include <GL/glext.h>
+
+static int Open(vlc_object_t *);
+static void Close(vlc_object_t *);
+
+vlc_module_begin ()
+ set_description("NVDEC OpenGL surface converter")
+ set_capability("glconv", 2)
+ set_callbacks(Open, Close)
+ set_category(CAT_VIDEO)
+ set_subcategory(SUBCAT_VIDEO_VOUT)
+ add_shortcut("nvdec")
+vlc_module_end ()
+
+typedef struct {
+ vlc_decoder_device *device;
+ CUcontext cuConverterCtx;
+ CUgraphicsResource cu_res[PICTURE_PLANE_MAX]; // Y, UV for NV12/P010
+ CUarray mappedArray[PICTURE_PLANE_MAX];
+} converter_sys_t;
+
+static inline int CudaCall(const opengl_tex_converter_t *tc, CUresult result, const char *psz_func)
+{
+ if (unlikely(result != CUDA_SUCCESS)) {
+ const char *psz_err, *psz_err_str;
+ vlc_decoder_device *device = tc->dec_device;
+ decoder_device_nvdec_t *devsys = device->opaque;
+ devsys->cudaFunctions->cuGetErrorName(result, &psz_err);
+ devsys->cudaFunctions->cuGetErrorString(result, &psz_err_str);
+ msg_Err((vlc_object_t *)&tc->obj, "%s failed: %s (%s)", psz_func, psz_err_str, psz_err);
+ return VLC_EGENERIC;
+ }
+ return VLC_SUCCESS;
+}
+
+#define CALL_CUDA(func, ...) CudaCall(tc, devsys->cudaFunctions->func(__VA_ARGS__), #func)
+
+static int tc_nvdec_gl_allocate_texture(const opengl_tex_converter_t *tc, GLuint *textures,
+ const GLsizei *tex_width, const GLsizei *tex_height)
+{
+ converter_sys_t *p_sys = tc->priv;
+ vlc_decoder_device *device = tc->dec_device;
+ decoder_device_nvdec_t *devsys = device->opaque;
+
+ int result;
+ result = CALL_CUDA(cuCtxPushCurrent, p_sys->cuConverterCtx ? p_sys->cuConverterCtx : devsys->cuCtx);
+ if (result != VLC_SUCCESS)
+ return result;
+
+ for (unsigned i = 0; i < tc->tex_count; i++)
+ {
+ tc->vt->BindTexture(tc->tex_target, textures[i]);
+ tc->vt->TexImage2D(tc->tex_target, 0, tc->texs[i].internal,
+ tex_width[i], tex_height[i], 0, tc->texs[i].format,
+ tc->texs[i].type, NULL);
+ if (tc->vt->GetError() != GL_NO_ERROR)
+ {
+ msg_Err(tc->gl, "could not alloc PBO buffers");
+ return VLC_EGENERIC;
+ }
+
+ result = CALL_CUDA(cuGraphicsGLRegisterImage, &p_sys->cu_res[i], textures[i], tc->tex_target, CU_GRAPHICS_REGISTER_FLAGS_WRITE_DISCARD);
+
+ result = CALL_CUDA(cuGraphicsMapResources, 1, &p_sys->cu_res[i], 0);
+ result = CALL_CUDA(cuGraphicsSubResourceGetMappedArray, &p_sys->mappedArray[i], p_sys->cu_res[i], 0, 0);
+ result = CALL_CUDA(cuGraphicsUnmapResources, 1, &p_sys->cu_res[i], 0);
+
+ tc->vt->BindTexture(tc->tex_target, 0);
+ }
+
+ CALL_CUDA(cuCtxPopCurrent, NULL);
+ return result;
+}
+
+static int
+tc_nvdec_gl_update(opengl_tex_converter_t const *tc, GLuint textures[],
+ GLsizei const tex_widths[], GLsizei const tex_heights[],
+ picture_t *pic, size_t const plane_offsets[])
+{
+ VLC_UNUSED(plane_offsets);
+ VLC_UNUSED(textures);
+
+ converter_sys_t *p_sys = tc->priv;
+ vlc_decoder_device *device = tc->dec_device;
+ decoder_device_nvdec_t *devsys = device->opaque;
+ pic_context_nvdec_t *srcpic = container_of(pic->context, pic_context_nvdec_t, ctx);
+
+ int result;
+ result = CALL_CUDA(cuCtxPushCurrent, p_sys->cuConverterCtx ? p_sys->cuConverterCtx : devsys->cuCtx);
+ if (result != VLC_SUCCESS)
+ return result;
+
+ // copy the planes from the pic context to mappedArray
+ size_t srcY = 0;
+ for (unsigned i = 0; i < tc->tex_count; i++)
+ {
+ CUDA_MEMCPY2D cu_cpy = {
+ .srcMemoryType = CU_MEMORYTYPE_DEVICE,
+ .srcDevice = srcpic->devidePtr,
+ .srcPitch = srcpic->bufferPitch,
+ .srcY = srcY,
+ .dstMemoryType = CU_MEMORYTYPE_ARRAY,
+ .dstArray = p_sys->mappedArray[i],
+ .WidthInBytes = tex_widths[0],
+ .Height = tex_heights[i],
+ };
+ if (tc->fmt.i_chroma != VLC_CODEC_NVDEC_OPAQUE)
+ cu_cpy.WidthInBytes *= 2;
+ result = CALL_CUDA(cuMemcpy2DAsync, &cu_cpy, 0);
+ if (result != VLC_SUCCESS)
+ goto error;
+ srcY += srcpic->bufferHeight;
+ }
+
+error:
+ CALL_CUDA(cuCtxPopCurrent, NULL);
+ return result;
+}
+
+static void Close(vlc_object_t *obj)
+{
+ opengl_tex_converter_t *tc = (void *)obj;
+ converter_sys_t *p_sys = tc->priv;
+ vlc_decoder_device_Release(p_sys->device);
+}
+
+static int Open(vlc_object_t *obj)
+{
+ opengl_tex_converter_t *tc = (void *) obj;
+ if (!is_nvdec_opaque(tc->fmt.i_chroma))
+ return VLC_EGENERIC;
+
+ vlc_decoder_device *device = tc->dec_device;
+ if (device == NULL || device->type != VLC_DECODER_DEVICE_NVDEC)
+ return VLC_EGENERIC;
+ device = vlc_decoder_device_Hold(device);
+
+ converter_sys_t *p_sys = vlc_obj_malloc(VLC_OBJECT(tc), sizeof(*p_sys));
+ if (unlikely(p_sys == NULL))
+ {
+ vlc_decoder_device_Release(device);
+ return VLC_ENOMEM;
+ }
+ for (size_t i=0; i < ARRAY_SIZE(p_sys->cu_res); i++)
+ p_sys->cu_res[i] = NULL;
+ p_sys->cuConverterCtx = NULL;
+ p_sys->device = device;
+
+ decoder_device_nvdec_t *devsys = device->opaque;
+ int result;
+ CUdevice cuDecDevice = 0;
+ unsigned int device_count;
+ result = CALL_CUDA(cuGLGetDevices, &device_count, &cuDecDevice, 1, CU_GL_DEVICE_LIST_ALL);
+ if (result < 0)
+ {
+ vlc_decoder_device_Release(device);
+ return result;
+ }
+
+ CUdevice cuConverterDevice;
+ CALL_CUDA(cuCtxPushCurrent, devsys->cuCtx);
+ result = CALL_CUDA(cuCtxGetDevice, &cuConverterDevice);
+ CALL_CUDA(cuCtxPopCurrent, NULL);
+
+ if (cuConverterDevice != cuDecDevice)
+ {
+ result = CALL_CUDA(cuCtxCreate, &p_sys->cuConverterCtx, 0, cuConverterDevice);
+ if (result != VLC_SUCCESS)
+ {
+ }
+ }
+
+ vlc_fourcc_t render_chroma;
+ switch (tc->fmt.i_chroma)
+ {
+ case VLC_CODEC_NVDEC_OPAQUE_10B: render_chroma = VLC_CODEC_P010; break;
+ case VLC_CODEC_NVDEC_OPAQUE_16B: render_chroma = VLC_CODEC_P016; break;
+ case VLC_CODEC_NVDEC_OPAQUE:
+ default: render_chroma = VLC_CODEC_NV12; break;
+ }
+
+ tc->fshader = opengl_fragment_shader_init(tc, GL_TEXTURE_2D, render_chroma, tc->fmt.space);
+ if (!tc->fshader)
+ {
+ Close(obj);
+ return VLC_EGENERIC;
+ }
+
+ tc->pf_allocate_textures = tc_nvdec_gl_allocate_texture;
+ tc->pf_update = tc_nvdec_gl_update;
+ tc->priv = p_sys;
+
+ return VLC_SUCCESS;
+}
More information about the vlc-commits
mailing list