obs-StreamFX/source/nvidia/cuda/nvidia-cuda.cpp

/*
 * Modern effects for a modern Streamer
 * Copyright (C) 2020 Michael Fabian Dirks
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA
 */

#include "nvidia-cuda.hpp"
#include "common.hpp"
#include <mutex>

#if defined(_WIN32) || defined(_WIN64)
#define CUDA_NAME "nvcuda.dll"
#else
#define CUDA_NAME "libcuda.so.1"
#endif

#define CUDA_LOAD_SYMBOL(NAME)                                                            \
	{                                                                                     \
		NAME = reinterpret_cast<decltype(NAME)>(os_dlsym(_library, #NAME));                    \
		if (!NAME)                                                                        \
			throw std::runtime_error("Failed to load '" #NAME "' from '" CUDA_NAME "'."); \
	}
#define CUDA_LOAD_SYMBOL_V2(NAME)                                                         \
	{                                                                                     \
		NAME = reinterpret_cast<decltype(NAME)>(os_dlsym(_library, #NAME "_v2"));              \
		if (!NAME)                                                                        \
			throw std::runtime_error("Failed to load '" #NAME "' from '" CUDA_NAME "'."); \
	}
#define CUDA_LOAD_SYMBOL_EX(NAME, OVERRIDE)                                               \
	{                                                                                     \
		NAME = reinterpret_cast<decltype(NAME)>(os_dlsym(_library, #OVERRIDE));                \
		if (!NAME)                                                                        \
			throw std::runtime_error("Failed to load '" #NAME "' from '" CUDA_NAME "'."); \
	}

nvidia::cuda::cuda::cuda()
{
	_library = os_dlopen(CUDA_NAME);
	if (!_library)
		throw std::runtime_error("Failed to load '" CUDA_NAME "'.");

	// Initialization
	CUDA_LOAD_SYMBOL(cuInit);

	// Version Management
	CUDA_LOAD_SYMBOL(cuDriverGetVersion);

	// Primary Context Management
	CUDA_LOAD_SYMBOL(cuDevicePrimaryCtxRetain);
	CUDA_LOAD_SYMBOL_V2(cuDevicePrimaryCtxRelease);
	CUDA_LOAD_SYMBOL_V2(cuDevicePrimaryCtxSetFlags);

	// Context Management
	CUDA_LOAD_SYMBOL_V2(cuCtxCreate);
	CUDA_LOAD_SYMBOL_V2(cuCtxDestroy);
	CUDA_LOAD_SYMBOL(cuCtxGetCurrent);
	CUDA_LOAD_SYMBOL(cuCtxGetStreamPriorityRange);
	CUDA_LOAD_SYMBOL_V2(cuCtxPopCurrent);
	CUDA_LOAD_SYMBOL_V2(cuCtxPushCurrent);
	CUDA_LOAD_SYMBOL(cuCtxSetCurrent);
	CUDA_LOAD_SYMBOL(cuCtxSynchronize);

	// Memory Management
	CUDA_LOAD_SYMBOL_V2(cuArrayGetDescriptor);
	CUDA_LOAD_SYMBOL_V2(cuMemAlloc);
	CUDA_LOAD_SYMBOL_V2(cuMemAllocPitch);
	CUDA_LOAD_SYMBOL_V2(cuMemFree);
	CUDA_LOAD_SYMBOL_V2(cuMemHostGetDevicePointer);
	CUDA_LOAD_SYMBOL(cuMemcpy);
	CUDA_LOAD_SYMBOL_V2(cuMemcpy2D);
	CUDA_LOAD_SYMBOL_V2(cuMemcpy2DAsync);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyAtoA);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyAtoD);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyAtoH);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyAtoHAsync);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyDtoA);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyDtoD);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyDtoH);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyDtoHAsync);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyHtoA);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyHtoAAsync);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyHtoD);
	CUDA_LOAD_SYMBOL_V2(cuMemcpyHtoDAsync);

	// Stream Managment
	CUDA_LOAD_SYMBOL(cuStreamCreate);
	CUDA_LOAD_SYMBOL(cuStreamCreateWithPriority);
	CUDA_LOAD_SYMBOL_V2(cuStreamDestroy);
	CUDA_LOAD_SYMBOL(cuStreamSynchronize);

	// Graphics Interoperability
	CUDA_LOAD_SYMBOL(cuGraphicsMapResources);
	CUDA_LOAD_SYMBOL(cuGraphicsSubResourceGetMappedArray);
	CUDA_LOAD_SYMBOL(cuGraphicsUnmapResources);
	CUDA_LOAD_SYMBOL(cuGraphicsUnregisterResource);

#ifdef WIN32
	// Direct3D11 Interopability
	CUDA_LOAD_SYMBOL(cuD3D11GetDevice);
	CUDA_LOAD_SYMBOL(cuGraphicsD3D11RegisterResource);
#endif

	// Initialize CUDA
	cuInit(0);
}

nvidia::cuda::cuda::~cuda()
{
	os_dlclose(_library);
}

std::shared_ptr<nvidia::cuda::cuda> nvidia::cuda::cuda::get()
{
	static std::shared_ptr<nvidia::cuda::cuda> instance;
	static std::mutex                          lock;

	std::unique_lock<std::mutex> ul(lock);
	if (!instance) {
		instance = std::make_shared<nvidia::cuda::cuda>();
	}
	return instance;
}