mirror of
https://github.com/Xaymar/obs-StreamFX
synced 2024-11-11 06:15:05 +00:00
5fc95b48d8
The high priority CUDA stream causes libOBS to be at a lower priority than the tracking, which is not what we want. Instead we want tracking to be incomplete in those cases, rather than slowing down encoding and other things. Geometry updates are also now done once per frame instead of one per tracking update, which should improve the smoothness without affecting performance too much. Additionally all tracking info is now in the 0..1 range, which drastically simplifies some math - especially with texture coordinates. To deal with tracking and updates being asynchronous, a very simple approximation of movement velocity has been added. This is mostly wrong, but it can bridge the gap where tracking updates are slower, as the values are all filtered anyway.
159 lines
5.3 KiB
C++
159 lines
5.3 KiB
C++
/*
|
|
* Modern effects for a modern Streamer
|
|
* Copyright (C) 2017 Michael Fabian Dirks
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
|
|
*/
|
|
|
|
#pragma once
|
|
#include "common.hpp"
|
|
#include <atomic>
|
|
#include <vector>
|
|
#include "obs/gs/gs-effect.hpp"
|
|
#include "obs/gs/gs-rendertarget.hpp"
|
|
#include "obs/gs/gs-vertexbuffer.hpp"
|
|
#include "obs/obs-source-factory.hpp"
|
|
|
|
// Nvidia
|
|
#include "nvidia/ar/nvidia-ar.hpp"
|
|
#include "nvidia/cuda/nvidia-cuda-context.hpp"
|
|
#include "nvidia/cuda/nvidia-cuda-gs-texture.hpp"
|
|
#include "nvidia/cuda/nvidia-cuda-memory.hpp"
|
|
#include "nvidia/cuda/nvidia-cuda-stream.hpp"
|
|
#include "nvidia/cuda/nvidia-cuda.hpp"
|
|
|
|
namespace streamfx::filter::nvidia {
|
|
class face_tracking_instance : public obs::source_instance {
|
|
// Filter Cache
|
|
std::pair<std::uint32_t, std::uint32_t> _size;
|
|
bool _rt_is_fresh;
|
|
std::shared_ptr<gs::rendertarget> _rt;
|
|
|
|
std::mutex _delete_protection;
|
|
|
|
// Settings
|
|
double_t _cfg_zoom;
|
|
std::pair<double_t, double_t> _cfg_offset;
|
|
double_t _cfg_stability;
|
|
|
|
// Operational Data
|
|
std::shared_ptr<gs::vertex_buffer> _geometry;
|
|
struct {
|
|
util::math::kalman1D<double_t> center[2];
|
|
util::math::kalman1D<double_t> size[2];
|
|
} _filters;
|
|
struct {
|
|
std::mutex lock;
|
|
double_t center[2];
|
|
double_t size[2];
|
|
double_t velocity[2];
|
|
} _values;
|
|
|
|
// Nvidia CUDA interop
|
|
std::shared_ptr<::nvidia::cuda::cuda> _cuda;
|
|
std::shared_ptr<::nvidia::cuda::context> _cuda_ctx;
|
|
std::shared_ptr<::nvidia::cuda::stream> _cuda_stream;
|
|
|
|
// Nvidia AR interop
|
|
std::shared_ptr<::nvidia::ar::ar> _ar_library;
|
|
std::atomic_bool _ar_loaded;
|
|
std::shared_ptr<nvAR_Feature> _ar_feature;
|
|
std::atomic_bool _ar_is_tracking;
|
|
std::mutex _ar_lock;
|
|
std::vector<float_t> _ar_bboxes_confidence;
|
|
std::vector<NvAR_Rect> _ar_bboxes_data;
|
|
NvAR_BBoxes _ar_bboxes;
|
|
std::shared_ptr<gs::texture> _ar_texture;
|
|
bool _ar_texture_cuda_fresh;
|
|
std::shared_ptr<::nvidia::cuda::gstexture> _ar_texture_cuda;
|
|
std::shared_ptr<::nvidia::cuda::memory> _ar_texture_cuda_mem;
|
|
NvCVImage _ar_image;
|
|
NvCVImage _ar_image_bgr;
|
|
NvCVImage _ar_image_temp;
|
|
|
|
// Tasks
|
|
std::shared_ptr<::util::threadpool::task> _async_initialize;
|
|
std::shared_ptr<::util::threadpool::task> _async_track;
|
|
|
|
#ifdef ENABLE_PROFILING
|
|
// Profiling
|
|
std::shared_ptr<util::profiler> _profile_capture;
|
|
std::shared_ptr<util::profiler> _profile_capture_realloc;
|
|
std::shared_ptr<util::profiler> _profile_capture_copy;
|
|
std::shared_ptr<util::profiler> _profile_ar_realloc;
|
|
std::shared_ptr<util::profiler> _profile_ar_copy;
|
|
std::shared_ptr<util::profiler> _profile_ar_transfer;
|
|
std::shared_ptr<util::profiler> _profile_ar_run;
|
|
std::shared_ptr<util::profiler> _profile_ar_calc;
|
|
#endif
|
|
|
|
public:
|
|
face_tracking_instance(obs_data_t*, obs_source_t*);
|
|
virtual ~face_tracking_instance() override;
|
|
|
|
// Tasks
|
|
void async_initialize(std::shared_ptr<void> = nullptr);
|
|
|
|
void async_track(std::shared_ptr<void> = nullptr);
|
|
|
|
void refresh_geometry();
|
|
|
|
void refresh_region_of_interest();
|
|
|
|
virtual void load(obs_data_t* data) override;
|
|
|
|
virtual void migrate(obs_data_t* data, std::uint64_t version) override;
|
|
|
|
virtual void update(obs_data_t* data) override;
|
|
|
|
virtual void video_tick(float_t seconds) override;
|
|
|
|
virtual void video_render(gs_effect_t* effect) override;
|
|
|
|
#ifdef ENABLE_PROFILING
|
|
bool button_profile(obs_properties_t* props, obs_property_t* property);
|
|
#endif
|
|
};
|
|
|
|
class face_tracking_factory
|
|
: public obs::source_factory<filter::nvidia::face_tracking_factory, filter::nvidia::face_tracking_instance> {
|
|
std::shared_ptr<::nvidia::cuda::cuda> _cuda;
|
|
std::shared_ptr<::nvidia::cuda::context> _cuda_ctx;
|
|
std::shared_ptr<::nvidia::ar::ar> _ar;
|
|
|
|
public:
|
|
face_tracking_factory();
|
|
virtual ~face_tracking_factory() override;
|
|
|
|
virtual const char* get_name() override;
|
|
|
|
virtual void get_defaults2(obs_data_t* data) override;
|
|
|
|
virtual obs_properties_t* get_properties2(filter::nvidia::face_tracking_instance* data) override;
|
|
|
|
std::shared_ptr<::nvidia::cuda::cuda> get_cuda();
|
|
|
|
std::shared_ptr<::nvidia::cuda::context> get_cuda_context();
|
|
|
|
std::shared_ptr<::nvidia::ar::ar> get_ar();
|
|
|
|
public: // Singleton
|
|
static void initialize();
|
|
|
|
static void finalize();
|
|
|
|
static std::shared_ptr<face_tracking_factory> get();
|
|
};
|
|
} // namespace streamfx::filter::nvidia
|