diff options
author | Timo Rothenpieler <[email protected]> | 2025-08-30 00:45:22 +0200 |
---|---|---|
committer | Timo Rothenpieler <[email protected]> | 2025-09-14 11:45:11 +0000 |
commit | 36e374efb05a2ad81369980de98a0d78381ec81f (patch) | |
tree | 75f67da7ada76d2c47ac3fb87ddc019049668921 /libavfilter | |
parent | 7856f57533b14c18e888e275770a0ca26685d6e4 (diff) |
avfilter: add gfxcapture, Windows.Graphics.Capture based window/monitor capture
Diffstat (limited to 'libavfilter')
-rw-r--r-- | libavfilter/Makefile | 1 | ||||
-rw-r--r-- | libavfilter/allfilters.c | 1 | ||||
-rw-r--r-- | libavfilter/version.h | 2 | ||||
-rw-r--r-- | libavfilter/vsrc_gfxcapture.c | 102 | ||||
-rw-r--r-- | libavfilter/vsrc_gfxcapture.h | 81 | ||||
-rw-r--r-- | libavfilter/vsrc_gfxcapture_shader.h | 126 | ||||
-rw-r--r-- | libavfilter/vsrc_gfxcapture_winrt.cpp | 1551 | ||||
-rw-r--r-- | libavfilter/vsrc_gfxcapture_winrt.h | 189 |
8 files changed, 2052 insertions, 1 deletions
diff --git a/libavfilter/Makefile b/libavfilter/Makefile index bd3f6da27d..70b100aff1 100644 --- a/libavfilter/Makefile +++ b/libavfilter/Makefile @@ -609,6 +609,7 @@ OBJS-$(CONFIG_COLORSPECTRUM_FILTER) += vsrc_testsrc.o OBJS-$(CONFIG_COREIMAGESRC_FILTER) += vf_coreimage.o OBJS-$(CONFIG_DDAGRAB_FILTER) += vsrc_ddagrab.o OBJS-$(CONFIG_FREI0R_SRC_FILTER) += vf_frei0r.o +OBJS-$(CONFIG_GFXCAPTURE_FILTER) += vsrc_gfxcapture.o vsrc_gfxcapture_winrt.o OBJS-$(CONFIG_GRADIENTS_FILTER) += vsrc_gradients.o OBJS-$(CONFIG_HALDCLUTSRC_FILTER) += vsrc_testsrc.o OBJS-$(CONFIG_LIFE_FILTER) += vsrc_life.o diff --git a/libavfilter/allfilters.c b/libavfilter/allfilters.c index 3ac1502254..84f15f85c5 100644 --- a/libavfilter/allfilters.c +++ b/libavfilter/allfilters.c @@ -571,6 +571,7 @@ extern const FFFilter ff_vsrc_colorspectrum; extern const FFFilter ff_vsrc_coreimagesrc; extern const FFFilter ff_vsrc_ddagrab; extern const FFFilter ff_vsrc_frei0r_src; +extern const FFFilter ff_vsrc_gfxcapture; extern const FFFilter ff_vsrc_gradients; extern const FFFilter ff_vsrc_haldclutsrc; extern const FFFilter ff_vsrc_life; diff --git a/libavfilter/version.h b/libavfilter/version.h index ba8a6fdab2..77f38cb9b4 100644 --- a/libavfilter/version.h +++ b/libavfilter/version.h @@ -31,7 +31,7 @@ #include "version_major.h" -#define LIBAVFILTER_VERSION_MINOR 8 +#define LIBAVFILTER_VERSION_MINOR 9 #define LIBAVFILTER_VERSION_MICRO 100 diff --git a/libavfilter/vsrc_gfxcapture.c b/libavfilter/vsrc_gfxcapture.c new file mode 100644 index 0000000000..19d8a8a52c --- /dev/null +++ b/libavfilter/vsrc_gfxcapture.c @@ -0,0 +1,102 @@ +/* + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include "config.h" + +#include "libavutil/internal.h" +#include "libavutil/opt.h" +#include "avfilter.h" +#include "filters.h" + +#include "vsrc_gfxcapture.h" + +#define OFFSET(x) offsetof(GfxCaptureContext, x) +#define FLAGS AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM +static const AVOption gfxcapture_options[] = { + { "window_title", "ECMAScript regular expression to match against the window title. " + "Supports PCRE style (?i) prefix for case-insensitivity.", + OFFSET(window_text), AV_OPT_TYPE_STRING, { .str = NULL }, 0, INT_MAX, FLAGS }, + { "window_class", "as window_title, but against the window class", + OFFSET(window_class), AV_OPT_TYPE_STRING, { .str = NULL }, 0, INT_MAX, FLAGS }, + { "window_exe", "as window_title, but against the windows executable name", + OFFSET(window_exe), AV_OPT_TYPE_STRING, { .str = NULL }, 0, INT_MAX, FLAGS }, + { "monitor_idx", "index of the monitor to capture", OFFSET(monitor_idx), AV_OPT_TYPE_INT, { .i64 = GFX_MONITOR_IDX_DEFAULT }, GFX_MONITOR_IDX_DEFAULT, INT_MAX, FLAGS, .unit = "monitor_idx" }, + { "window", "derive from selected window", 0, AV_OPT_TYPE_CONST, { .i64 = GFX_MONITOR_IDX_WINDOW }, 0, 0, FLAGS, .unit = "monitor_idx" }, + { "capture_cursor", "capture mouse cursor", OFFSET(capture_cursor), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, FLAGS }, + { "capture_border", "capture full window border", OFFSET(capture_border), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, FLAGS }, + { "display_border", "display yellow border around captured window", + OFFSET(display_border), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, FLAGS }, + { "max_framerate", "set maximum capture frame rate", OFFSET(frame_rate), AV_OPT_TYPE_VIDEO_RATE, { .str = "60" }, 0.001, 1000, FLAGS }, + { "hwnd", "pre-existing HWND handle", OFFSET(user_hwnd), AV_OPT_TYPE_UINT64, { .i64 = 0 }, 0, UINT64_MAX, FLAGS }, + { "hmonitor", "pre-existing HMONITOR handle", OFFSET(user_hmonitor), AV_OPT_TYPE_UINT64, { .i64 = 0 }, 0, UINT64_MAX, FLAGS }, + { "width", "force width of the output frames, negative values round down the width to the nearest multiple of that number", + OFFSET(canvas_width), AV_OPT_TYPE_INT, { .i64 = 0 }, INT_MIN, INT_MAX, FLAGS }, + { "height", "force height of the output frames, negative values round down the height to the nearest multiple of that number", + OFFSET(canvas_height), AV_OPT_TYPE_INT, { .i64 = 0 }, INT_MIN, INT_MAX, FLAGS }, + { "crop_left", "number of pixels to crop from the left of the captured area", + OFFSET(crop_left), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, FLAGS }, + { "crop_top", "number of pixels to crop from the top of the captured area", + OFFSET(crop_top), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, FLAGS }, + { "crop_right", "number of pixels to crop from the right of the captured area", + OFFSET(crop_right), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, FLAGS }, + { "crop_bottom", "number of pixels to crop from the bottom of the captured area", + OFFSET(crop_bottom), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, FLAGS }, + { "premultiplied", "return premultiplied alpha frames", OFFSET(premult_alpha), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, FLAGS }, + { "resize_mode", "capture source resize behavior", OFFSET(resize_mode), AV_OPT_TYPE_INT, { .i64 = GFX_RESIZE_CROP }, 0, GFX_RESIZE_NB - 1, FLAGS, .unit = "resize_mode" }, + { "crop", "crop or add black bars into frame", 0, AV_OPT_TYPE_CONST, { .i64 = GFX_RESIZE_CROP }, 0, 0, FLAGS, .unit = "resize_mode" }, + { "scale", "scale source to fit initial size", 0, AV_OPT_TYPE_CONST, { .i64 = GFX_RESIZE_SCALE }, 0, 0, FLAGS, .unit = "resize_mode" }, + { "scale_aspect", "scale source to fit initial size while preserving aspect ratio", + 0, AV_OPT_TYPE_CONST, { .i64 = GFX_RESIZE_SCALE_ASPECT }, 0, 0, FLAGS, .unit = "resize_mode" }, + { "scale_mode", "scaling algorithm", OFFSET(scale_mode), AV_OPT_TYPE_INT, { .i64 = GFX_SCALE_BILINEAR }, 0, GFX_SCALE_NB - 1, FLAGS, .unit = "scale_mode" }, + { "point", "use point scaling", 0, AV_OPT_TYPE_CONST, { .i64 = GFX_SCALE_POINT }, 0, 0, FLAGS, .unit = "scale_mode" }, + { "bilinear", "use bilinear scaling", 0, AV_OPT_TYPE_CONST, { .i64 = GFX_SCALE_BILINEAR }, 0, 0, FLAGS, .unit = "scale_mode" }, + { "bicubic", "use bicubic scaling", 0, AV_OPT_TYPE_CONST, { .i64 = GFX_SCALE_BICUBIC }, 0, 0, FLAGS, .unit = "scale_mode" }, + { "output_fmt", "desired output format", OFFSET(out_fmt), AV_OPT_TYPE_INT, { .i64 = AV_PIX_FMT_BGRA }, 0, INT_MAX, FLAGS, .unit = "output_fmt" }, + { "8bit", "output default 8 Bit format", 0, AV_OPT_TYPE_CONST, { .i64 = AV_PIX_FMT_BGRA }, 0, 0, FLAGS, .unit = "output_fmt" }, + { "bgra", "output 8 Bit BGRA", 0, AV_OPT_TYPE_CONST, { .i64 = AV_PIX_FMT_BGRA }, 0, 0, FLAGS, .unit = "output_fmt" }, + { "10bit", "output default 10 Bit format", 0, AV_OPT_TYPE_CONST, { .i64 = AV_PIX_FMT_X2BGR10 }, 0, 0, FLAGS, .unit = "output_fmt" }, + { "x2bgr10", "output 10 Bit X2BGR10", 0, AV_OPT_TYPE_CONST, { .i64 = AV_PIX_FMT_X2BGR10 }, 0, 0, FLAGS, .unit = "output_fmt" }, + { "16bit", "output default 16 Bit format", 0, AV_OPT_TYPE_CONST, { .i64 = AV_PIX_FMT_RGBAF16 }, 0, 0, FLAGS, .unit = "output_fmt" }, + { "rgbaf16", "output 16 Bit RGBAF16", 0, AV_OPT_TYPE_CONST, { .i64 = AV_PIX_FMT_RGBAF16 }, 0, 0, FLAGS, .unit = "output_fmt" }, + { NULL } +}; + +AVFILTER_DEFINE_CLASS(gfxcapture); + +static const AVFilterPad gfxcapture_outputs[] = { + { + .name = "default", + .type = AVMEDIA_TYPE_VIDEO, + .config_props = ff_gfxcapture_config_props, + }, +}; + +const FFFilter ff_vsrc_gfxcapture = { + .p.name = "gfxcapture", + .p.description = NULL_IF_CONFIG_SMALL("Capture graphics/screen content as a video source"), + .p.priv_class = &gfxcapture_class, + .p.inputs = NULL, + .p.flags = AVFILTER_FLAG_HWDEVICE, + .priv_size = sizeof(GfxCaptureContext), + .init = ff_gfxcapture_init, + .uninit = ff_gfxcapture_uninit, + FILTER_OUTPUTS(gfxcapture_outputs), + FILTER_SINGLE_PIXFMT(AV_PIX_FMT_D3D11), + .flags_internal = FF_FILTER_FLAG_HWFRAME_AWARE, + .activate = ff_gfxcapture_activate, +}; diff --git a/libavfilter/vsrc_gfxcapture.h b/libavfilter/vsrc_gfxcapture.h new file mode 100644 index 0000000000..617f48de22 --- /dev/null +++ b/libavfilter/vsrc_gfxcapture.h @@ -0,0 +1,81 @@ +/* + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#ifndef AVFILTER_VSRC_GFXCAPTURE_H +#define AVFILTER_VSRC_GFXCAPTURE_H + +typedef struct GfxCaptureContextCpp GfxCaptureContextCpp; + +enum GfxResizeMode { + GFX_RESIZE_CROP = 0, + GFX_RESIZE_SCALE, + GFX_RESIZE_SCALE_ASPECT, + GFX_RESIZE_NB +}; + +enum GfxScaleMode { + GFX_SCALE_POINT = 0, + GFX_SCALE_BILINEAR, + GFX_SCALE_BICUBIC, + GFX_SCALE_NB +}; + +enum GfxMonitorIdx { + GFX_MONITOR_IDX_WINDOW = -1, + GFX_MONITOR_IDX_DEFAULT = -2 +}; + +typedef struct GfxCaptureContext { + const AVClass *avclass; + + GfxCaptureContextCpp *ctx; + + const char *window_text; + const char *window_class; + const char *window_exe; + int monitor_idx; + + uint64_t user_hwnd; + uint64_t user_hmonitor; + + int capture_cursor; + int capture_border; + int display_border; + AVRational frame_rate; + int canvas_width, canvas_height; + int crop_left, crop_top, crop_right, crop_bottom; + int out_fmt; + int resize_mode; + int scale_mode; + int premult_alpha; +} GfxCaptureContext; + +#ifdef __cplusplus +#define NOEXCEPT noexcept +#else +#define NOEXCEPT +#endif + +av_cold int ff_gfxcapture_init(AVFilterContext *avctx) NOEXCEPT; +av_cold void ff_gfxcapture_uninit(AVFilterContext *avctx) NOEXCEPT; +int ff_gfxcapture_activate(AVFilterContext *avctx) NOEXCEPT; +int ff_gfxcapture_config_props(AVFilterLink *outlink) NOEXCEPT; + +#undef NOEXCEPT + +#endif /* AVFILTER_VSRC_GFXCAPTURE_H */ diff --git a/libavfilter/vsrc_gfxcapture_shader.h b/libavfilter/vsrc_gfxcapture_shader.h new file mode 100644 index 0000000000..3fe9d5ec0d --- /dev/null +++ b/libavfilter/vsrc_gfxcapture_shader.h @@ -0,0 +1,126 @@ +/* + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#ifndef AVFILTER_VSRC_GFXCAPTURE_SHADER_H +#define AVFILTER_VSRC_GFXCAPTURE_SHADER_H + +#define HLSL_SHADER(shader) #shader + +static const char render_shader_src[] = HLSL_SHADER( + struct VSOut { + float4 pos : SV_Position; + float2 uv : TEXCOORD0; + }; + + cbuffer cb : register(b0) { + float2 tS; + float2 dS; + float2 uvMin; + float2 uvMax; + uint to_unpremult; + uint to_srgb; + uint2 pad; + }; + + Texture2D t0 : register(t0); + SamplerState s0 : register(s0); + + VSOut main_vs(uint id : SV_VertexID) { + VSOut o; + o.pos = float4(id == 2 ? 3.0 : -1.0, id == 1 ? 3.0 : -1.0, 0, 1); + o.uv = lerp(uvMin, uvMax, float2((o.pos.x + 1) * 0.5, 1 - (o.pos.y + 1) * 0.5)); + return o; + } + + float4 cubic(float v) { + float4 n = float4(1.0, 2.0, 3.0, 4.0) - v; + float4 s = n * n * n; + float x = s.x; + float y = s.y - 4.0 * s.x; + float z = s.z - 4.0 * s.y + 6.0 * s.x; + float w = 6.0 - x - y - z; + return float4(x, y, z, w) * (1.0 / 6.0); + } + + float4 texBicubic(Texture2D t, SamplerState ss, float2 uv) { + float2 itS = 1.0 / tS; + + float2 tc = uv * tS - 0.5; + float2 fxy = frac(tc); + tc -= fxy; + + float4 xc = cubic(fxy.x); + float4 yc = cubic(fxy.y); + + float4 s = float4(xc.xz + xc.yw, yc.xz + yc.yw); + float4 o = tc.xxyy + (float2(-0.5, 1.5)).xyxy + float4(xc.yw, yc.yw) / s; + o *= itS.xxyy; + + float4 s0 = t.Sample(ss, o.xz); + float4 s1 = t.Sample(ss, o.yz); + float4 s2 = t.Sample(ss, o.xw); + float4 s3 = t.Sample(ss, o.yw); + + float sx = s.x / (s.x + s.y); + float sy = s.z / (s.z + s.w); + + return lerp(lerp(s3, s2, sx), lerp(s1, s0, sx), sy); + } + + float4 unpremultiply(float4 c) { + if (c.a < 1e-6) + return float4(0.0, 0.0, 0.0, 0.0); + return float4(c.rgb / c.a, c.a); + } + + float4 premultiply(float4 c) { + return float4(c.rgb * c.a, c.a); + } + + float3 linear_to_srgb(float3 c) { + c = max(c, 0.0); + float3 lo = 12.92 * c; + float3 hi = 1.055 * pow(c, 1.0 / 2.4) - 0.055; + return saturate(lerp(hi, lo, step(c, 0.0031308))); + } + + float4 fix_color(float4 c) { + if (to_unpremult || to_srgb) + c = unpremultiply(c); + if (to_srgb) { + c.rgb = linear_to_srgb(c.rgb); + if (!to_unpremult) + c = premultiply(c); + } + return c; + } + + float4 main_ps(VSOut i) : SV_Target { + return fix_color(t0.Sample(s0, i.uv)); + } + + float4 main_ps_bicubic(VSOut i) : SV_Target { + if (all(tS == dS)) + return main_ps(i); + return fix_color(texBicubic(t0, s0, i.uv)); + } +); + +#undef HLSL_SHADER + +#endif /* AVFILTER_VSRC_GFXCAPTURE_SHADER_H */ diff --git a/libavfilter/vsrc_gfxcapture_winrt.cpp b/libavfilter/vsrc_gfxcapture_winrt.cpp new file mode 100644 index 0000000000..42977efcc5 --- /dev/null +++ b/libavfilter/vsrc_gfxcapture_winrt.cpp @@ -0,0 +1,1551 @@ +/* + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +extern "C" { +#include "config.h" +} + +#if !defined(_WIN32_WINNT) || _WIN32_WINNT < 0x0A00 +#undef _WIN32_WINNT +#define _WIN32_WINNT 0x0A00 +#endif + +#define WINDOWS_FOUNDATION_UNIVERSALAPICONTRACT_VERSION 0x130000 + +// work around bug in mingw double-defining IReference<unsigned char> (BYTE == boolean) +#define ____FIReference_1_boolean_INTERFACE_DEFINED__ + +#include <windows.h> +#include <initguid.h> +#include <wrl.h> +#include <roapi.h> +#include <dwmapi.h> +#include <d3d11.h> +#include <d3dcompiler.h> +#include <dispatcherqueue.h> +#include <windows.foundation.h> +#include <windows.graphics.capture.h> +#include <windows.graphics.capture.interop.h> +#include <windows.graphics.directx.direct3d11.h> +#if HAVE_IDIRECT3DDXGIINTERFACEACCESS +#include <windows.graphics.directx.direct3d11.interop.h> +#endif + +extern "C" { +#include "libavutil/avassert.h" +#include "libavutil/internal.h" +#include "libavutil/mem.h" +#include "libavutil/opt.h" +#include "libavutil/time.h" +#include "libavutil/thread.h" +#include "libavutil/pixdesc.h" +#include "libavutil/hwcontext.h" +#include "libavutil/hwcontext_d3d11va.h" +#include "avfilter.h" +#include "filters.h" +#include "video.h" + +#include "vsrc_gfxcapture.h" +} + +#include <atomic> +#include <cinttypes> +#include <condition_variable> +#include <functional> +#include <memory> +#include <mutex> +#include <regex> +#include <string> +#include <type_traits> + +#include "vsrc_gfxcapture_winrt.h" +#include "vsrc_gfxcapture_shader.h" + +using namespace ABI::Windows::System; +using namespace ABI::Windows::Foundation; +using namespace ABI::Windows::Graphics::Capture; +using namespace ABI::Windows::Graphics::DirectX::Direct3D11; +using namespace Windows::Graphics::DirectX::Direct3D11; +using Microsoft::WRL::ComPtr; +using ABI::Windows::Graphics::SizeInt32; +using ABI::Windows::Foundation::TimeSpan; +using ABI::Windows::Graphics::DirectX::DirectXPixelFormat; + +#define TIMESPAN_RES 10000000 +#define TIMESPAN_RES64 INT64_C(10000000) + +#define CAPTURE_POOL_SIZE 2 + +enum { + WM_WGC_THREAD_SHUTDOWN = WM_APP + 1 +}; + +#define CCTX(ctx) static_cast<GfxCaptureContext*>(ctx) + +typedef struct GfxCaptureFunctions { + hmodule_ptr_t graphicscapture_handle; + + hmodule_ptr_t combase_handle; + HRESULT (WINAPI *RoInitialize)(RO_INIT_TYPE initType); + void (WINAPI *RoUninitialize)(void); + HRESULT (WINAPI *RoGetActivationFactory)(HSTRING activatableClassId, REFIID iid, void **factory); + HRESULT (WINAPI *WindowsCreateStringReference)(PCWSTR sourceString, UINT32 length, HSTRING_HEADER *hstringHeader, HSTRING *string); + + hmodule_ptr_t dwmapi_handle; + HRESULT (WINAPI *DwmGetWindowAttribute)(HWND hwnd, DWORD dwAttribute, PVOID pvAttribute, DWORD cbAttribute); + + hmodule_ptr_t d3d11_handle; + HRESULT (WINAPI *CreateDirect3D11DeviceFromDXGIDevice)(IDXGIDevice *dxgiDevice, IInspectable **graphicsDevice); + + hmodule_ptr_t coremsg_handle; + HRESULT (WINAPI *CreateDispatcherQueueController)(DispatcherQueueOptions options, PDISPATCHERQUEUECONTROLLER *dispatcherQueueController); + + hmodule_ptr_t user32_handle; + DPI_AWARENESS_CONTEXT (WINAPI *SetThreadDpiAwarenessContext)(DPI_AWARENESS_CONTEXT dpiContext); + + hmodule_ptr_t d3dcompiler_handle; + HRESULT (WINAPI *D3DCompile)(LPCVOID pSrcData, SIZE_T SrcDataSize, LPCSTR pSourceName, const D3D10_SHADER_MACRO *pDefines, ID3DInclude *pInclude, + LPCSTR pEntrypoint, LPCSTR pTarget, UINT Flags1, UINT Flags2, ID3DBlob **ppCode, ID3DBlob **ppErrorMsgs); +} GfxCaptureFunctions; + +// This struct contains all data handled by the capture thread +struct GfxCaptureContextWgc { + ComPtr<IDispatcherQueueController> dispatcher_queue_controller; + ComPtr<IDispatcherQueue> dispatcher_queue; + + ComPtr<IGraphicsCaptureItem> capture_item; + ComPtr<IDirect3DDevice> d3d_device; + ComPtr<IDirect3D11CaptureFramePool> frame_pool; + ComPtr<IGraphicsCaptureSession> capture_session; + + EventRegistrationToken frame_arrived_token { 0 }; + EventRegistrationToken closed_token { 0 }; + + std::mutex frame_arrived_mutex; + std::condition_variable frame_arrived_cond; + std::atomic<bool> window_closed { false }; + std::atomic<uint64_t> frame_seq { 0 }; + + SizeInt32 cap_size { 0, 0 }; + RECT client_area_offsets { 0, 0, 0, 0 }; +}; + +struct GfxCaptureContextD3D { + ComPtr<ID3D11VertexShader> vertex_shader; + ComPtr<ID3D11PixelShader> pixel_shader; + ComPtr<ID3D11SamplerState> sampler_state; + ComPtr<ID3D11Buffer> shader_cb; + ComPtr<ID3D11DeviceContext> deferred_ctx; +}; + +struct GfxCaptureContextCpp { + GfxCaptureFunctions fn; + std::unique_ptr<GfxCaptureContextWgc> wgc; + std::unique_ptr<GfxCaptureContextD3D> d3d; + + pthread_t wgc_thread; + bool wgc_thread_created { false }; + DWORD wgc_thread_id { 0 }; + std::mutex wgc_thread_init_mutex; + std::condition_variable wgc_thread_init_cond; + volatile int wgc_thread_init_res { INT_MAX }; + std::recursive_mutex wgc_thread_uninit_mutex; + + HWND capture_hwnd { nullptr }; + HMONITOR capture_hmonitor { nullptr }; + + AVBufferRef *device_ref { nullptr }; + AVHWDeviceContext *device_ctx { nullptr }; + AVD3D11VADeviceContext *device_hwctx { nullptr }; + + AVBufferRef *frames_ref { nullptr }; + AVHWFramesContext *frames_ctx { nullptr }; + AVD3D11VAFramesContext *frames_hwctx { nullptr }; + + int64_t first_pts { 0 }; + int64_t last_pts { 0 }; +}; + +template <typename T> +static HRESULT get_activation_factory(GfxCaptureContextCpp *ctx, PCWSTR clsid, T** factory) { + HSTRING_HEADER hsheader = { 0 }; + HSTRING hs = NULL; + + HRESULT hr = ctx->fn.WindowsCreateStringReference(clsid, (UINT32)wcslen(clsid), &hsheader, &hs); + if (FAILED(hr)) + return hr; + + return ctx->fn.RoGetActivationFactory(hs, IID_PPV_ARGS(factory)); +} + +#define CHECK_HR(fcall, action) \ + do { \ + HRESULT fhr = fcall; \ + if (FAILED(fhr)) { \ + av_log(avctx, AV_LOG_ERROR, #fcall " failed: 0x%08lX\n", fhr); \ + action; \ + } \ + } while (0) +#define CHECK_HR_RET(...) CHECK_HR((__VA_ARGS__), return AVERROR_EXTERNAL) +#define CHECK_HR_FAIL(...) CHECK_HR((__VA_ARGS__), ret = AVERROR_EXTERNAL; goto fail) +#define CHECK_HR_LOG(...) CHECK_HR((__VA_ARGS__), (void)0) + +/**************************************************** + * Windows Graphics Capture Worker Thread * + * All wgc_* functions must run only on WGC thread! * + ****************************************************/ + +static void wgc_frame_arrived_handler(const std::unique_ptr<GfxCaptureContextWgc> &wgctx) { + wgctx->frame_seq.fetch_add(1, std::memory_order_release); + wgctx->frame_arrived_cond.notify_one(); +} + +static void wgc_closed_handler(const std::unique_ptr<GfxCaptureContextWgc> &wgctx) { + wgctx->window_closed.store(true, std::memory_order_release); + wgctx->frame_arrived_cond.notify_one(); +} + +static void wgc_stop_capture_session(AVFilterContext *avctx) noexcept +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + + if (wgctx->closed_token.value && wgctx->capture_item) { + CHECK_HR_LOG(wgctx->capture_item->remove_Closed(wgctx->closed_token)); + wgctx->closed_token.value = 0; + } + + if (wgctx->frame_arrived_token.value && wgctx->frame_pool) { + CHECK_HR_LOG(wgctx->frame_pool->remove_FrameArrived(wgctx->frame_arrived_token)); + wgctx->frame_arrived_token.value = 0; + } + + if (wgctx->capture_session) { + ComPtr<IClosable> closable; + if (SUCCEEDED(wgctx->capture_session.As(&closable))) { + closable->Close(); + } else { + av_log(avctx, AV_LOG_ERROR, "Failed to get capture session IClosable interface\n"); + } + } + + if (wgctx->frame_pool) { + ComPtr<IClosable> closable; + if (SUCCEEDED(wgctx->frame_pool.As(&closable))) { + CHECK_HR_LOG(closable->Close()); + } else { + av_log(avctx, AV_LOG_ERROR, "Failed to get frame pool IClosable interface\n"); + } + } +} + +static int wgc_calculate_client_area(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + + if (!ctx->capture_hwnd) { + wgctx->client_area_offsets.left = 0; + wgctx->client_area_offsets.top = 0; + wgctx->client_area_offsets.right = 0; + wgctx->client_area_offsets.bottom = 0; + return 0; + } + + RECT client_rect = {}; + RECT frame_bounds = {}; + RECT window_rect = {}; + + if (IsIconic(ctx->capture_hwnd)) { + av_log(avctx, AV_LOG_VERBOSE, "Capture window is iconic, no client area\n"); + return 0; + } + + if (!GetClientRect(ctx->capture_hwnd, &client_rect)) { + av_log(avctx, AV_LOG_ERROR, "GetClientRect failed\n"); + return AVERROR_EXTERNAL; + } + + if (!MapWindowPoints(ctx->capture_hwnd, nullptr, (POINT*)&client_rect, 2)) { + av_log(avctx, AV_LOG_ERROR, "MapWindowPoints failed\n"); + return AVERROR_EXTERNAL; + } + + if (FAILED(ctx->fn.DwmGetWindowAttribute(ctx->capture_hwnd, DWMWA_EXTENDED_FRAME_BOUNDS, &frame_bounds, sizeof(window_rect)))) + av_log(avctx, AV_LOG_DEBUG, "DwmGetWindowAttribute failed\n"); + + if (!GetWindowRect(ctx->capture_hwnd, &window_rect)) + av_log(avctx, AV_LOG_DEBUG, "GetWindowRect failed\n"); + + if (wgctx->cap_size.Width == frame_bounds.right - frame_bounds.left || + wgctx->cap_size.Height == frame_bounds.bottom - frame_bounds.top) { + av_log(avctx, AV_LOG_DEBUG, "Using window rect from DWMWA_EXTENDED_FRAME_BOUNDS\n"); + } else if (wgctx->cap_size.Width == window_rect.right - window_rect.left || + wgctx->cap_size.Height == window_rect.bottom - window_rect.top) { + av_log(avctx, AV_LOG_DEBUG, "Using window rect from GetWindowRect\n"); + frame_bounds = window_rect; + } else { + if ((frame_bounds.top == frame_bounds.bottom || frame_bounds.left == frame_bounds.right) && + (window_rect.top == window_rect.bottom || window_rect.left == window_rect.right)) + { + av_log(avctx, AV_LOG_ERROR, "No valid window rect found\n"); + return AVERROR_EXTERNAL; + } + av_log(avctx, AV_LOG_VERBOSE, "Failed to get valid window rect, client area may be inaccurate\n"); + return 0; + } + + wgctx->client_area_offsets.left = FFMAX(client_rect.left - frame_bounds.left, 0); + wgctx->client_area_offsets.top = FFMAX(client_rect.top - frame_bounds.top, 0); + wgctx->client_area_offsets.right = FFMAX(frame_bounds.right - client_rect.right, 0); + wgctx->client_area_offsets.bottom = FFMAX(frame_bounds.bottom - client_rect.bottom, 0); + + av_log(avctx, AV_LOG_DEBUG, "Client area offsets: left=%ld top=%ld right=%ld bottom=%ld\n", + wgctx->client_area_offsets.left, wgctx->client_area_offsets.top, + wgctx->client_area_offsets.right, wgctx->client_area_offsets.bottom); + + return 0; +} + +static int wgc_setup_gfxcapture_session(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + int ret; + + ComPtr<IDirect3D11CaptureFramePoolStatics> frame_pool_statics; + ComPtr<ID3D11Device> d3d11_device = ctx->device_hwctx->device; + ComPtr<ID3D10Multithread> d3d10_multithread; + ComPtr<IDXGIDevice> dxgi_device; + ComPtr<IGraphicsCaptureSession2> session2; + ComPtr<IGraphicsCaptureSession3> session3; + ComPtr<IGraphicsCaptureSession5> session5; + + DirectXPixelFormat fmt = DirectXPixelFormat::DirectXPixelFormat_B8G8R8A8UIntNormalized; + if (cctx->out_fmt != AV_PIX_FMT_BGRA) + fmt = DirectXPixelFormat::DirectXPixelFormat_R16G16B16A16Float; + + CHECK_HR_RET(wgctx->capture_item->get_Size(&wgctx->cap_size)); + ret = wgc_calculate_client_area(avctx); + if (ret < 0) + return ret; + + CHECK_HR_RET(d3d11_device.As(&d3d10_multithread)); + d3d10_multithread->SetMultithreadProtected(TRUE); + + CHECK_HR_RET(d3d11_device.As(&dxgi_device)); + CHECK_HR_RET(ctx->fn.CreateDirect3D11DeviceFromDXGIDevice(dxgi_device.Get(), &wgctx->d3d_device)); + + CHECK_HR_RET(get_activation_factory<IDirect3D11CaptureFramePoolStatics>(ctx, RuntimeClass_Windows_Graphics_Capture_Direct3D11CaptureFramePool, &frame_pool_statics)); + CHECK_HR_RET(frame_pool_statics->Create(wgctx->d3d_device.Get(), fmt, CAPTURE_POOL_SIZE, wgctx->cap_size, &wgctx->frame_pool)); + CHECK_HR_RET(wgctx->frame_pool->CreateCaptureSession(wgctx->capture_item.Get(), &wgctx->capture_session)); + + if (SUCCEEDED(wgctx->capture_session.As(&session2))) { + if (FAILED(session2->put_IsCursorCaptureEnabled(cctx->capture_cursor))) { + av_log(avctx, AV_LOG_WARNING, "Failed setting cursor capture mode\n"); + } + } else { + av_log(avctx, AV_LOG_WARNING, "Cursor capture unavailable\n"); + } + + if (SUCCEEDED(wgctx->capture_session.As(&session3))) { + // this one is weird, it can return failure but still work + if (FAILED(session3->put_IsBorderRequired(cctx->display_border))) { + av_log(avctx, AV_LOG_WARNING, "Failed setting border drawing mode\n"); + } + } else { + av_log(avctx, AV_LOG_WARNING, "Disabling border drawing unavailable\n"); + } + + if (SUCCEEDED(wgctx->capture_session.As(&session5))) { + TimeSpan ivl = { av_rescale_q(1, av_inv_q(cctx->frame_rate), AVRational{1, TIMESPAN_RES}) }; + if (FAILED(session5->put_MinUpdateInterval(ivl))) { + av_log(avctx, AV_LOG_WARNING, "Failed setting minimum update interval, framerate may be limited\n"); + } + } else { + av_log(avctx, AV_LOG_WARNING, "Setting minimum update interval unavailable, framerate may be limited\n"); + } + + wgctx->window_closed = 0; + + CHECK_HR_RET(wgctx->capture_item->add_Closed( + create_cb_handler<ITypedEventHandler<GraphicsCaptureItem*,IInspectable*>, IGraphicsCaptureItem*, IInspectable*>( + [avctx, ctx](auto, auto) { + av_log(avctx, AV_LOG_INFO, "Capture item closed\n"); + wgc_closed_handler(ctx->wgc); + return S_OK; + }).Get(), &wgctx->closed_token)); + + CHECK_HR_RET(wgctx->frame_pool->add_FrameArrived( + create_cb_handler<ITypedEventHandler<Direct3D11CaptureFramePool*,IInspectable*>, IDirect3D11CaptureFramePool*, IInspectable*>( + [avctx, ctx](auto, auto) { + av_log(avctx, AV_LOG_TRACE, "Frame arrived\n"); + wgc_frame_arrived_handler(ctx->wgc); + return S_OK; + }).Get(), &wgctx->frame_arrived_token)); + + return 0; +} + +static int wgc_setup_gfxcapture_capture(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + HRESULT hr; + int ret; + + ComPtr<IGraphicsCaptureItemInterop> capture_item_interop; + CHECK_HR_RET(get_activation_factory<IGraphicsCaptureItemInterop>(ctx, RuntimeClass_Windows_Graphics_Capture_GraphicsCaptureItem, &capture_item_interop)); + + if (ctx->capture_hmonitor) { + hr = capture_item_interop->CreateForMonitor(ctx->capture_hmonitor, IID_PPV_ARGS(&wgctx->capture_item)); + if (FAILED(hr)) { + av_log(avctx, AV_LOG_ERROR, "Failed to setup graphics capture for monitor (0x%08lX)\n", hr); + return AVERROR_EXTERNAL; + } + } else if (ctx->capture_hwnd) { + hr = capture_item_interop->CreateForWindow(ctx->capture_hwnd, IID_PPV_ARGS(&wgctx->capture_item)); + if (FAILED(hr)) { + av_log(avctx, AV_LOG_ERROR, "Failed to setup graphics capture for window (0x%08lX)\n", hr); + return AVERROR_EXTERNAL; + } + } + + ret = wgc_setup_gfxcapture_session(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to setup graphics capture pool\n"); + return ret; + } + + hr = ctx->wgc->capture_session->StartCapture(); + if (FAILED(hr)) { + av_log(avctx, AV_LOG_ERROR, "Failed to start graphics capture session (0x%08lX)\n", hr); + return AVERROR_EXTERNAL; + } + + return 0; +} + +static int wgc_try_get_next_frame(AVFilterContext *avctx, ComPtr<IDirect3D11CaptureFrame> *capture_frame) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + + ComPtr<IDirect3DSurface> capture_surface; + ComPtr<IDirect3DDxgiInterfaceAccess> dxgi_interface_access; + ComPtr<ID3D11Texture2D> frame_texture; + SizeInt32 frame_size = { 0, 0 }; + + CHECK_HR_RET(wgctx->frame_pool->TryGetNextFrame(capture_frame->ReleaseAndGetAddressOf())); + if (!capture_frame->Get()) + return AVERROR(EAGAIN); + + CHECK_HR_RET(capture_frame->Get()->get_ContentSize(&frame_size)); + if (frame_size.Width != wgctx->cap_size.Width || frame_size.Height != wgctx->cap_size.Height) { + av_log(avctx, AV_LOG_VERBOSE, "Capture size changed to %dx%d\n", frame_size.Width, frame_size.Height); + + DirectXPixelFormat fmt = DirectXPixelFormat::DirectXPixelFormat_B8G8R8A8UIntNormalized; + if (cctx->out_fmt != AV_PIX_FMT_BGRA) + fmt = DirectXPixelFormat::DirectXPixelFormat_R16G16B16A16Float; + + CHECK_HR_RET(wgctx->frame_pool->Recreate(wgctx->d3d_device.Get(), fmt, CAPTURE_POOL_SIZE, frame_size)); + wgctx->cap_size = frame_size; + + int ret = wgc_calculate_client_area(avctx); + if (ret < 0) + return ret; + } + + return 0; +} + +static int wgc_setup_winrt(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + MSG msg; + + // pre-create the message-queue + PeekMessage(&msg, nullptr, 0, 0, PM_NOREMOVE); + + DispatcherQueueOptions options = { 0 }; + options.dwSize = sizeof(DispatcherQueueOptions); + options.threadType = DISPATCHERQUEUE_THREAD_TYPE::DQTYPE_THREAD_CURRENT; + options.apartmentType = DISPATCHERQUEUE_THREAD_APARTMENTTYPE::DQTAT_COM_NONE; + + CHECK_HR_RET(ctx->fn.CreateDispatcherQueueController(options, &wgctx->dispatcher_queue_controller)); + CHECK_HR_RET(wgctx->dispatcher_queue_controller->get_DispatcherQueue(&wgctx->dispatcher_queue)); + + return 0; +} + +static void wgc_thread_uninit(AVFilterContext *avctx) noexcept +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + + wgc_stop_capture_session(avctx); + + ctx->wgc.reset(); + ctx->fn.RoUninitialize(); +} + +static int wgc_thread_init(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + HRESULT hr; + int ret; + + ctx->wgc = std::make_unique<GfxCaptureContextWgc>(); + + ctx->fn.SetThreadDpiAwarenessContext(DPI_AWARENESS_CONTEXT_PER_MONITOR_AWARE_V2); + + hr = ctx->fn.RoInitialize(RO_INIT_MULTITHREADED); + if (FAILED(hr)) { + av_log(avctx, AV_LOG_ERROR, "Failed to initialize WinRT\n"); + ctx->wgc.reset(); + return AVERROR_EXTERNAL; + } + + ret = wgc_setup_winrt(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to setup WinRT\n"); + goto fail; + } + + ret = wgc_setup_gfxcapture_capture(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to setup graphics capture\n"); + goto fail; + } + + return 0; + +fail: + wgc_thread_uninit(avctx); + return ret; +} + +static int wgc_thread_worker(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + ComPtr<IAsyncAction> async; + MSG msg; + + av_log(avctx, AV_LOG_DEBUG, "Starting message loop\n"); + + while (BOOL res = GetMessage(&msg, NULL, 0, 0)) { + if (res == -1) { + av_log(avctx, AV_LOG_ERROR, "Failed to get message\n"); + return AVERROR(EIO); + } + + if (!msg.hwnd && msg.message == WM_WGC_THREAD_SHUTDOWN) { + av_log(avctx, AV_LOG_DEBUG, "Initializing WGC thread shutdown\n"); + if (FAILED(wgctx->dispatcher_queue_controller->ShutdownQueueAsync(&async))) { + av_log(avctx, AV_LOG_ERROR, "Failed to shutdown dispatcher queue\n"); + return AVERROR_EXTERNAL; + } + async->put_Completed(create_cb_handler<IAsyncActionCompletedHandler, IAsyncAction*, AsyncStatus>( + [avctx, ctx](auto, auto status) { + PostThreadMessage(ctx->wgc_thread_id, WM_QUIT, 0, 0); + av_log(avctx, AV_LOG_DEBUG, "WGC thread async shutdown completed: %d\n", (int)status); + return S_OK; + }).Get()); + continue; + } + + av_log(avctx, AV_LOG_TRACE, "Got message: %u\n", msg.message); + + TranslateMessage(&msg); + DispatchMessage(&msg); + } + + if (!async) { + av_log(avctx, AV_LOG_ERROR, "WGC Thread message loop ended without proper shutdown\n"); + return AVERROR_EXTERNAL; + } + + av_log(avctx, AV_LOG_DEBUG, "Message loop ended\n"); + + return msg.wParam; +} + +static void *wgc_thread_entry(void *arg) noexcept +{ + AVFilterContext *avctx = static_cast<AVFilterContext*>(arg); + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + + { + static const char name_prefix[] = "wgc_winrt@0x"; + char thread_name[sizeof(name_prefix) + sizeof(void*) * 2]; + snprintf(thread_name, sizeof(thread_name), "%s%" PRIxPTR, name_prefix, (uintptr_t)avctx); + ff_thread_setname(thread_name); + + std::lock_guard init_lock(ctx->wgc_thread_init_mutex); + ctx->wgc_thread_id = GetCurrentThreadId(); + + try { + ctx->wgc_thread_init_res = wgc_thread_init(avctx); + } catch (const std::bad_alloc &) { + ctx->wgc_thread_init_res = AVERROR(ENOMEM); + } catch (const std::exception &e) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception in WGC thread init: %s\n", e.what()); + ctx->wgc_thread_init_res = AVERROR_BUG; + } catch (...) { + av_log(avctx, AV_LOG_ERROR, "Unhandled exception in WGC thread init\n"); + ctx->wgc_thread_init_res = AVERROR_BUG; + } + + ctx->wgc_thread_init_cond.notify_all(); + if (ctx->wgc_thread_init_res < 0) + return (void*)(intptr_t)AVERROR(ENOSYS); + } + + int ret; + + try { + ret = wgc_thread_worker(avctx); + } catch (const std::bad_alloc &) { + ret = AVERROR(ENOMEM); + } catch (const std::exception &e) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception in WGC thread worker: %s\n", e.what()); + ret = AVERROR_BUG; + } catch (...) { + av_log(avctx, AV_LOG_ERROR, "Unhandled exception in WGC thread worker\n"); + ret = AVERROR_BUG; + } + + std::lock_guard uninit_lock(ctx->wgc_thread_uninit_mutex); + wgc_thread_uninit(avctx); + + return (void*)(intptr_t)ret; +} + +/*********************************** + * WGC Thread Management Functions * + ***********************************/ + +static int stop_wgc_thread(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + int ret = 0; + + if (ctx->wgc_thread_created) { + if (ctx->wgc_thread_id && !PostThreadMessage(ctx->wgc_thread_id, WM_WGC_THREAD_SHUTDOWN, 0, 0)) + av_log(avctx, AV_LOG_ERROR, "Failed to post shutdown message to WGC thread\n"); + + void *wgc_res = nullptr; + pthread_join(ctx->wgc_thread, &wgc_res); + ret = (int)(intptr_t)wgc_res; + + ctx->wgc_thread_id = 0; + ctx->wgc_thread_created = false; + } + + return ret; +} + +static int start_wgc_thread(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + + if (ctx->wgc_thread_created || ctx->wgc_thread_id) { + av_log(avctx, AV_LOG_ERROR, "Double-creation of WGC thread\n"); + return AVERROR_BUG; + } + + std::unique_lock wgc_lock(ctx->wgc_thread_init_mutex); + ctx->wgc_thread_init_res = INT_MAX; + + int ret = pthread_create(&ctx->wgc_thread, nullptr, wgc_thread_entry, avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to create WGC thread\n"); + return ret; + } + + ctx->wgc_thread_created = true; + + if (!ctx->wgc_thread_init_cond.wait_for(wgc_lock, std::chrono::seconds(1), [&]() { + return ctx->wgc_thread_init_res != INT_MAX; + })) { + av_log(avctx, AV_LOG_ERROR, "WGC thread init timed out\n"); + return AVERROR(ETIMEDOUT); + } + + return ctx->wgc_thread_init_res; +} + +template <typename F> +static int run_on_wgc_thread(AVFilterContext *avctx, F &&cb) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + + std::lock_guard uninit_lock(ctx->wgc_thread_uninit_mutex); + if (!wgctx) { + av_log(avctx, AV_LOG_ERROR, "WGC thread not initialized\n"); + return AVERROR(ENOSYS); + } + + struct CBData { + std::mutex mutex; + std::condition_variable cond; + std::atomic<bool> done { false }; + std::atomic<bool> cancel { false }; + int ret = AVERROR_BUG; + }; + auto cbdata = std::make_shared<CBData>(); + + std::unique_lock cblock(cbdata->mutex); + + boolean res = 0; + CHECK_HR_RET(wgctx->dispatcher_queue->TryEnqueue( + create_cb_handler<IDispatcherQueueHandler>( + [cb = std::forward<F>(cb), cbdata]() { + { + std::lock_guard lock(cbdata->mutex); + if (cbdata->cancel.load(std::memory_order_acquire)) + return S_OK; + + try { + cbdata->ret = cb(); + } catch (const std::bad_alloc &) { + cbdata->ret = AVERROR(ENOMEM); + } catch (...) { + cbdata->ret = AVERROR_BUG; + } + + cbdata->done.store(true, std::memory_order_release); + } + + cbdata->cond.notify_one(); + return S_OK; + }).Get(), &res)); + if (!res) { + av_log(avctx, AV_LOG_ERROR, "Failed to enqueue WGC thread callback\n"); + return AVERROR_EXTERNAL; + } + + if (!cbdata->cond.wait_for(cblock, std::chrono::seconds(1), [&]() { return cbdata->done.load(std::memory_order_acquire); })) { + cbdata->cancel.store(true, std::memory_order_release); + av_log(avctx, AV_LOG_ERROR, "WGC thread callback timed out\n"); + return AVERROR(ETIMEDOUT); + } + + return cbdata->ret; +} + +/******************************* + * Standard AVFilter functions * + *******************************/ + +static int build_regex(AVFilterContext *avctx, const char *pattern, std::regex *out) +{ + if (!pattern) + return 0; + + std::string pat(pattern); + + auto flags = std::regex::ECMAScript | std::regex::optimize; + if (pat.rfind("(?i)", 0) == 0 || pat.rfind("(?I)", 0) == 0) { + pat.erase(0, 4); + flags |= std::regex::icase; + } else if(pat.rfind("(?c)", 0) == 0 || pat.rfind("(?C)", 0) == 0) { + pat.erase(0, 4); + } + + try { + *out = std::regex(pat, flags); + } catch (const std::regex_error &e) { + av_log(avctx, AV_LOG_ERROR, "Failed to compile regex '%s': %s\n", pat.c_str(), e.what()); + return AVERROR(EINVAL); + } + + av_log(avctx, AV_LOG_DEBUG, "Built regex: %s\n", pattern); + + return 0; +} + +static int wstring_to_utf8(const wchar_t *in, std::string *out) +{ + int utf8size = WideCharToMultiByte(CP_UTF8, 0, in, -1, nullptr, 0, nullptr, nullptr); + if (utf8size <= 0) + return AVERROR(EINVAL); + + // over-writing std::string by one is valid in C++17 according to 27.4.3.6 if and only if it's overwritten with 0 + out->resize(utf8size - 1); + + if (WideCharToMultiByte(CP_UTF8, 0, in, -1, out->data(), utf8size, nullptr, nullptr) != utf8size) + return AVERROR_EXTERNAL; + + return 0; +} + +static int get_window_exe_name(HWND hwnd, std::string *out) +{ + out->clear(); + + DWORD pid = 0; + if (!GetWindowThreadProcessId(hwnd, &pid)) + return AVERROR(ENOENT); + + handle_ptr_t proc(OpenProcess(PROCESS_QUERY_LIMITED_INFORMATION, FALSE, pid)); + if (!proc) + return AVERROR(EACCES); + + std::wstring image_name; + DWORD image_name_size = 512; + + for (;;) { + DWORD len = image_name_size; + image_name.resize(len); + if (QueryFullProcessImageNameW(proc.get(), 0, image_name.data(), &len)) { + image_name.resize(len); + break; + } + if (GetLastError() == ERROR_INSUFFICIENT_BUFFER) { + image_name_size *= 2; + continue; + } + return AVERROR_EXTERNAL; + } + + if (image_name.empty()) + return AVERROR_EXTERNAL; + + const wchar_t *base = image_name.c_str(); + size_t pos = image_name.find_last_of(L"\\/"); + if (pos != std::string::npos) + base += pos + 1; + + return wstring_to_utf8(base, out); +} + +static int find_capture_source(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + int cur_idx = 0; + + ctx->capture_hwnd = NULL; + ctx->capture_hmonitor = NULL; + + if (cctx->user_hmonitor) { + ctx->capture_hmonitor = (HMONITOR)(uintptr_t)cctx->user_hmonitor; + return 0; + } else if (cctx->user_hwnd) { + ctx->capture_hwnd = (HWND)(uintptr_t)cctx->user_hwnd; + return 0; + } else if (cctx->monitor_idx >= 0) { + auto cb = make_win32_callback([&](HMONITOR hmonitor, HDC, LPRECT) { + if (cur_idx++ == cctx->monitor_idx) { + av_log(avctx, AV_LOG_DEBUG, "Found capture monitor: %d\n", cctx->monitor_idx); + ctx->capture_hmonitor = hmonitor; + return FALSE; + } + return TRUE; + }); + if (EnumDisplayMonitors(NULL, NULL, cb->proc, cb->lparam) || !ctx->capture_hmonitor) + return AVERROR(ENOENT); + return 0; + } else if (cctx->window_text || cctx->window_class || cctx->window_exe) { + std::regex text_regex; + if (build_regex(avctx, cctx->window_text, &text_regex) < 0) + return AVERROR(EINVAL); + + std::regex class_regex; + if (build_regex(avctx, cctx->window_class, &class_regex) < 0) + return AVERROR(EINVAL); + + std::regex exe_regex; + if (build_regex(avctx, cctx->window_exe, &exe_regex) < 0) + return AVERROR(EINVAL); + + std::string window_text; + std::wstring window_text_w; + std::string window_class; + std::wstring window_class_w; + std::string window_exe; + auto cb = make_win32_callback([&](HWND hwnd) { + RECT r = { 0 }; + if (!GetWindowRect(hwnd, &r) || r.right <= r.left || r.bottom <= r.top || !IsWindowVisible(hwnd)) + return TRUE; + + window_text_w.resize(GetWindowTextLengthW(hwnd) + 1); + int len = GetWindowTextW(hwnd, window_text_w.data(), (int)window_text_w.size()); + if (len >= 0) { + window_text_w.resize(len); + if (wstring_to_utf8(window_text_w.c_str(), &window_text) < 0) + window_text.clear(); + } else { + window_text.clear(); + } + + window_class_w.resize(256); + len = GetClassNameW(hwnd, window_class_w.data(), (int)window_class_w.size()); + if (len >= 0) { + window_class_w.resize(len); + if (wstring_to_utf8(window_class_w.c_str(), &window_class) < 0) + window_class.clear(); + } else { + window_class.clear(); + } + + get_window_exe_name(hwnd, &window_exe); + + av_log(avctx, AV_LOG_TRACE, "Checking window: hwnd=%p text=%s class=%s exe=%s\n", + hwnd, window_text.c_str(), window_class.c_str(), window_exe.c_str()); + + if (cctx->window_text) { + if (window_text.empty() || !std::regex_search(window_text, text_regex)) + return TRUE; + } + + if (cctx->window_class) { + if (window_class.empty() || !std::regex_search(window_class, class_regex)) + return TRUE; + } + + if (cctx->window_exe) { + if (window_exe.empty() || !std::regex_search(window_exe, exe_regex)) + return TRUE; + } + + av_log(avctx, AV_LOG_VERBOSE, "Found capture window: %s (Class: %s, Exe: %s)\n", + window_text.c_str(), window_class.c_str(), window_exe.c_str()); + ctx->capture_hwnd = hwnd; + return FALSE; + }); + if (EnumWindows(cb->proc, cb->lparam) || !ctx->capture_hwnd) + return AVERROR(ENOENT); + + if (cctx->monitor_idx == GFX_MONITOR_IDX_WINDOW) { + ctx->capture_hmonitor = MonitorFromWindow(ctx->capture_hwnd, MONITOR_DEFAULTTONEAREST); + ctx->capture_hwnd = NULL; + if (!ctx->capture_hmonitor) { + av_log(avctx, AV_LOG_ERROR, "Failed to get monitor for capture window\n"); + return AVERROR(ENOENT); + } + } + + return 0; + } + + av_log(avctx, AV_LOG_ERROR, "No capture source specified\n"); + return AVERROR(EINVAL); +} + +static av_cold void gfxcapture_uninit(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + + if (!ctx) + return; + + stop_wgc_thread(avctx); + + ctx->d3d.reset(); + + av_buffer_unref(&ctx->frames_ref); + av_buffer_unref(&ctx->device_ref); + + delete ctx; + cctx->ctx = nullptr; +} + +template<typename T> +static av_cold void GetProcAddressTyped(const hmodule_ptr_t &hModule, LPCSTR lpProcName, T *out) { + *out = reinterpret_cast<T>(GetProcAddress(hModule.get(), lpProcName)); +} + +static av_cold int load_functions(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + +#define LOAD_DLL(handle, name) \ + handle = hmodule_ptr_t(LoadLibraryExW(L##name, NULL, LOAD_LIBRARY_SEARCH_SYSTEM32)); \ + if (!handle) { \ + av_log(avctx, AV_LOG_ERROR, "Failed opening " #name "\n"); \ + return AVERROR(ENOSYS); \ + } + +#define LOAD_FUNC(handle, name) \ + GetProcAddressTyped(handle, #name, &ctx->fn.name); \ + if (!ctx->fn.name) { \ + av_log(avctx, AV_LOG_ERROR, "Failed loading " #name "\n"); \ + return AVERROR(ENOSYS); \ + } + + // this handle is not used anywhere, but letting it get auto-freed during RoUninit causes crashes + LOAD_DLL(ctx->fn.graphicscapture_handle, "graphicscapture.dll"); + + LOAD_DLL(ctx->fn.combase_handle, "combase.dll"); + LOAD_DLL(ctx->fn.dwmapi_handle, "dwmapi.dll"); + LOAD_DLL(ctx->fn.d3d11_handle, "d3d11.dll"); + LOAD_DLL(ctx->fn.coremsg_handle, "coremessaging.dll"); + LOAD_DLL(ctx->fn.user32_handle, "user32.dll"); + LOAD_DLL(ctx->fn.d3dcompiler_handle, "d3dcompiler_47.dll"); + + LOAD_FUNC(ctx->fn.combase_handle, RoInitialize); + LOAD_FUNC(ctx->fn.combase_handle, RoUninitialize); + LOAD_FUNC(ctx->fn.combase_handle, RoGetActivationFactory); + LOAD_FUNC(ctx->fn.combase_handle, WindowsCreateStringReference); + + LOAD_FUNC(ctx->fn.dwmapi_handle, DwmGetWindowAttribute); + + LOAD_FUNC(ctx->fn.d3d11_handle, CreateDirect3D11DeviceFromDXGIDevice); + + LOAD_FUNC(ctx->fn.coremsg_handle, CreateDispatcherQueueController); + + LOAD_FUNC(ctx->fn.user32_handle, SetThreadDpiAwarenessContext); + + LOAD_FUNC(ctx->fn.d3dcompiler_handle, D3DCompile); + +#undef LOAD_FUNC +#undef LOAD_DLL + return 0; +} + +static av_cold int gfxcapture_init(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + int ret = 0; + + GfxCaptureContextCpp *ctx = cctx->ctx = new GfxCaptureContextCpp(); + ctx->d3d = std::make_unique<GfxCaptureContextD3D>(); + + ret = load_functions(avctx); + if (ret < 0) { + ctx->fn.RoUninitialize = nullptr; + goto fail; + } + + return 0; + +fail: + gfxcapture_uninit(avctx); + return ret; +} + +static int init_hwframes_ctx(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + int ret = 0; + + ctx->frames_ref = av_hwframe_ctx_alloc(ctx->device_ref); + if (!ctx->frames_ref) + return AVERROR(ENOMEM); + ctx->frames_ctx = (AVHWFramesContext*)ctx->frames_ref->data; + ctx->frames_hwctx = (AVD3D11VAFramesContext*)ctx->frames_ctx->hwctx; + + ctx->frames_ctx->format = AV_PIX_FMT_D3D11; + ctx->frames_ctx->width = cctx->canvas_width; + ctx->frames_ctx->height = cctx->canvas_height; + ctx->frames_ctx->sw_format = (AVPixelFormat)cctx->out_fmt; + if (avctx->extra_hw_frames > 0) + ctx->frames_ctx->initial_pool_size = 8 + avctx->extra_hw_frames; + + ctx->frames_hwctx->BindFlags = D3D11_BIND_RENDER_TARGET; + + ret = av_hwframe_ctx_init(ctx->frames_ref); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to initialise hardware frames context: %d.\n", ret); + goto fail; + } + + return 0; +fail: + av_buffer_unref(&ctx->frames_ref); + return ret; +} + +static int setup_gfxcapture_capture(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + int ret = 0; + + stop_wgc_thread(avctx); + + ret = find_capture_source(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to find capture source\n"); + return ret; + } + + ret = start_wgc_thread(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to start WGC thread\n"); + return ret; + } + + int cap_w = wgctx->cap_size.Width - cctx->crop_left - cctx->crop_right; + int cap_h = wgctx->cap_size.Height - cctx->crop_top - cctx->crop_bottom; + + if (!cctx->capture_border) { + cap_w -= wgctx->client_area_offsets.left + wgctx->client_area_offsets.right; + cap_h -= wgctx->client_area_offsets.top + wgctx->client_area_offsets.bottom; + } + + if (cctx->canvas_width == 0) + cctx->canvas_width = cap_w; + else if (cctx->canvas_width < 0) + cctx->canvas_width = (cap_w / cctx->canvas_width) * cctx->canvas_width; + + if (cctx->canvas_height == 0) + cctx->canvas_height = cap_h; + else if (cctx->canvas_height < 0) + cctx->canvas_height = (cap_h / cctx->canvas_height) * cctx->canvas_height; + + return 0; +} + +static int prepare_render_resources(AVFilterContext *avctx) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextD3D> &d3dctx = ctx->d3d; + HRESULT hr; + + ComPtr<ID3DBlob> vs_blob, ps_blob, err_blob; + CD3D11_SAMPLER_DESC sampler_desc(CD3D11_DEFAULT{}); + UINT flags = D3DCOMPILE_OPTIMIZATION_LEVEL3; + + hr = ctx->fn.D3DCompile(render_shader_src, sizeof(render_shader_src) - 1, NULL, NULL, NULL, "main_vs", "vs_4_0", flags, 0, &vs_blob, &err_blob); + if (FAILED(hr)) { + if (err_blob) { + av_log(avctx, AV_LOG_ERROR, "Failed compiling vertex shader: %.*s\n", (int)err_blob->GetBufferSize(), (char*)err_blob->GetBufferPointer()); + } else { + av_log(avctx, AV_LOG_ERROR, "Failed compiling vertex shader: 0x%08lX\n", hr); + } + return AVERROR_EXTERNAL; + } + + const char *ps_entry = "main_ps_bicubic"; + if (cctx->resize_mode == GFX_RESIZE_CROP || cctx->scale_mode == GFX_SCALE_POINT) { + ps_entry = "main_ps"; + sampler_desc.Filter = D3D11_FILTER_MIN_MAG_MIP_POINT; + } + + hr = ctx->fn.D3DCompile(render_shader_src, sizeof(render_shader_src) - 1, NULL, NULL, NULL, ps_entry, "ps_4_0", flags, 0, &ps_blob, &err_blob); + if (FAILED(hr)) { + if (err_blob) { + av_log(avctx, AV_LOG_ERROR, "Failed compiling pixel shader: %.*s\n", (int)err_blob->GetBufferSize(), (char*)err_blob->GetBufferPointer()); + } else { + av_log(avctx, AV_LOG_ERROR, "Failed compiling pixel shader: 0x%08lX\n", hr); + } + return AVERROR_EXTERNAL; + } + + CHECK_HR_RET(ctx->device_hwctx->device->CreateVertexShader(vs_blob->GetBufferPointer(), vs_blob->GetBufferSize(), NULL, &d3dctx->vertex_shader)); + CHECK_HR_RET(ctx->device_hwctx->device->CreatePixelShader(ps_blob->GetBufferPointer(), ps_blob->GetBufferSize(), NULL, &d3dctx->pixel_shader)); + + CHECK_HR_RET(ctx->device_hwctx->device->CreateSamplerState(&sampler_desc, &d3dctx->sampler_state)); + + D3D11_BUFFER_DESC cb_desc = { 0 }; + cb_desc.ByteWidth = 48; + cb_desc.Usage = D3D11_USAGE_DYNAMIC; + cb_desc.BindFlags = D3D11_BIND_CONSTANT_BUFFER; + cb_desc.CPUAccessFlags = D3D11_CPU_ACCESS_WRITE; + + CHECK_HR_RET(ctx->device_hwctx->device->CreateBuffer(&cb_desc, NULL, &d3dctx->shader_cb)); + + CHECK_HR_RET(ctx->device_hwctx->device->CreateDeferredContext(0, &d3dctx->deferred_ctx)); + + return 0; +} + +static int gfxcapture_config_props(AVFilterLink *outlink) +{ + AVFilterContext *avctx = outlink->src; + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + + FilterLink *link = ff_filter_link(outlink); + int ret; + + if (avctx->hw_device_ctx) { + ctx->device_ctx = (AVHWDeviceContext*)avctx->hw_device_ctx->data; + + if (ctx->device_ctx->type != AV_HWDEVICE_TYPE_D3D11VA) { + av_log(avctx, AV_LOG_ERROR, "Non-D3D11VA input hw_device_ctx\n"); + return AVERROR(EINVAL); + } + + ctx->device_ref = av_buffer_ref(avctx->hw_device_ctx); + if (!ctx->device_ref) + return AVERROR(ENOMEM); + + av_log(avctx, AV_LOG_VERBOSE, "Using provided hw_device_ctx\n"); + } else { + ret = av_hwdevice_ctx_create(&ctx->device_ref, AV_HWDEVICE_TYPE_D3D11VA, NULL, NULL, 0); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to create D3D11VA device.\n"); + return ret; + } + + ctx->device_ctx = (AVHWDeviceContext*)ctx->device_ref->data; + + av_log(avctx, AV_LOG_VERBOSE, "Created internal hw_device_ctx\n"); + } + + ctx->device_hwctx = (AVD3D11VADeviceContext*)ctx->device_ctx->hwctx; + + ret = prepare_render_resources(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to prepare render resources\n"); + return ret; + } + + ret = setup_gfxcapture_capture(avctx); + if (ret < 0) { + av_log(avctx, AV_LOG_ERROR, "Failed to setup graphics capture\n"); + return ret; + } + + ret = init_hwframes_ctx(avctx); + if (ret < 0) + return ret; + + link->hw_frames_ctx = av_buffer_ref(ctx->frames_ref); + if (!link->hw_frames_ctx) + return AVERROR(ENOMEM); + + std::lock_guard wgc_lock(ctx->wgc_thread_uninit_mutex); + if (!ctx->wgc) { + av_log(avctx, AV_LOG_ERROR, "WGC thread died prematurely\n"); + return AVERROR(ENOSYS); + } + + outlink->w = ctx->frames_ctx->width; + outlink->h = ctx->frames_ctx->height; + outlink->time_base = AVRational{1, TIMESPAN_RES}; + outlink->alpha_mode = cctx->premult_alpha ? AVALPHA_MODE_PREMULTIPLIED : AVALPHA_MODE_STRAIGHT; + link->frame_rate = cctx->frame_rate; + + av_log(avctx, AV_LOG_DEBUG, "Capture setup with res %dx%d\n", outlink->w, outlink->h); + + return 0; +} + +static int render_capture_to_frame(AVFilterContext *avctx, AVFrame *frame, const ComPtr<ID3D11Texture2D> &src_tex) +{ + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextD3D> &d3dctx = ctx->d3d; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + + ID3D11Device *dev = ctx->device_hwctx->device; + ID3D11DeviceContext *dev_ctx = ctx->device_hwctx->device_context; + ComPtr<ID3D11DeviceContext> &def_ctx = d3dctx->deferred_ctx; + + D3D11_TEXTURE2D_DESC dst_tex_desc; + reinterpret_cast<ID3D11Texture2D*>(frame->data[0])->GetDesc(&dst_tex_desc); + + D3D11_TEXTURE2D_DESC src_tex_desc; + src_tex->GetDesc(&src_tex_desc); + + D3D11_RENDER_TARGET_VIEW_DESC target_desc = {}; + target_desc.Format = dst_tex_desc.Format; + + if (dst_tex_desc.ArraySize > 1) { + target_desc.ViewDimension = D3D11_RTV_DIMENSION_TEXTURE2DARRAY; + target_desc.Texture2DArray.ArraySize = 1; + target_desc.Texture2DArray.FirstArraySlice = (uintptr_t)frame->data[1]; + target_desc.Texture2DArray.MipSlice = 0; + } else { + target_desc.ViewDimension = D3D11_RTV_DIMENSION_TEXTURE2D; + target_desc.Texture2D.MipSlice = 0; + } + + ComPtr<ID3D11RenderTargetView> rtv; + CHECK_HR_RET(dev->CreateRenderTargetView( + reinterpret_cast<ID3D11Resource*>(frame->data[0]), &target_desc, &rtv)); + + ComPtr<ID3D11ShaderResourceView> srv; + CHECK_HR_RET(dev->CreateShaderResourceView(src_tex.Get(), nullptr, &srv)); + + int crop_left = cctx->crop_left; + int crop_top = cctx->crop_top; + int crop_right = cctx->crop_right; + int crop_bottom = cctx->crop_bottom; + + if (!cctx->capture_border) { + crop_left += wgctx->client_area_offsets.left; + crop_top += wgctx->client_area_offsets.top; + crop_right += wgctx->client_area_offsets.right; + crop_bottom += wgctx->client_area_offsets.bottom; + } + + // Using the actual capture frame size here adjusts for jank that can happen during rapid + // resizing of the source window. The capture frame pool is only recreated once a frame + // of changed size came out of it, so we need to cut/pad such frames to fit. + // Just discarding such frames can lead to visible stutter if the source window is being + // resized continuously, so this code does its best to adjust them instead. With the risk + // of slight clamping artifacts when enlarging rapidly. + int cropped_w = wgctx->cap_size.Width - crop_left - crop_right; + int cropped_h = wgctx->cap_size.Height - crop_top - crop_bottom; + + D3D11_VIEWPORT viewport = { 0 }; + viewport.MinDepth = 0.f; + viewport.MaxDepth = 1.f; + + switch (cctx->resize_mode) { + case GFX_RESIZE_CROP: + viewport.Width = (float)cropped_w; + viewport.Height = (float)cropped_h; + break; + case GFX_RESIZE_SCALE: + viewport.Width = dst_tex_desc.Width; + viewport.Height = dst_tex_desc.Height; + break; + case GFX_RESIZE_SCALE_ASPECT: { + float scale = FFMIN(dst_tex_desc.Width / (float)cropped_w, + dst_tex_desc.Height / (float)cropped_h); + viewport.Width = cropped_w * scale; + viewport.Height = cropped_h * scale; + break; + } + default: + av_log(avctx, AV_LOG_ERROR, "Invalid scaling mode\n"); + return AVERROR_BUG; + }; + + def_ctx->RSSetViewports(1, &viewport); + + D3D11_MAPPED_SUBRESOURCE map; + CHECK_HR_RET(def_ctx->Map(d3dctx->shader_cb.Get(), 0, D3D11_MAP_WRITE_DISCARD, 0, &map)); + { + float *cb_f = static_cast<float*>(map.pData); + uint32_t *cb_u = static_cast<uint32_t*>(map.pData); + cb_f[0] = (float)cropped_w; + cb_f[1] = (float)cropped_h; + cb_f[2] = viewport.Width; + cb_f[3] = viewport.Height; + cb_f[4] = crop_left / (float)src_tex_desc.Width; // min_u + cb_f[5] = crop_top / (float)src_tex_desc.Height; // min_v + cb_f[6] = (crop_left + cropped_w) / (float)src_tex_desc.Width; // max_u + cb_f[7] = (crop_top + cropped_h) / (float)src_tex_desc.Height; // max_v + cb_u[8] = !cctx->premult_alpha; // to_unpremult + cb_u[9] = src_tex_desc.Format == DXGI_FORMAT_R16G16B16A16_FLOAT && + dst_tex_desc.Format != DXGI_FORMAT_R16G16B16A16_FLOAT; // to_srgb + } + def_ctx->Unmap(d3dctx->shader_cb.Get(), 0); + + def_ctx->OMSetRenderTargets(1, rtv.GetAddressOf(), nullptr); + + const float clear_color[4] = {0.f, 0.f, 0.f, 1.f}; + def_ctx->ClearRenderTargetView(rtv.Get(), clear_color); + + def_ctx->IASetPrimitiveTopology(D3D11_PRIMITIVE_TOPOLOGY_TRIANGLELIST); + def_ctx->VSSetShader(d3dctx->vertex_shader.Get(), nullptr, 0); + def_ctx->VSSetConstantBuffers(0, 1, d3dctx->shader_cb.GetAddressOf()); + def_ctx->PSSetShader(d3dctx->pixel_shader.Get(), nullptr, 0); + def_ctx->PSSetSamplers(0, 1, d3dctx->sampler_state.GetAddressOf()); + def_ctx->PSSetShaderResources(0, 1, srv.GetAddressOf()); + def_ctx->PSSetConstantBuffers(0, 1, d3dctx->shader_cb.GetAddressOf()); + + def_ctx->Draw(3, 0); + + ComPtr<ID3D11CommandList> cmd_list; + CHECK_HR_RET(def_ctx->FinishCommandList(FALSE, &cmd_list)); + dev_ctx->ExecuteCommandList(cmd_list.Get(), FALSE); + + return 0; +} + +static int process_frame_if_exists(AVFilterLink *outlink) +{ + AVFilterContext *avctx = outlink->src; + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + int ret; + + AVFrame *frame = nullptr; + + ret = run_on_wgc_thread(avctx, [&]() { + ComPtr<IDirect3D11CaptureFrame> capture_frame; + ComPtr<IDirect3DSurface> capture_surface; + ComPtr<IDirect3DDxgiInterfaceAccess> dxgi_interface_access; + ComPtr<ID3D11Texture2D> frame_texture; + TimeSpan frame_time = { 0 }; + + ret = wgc_try_get_next_frame(avctx, &capture_frame); + if (ret < 0) + return ret; + + CHECK_HR_RET(capture_frame->get_SystemRelativeTime(&frame_time)); + + CHECK_HR_RET(capture_frame->get_Surface(&capture_surface)); + CHECK_HR_RET(capture_surface.As(&dxgi_interface_access)); + CHECK_HR_RET(dxgi_interface_access->GetInterface(IID_PPV_ARGS(&frame_texture))); + + if (!frame_texture) + return AVERROR(EAGAIN); + + frame = ff_get_video_buffer(outlink, cctx->canvas_width, cctx->canvas_height); + if (!frame) + return AVERROR(ENOMEM); + + frame->pts = frame_time.Duration; + + return render_capture_to_frame(avctx, frame, frame_texture); + }); + if (ret < 0) + return ret; + + frame->sample_aspect_ratio = AVRational{1, 1}; + + if (ctx->frames_ctx->sw_format == AV_PIX_FMT_RGBAF16) { + // According to MSDN, all floating point formats contain sRGB image data with linear 1.0 gamma. + frame->color_range = AVCOL_RANGE_JPEG; + frame->color_primaries = AVCOL_PRI_BT709; + frame->color_trc = AVCOL_TRC_LINEAR; + frame->colorspace = AVCOL_SPC_RGB; + } else { + // According to MSDN, all integer formats contain sRGB image data + frame->color_range = AVCOL_RANGE_JPEG; + frame->color_primaries = AVCOL_PRI_BT709; + frame->color_trc = AVCOL_TRC_IEC61966_2_1; + frame->colorspace = AVCOL_SPC_RGB; + } + + ctx->last_pts = frame->pts; + + if (!ctx->first_pts) + ctx->first_pts = frame->pts; + frame->pts -= ctx->first_pts; + + return ff_filter_frame(outlink, frame); +} + +static int gfxcapture_activate(AVFilterContext *avctx) +{ + AVFilterLink *outlink = avctx->outputs[0]; + GfxCaptureContext *cctx = CCTX(avctx->priv); + GfxCaptureContextCpp *ctx = cctx->ctx; + std::unique_ptr<GfxCaptureContextWgc> &wgctx = ctx->wgc; + + std::lock_guard wgc_lock(ctx->wgc_thread_uninit_mutex); + if (!wgctx) { + av_log(avctx, AV_LOG_ERROR, "WGC thread not initialized\n"); + return AVERROR(ENOSYS); + } + + if (!ff_outlink_frame_wanted(outlink)) + return FFERROR_NOT_READY; + + std::unique_lock frame_lock(wgctx->frame_arrived_mutex); + + for (;;) { + uint64_t last_seq = wgctx->frame_seq.load(std::memory_order_acquire); + + int ret = process_frame_if_exists(outlink); + if (ret != AVERROR(EAGAIN)) + return ret; + + if (wgctx->window_closed.load(std::memory_order_acquire)) { + ff_outlink_set_status(outlink, AVERROR_EOF, ctx->last_pts - ctx->first_pts + 1); + break; + } + + if (!wgctx->frame_arrived_cond.wait_for(frame_lock, std::chrono::seconds(1), [&]() { + return wgctx->frame_seq.load(std::memory_order_acquire) != last_seq || + wgctx->window_closed.load(std::memory_order_acquire); + })) + break; + } + + return 0; +} + +av_cold void ff_gfxcapture_uninit(AVFilterContext *avctx) noexcept +{ + try { + gfxcapture_uninit(avctx); + } catch (const std::exception &e) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during uninit: %s\n", e.what()); + } catch (...) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during uninit\n"); + } +} + +av_cold int ff_gfxcapture_init(AVFilterContext *avctx) noexcept +{ + try { + return gfxcapture_init(avctx); + } catch (const std::bad_alloc&) { + return AVERROR(ENOMEM); + } catch (const std::exception &e) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during init: %s\n", e.what()); + return AVERROR_BUG; + } catch (...) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during init\n"); + return AVERROR_BUG; + } +} + +int ff_gfxcapture_activate(AVFilterContext *avctx) noexcept +{ + try { + return gfxcapture_activate(avctx); + } catch (const std::bad_alloc&) { + return AVERROR(ENOMEM); + } catch (const std::exception &e) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during activate: %s\n", e.what()); + return AVERROR_BUG; + } catch (...) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during activate\n"); + return AVERROR_BUG; + } +} + +int ff_gfxcapture_config_props(AVFilterLink *outlink) noexcept +{ + AVFilterContext *avctx = outlink->src; + + try { + return gfxcapture_config_props(outlink); + } catch (const std::bad_alloc&) { + return AVERROR(ENOMEM); + } catch (const std::exception &e) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during config_props: %s\n", e.what()); + return AVERROR_BUG; + } catch (...) { + av_log(avctx, AV_LOG_ERROR, "unhandled exception during config_props\n"); + return AVERROR_BUG; + } +} diff --git a/libavfilter/vsrc_gfxcapture_winrt.h b/libavfilter/vsrc_gfxcapture_winrt.h new file mode 100644 index 0000000000..d6f11e4ef5 --- /dev/null +++ b/libavfilter/vsrc_gfxcapture_winrt.h @@ -0,0 +1,189 @@ +/* + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#ifndef AVFILTER_VSRC_GFXCAPTURE_WINRT_H +#define AVFILTER_VSRC_GFXCAPTURE_WINRT_H + +// Forward-declare IDirect3DDxgiInterfaceAccess if headers too old +#if !HAVE_IDIRECT3DDXGIINTERFACEACCESS +namespace Windows::Graphics::DirectX::Direct3D11 { + MIDL_INTERFACE("A9B3D012-3DF2-4EE3-B8D1-8695F457D3C1") + IDirect3DDxgiInterfaceAccess : public IUnknown + { + public: + IFACEMETHOD(GetInterface)(REFIID iid, _COM_Outptr_ void** p) = 0; + }; +} +#ifdef __MINGW32__ +__CRT_UUID_DECL(Windows::Graphics::DirectX::Direct3D11::IDirect3DDxgiInterfaceAccess, + 0xa9b3d012, 0x3df2, 0x4ee3, 0xb8, 0xd1, 0x86, 0x95, 0xf4, 0x57, 0xd3, 0xc1) +#endif +#endif /* !HAVE_IDIRECT3DDXGIINTERFACEACCESS */ + +// Forward-declare IGraphicsCaptureSession5 if headers too old +#if !HAVE___X_ABI_CWINDOWS_CGRAPHICS_CCAPTURE_CIGRAPHICSCAPTURESESSION5 +namespace ABI::Windows ::Graphics::Capture { + MIDL_INTERFACE("67C0EA62-1F85-5061-925A-239BE0AC09CB") + IGraphicsCaptureSession5 : public IInspectable + { + public: + IFACEMETHOD(get_MinUpdateInterval)(ABI::Windows::Foundation::TimeSpan* value) = 0; + IFACEMETHOD(put_MinUpdateInterval)(ABI::Windows::Foundation::TimeSpan value) = 0; + }; +} +#ifdef __MINGW32__ +__CRT_UUID_DECL(ABI::Windows ::Graphics::Capture::IGraphicsCaptureSession5, + 0x67c0ea62, 0x1f85, 0x5061, 0x92, 0x5a, 0x23, 0x9b, 0xe0, 0xac, 0x09, 0xcb) +#endif +#endif /* !HAVE___X_ABI_CWINDOWS_CGRAPHICS_CCAPTURE_CIGRAPHICSCAPTURESESSION5 */ + +/**************************************************** + * Helper class to implement refcounted COM objects * + ****************************************************/ +template<typename... Interfaces> +struct FFComObject : Interfaces... +{ + virtual ~FFComObject() = default; + + HRESULT STDMETHODCALLTYPE QueryInterface(REFIID riid, void** ppvObject) override + { + if (!ppvObject) + return E_POINTER; + + if (query_all<Interfaces...>(riid, ppvObject)) + { + AddRef(); + return S_OK; + } + + *ppvObject = nullptr; + return E_NOINTERFACE; + } + + ULONG STDMETHODCALLTYPE AddRef() override + { + return ++ref_count; + } + + ULONG STDMETHODCALLTYPE Release() override + { + ULONG rc = --ref_count; + if (rc == 0) + delete this; + return rc; + } + +private: + template <typename Iface, typename... IFaces> + bool query_all(REFIID riid, void** ppvObject) + { + if (riid == __uuidof(Iface)) { + *ppvObject = static_cast<Iface*>(this); + return true; + } + if constexpr (sizeof...(IFaces)) { + return query_all<IFaces...>(riid, ppvObject); + } else if (riid == __uuidof(IUnknown)) { + *ppvObject = static_cast<IUnknown*>(static_cast<Iface*>(this)); + return true; + } + return false; + } + + std::atomic<ULONG> ref_count { 1 }; +}; + +/******************************************* + * Helper to implement COM/WinRT callbacks * + *******************************************/ +template<class Iface, typename F, typename... Args> +struct FFTypedCBHandler : FFComObject<Iface, IAgileObject> +{ + using Func = std::decay_t<F>; + + explicit FFTypedCBHandler(F&& f) : cb_func(std::forward<F>(f)) {} + + std::invoke_result_t<Func&, Args...> STDMETHODCALLTYPE Invoke(Args... args) override + { + if constexpr (std::is_same_v<std::invoke_result_t<Func&, Args...>, HRESULT>) { + return cb_func(std::forward<Args>(args)...); + } else { + cb_func(std::forward<Args>(args)...); + return S_OK; + } + } + +private: + Func cb_func; +}; + +template<class Iface, typename... Args, typename F> +static Microsoft::WRL::ComPtr<Iface> create_cb_handler(F&& cb_func) +{ + return Microsoft::WRL::ComPtr<Iface>( + new FFTypedCBHandler<Iface, F, Args...>(std::forward<F>(cb_func)) + ); +} + +/****************************************** + * Helpers to implement C style callbacks * + ******************************************/ +template <typename Ret, typename... Args> +struct Win32Callback { + std::function<Ret(Args...)> fn; + static Ret CALLBACK thunk(Args... args, LPARAM lparam) { + auto self = reinterpret_cast<Win32Callback*>(lparam); + return self->fn(std::forward<Args>(args)...); + } + decltype(&Win32Callback::thunk) proc = &Win32Callback::thunk; + LPARAM lparam = 0; +}; + +template <typename Ret, typename... Args> +auto make_win32_callback(const std::function<Ret(Args...)> &&fn) { + using T = Win32Callback<Ret, Args...>; + auto res = std::make_unique<T>(T{ std::forward<decltype(fn)>(fn) }); + res->lparam = reinterpret_cast<LPARAM>(res.get()); + return res; +} +#define make_win32_callback(...) make_win32_callback(std::function(__VA_ARGS__)) + +/***************************** + * Small convenience helpers * + *****************************/ +struct HMODULEDeleter { + typedef HMODULE pointer; + void operator()(HMODULE handle) const { + if (handle) + FreeLibrary(handle); + } +}; +typedef std::unique_ptr<HMODULE, HMODULEDeleter> hmodule_ptr_t; + +struct HANDLEDeleter { + typedef HANDLE pointer; + void operator()(HANDLE handle) const { + if (handle && handle != INVALID_HANDLE_VALUE) + CloseHandle(handle); + } +}; +typedef std::unique_ptr<HANDLE, HANDLEDeleter> handle_ptr_t; + +#define HLSL(shader) #shader + +#endif /* AVFILTER_VSRC_GFXCAPTURE_WINRT_H */ |