API/VulkanPatchMatch_8h_source.html

/*--------------------------------------------------------------------------------------------

Copyright (c) 2026, NDEVR LLC

tyler.parke@ndevr.org

  __    __   ____     _____ __     __  _______

 |  \  |  | |  __ \  |  ___|\ \   / / |   __  \

 |   \ |  | | |  \ \ | |___  \ \ / /  |  |__)  |

 |  . \|  | | |__/ / | |___   \ V /   |   _   /

 |  |\    |_|_____/__|_____|___\_/____|  | \  \

 |__| \__________________________________|  \__\


Subject to the terms of the Enterprise+ Agreement, NDEVR hereby grants

Licensee a limited, non-exclusive, non-transferable, royalty-free license

(without the right to sublicense) to use the API solely for the purpose of

Licensee's internal development efforts to develop applications for which

the API was provided.


The above copyright notice and this permission notice shall be included in all

copies or substantial portions of the Software.


THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,

INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR

PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE

FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR

OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

DEALINGS IN THE SOFTWARE.


Library: VulkanCompute

File: VulkanPatchMatch

Included in API: True

Author(s): Tyler Parke

 *-----------------------------------------------------------------------------------------**/

#pragma once

#include "DLLInfo.h"

#include "VulkanComputeDevice.h"

#include "VulkanComputeBuffer.h"

#include "VulkanComputePipeline.h"

#include <NDEVR/Buffer.h>

#include <NDEVR/Pointer.h>

#include <NDEVR/String.h>

#include <NDEVR/File.h>


#if !defined(__EMSCRIPTEN__) && NDEVR_SUPPORTS_THREADING


namespace NDEVR

{


    struct PatchMatchCamera

    {

        float K[12];

        float R[12];

        float C[3];

        int32_t camWidth;

        int32_t camHeight;

        uint32_t pixelOffset;

        uint32_t _pad0;

        uint32_t _pad1;

    };


    static_assert(sizeof(PatchMatchCamera) == 128, "PatchMatchCamera must be 128 bytes for std430 array stride");


    struct PatchMatchPushConstants

    {

        int32_t width;

        int32_t height;

        int32_t nNumViews;

        int32_t nInitTopK;

        float fDepthMin;

        float fDepthMax;

        float fThresholdKeepCost;

        int32_t iteration;

        int32_t isRedPass;

        int32_t nEstimationIters;

        int32_t bLowResProcessed;

        int32_t yOffset;

        float fConfidenceSkipThreshold;

        int32_t _pcPad0;

        int32_t _pcPad1;

        int32_t _pcPad2;

    };


    struct DepthEstimateResult

    {

        Buffer<float> depth_map;

        Buffer<float> normal_map;

        Buffer<float> confidence_map;

        int width = 0;

        int height = 0;

        void clear()

        {

            width = 0;

            height = 0;

            depth_map.clear();

            normal_map.clear();

            confidence_map.clear();

        }


    };


    struct GeometricConsistencyPushConstants

    {

        int32_t width;

        int32_t height;

        int32_t nNumNeighbors;

        int32_t nMinConsistent;

        float fDepthDiffThreshold;

        float fNormalDiffThreshold;

        int32_t yOffset;

        int32_t _pad0;

    };


    struct DepthConsistencyPushConstants

    {

        int32_t width;

        int32_t height;

        int32_t nMinConsistent;

        int32_t _pad0;

        float fDepthRelTolerance;

        float _pad1;

        float _pad2;

        float _pad3;

        int32_t yOffset;

        int32_t _pad4;

        int32_t _pad5;

        int32_t _pad6;

    };


    struct MedianFilterPushConstants

    {

        int32_t width;

        int32_t height;

        int32_t _pad0;

        int32_t _pad1;

        float _pad2;

        float _pad3;

        float _pad4;

        float _pad5;

        int32_t yOffset;

        int32_t _pad6;

        int32_t _pad7;

        int32_t _pad8;

    };


    struct SGMPushConstants

    {

        int32_t width;

        int32_t height;

        int32_t maxRange;

        int32_t _pad0;

        float _pad1;

        float _pad2;

        float P1;

        float P2;

        float decay;

        float sgmWeight;

        float threshSmall;

        int32_t yOffset;

    };


    struct PatchMatchGpuCache

    {

        DynamicPointer<VulkanComputeBuffer> planes_buf, costs_buf, views_buf, rand_buf;

        DynamicPointer<VulkanComputeBuffer> camera_buf, image_buf, low_depth_buf;

        uint04 pixel_count = 0;

        uint04 n_views = 0;

        bool allocated = false;

    };


    class VULKAN_COMPUTE_API VulkanPatchMatch

    {

    public:

        static bool IsAvailable(LogPtr log);


        VulkanPatchMatch();

        ~VulkanPatchMatch();


        bool isInitialized() const { return m_initialized; }


        bool estimateDepthMap(

            uint04 ref_index,

            const Buffer<uint04>& neighbor_indices,

            const Buffer<PatchMatchCamera>& cameras,

            const Buffer<Buffer<float>>& images,

            const Buffer<int>& image_widths,

            const Buffer<int>& image_heights,

            float depth_min,

            float depth_max,

            uint04 n_estimation_iters,

            uint04 n_init_top_k,

            float threshold_keep_cost,

            const Buffer<float>& initial_planes,

            DepthEstimateResult& result,

            const Buffer<float>& geometric_prior = Buffer<float>(),

            PatchMatchGpuCache* cache = nullptr,

            float confidence_skip = 0.0f);


        static void FilterDepthMap(DepthEstimateResult& result,

            uint04 min_component_size = 16u,

            float depth_rel_tolerance = 0.02f);


        static bool WriteDmap(File file_path,

            const String& image_file_name,

            const Buffer<uint32_t>& view_ids,

            uint32_t image_width, uint32_t image_height,

            const double K[9], const double R[9], const double C[3],

            float depth_min, float depth_max,

            float threshold_keep_cost,

            const DepthEstimateResult& result);


        bool filterGeometricConsistency(

            const PatchMatchCamera& ref_camera,

            const Buffer<PatchMatchCamera>& neighbor_cameras,

            DepthEstimateResult& ref_result,

            const Buffer<DepthEstimateResult>& neighbor_results,

            float depth_diff_threshold,

            float normal_diff_threshold,

            uint04 min_consistent_views);


        void filterDepthMapGpu(DepthEstimateResult& result,

            uint04 min_consistent = 2u,

            float depth_rel_tolerance = 0.02f);


        bool refineDepthsInPlace(

            const Buffer<PatchMatchCamera>& cameras,

            const Buffer<Buffer<float>>& images,

            const Buffer<int>& image_widths,

            const Buffer<int>& image_heights,

            float depth_min, float depth_max,

            uint04 n_refinement_iters,

            float threshold_keep_cost,

            DepthEstimateResult& result,

            PatchMatchGpuCache* cache = nullptr);


        bool refineGeometric(

            uint04 ref_index,

            const Buffer<uint04>& neighbor_indices,

            const Buffer<PatchMatchCamera>& cameras,

            const Buffer<Buffer<float>>& images,

            const Buffer<int>& image_widths,

            const Buffer<int>& image_heights,

            float depth_min, float depth_max,

            uint04 n_refinement_iters,

            uint04 n_init_top_k,

            float threshold_keep_cost,

            DepthEstimateResult& result,

            const Buffer<PatchMatchCamera>& neighbor_cameras_for_geo,

            const Buffer<DepthEstimateResult>& neighbor_depth_maps,

            float depth_diff_threshold,

            float normal_diff_threshold,

            uint04 min_consistent_views,

            PatchMatchGpuCache* cache = nullptr);


    private:

        bool loadShaders();

        void createPipelines();


    private:

        ConstPointer<VulkanComputeDevice> m_compute_device;


        // Compute pipelines (one per shader)

        DynamicPointer<VulkanComputePipeline> m_initialize_pipeline;

        DynamicPointer<VulkanComputePipeline> m_propagate_pipeline;

        DynamicPointer<VulkanComputePipeline> m_filter_pipeline;

        DynamicPointer<VulkanComputePipeline> m_refine_pipeline;

        DynamicPointer<VulkanComputePipeline> m_geo_consistency_pipeline;

        DynamicPointer<VulkanComputePipeline> m_depth_consistency_pipeline;

        DynamicPointer<VulkanComputePipeline> m_median_pipeline;

        DynamicPointer<VulkanComputePipeline> m_sgm_pipeline;


        // SPIR-V shaders

        DynamicPointer<VulkanShader> m_initialize_shader;

        DynamicPointer<VulkanShader> m_propagate_shader;

        DynamicPointer<VulkanShader> m_filter_shader;

        DynamicPointer<VulkanShader> m_refine_shader;

        DynamicPointer<VulkanShader> m_geo_consistency_shader;

        DynamicPointer<VulkanShader> m_depth_consistency_shader;

        DynamicPointer<VulkanShader> m_median_shader;

        DynamicPointer<VulkanShader> m_sgm_shader;


        bool m_initialized = false;

        LogPtr m_log;

    public:

        void setLog(LogPtr log) { m_log = log; }

    };

}


#else // __EMSCRIPTEN__ or no threading


namespace NDEVR

{

    // Stub for platforms without Vulkan support

    class VULKAN_COMPUTE_API VulkanPatchMatch

    {

    public:

        static bool IsAvailable() { return false; }

    };

}


#endif // !__EMSCRIPTEN__ && NDEVR_SUPPORTS_THREADING

Buffer
The equivelent of std::vector but with a bit more control.
Definition Buffer.hpp:58

DynamicPointer
Provides a modifiable pointer that has shared ownership of a dynamically allocated object.
Definition Pointer.hpp:356

LogPtr
A light-weight wrapper that will be a no-op if there is not a valid log reference,...
Definition ProgressInfo.hpp:102

NDEVR
The primary namespace for the NDEVR SDK.
Definition ArialTileFetcherModule.h:35

uint04
uint32_t uint04
-Defines an alias representing a 4 byte, unsigned integer -Can represent exact integer values 0 throu...
Definition BaseValues.hpp:97

DepthConsistencyPushConstants
Push constants for depth consistency shader.
Definition VulkanPatchMatch.h:135

DepthConsistencyPushConstants::_pad3
float _pad3
Padding for std430 alignment.
Definition VulkanPatchMatch.h:143

DepthConsistencyPushConstants::width
int32_t width
Image width in pixels.
Definition VulkanPatchMatch.h:136

DepthConsistencyPushConstants::height
int32_t height
Image height in pixels.
Definition VulkanPatchMatch.h:137

DepthConsistencyPushConstants::_pad1
float _pad1
Padding for std430 alignment.
Definition VulkanPatchMatch.h:141

DepthConsistencyPushConstants::_pad0
int32_t _pad0
Padding for std430 alignment.
Definition VulkanPatchMatch.h:139

DepthConsistencyPushConstants::_pad6
int32_t _pad6
Padding for std430 alignment.
Definition VulkanPatchMatch.h:147

DepthConsistencyPushConstants::fDepthRelTolerance
float fDepthRelTolerance
Relative depth tolerance for neighbor consistency.
Definition VulkanPatchMatch.h:140

DepthConsistencyPushConstants::nMinConsistent
int32_t nMinConsistent
Minimum consistent 8-neighbors to keep a pixel.
Definition VulkanPatchMatch.h:138

DepthConsistencyPushConstants::_pad2
float _pad2
Padding for std430 alignment.
Definition VulkanPatchMatch.h:142

DepthConsistencyPushConstants::_pad4
int32_t _pad4
Padding for std430 alignment.
Definition VulkanPatchMatch.h:145

DepthConsistencyPushConstants::_pad5
int32_t _pad5
Padding for std430 alignment.
Definition VulkanPatchMatch.h:146

DepthConsistencyPushConstants::yOffset
int32_t yOffset
Row offset for tiled dispatches.
Definition VulkanPatchMatch.h:144

DepthEstimateResult
Result from a single depth estimation pass.
Definition VulkanPatchMatch.h:103

DepthEstimateResult::depth_map
Buffer< float > depth_map
W*H depth values.
Definition VulkanPatchMatch.h:104

DepthEstimateResult::width
int width
Image width in pixels.
Definition VulkanPatchMatch.h:107

DepthEstimateResult::normal_map
Buffer< float > normal_map
W*H*3 normal components.
Definition VulkanPatchMatch.h:105

DepthEstimateResult::height
int height
Image height in pixels.
Definition VulkanPatchMatch.h:108

DepthEstimateResult::confidence_map
Buffer< float > confidence_map
W*H confidence values.
Definition VulkanPatchMatch.h:106

GeometricConsistencyPushConstants
Push constants for geometric consistency shader.
Definition VulkanPatchMatch.h:122

GeometricConsistencyPushConstants::nMinConsistent
int32_t nMinConsistent
Minimum consistent neighbors required to keep a pixel.
Definition VulkanPatchMatch.h:126

GeometricConsistencyPushConstants::fNormalDiffThreshold
float fNormalDiffThreshold
Cosine angle threshold for normal consistency.
Definition VulkanPatchMatch.h:128

GeometricConsistencyPushConstants::height
int32_t height
Image height in pixels.
Definition VulkanPatchMatch.h:124

GeometricConsistencyPushConstants::fDepthDiffThreshold
float fDepthDiffThreshold
Relative depth tolerance for consistency.
Definition VulkanPatchMatch.h:127

GeometricConsistencyPushConstants::yOffset
int32_t yOffset
Row offset for tiled dispatches.
Definition VulkanPatchMatch.h:129

GeometricConsistencyPushConstants::_pad0
int32_t _pad0
Padding for std430 alignment.
Definition VulkanPatchMatch.h:130

GeometricConsistencyPushConstants::width
int32_t width
Image width in pixels.
Definition VulkanPatchMatch.h:123

GeometricConsistencyPushConstants::nNumNeighbors
int32_t nNumNeighbors
Number of neighbor depth maps to check.
Definition VulkanPatchMatch.h:125

MedianFilterPushConstants
Push constants for median filter shader.
Definition VulkanPatchMatch.h:152

MedianFilterPushConstants::height
int32_t height
Image height in pixels.
Definition VulkanPatchMatch.h:154

MedianFilterPushConstants::width
int32_t width
Image width in pixels.
Definition VulkanPatchMatch.h:153

PatchMatchCamera
GPU-accelerated PatchMatch depth estimation using Vulkan compute shaders.
Definition VulkanPatchMatch.h:68

PatchMatchCamera::R
float R[12]
3x3 rotation (column-major, 3 columns × [3 floats + 1 pad])
Definition VulkanPatchMatch.h:70

PatchMatchCamera::camHeight
int32_t camHeight
Image height.
Definition VulkanPatchMatch.h:73

PatchMatchCamera::_pad0
uint32_t _pad0
Padding to match GLSL std430 array stride (128 bytes).
Definition VulkanPatchMatch.h:75

PatchMatchCamera::pixelOffset
uint32_t pixelOffset
Offset into packed image SSBO.
Definition VulkanPatchMatch.h:74

PatchMatchCamera::K
float K[12]
3x3 intrinsic (column-major, 3 columns × [3 floats + 1 pad])
Definition VulkanPatchMatch.h:69

PatchMatchCamera::C
float C[3]
Camera center (vec3).
Definition VulkanPatchMatch.h:71

PatchMatchCamera::camWidth
int32_t camWidth
Image width (packs into vec3 C's trailing 4 bytes).
Definition VulkanPatchMatch.h:72

PatchMatchCamera::_pad1
uint32_t _pad1
(std430 rounds struct size to 16-byte alignment for arrays)
Definition VulkanPatchMatch.h:76

PatchMatchGpuCache
GPU buffer cache for reuse across multiple estimateDepthMap calls.
Definition VulkanPatchMatch.h:187

PatchMatchPushConstants
Push constant layout (must match GLSL layout exactly).
Definition VulkanPatchMatch.h:82

PatchMatchPushConstants::yOffset
int32_t yOffset
Row offset for tiled dispatches.
Definition VulkanPatchMatch.h:94

PatchMatchPushConstants::nInitTopK
int32_t nInitTopK
Number of top views to select during initialization.
Definition VulkanPatchMatch.h:86

PatchMatchPushConstants::fThresholdKeepCost
float fThresholdKeepCost
Cost threshold for filtering bad matches.
Definition VulkanPatchMatch.h:89

PatchMatchPushConstants::nNumViews
int32_t nNumViews
Number of neighbor views used for matching.
Definition VulkanPatchMatch.h:85

PatchMatchPushConstants::iteration
int32_t iteration
Current PatchMatch iteration index.
Definition VulkanPatchMatch.h:90

PatchMatchPushConstants::fConfidenceSkipThreshold
float fConfidenceSkipThreshold
Skip pixels with cost below this (0 = disabled).
Definition VulkanPatchMatch.h:95

PatchMatchPushConstants::width
int32_t width
Image width in pixels.
Definition VulkanPatchMatch.h:83

PatchMatchPushConstants::_pcPad1
int32_t _pcPad1
Padding for std430 alignment.
Definition VulkanPatchMatch.h:97

PatchMatchPushConstants::isRedPass
int32_t isRedPass
Whether this is the red (1) or black (0) checkerboard pass.
Definition VulkanPatchMatch.h:91

PatchMatchPushConstants::nEstimationIters
int32_t nEstimationIters
Total number of PatchMatch iterations to perform.
Definition VulkanPatchMatch.h:92

PatchMatchPushConstants::bLowResProcessed
int32_t bLowResProcessed
Whether a low-resolution prior has been applied.
Definition VulkanPatchMatch.h:93

PatchMatchPushConstants::fDepthMin
float fDepthMin
Minimum depth bound.
Definition VulkanPatchMatch.h:87

PatchMatchPushConstants::fDepthMax
float fDepthMax
Maximum depth bound.
Definition VulkanPatchMatch.h:88

PatchMatchPushConstants::_pcPad0
int32_t _pcPad0
Padding for std430 alignment.
Definition VulkanPatchMatch.h:96

PatchMatchPushConstants::_pcPad2
int32_t _pcPad2
Padding for std430 alignment.
Definition VulkanPatchMatch.h:98

PatchMatchPushConstants::height
int32_t height
Image height in pixels.
Definition VulkanPatchMatch.h:84

SGMPushConstants
Push constants for SGM directional cost aggregation shader.
Definition VulkanPatchMatch.h:169

SGMPushConstants::maxRange
int32_t maxRange
Max scanline walk distance (default 64).
Definition VulkanPatchMatch.h:172

SGMPushConstants::threshSmall
float threshSmall
Relative depth diff threshold for small step (default 0.01).
Definition VulkanPatchMatch.h:180

SGMPushConstants::P2
float P2
Large depth step penalty (default 0.08).
Definition VulkanPatchMatch.h:177

SGMPushConstants::sgmWeight
float sgmWeight
Blend weight for aggregated cost (default 0.3).
Definition VulkanPatchMatch.h:179

SGMPushConstants::decay
float decay
Per-step penalty decay (default 0.92).
Definition VulkanPatchMatch.h:178

SGMPushConstants::P1
float P1
Small depth step penalty (default 0.02).
Definition VulkanPatchMatch.h:176