image_framework_ymj/include/open3d/t/geometry/VoxelBlockGrid.h

// ----------------------------------------------------------------------------
// -                        Open3D: www.open3d.org                            -
// ----------------------------------------------------------------------------
// Copyright (c) 2018-2023 www.open3d.org
// SPDX-License-Identifier: MIT
// ----------------------------------------------------------------------------

#pragma once

#include "open3d/core/Tensor.h"
#include "open3d/core/hashmap/HashMap.h"
#include "open3d/t/geometry/Geometry.h"
#include "open3d/t/geometry/Image.h"
#include "open3d/t/geometry/PointCloud.h"
#include "open3d/t/geometry/TensorMap.h"
#include "open3d/t/geometry/TriangleMesh.h"

namespace open3d {
namespace t {
namespace geometry {

/// A voxel block grid is a sparse grid of voxel blocks.
/// Each voxel block is a dense 3D array, preserving local data distribution.
/// If the block_resolution is set to 1, then the VoxelBlockGrid degenerates to
/// a sparse voxel grid.
class VoxelBlockGrid {
public:
    VoxelBlockGrid() = default;

    /// \brief Default Constructor.
    /// Example:
    /// VoxelBlockGrid({"tsdf", "weight", "color"},
    ///                {core::Float32, core::UInt16, core::UInt16},
    ///                {{1}, {1}, {3}},
    ///                0.005,
    ///                16,
    ///                10000,
    ///                core::Device("CUDA:0"),
    ///                core::HashBackendType::Default);
    VoxelBlockGrid(const std::vector<std::string> &attr_names,
                   const std::vector<core::Dtype> &attr_dtypes,
                   const std::vector<core::SizeVector> &attr_channels,
                   float voxel_size = 0.0058,
                   int64_t block_resolution = 16,
                   int64_t block_count = 10000,
                   const core::Device &device = core::Device("CPU:0"),
                   const core::HashBackendType &backend =
                           core::HashBackendType::Default);

    /// Get the underlying hash map that stores values in structure of arrays
    /// (SoA).
    core::HashMap GetHashMap() { return *block_hashmap_; }

    /// Get the attribute tensor corresponding to the attribute name.
    /// A sugar for hashmap.GetValueTensor(i)
    core::Tensor GetAttribute(const std::string &attr_name) const;

    /// Get a (4, N), Int64 index tensor for active voxels, used for advanced
    /// indexing.
    /// Returned index tensor can access selected value buffers in order of
    /// (buf_index, index_voxel_x, index_voxel_y, index_voxel_z).
    ///
    /// Example:
    /// For a voxel block grid with (2, 2, 2) block resolution,
    /// if the active block coordinates are at buffer index {(2, 4)} given by
    /// GetActiveIndices() from the underlying hash map,
    /// the returned result will be a (4, 2 x 8) tensor:
    /// {
    /// (2, 0, 0, 0), (2, 1, 0, 0), (2, 0, 1, 0), (2, 1, 1, 0),
    /// (2, 0, 0, 1), (2, 1, 0, 1), (2, 0, 1, 1), (2, 1, 1, 1),
    /// (4, 0, 0, 0), (4, 1, 0, 0), (4, 0, 1, 0), (4, 1, 1, 0),
    /// (4, 0, 0, 1), (4, 1, 0, 1), (4, 0, 1, 1), (4, 1, 1, 1),
    /// }
    /// Note: the slicing order is z-y-x.
    core::Tensor GetVoxelIndices(const core::Tensor &buf_indices) const;

    /// Get all active voxel indices.
    core::Tensor GetVoxelIndices() const;

    /// Get a (3, hashmap.Size() * resolution^3) coordinate tensor of active
    /// voxels per block, used for geometry transformation jointly with
    /// indices from GetVoxelIndices.
    ///
    /// Example:
    /// For a voxel block grid with (2, 2, 2) block resolution,
    /// if the active block coordinates are {(-1, 3, 2), (0, 2, 4)},
    /// the returned result will be a (3, 2 x 8) tensor given by:
    /// {
    /// key_tensor[voxel_indices[0]] * block_resolution_ + voxel_indices[1]
    /// key_tensor[voxel_indices[0]] * block_resolution_ + voxel_indices[2]
    /// key_tensor[voxel_indices[0]] * block_resolution_ + voxel_indices[3]
    /// }
    /// Note: the coordinates are VOXEL COORDINATES in Int64. To access metric
    /// coordinates, multiply by voxel size.
    core::Tensor GetVoxelCoordinates(const core::Tensor &voxel_indices) const;

    /// Accelerated combination of GetVoxelIndices and GetVoxelCoordinates.
    /// Returns a (N, 3) coordinate in float, and a (N, ) flattened index
    /// tensor, where N is the number of active voxels located at buf_indices.
    std::pair<core::Tensor, core::Tensor>
    GetVoxelCoordinatesAndFlattenedIndices(const core::Tensor &buf_indices);

    /// Same as above, but N is the number of all the active voxels with blocks
    /// stored in the hash map.
    std::pair<core::Tensor, core::Tensor>
    GetVoxelCoordinatesAndFlattenedIndices();

    /// Get a (3, M) active block coordinates from a depth image, with potential
    /// duplicates removed.
    /// Note: these coordinates are not activated in the internal sparse voxel
    /// block. They need to be inserted in the hash map.
    core::Tensor GetUniqueBlockCoordinates(const Image &depth,
                                           const core::Tensor &intrinsic,
                                           const core::Tensor &extrinsic,
                                           float depth_scale = 1000.0f,
                                           float depth_max = 3.0f,
                                           float trunc_voxel_multiplier = 8.0);

    /// Obtain active block coordinates from a point cloud.
    core::Tensor GetUniqueBlockCoordinates(const PointCloud &pcd,
                                           float trunc_voxel_multiplier = 8.0);

    /// Specific operation for TSDF volumes.
    /// Integrate an RGB-D frame in the selected block coordinates using pinhole
    /// camera model.
    /// For built-in kernels, we support efficient hash map types for SLAM:
    /// tsdf: float, weight: uint16_t, color: uint16_t
    /// and accurate mode for differentiable rendering:
    /// tsdf/weight/color: float
    /// We assume input data are either raw:
    /// depth: uint16_t, color: uint8_t
    /// or depth/color: float.
    /// To support other types and properties, users should combine
    /// GetUniqueBlockCoordinates, GetVoxelIndices, and GetVoxelCoordinates,
    /// with self-defined operations.
    void Integrate(const core::Tensor &block_coords,
                   const Image &depth,
                   const Image &color,
                   const core::Tensor &depth_intrinsic,
                   const core::Tensor &color_intrinsic,
                   const core::Tensor &extrinsic,
                   float depth_scale = 1000.0f,
                   float depth_max = 3.0f,
                   float trunc_voxel_multiplier = 8.0f);

    /// Specific operation for TSDF volumes.
    /// Similar to RGB-D integration, but uses the same intrinsics for depth and
    /// color.
    void Integrate(const core::Tensor &block_coords,
                   const Image &depth,
                   const Image &color,
                   const core::Tensor &intrinsic,
                   const core::Tensor &extrinsic,
                   float depth_scale = 1000.0f,
                   float depth_max = 3.0f,
                   float trunc_voxel_multiplier = 8.0f);

    /// Specific operation for TSDF volumes.
    /// Similar to RGB-D integration, but only applied to depth.
    void Integrate(const core::Tensor &block_coords,
                   const Image &depth,
                   const core::Tensor &intrinsic,
                   const core::Tensor &extrinsic,
                   float depth_scale = 1000.0f,
                   float depth_max = 3.0f,
                   float trunc_voxel_multiplier = 8.0f);

    /// Specific operation for TSDF volumes.
    /// Perform volumetric ray casting in the selected block coordinates.
    /// Return selected properties from the frame.
    /// Supported attributes:
    /// Conventional rendering: vertex, depth, color, normal, range
    /// Differentiable rendering (voxel-wise): mask, index, (interpolation)
    /// ratio.
    /// The block coordinates in the frustum can be taken from
    /// GetUniqueBlockCoordinates.
    /// All the block coordinates can be taken from GetHashMap().GetKeyTensor().
    TensorMap RayCast(const core::Tensor &block_coords,
                      const core::Tensor &intrinsic,
                      const core::Tensor &extrinsic,
                      int width,
                      int height,
                      const std::vector<std::string> attrs = {"depth", "color"},
                      float depth_scale = 1000.0f,
                      float depth_min = 0.1f,
                      float depth_max = 3.0f,
                      float weight_threshold = 3.0f,
                      float trunc_voxel_multiplier = 8.0f,
                      int range_map_down_factor = 8);

    /// Specific operation for TSDF volumes.
    /// Extract point cloud at isosurface points.
    /// Weight threshold is used to filter outliers. By default we use 3.0,
    /// where we assume a reliable surface point comes from the fusion of at
    /// least 3 viewpoints. Use as low as 0.0 to accept all the possible
    /// observations.
    /// Estimated point numbers optionally speeds up the process by a one-pass
    /// extraction with pre-allocated buffers. Use -1 when no estimate is
    /// available.
    PointCloud ExtractPointCloud(float weight_threshold = 3.0f,
                                 int estimated_point_number = -1);

    /// Specific operation for TSDF volumes.
    /// Extract mesh near iso-surfaces with Marching Cubes.
    /// Weight threshold is used to filter outliers. By default we use 3.0,
    /// where we assume a reliable surface point comes from the fusion of at
    /// least 3 viewpoints. Use as low as 0.0 to accept all the possible
    /// observations.
    /// Estimated point numbers optionally speeds up the process by a one-pass
    /// extraction with pre-allocated buffers. Use -1 when no estimate is
    /// available.
    TriangleMesh ExtractTriangleMesh(float weight_threshold = 3.0f,
                                     int estimated_vertex_numer = -1);

    /// Save a voxel block grid to a .npz file.
    void Save(const std::string &file_name) const;

    /// Load a voxel block grid from a .npz file.
    static VoxelBlockGrid Load(const std::string &file_name);

    /// Convert the hash map to another device.
    VoxelBlockGrid To(const core::Device &device, bool copy = false) const;

private:
    void AssertInitialized() const;

    VoxelBlockGrid(float voxelSize,
                   int64_t blockResolution,
                   const std::shared_ptr<core::HashMap> &blockHashmap,
                   const std::unordered_map<std::string, int> &nameAttrMap)
        : voxel_size_(voxelSize),
          block_resolution_(blockResolution),
          block_hashmap_(blockHashmap),
          name_attr_map_(nameAttrMap) {}

    float voxel_size_ = -1;
    int64_t block_resolution_ = -1;

    // Global hash map: 3D coords -> voxel blocks in SoA.
    std::shared_ptr<core::HashMap> block_hashmap_;

    // Local hash map: 3D coords -> indices in block_hashmap_.
    std::shared_ptr<core::HashMap> frustum_hashmap_;

    // Map: attribute name -> index to access the attribute in SoA.
    std::unordered_map<std::string, int> name_attr_map_;

    // Allocated fragment buffer for reuse in depth estimation
    core::Tensor fragment_buffer_;
};
}  // namespace geometry
}  // namespace t
}  // namespace open3d
init 2024-12-06 16:25:16 +08:00			`// ----------------------------------------------------------------------------`
			`// - Open3D: www.open3d.org -`
			`// ----------------------------------------------------------------------------`
			`// Copyright (c) 2018-2023 www.open3d.org`
			`// SPDX-License-Identifier: MIT`
			`// ----------------------------------------------------------------------------`

			`#pragma once`

			`#include "open3d/core/Tensor.h"`
			`#include "open3d/core/hashmap/HashMap.h"`
			`#include "open3d/t/geometry/Geometry.h"`
			`#include "open3d/t/geometry/Image.h"`
			`#include "open3d/t/geometry/PointCloud.h"`
			`#include "open3d/t/geometry/TensorMap.h"`
			`#include "open3d/t/geometry/TriangleMesh.h"`

			`namespace open3d {`
			`namespace t {`
			`namespace geometry {`

			`/// A voxel block grid is a sparse grid of voxel blocks.`
			`/// Each voxel block is a dense 3D array, preserving local data distribution.`
			`/// If the block_resolution is set to 1, then the VoxelBlockGrid degenerates to`
			`/// a sparse voxel grid.`
			`class VoxelBlockGrid {`
			`public:`
			`VoxelBlockGrid() = default;`

			`/// \brief Default Constructor.`
			`/// Example:`
			`/// VoxelBlockGrid({"tsdf", "weight", "color"},`
			`/// {core::Float32, core::UInt16, core::UInt16},`
			`/// {{1}, {1}, {3}},`
			`/// 0.005,`
			`/// 16,`
			`/// 10000,`
			`/// core::Device("CUDA:0"),`
			`/// core::HashBackendType::Default);`
			`VoxelBlockGrid(const std::vector<std::string> &attr_names,`
			`const std::vector<core::Dtype> &attr_dtypes,`
			`const std::vector<core::SizeVector> &attr_channels,`
			`float voxel_size = 0.0058,`
			`int64_t block_resolution = 16,`
			`int64_t block_count = 10000,`
			`const core::Device &device = core::Device("CPU:0"),`
			`const core::HashBackendType &backend =`
			`core::HashBackendType::Default);`

			`/// Get the underlying hash map that stores values in structure of arrays`
			`/// (SoA).`
			`core::HashMap GetHashMap() { return *block_hashmap_; }`

			`/// Get the attribute tensor corresponding to the attribute name.`
			`/// A sugar for hashmap.GetValueTensor(i)`
			`core::Tensor GetAttribute(const std::string &attr_name) const;`

			`/// Get a (4, N), Int64 index tensor for active voxels, used for advanced`
			`/// indexing.`
			`/// Returned index tensor can access selected value buffers in order of`
			`/// (buf_index, index_voxel_x, index_voxel_y, index_voxel_z).`
			`///`
			`/// Example:`
			`/// For a voxel block grid with (2, 2, 2) block resolution,`
			`/// if the active block coordinates are at buffer index {(2, 4)} given by`
			`/// GetActiveIndices() from the underlying hash map,`
			`/// the returned result will be a (4, 2 x 8) tensor:`
			`/// {`
			`/// (2, 0, 0, 0), (2, 1, 0, 0), (2, 0, 1, 0), (2, 1, 1, 0),`
			`/// (2, 0, 0, 1), (2, 1, 0, 1), (2, 0, 1, 1), (2, 1, 1, 1),`
			`/// (4, 0, 0, 0), (4, 1, 0, 0), (4, 0, 1, 0), (4, 1, 1, 0),`
			`/// (4, 0, 0, 1), (4, 1, 0, 1), (4, 0, 1, 1), (4, 1, 1, 1),`
			`/// }`
			`/// Note: the slicing order is z-y-x.`
			`core::Tensor GetVoxelIndices(const core::Tensor &buf_indices) const;`

			`/// Get all active voxel indices.`
			`core::Tensor GetVoxelIndices() const;`

			`/// Get a (3, hashmap.Size() * resolution^3) coordinate tensor of active`
			`/// voxels per block, used for geometry transformation jointly with`
			`/// indices from GetVoxelIndices.`
			`///`
			`/// Example:`
			`/// For a voxel block grid with (2, 2, 2) block resolution,`
			`/// if the active block coordinates are {(-1, 3, 2), (0, 2, 4)},`
			`/// the returned result will be a (3, 2 x 8) tensor given by:`
			`/// {`
			`/// key_tensor[voxel_indices[0]] * block_resolution_ + voxel_indices[1]`
			`/// key_tensor[voxel_indices[0]] * block_resolution_ + voxel_indices[2]`
			`/// key_tensor[voxel_indices[0]] * block_resolution_ + voxel_indices[3]`
			`/// }`
			`/// Note: the coordinates are VOXEL COORDINATES in Int64. To access metric`
			`/// coordinates, multiply by voxel size.`
			`core::Tensor GetVoxelCoordinates(const core::Tensor &voxel_indices) const;`

			`/// Accelerated combination of GetVoxelIndices and GetVoxelCoordinates.`
			`/// Returns a (N, 3) coordinate in float, and a (N, ) flattened index`
			`/// tensor, where N is the number of active voxels located at buf_indices.`
			`std::pair<core::Tensor, core::Tensor>`
			`GetVoxelCoordinatesAndFlattenedIndices(const core::Tensor &buf_indices);`

			`/// Same as above, but N is the number of all the active voxels with blocks`
			`/// stored in the hash map.`
			`std::pair<core::Tensor, core::Tensor>`
			`GetVoxelCoordinatesAndFlattenedIndices();`

			`/// Get a (3, M) active block coordinates from a depth image, with potential`
			`/// duplicates removed.`
			`/// Note: these coordinates are not activated in the internal sparse voxel`
			`/// block. They need to be inserted in the hash map.`
			`core::Tensor GetUniqueBlockCoordinates(const Image &depth,`
			`const core::Tensor &intrinsic,`
			`const core::Tensor &extrinsic,`
			`float depth_scale = 1000.0f,`
			`float depth_max = 3.0f,`
			`float trunc_voxel_multiplier = 8.0);`

			`/// Obtain active block coordinates from a point cloud.`
			`core::Tensor GetUniqueBlockCoordinates(const PointCloud &pcd,`
			`float trunc_voxel_multiplier = 8.0);`

			`/// Specific operation for TSDF volumes.`
			`/// Integrate an RGB-D frame in the selected block coordinates using pinhole`
			`/// camera model.`
			`/// For built-in kernels, we support efficient hash map types for SLAM:`
			`/// tsdf: float, weight: uint16_t, color: uint16_t`
			`/// and accurate mode for differentiable rendering:`
			`/// tsdf/weight/color: float`
			`/// We assume input data are either raw:`
			`/// depth: uint16_t, color: uint8_t`
			`/// or depth/color: float.`
			`/// To support other types and properties, users should combine`
			`/// GetUniqueBlockCoordinates, GetVoxelIndices, and GetVoxelCoordinates,`
			`/// with self-defined operations.`
			`void Integrate(const core::Tensor &block_coords,`
			`const Image &depth,`
			`const Image &color,`
			`const core::Tensor &depth_intrinsic,`
			`const core::Tensor &color_intrinsic,`
			`const core::Tensor &extrinsic,`
			`float depth_scale = 1000.0f,`
			`float depth_max = 3.0f,`
			`float trunc_voxel_multiplier = 8.0f);`

			`/// Specific operation for TSDF volumes.`
			`/// Similar to RGB-D integration, but uses the same intrinsics for depth and`
			`/// color.`
			`void Integrate(const core::Tensor &block_coords,`
			`const Image &depth,`
			`const Image &color,`
			`const core::Tensor &intrinsic,`
			`const core::Tensor &extrinsic,`
			`float depth_scale = 1000.0f,`
			`float depth_max = 3.0f,`
			`float trunc_voxel_multiplier = 8.0f);`

			`/// Specific operation for TSDF volumes.`
			`/// Similar to RGB-D integration, but only applied to depth.`
			`void Integrate(const core::Tensor &block_coords,`
			`const Image &depth,`
			`const core::Tensor &intrinsic,`
			`const core::Tensor &extrinsic,`
			`float depth_scale = 1000.0f,`
			`float depth_max = 3.0f,`
			`float trunc_voxel_multiplier = 8.0f);`

			`/// Specific operation for TSDF volumes.`
			`/// Perform volumetric ray casting in the selected block coordinates.`
			`/// Return selected properties from the frame.`
			`/// Supported attributes:`
			`/// Conventional rendering: vertex, depth, color, normal, range`
			`/// Differentiable rendering (voxel-wise): mask, index, (interpolation)`
			`/// ratio.`
			`/// The block coordinates in the frustum can be taken from`
			`/// GetUniqueBlockCoordinates.`
			`/// All the block coordinates can be taken from GetHashMap().GetKeyTensor().`
			`TensorMap RayCast(const core::Tensor &block_coords,`
			`const core::Tensor &intrinsic,`
			`const core::Tensor &extrinsic,`
			`int width,`
			`int height,`
			`const std::vector<std::string> attrs = {"depth", "color"},`
			`float depth_scale = 1000.0f,`
			`float depth_min = 0.1f,`
			`float depth_max = 3.0f,`
			`float weight_threshold = 3.0f,`
			`float trunc_voxel_multiplier = 8.0f,`
			`int range_map_down_factor = 8);`

			`/// Specific operation for TSDF volumes.`
			`/// Extract point cloud at isosurface points.`
			`/// Weight threshold is used to filter outliers. By default we use 3.0,`
			`/// where we assume a reliable surface point comes from the fusion of at`
			`/// least 3 viewpoints. Use as low as 0.0 to accept all the possible`
			`/// observations.`
			`/// Estimated point numbers optionally speeds up the process by a one-pass`
			`/// extraction with pre-allocated buffers. Use -1 when no estimate is`
			`/// available.`
			`PointCloud ExtractPointCloud(float weight_threshold = 3.0f,`
			`int estimated_point_number = -1);`

			`/// Specific operation for TSDF volumes.`
			`/// Extract mesh near iso-surfaces with Marching Cubes.`
			`/// Weight threshold is used to filter outliers. By default we use 3.0,`
			`/// where we assume a reliable surface point comes from the fusion of at`
			`/// least 3 viewpoints. Use as low as 0.0 to accept all the possible`
			`/// observations.`
			`/// Estimated point numbers optionally speeds up the process by a one-pass`
			`/// extraction with pre-allocated buffers. Use -1 when no estimate is`
			`/// available.`
			`TriangleMesh ExtractTriangleMesh(float weight_threshold = 3.0f,`
			`int estimated_vertex_numer = -1);`

			`/// Save a voxel block grid to a .npz file.`
			`void Save(const std::string &file_name) const;`

			`/// Load a voxel block grid from a .npz file.`
			`static VoxelBlockGrid Load(const std::string &file_name);`

			`/// Convert the hash map to another device.`
			`VoxelBlockGrid To(const core::Device &device, bool copy = false) const;`

			`private:`
			`void AssertInitialized() const;`

			`VoxelBlockGrid(float voxelSize,`
			`int64_t blockResolution,`
			`const std::shared_ptr<core::HashMap> &blockHashmap,`
			`const std::unordered_map<std::string, int> &nameAttrMap)`
			`: voxel_size_(voxelSize),`
			`block_resolution_(blockResolution),`
			`block_hashmap_(blockHashmap),`
			`name_attr_map_(nameAttrMap) {}`

			`float voxel_size_ = -1;`
			`int64_t block_resolution_ = -1;`

			`// Global hash map: 3D coords -> voxel blocks in SoA.`
			`std::shared_ptr<core::HashMap> block_hashmap_;`

			`// Local hash map: 3D coords -> indices in block_hashmap_.`
			`std::shared_ptr<core::HashMap> frustum_hashmap_;`

			`// Map: attribute name -> index to access the attribute in SoA.`
			`std::unordered_map<std::string, int> name_attr_map_;`

			`// Allocated fragment buffer for reuse in depth estimation`
			`core::Tensor fragment_buffer_;`
			`};`
			`} // namespace geometry`
			`} // namespace t`
			`} // namespace open3d`