cppapi/_voxelize_8h_source.html

 // ----------------------------------------------------------------------------

 // -                        Open3D: www.open3d.org                            -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2023 www.open3d.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #pragma once


 #include <tbb/parallel_for.h>

 #include <tbb/parallel_sort.h>


 #include <vector>


 #include "open3d/core/Atomic.h"

 #include "open3d/utility/MiniVec.h"

 #include "open3d/utility/ParallelScan.h"


 namespace open3d {

 namespace ml {

 namespace impl {


 template <class T, int NDIM, class OUTPUT_ALLOCATOR>

 void VoxelizeCPU(const size_t num_points,

                  const T* const points,

                  const size_t batch_size,

                  const int64_t* const row_splits,

                  const T* const voxel_size,

                  const T* const points_range_min,

                  const T* const points_range_max,

                  const int64_t max_points_per_voxel,

                  const int64_t max_voxels,

                  OUTPUT_ALLOCATOR& output_allocator) {

     using namespace open3d::utility;

     typedef MiniVec<T, NDIM> Vec_t;

     const Vec_t inv_voxel_size = T(1) / Vec_t(voxel_size);

     const Vec_t points_range_min_vec(points_range_min);

     const Vec_t points_range_max_vec(points_range_max);

     MiniVec<int32_t, NDIM> extents =

             ceil((points_range_max_vec - points_range_min_vec) * inv_voxel_size)

                     .template cast<int32_t>();

     MiniVec<int64_t, NDIM> strides;

     for (int i = 0; i < NDIM; ++i) {

         strides[i] = 1;

         for (int j = 0; j < i; ++j) {

             strides[i] *= extents[j];

         }

     }

     const int64_t batch_hash = strides[NDIM - 1] * extents[NDIM - 1];

     const int64_t invalid_hash = batch_hash * batch_size;


     std::vector<int64_t> indices_batches(num_points, 0);

     tbb::parallel_for(tbb::blocked_range<int64_t>(0, batch_size),

                       [&](const tbb::blocked_range<int64_t>& r) {

                           for (int64_t i = r.begin(); i != r.end(); ++i) {

                               for (int64_t idx = row_splits[i];

                                    idx < row_splits[i + 1]; ++idx) {

                                   indices_batches[idx] = i;

                               }

                           }

                       });


     auto CoordFn = [&](const Vec_t& point) {

         auto coords = ((point - points_range_min_vec) * inv_voxel_size)

                               .template cast<int64_t>();

         return coords;

     };


     auto HashFn = [&](const Vec_t& point, const int64_t& idx) {

         if ((point >= points_range_min_vec && point <= points_range_max_vec)

                     .all()) {

             auto coords = CoordFn(point);

             int64_t hash = coords.dot(strides);

             hash += indices_batches[idx] * batch_hash;

             return hash;

         }

         return invalid_hash;

     };


     std::vector<std::pair<int64_t, int64_t>> hashes_indices(num_points);

     std::vector<uint64_t> num_voxels(batch_size, 0);


     tbb::parallel_for(tbb::blocked_range<int64_t>(0, num_points),

                       [&](const tbb::blocked_range<int64_t>& r) {

                           for (int64_t i = r.begin(); i != r.end(); ++i) {

                               Vec_t pos(points + NDIM * i);

                               hashes_indices[i].first = HashFn(pos, i);

                               hashes_indices[i].second = i;

                           }

                       });


     tbb::parallel_sort(hashes_indices);


     tbb::parallel_for(

             tbb::blocked_range<int64_t>(0, hashes_indices.size()),

             [&](const tbb::blocked_range<int64_t>& r) {

                 for (int64_t i = r.begin(); i != r.end(); ++i) {

                     int64_t batch_id = hashes_indices[i].first / batch_hash;

                     if (batch_id >= batch_size) break;

                     if (i == 0) {

                         core::AtomicFetchAddRelaxed(&num_voxels[batch_id], 1);

                         continue;

                     }

                     int64_t batch_id_prev =

                             hashes_indices[i - 1].first / batch_hash;

                     if ((batch_id != batch_id_prev) ||

                         (hashes_indices[i].first !=

                          hashes_indices[i - 1].first)) {

                         core::AtomicFetchAddRelaxed(&num_voxels[batch_id], 1);

                     }

                 }

             });


     tbb::parallel_for(tbb::blocked_range<int64_t>(0, batch_size),

                       [&](const tbb::blocked_range<int64_t>& r) {

                           for (int64_t i = r.begin(); i != r.end(); ++i) {

                               num_voxels[i] = std::min(int64_t(num_voxels[i]),

                                                        max_voxels);

                           }

                       });


     int64_t* out_batch_splits = nullptr;

     output_allocator.AllocVoxelBatchSplits(&out_batch_splits, batch_size + 1);

     out_batch_splits[0] = 0;


     // prefix sum for batch_splits

     for (int64_t i = 1; i < batch_size + 1; ++i) {

         out_batch_splits[i] = out_batch_splits[i - 1] + num_voxels[i - 1];

     }


     uint64_t total_voxels = out_batch_splits[batch_size];


     int32_t* out_voxel_coords = nullptr;

     output_allocator.AllocVoxelCoords(&out_voxel_coords, total_voxels, NDIM);


     int64_t* out_voxel_row_splits = nullptr;

     output_allocator.AllocVoxelPointRowSplits(&out_voxel_row_splits,

                                               total_voxels + 1);


     std::vector<int64_t> tmp_point_indices;

     {

         int64_t hash_i = 0;  // index into the vector hashes_indices

         for (int64_t voxel_i = 0; voxel_i < total_voxels; ++voxel_i) {

             // compute voxel coord and the prefix sum value

             auto coord = CoordFn(

                     Vec_t(points + hashes_indices[hash_i].second * NDIM));

             for (int d = 0; d < NDIM; ++d) {

                 out_voxel_coords[voxel_i * NDIM + d] = coord[d];

             }

             out_voxel_row_splits[voxel_i] = tmp_point_indices.size();


             // add up to max_points_per_voxel indices for this voxel

             int64_t points_per_voxel = 0;

             const int64_t current_hash = hashes_indices[hash_i].first;

             int64_t batch_id = current_hash / batch_hash;

             num_voxels[batch_id]--;

             for (; hash_i < hashes_indices.size(); ++hash_i) {

                 if (current_hash != hashes_indices[hash_i].first) {

                     // new voxel starts -> break

                     break;

                 }

                 if (points_per_voxel < max_points_per_voxel) {

                     tmp_point_indices.push_back(hashes_indices[hash_i].second);

                     ++points_per_voxel;

                 }

             }


             // skip voxels exceeding max_voxel

             if (num_voxels[batch_id] == 0) {

                 for (; hash_i < hashes_indices.size(); ++hash_i) {

                     if ((int64_t)(hashes_indices[hash_i].first / batch_hash) !=

                         batch_id) {

                         break;

                     }

                 }

             }

         }

         out_voxel_row_splits[total_voxels] = tmp_point_indices.size();

     }


     int64_t* out_point_indices = nullptr;

     output_allocator.AllocVoxelPointIndices(&out_point_indices,

                                             tmp_point_indices.size());

     memcpy(out_point_indices, tmp_point_indices.data(),

            tmp_point_indices.size() * sizeof(int64_t));

 }


 }  // namespace impl

 }  // namespace ml

 }  // namespace open3d

Atomic.h

MiniVec.h

ParallelScan.h

points
int points
Definition: FilePCD.cpp:54

open3d::io::k4a_plugin::uint64_t
const char const char value recording_handle imu_sample recording_handle uint8_t size_t data_size k4a_record_configuration_t config target_format k4a_capture_t capture_handle k4a_imu_sample_t imu_sample uint64_t
Definition: K4aPlugin.cpp:343

open3d::io::k4a_plugin::int32_t
const char const char value recording_handle imu_sample recording_handle uint8_t size_t data_size k4a_record_configuration_t config target_format k4a_capture_t capture_handle k4a_imu_sample_t imu_sample playback_handle k4a_logging_message_cb_t void min_level device_handle k4a_imu_sample_t int32_t
Definition: K4aPlugin.cpp:395

open3d::ml::impl::VoxelizeCPU
void VoxelizeCPU(const size_t num_points, const T *const points, const size_t batch_size, const int64_t *const row_splits, const T *const voxel_size, const T *const points_range_min, const T *const points_range_max, const int64_t max_points_per_voxel, const int64_t max_voxels, OUTPUT_ALLOCATOR &output_allocator)
Definition: Voxelize.h:78

open3d::utility
Definition: Dispatch.h:91

open3d::utility::ceil
FN_SPECIFIERS MiniVec< float, N > ceil(const MiniVec< float, N > &a)
Definition: MiniVec.h:89

open3d
Definition: PinholeCameraIntrinsic.cpp:16

open3d::utility::MiniVec
Definition: MiniVec.h:24