latest/cpp_api/_std_g_p_u_hashmap_8h_source.html

 // ----------------------------------------------------------------------------
 // -                        Open3D: www.open3d.org                            -
 // ----------------------------------------------------------------------------
 // The MIT License (MIT)
 //
 // Copyright (c) 2018-2021 www.open3d.org
 //
 // Permission is hereby granted, free of charge, to any person obtaining a copy
 // of this software and associated documentation files (the "Software"), to deal
 // in the Software without restriction, including without limitation the rights
 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 // copies of the Software, and to permit persons to whom the Software is
 // furnished to do so, subject to the following conditions:
 //
 // The above copyright notice and this permission notice shall be included in
 // all copies or substantial portions of the Software.
 //
 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 // FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 // IN THE SOFTWARE.
 // ----------------------------------------------------------------------------

 #pragma once

 #include <stdgpu/memory.h>
 #include <thrust/transform.h>

 #include <stdgpu/unordered_map.cuh>
 #include <type_traits>

 #include "open3d/core/CUDAUtils.h"
 #include "open3d/core/StdAllocator.h"
 #include "open3d/core/hashmap/CUDA/CUDAHashmapBufferAccessor.h"
 #include "open3d/core/hashmap/DeviceHashmap.h"

 namespace open3d {
 namespace core {

 template <typename T>
 class StdGPUAllocator {
 public:
     using value_type = T;

     StdGPUAllocator() = default;

     explicit StdGPUAllocator(const Device& device) : std_allocator_(device) {}

     StdGPUAllocator(const StdGPUAllocator&) = default;

     StdGPUAllocator& operator=(const StdGPUAllocator&) = default;

     StdGPUAllocator(StdGPUAllocator&&) = default;

     StdGPUAllocator& operator=(StdGPUAllocator&&) = default;

     template <typename U>
     StdGPUAllocator(const StdGPUAllocator<U>& other)
         : std_allocator_(other.std_allocator_) {}

     T* allocate(std::size_t n) {
         if (GetDevice().GetType() != Device::DeviceType::CUDA) {
             utility::LogError("Unsupported device.");
         }

         T* p = std_allocator_.allocate(n);
         stdgpu::register_memory(p, n, stdgpu::dynamic_memory_type::device);
         return p;
     }

     void deallocate(T* p, std::size_t n) {
         if (GetDevice().GetType() != Device::DeviceType::CUDA) {
             utility::LogError("Unsupported device.");
         }

         stdgpu::deregister_memory(p, n, stdgpu::dynamic_memory_type::device);
         std_allocator_.deallocate(p, n);
     }

     bool operator==(const StdGPUAllocator& other) {
         return std_allocator_ == other.std_allocator_;
     }

     bool operator!=(const StdGPUAllocator& other) { return !operator==(other); }

     Device GetDevice() const { return std_allocator_.GetDevice(); }

 private:
     // Allow access in rebind constructor.
     template <typename T2>
     friend class StdGPUAllocator;

     StdAllocator<T> std_allocator_;
 };

 // These typedefs must be defined outside of StdGPUHashmap to make them
 // accessible in raw CUDA kernels.
 template <typename Key>
 using InternalStdGPUHashmapAllocator =
         StdGPUAllocator<thrust::pair<const Key, addr_t>>;

 template <typename Key, typename Hash>
 using InternalStdGPUHashmap =
         stdgpu::unordered_map<Key,
                               addr_t,
                               Hash,
                               stdgpu::equal_to<Key>,
                               InternalStdGPUHashmapAllocator<Key>>;

 template <typename Key, typename Hash>
 class StdGPUHashmap : public DeviceHashmap {
 public:
     StdGPUHashmap(int64_t init_capacity,
                   int64_t dsize_key,
                   int64_t dsize_value,
                   const Device& device);
     ~StdGPUHashmap();

     void Rehash(int64_t buckets) override;

     void Insert(const void* input_keys,
                 const void* input_values,
                 addr_t* output_addrs,
                 bool* output_masks,
                 int64_t count) override;

     void Activate(const void* input_keys,
                   addr_t* output_addrs,
                   bool* output_masks,
                   int64_t count) override;

     void Find(const void* input_keys,
               addr_t* output_addrs,
               bool* output_masks,
               int64_t count) override;

     void Erase(const void* input_keys,
                bool* output_masks,
                int64_t count) override;

     int64_t GetActiveIndices(addr_t* output_indices) override;

     void Clear() override;

     int64_t Size() const override;

     int64_t GetBucketCount() const override;
     std::vector<int64_t> BucketSizes() const override;
     float LoadFactor() const override;

     InternalStdGPUHashmap<Key, Hash> GetImpl() const { return impl_; }

 protected:
     // Use reference, since the structure itself is implicitly handled as a
     // pointer directly by stdgpu.
     InternalStdGPUHashmap<Key, Hash> impl_;

     CUDAHashmapBufferAccessor buffer_accessor_;

     void InsertImpl(const void* input_keys,
                     const void* input_values,
                     addr_t* output_addrs,
                     bool* output_masks,
                     int64_t count);

     void Allocate(int64_t capacity);
     void Free();
 };

 template <typename Key, typename Hash>
 StdGPUHashmap<Key, Hash>::StdGPUHashmap(int64_t init_capacity,
                                         int64_t dsize_key,
                                         int64_t dsize_value,
                                         const Device& device)
     : DeviceHashmap(init_capacity, dsize_key, dsize_value, device) {
     Allocate(init_capacity);
 }

 template <typename Key, typename Hash>
 StdGPUHashmap<Key, Hash>::~StdGPUHashmap() {
     Free();
 }

 template <typename Key, typename Hash>
 int64_t StdGPUHashmap<Key, Hash>::Size() const {
     return impl_.size();
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Insert(const void* input_keys,
                                       const void* input_values,
                                       addr_t* output_addrs,
                                       bool* output_masks,
                                       int64_t count) {
     int64_t new_size = Size() + count;
     if (new_size > this->capacity_) {
         int64_t bucket_count = GetBucketCount();
         float avg_capacity_per_bucket =
                 float(this->capacity_) / float(bucket_count);
         int64_t expected_buckets = std::max(
                 bucket_count * 2,
                 int64_t(std::ceil(new_size / avg_capacity_per_bucket)));
         Rehash(expected_buckets);
     }
     InsertImpl(input_keys, input_values, output_addrs, output_masks, count);
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Activate(const void* input_keys,
                                         addr_t* output_addrs,
                                         bool* output_masks,
                                         int64_t count) {
     Insert(input_keys, nullptr, output_addrs, output_masks, count);
 }

 // Need an explicit kernel for non-const access to map
 template <typename Key, typename Hash>
 __global__ void STDGPUFindKernel(InternalStdGPUHashmap<Key, Hash> map,
                                  CUDAHashmapBufferAccessor buffer_accessor,
                                  const Key* input_keys,
                                  addr_t* output_addrs,
                                  bool* output_masks,
                                  int64_t count) {
     uint32_t tid = threadIdx.x + blockIdx.x * blockDim.x;
     if (tid >= count) return;

     Key key = input_keys[tid];
     auto iter = map.find(key);
     bool flag = (iter != map.end());
     output_masks[tid] = flag;
     output_addrs[tid] = flag ? iter->second : 0;
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Find(const void* input_keys,
                                     addr_t* output_addrs,
                                     bool* output_masks,
                                     int64_t count) {
     uint32_t threads = 128;
     uint32_t blocks = (count + threads - 1) / threads;

     STDGPUFindKernel<<<blocks, threads, 0, core::cuda::GetStream()>>>(
             impl_, buffer_accessor_, static_cast<const Key*>(input_keys),
             output_addrs, output_masks, count);
     cuda::Synchronize(this->device_);
 }

 // Need an explicit kernel for non-const access to map
 template <typename Key, typename Hash>
 __global__ void STDGPUEraseKernel(InternalStdGPUHashmap<Key, Hash> map,
                                   CUDAHashmapBufferAccessor buffer_accessor,
                                   const Key* input_keys,
                                   addr_t* output_addrs,
                                   bool* output_masks,
                                   int64_t count) {
     uint32_t tid = threadIdx.x + blockIdx.x * blockDim.x;
     if (tid >= count) return;

     Key key = input_keys[tid];
     auto iter = map.find(key);
     bool flag = (iter != map.end());
     output_masks[tid] = flag;
     output_addrs[tid] = flag ? iter->second : 0;

     if (output_masks[tid]) {
         output_masks[tid] = map.erase(key);
         if (output_masks[tid]) {
             buffer_accessor.DeviceFree(output_addrs[tid]);
         }
     }
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Erase(const void* input_keys,
                                      bool* output_masks,
                                      int64_t count) {
     uint32_t threads = 128;
     uint32_t blocks = (count + threads - 1) / threads;

     core::Tensor toutput_addrs =
             core::Tensor({count}, core::Int32, this->device_);
     addr_t* output_addrs = static_cast<addr_t*>(toutput_addrs.GetDataPtr());

     STDGPUEraseKernel<<<blocks, threads, 0, core::cuda::GetStream()>>>(
             impl_, buffer_accessor_, static_cast<const Key*>(input_keys),
             output_addrs, output_masks, count);
     cuda::Synchronize(this->device_);
 }

 template <typename Key>
 struct ValueExtractor {
     OPEN3D_HOST_DEVICE addr_t
     operator()(const thrust::pair<Key, addr_t>& x) const {
         return x.second;
     }
 };

 template <typename Key, typename Hash>
 int64_t StdGPUHashmap<Key, Hash>::GetActiveIndices(addr_t* output_indices) {
     auto range = impl_.device_range();

     thrust::transform(range.begin(), range.end(), output_indices,
                       ValueExtractor<Key>());

     return impl_.size();
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Clear() {
     impl_.clear();
     buffer_accessor_.Reset(this->device_);
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Rehash(int64_t buckets) {
     int64_t iterator_count = Size();

     Tensor active_keys;
     Tensor active_values;

     if (iterator_count > 0) {
         Tensor active_addrs({iterator_count}, core::Int32, this->device_);
         GetActiveIndices(static_cast<addr_t*>(active_addrs.GetDataPtr()));

         Tensor active_indices = active_addrs.To(core::Int64);
         active_keys = this->GetKeyBuffer().IndexGet({active_indices});
         active_values = this->GetValueBuffer().IndexGet({active_indices});
     }

     float avg_capacity_per_bucket =
             float(this->capacity_) / float(GetBucketCount());

     Free();
     int64_t new_capacity =
             int64_t(std::ceil(buckets * avg_capacity_per_bucket));
     Allocate(new_capacity);

     if (iterator_count > 0) {
         Tensor output_addrs({iterator_count}, core::Int32, this->device_);
         Tensor output_masks({iterator_count}, core::Bool, this->device_);

         InsertImpl(active_keys.GetDataPtr(), active_values.GetDataPtr(),
                    static_cast<addr_t*>(output_addrs.GetDataPtr()),
                    output_masks.GetDataPtr<bool>(), iterator_count);
     }
 }

 template <typename Key, typename Hash>
 int64_t StdGPUHashmap<Key, Hash>::GetBucketCount() const {
     return impl_.bucket_count();
 }

 template <typename Key, typename Hash>
 std::vector<int64_t> StdGPUHashmap<Key, Hash>::BucketSizes() const {
     utility::LogError("Unimplemented");
 }

 template <typename Key, typename Hash>
 float StdGPUHashmap<Key, Hash>::LoadFactor() const {
     return impl_.load_factor();
 }

 // Need an explicit kernel for non-const access to map
 template <typename Key, typename Hash>
 __global__ void STDGPUInsertKernel(InternalStdGPUHashmap<Key, Hash> map,
                                    CUDAHashmapBufferAccessor buffer_accessor,
                                    const Key* input_keys,
                                    const void* input_values,
                                    int64_t dsize_value,
                                    addr_t* output_addrs,
                                    bool* output_masks,
                                    int64_t count) {
     uint32_t tid = threadIdx.x + blockIdx.x * blockDim.x;
     if (tid >= count) return;

     Key key = input_keys[tid];
     output_addrs[tid] = 0;
     output_masks[tid] = false;

     // First apply 'try insert' with a dummy index
     auto res = map.emplace(key, 0);

     // If success, change the iterator and provide the actual index
     if (res.second) {
         addr_t dst_kv_addr = buffer_accessor.DeviceAllocate();
         auto dst_kv_iter = buffer_accessor.ExtractIterator(dst_kv_addr);

         // Copy templated key to buffer (duplicate)
         // TODO: hack stdgpu inside and take out the buffer directly
         *static_cast<Key*>(dst_kv_iter.first) = key;

         // Copy/reset non-templated value in buffer
         uint8_t* dst_value = static_cast<uint8_t*>(dst_kv_iter.second);
         if (input_values != nullptr) {
             const uint8_t* src_value =
                     static_cast<const uint8_t*>(input_values) +
                     dsize_value * tid;
             for (int byte = 0; byte < dsize_value; ++byte) {
                 dst_value[byte] = src_value[byte];
             }
         }

         // Update from the dummy index
         res.first->second = dst_kv_addr;

         // Write to return variables
         output_addrs[tid] = dst_kv_addr;
         output_masks[tid] = true;
     }
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::InsertImpl(const void* input_keys,
                                           const void* input_values,
                                           addr_t* output_addrs,
                                           bool* output_masks,
                                           int64_t count) {
     uint32_t threads = 128;
     uint32_t blocks = (count + threads - 1) / threads;

     STDGPUInsertKernel<<<blocks, threads, 0, core::cuda::GetStream()>>>(
             impl_, buffer_accessor_, static_cast<const Key*>(input_keys),
             input_values, this->dsize_value_, output_addrs, output_masks,
             count);
     cuda::Synchronize(this->device_);
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Allocate(int64_t capacity) {
     this->capacity_ = capacity;

     // Allocate buffer for key values.
     this->buffer_ =
             std::make_shared<HashmapBuffer>(this->capacity_, this->dsize_key_,
                                             this->dsize_value_, this->device_);

     buffer_accessor_.HostAllocate(this->device_);
     buffer_accessor_.Setup(this->capacity_, this->dsize_key_,
                            this->dsize_value_, this->buffer_->GetKeyBuffer(),
                            this->buffer_->GetValueBuffer(),
                            this->buffer_->GetHeap());
     buffer_accessor_.Reset(this->device_);

     // stdgpu initializes on the default stream. Set the current stream to
     // ensure correct behavior.
     {
         CUDAScopedStream scoped_stream(cuda::GetDefaultStream());

         impl_ = InternalStdGPUHashmap<Key, Hash>::createDeviceObject(
                 this->capacity_,
                 InternalStdGPUHashmapAllocator<Key>(this->device_));
         cuda::Synchronize(this->device_);
     }
 }

 template <typename Key, typename Hash>
 void StdGPUHashmap<Key, Hash>::Free() {
     // Buffer is automatically handled by the smart pointer.

     buffer_accessor_.HostFree(this->device_);

     // stdgpu initializes on the default stream. Set the current stream to
     // ensure correct behavior.
     {
         CUDAScopedStream scoped_stream(cuda::GetDefaultStream());

         InternalStdGPUHashmap<Key, Hash>::destroyDeviceObject(impl_);
     }
 }
 }  // namespace core
 }  // namespace open3d
open3d::core::iterator_t::first
void * first
Definition: SlabTraits.h:54

open3d::core::StdGPUHashmap::Clear
void Clear() override
Clear stored map without reallocating memory.
Definition: StdGPUHashmap.h:330

open3d::core::StdGPUHashmap::Insert
void Insert(const void *input_keys, const void *input_values, addr_t *output_addrs, bool *output_masks, int64_t count) override
Parallel insert contiguous arrays of keys and values.
Definition: StdGPUHashmap.h:211

open3d::core::ValueExtractor
Definition: StdGPUHashmap.h:312

open3d::core::STDGPUEraseKernel
__global__ void STDGPUEraseKernel(InternalStdGPUHashmap< Key, Hash > map, CUDAHashmapBufferAccessor buffer_accessor, const Key *input_keys, addr_t *output_addrs, bool *output_masks, int64_t count)
Definition: StdGPUHashmap.h:271

open3d::core::StdGPUAllocator::operator==
bool operator==(const StdGPUAllocator &other)
Returns true if the instances are equal, false otherwise.
Definition: StdGPUHashmap.h:99

open3d::core::StdGPUHashmap::Free
void Free()
Definition: StdGPUHashmap.h:478

open3d::core::StdGPUAllocator::StdGPUAllocator
StdGPUAllocator(const StdGPUAllocator< U > &other)
Rebind copy constructor.
Definition: StdGPUHashmap.h:74

open3d::core::StdGPUAllocator::operator!=
bool operator!=(const StdGPUAllocator &other)
Returns true if the instances are not equal, false otherwise.
Definition: StdGPUHashmap.h:104

open3d::core::Bool
const Dtype Bool
Definition: Dtype.cpp:72

open3d::core::Int64
const Dtype Int64
Definition: Dtype.cpp:67

open3d::core::StdGPUAllocator::value_type
T value_type
T.
Definition: StdGPUHashmap.h:52

open3d::io::k4a_plugin::uint32_t
const char const char value recording_handle imu_sample recording_handle uint8_t size_t data_size k4a_record_configuration_t config target_format k4a_capture_t capture_handle k4a_imu_sample_t imu_sample playback_handle k4a_logging_message_cb_t void min_level device_handle k4a_imu_sample_t timeout_in_ms capture_handle capture_handle capture_handle image_handle temperature_c k4a_image_t image_handle uint8_t image_handle image_handle image_handle image_handle uint32_t
Definition: K4aPlugin.cpp:557

open3d::core::StdGPUHashmap::StdGPUHashmap
StdGPUHashmap(int64_t init_capacity, int64_t dsize_key, int64_t dsize_value, const Device &device)
Definition: StdGPUHashmap.h:192

open3d::core::StdGPUHashmap::~StdGPUHashmap
~StdGPUHashmap()
Definition: StdGPUHashmap.h:201

open3d::core::StdGPUHashmap::Allocate
void Allocate(int64_t capacity)
Definition: StdGPUHashmap.h:450

open3d::core::CUDAHashmapBufferAccessor::Setup
__host__ void Setup(int64_t capacity, int64_t dsize_key, int64_t dsize_value, Tensor &keys, Tensor &values, Tensor &heap)
Definition: CUDAHashmapBufferAccessor.h:50

open3d::core::CUDAHashmapBufferAccessor::HostAllocate
__host__ void HostAllocate(const Device &device)
Definition: CUDAHashmapBufferAccessor.h:80

open3d::core::StdGPUAllocator::deallocate
void deallocate(T *p, std::size_t n)
Deallocates memory from pointer p of size n .
Definition: StdGPUHashmap.h:89

open3d::core::StdGPUHashmap
Definition: StdGPUHashmap.h:132

open3d::utility::ceil
FN_SPECIFIERS MiniVec< float, N > ceil(const MiniVec< float, N > &a)
Definition: MiniVec.h:108

open3d::core::DeviceHashmap
Definition: DeviceHashmap.h:39

open3d::core::CUDAHashmapBufferAccessor::DeviceAllocate
__device__ addr_t DeviceAllocate()
Definition: CUDAHashmapBufferAccessor.h:92

open3d::core::StdAllocator
Definition: StdAllocator.h:42

open3d::core::cuda::Synchronize
void Synchronize()
Definition: CUDAUtils.cpp:72

open3d::core::Tensor::IndexGet
Tensor IndexGet(const std::vector< Tensor > &index_tensors) const
Advanced indexing getter.
Definition: Tensor.cpp:707

open3d::core::CUDAHashmapBufferAccessor
Definition: CUDAHashmapBufferAccessor.h:48

OPEN3D_HOST_DEVICE
#define OPEN3D_HOST_DEVICE
Definition: CUDAUtils.h:63

open3d::core::StdGPUHashmap::Rehash
void Rehash(int64_t buckets) override
Definition: StdGPUHashmap.h:336

open3d::core::Int32
const Dtype Int32
Definition: Dtype.cpp:66

open3d::core::CUDAHashmapBufferAccessor::DeviceFree
__device__ void DeviceFree(addr_t ptr)
Definition: CUDAHashmapBufferAccessor.h:97

open3d::core::StdGPUHashmap::impl_
InternalStdGPUHashmap< Key, Hash > impl_
Definition: StdGPUHashmap.h:177

open3d::core::Device::DeviceType::CUDA

open3d::core::Tensor::To
Tensor To(Dtype dtype, bool copy=false) const
Definition: Tensor.cpp:541

open3d::core::CUDAHashmapBufferAccessor::ExtractIterator
__device__ iterator_t ExtractIterator(addr_t ptr)
Definition: CUDAHashmapBufferAccessor.h:109

open3d::core::StdGPUHashmap::GetActiveIndices
int64_t GetActiveIndices(addr_t *output_indices) override
Parallel collect all iterators in the hash table.
Definition: StdGPUHashmap.h:320

open3d::core::DeviceHashmap::device_
Device device_
Definition: DeviceHashmap.h:113

open3d::core::Device
Definition: Device.h:39

open3d::core::StdGPUAllocator::StdGPUAllocator
StdGPUAllocator(const Device &device)
Constructor from device.
Definition: StdGPUHashmap.h:58

open3d::core::StdGPUHashmap::Activate
void Activate(const void *input_keys, addr_t *output_addrs, bool *output_masks, int64_t count) override
Definition: StdGPUHashmap.h:230

open3d::core::StdGPUAllocator
Definition: StdGPUHashmap.h:49

open3d::core::StdGPUHashmap::GetBucketCount
int64_t GetBucketCount() const override
Definition: StdGPUHashmap.h:370

open3d::core::StdGPUAllocator::allocate
T * allocate(std::size_t n)
Allocates memory of size n.
Definition: StdGPUHashmap.h:78

open3d::core::StdGPUAllocator::StdGPUAllocator
StdGPUAllocator()=default
Default constructor.

StdAllocator.h

count
int count
Definition: FilePCD.cpp:61

open3d::core::StdGPUHashmap::LoadFactor
float LoadFactor() const override
Definition: StdGPUHashmap.h:380

open3d::core::StdGPUHashmap::Size
int64_t Size() const override
Definition: StdGPUHashmap.h:206

open3d::core::StdGPUHashmap::Erase
void Erase(const void *input_keys, bool *output_masks, int64_t count) override
Parallel erase a contiguous array of keys.
Definition: StdGPUHashmap.h:295

open3d
Definition: PinholeCameraIntrinsic.cpp:35

open3d::core::StdGPUHashmap::buffer_accessor_
CUDAHashmapBufferAccessor buffer_accessor_
Definition: StdGPUHashmap.h:179

open3d::core::Tensor
Definition: Tensor.h:49

open3d::core::STDGPUFindKernel
__global__ void STDGPUFindKernel(InternalStdGPUHashmap< Key, Hash > map, CUDAHashmapBufferAccessor buffer_accessor, const Key *input_keys, addr_t *output_addrs, bool *output_masks, int64_t count)
Definition: StdGPUHashmap.h:239

open3d::io::k4a_plugin::float
const char const char value recording_handle imu_sample recording_handle uint8_t size_t data_size k4a_record_configuration_t config target_format k4a_capture_t capture_handle k4a_imu_sample_t imu_sample playback_handle k4a_logging_message_cb_t void min_level device_handle k4a_imu_sample_t timeout_in_ms capture_handle capture_handle capture_handle image_handle float
Definition: K4aPlugin.cpp:465

open3d::core::DeviceHashmap::capacity_
int64_t capacity_
Definition: DeviceHashmap.h:109

open3d::core::STDGPUInsertKernel
__global__ void STDGPUInsertKernel(InternalStdGPUHashmap< Key, Hash > map, CUDAHashmapBufferAccessor buffer_accessor, const Key *input_keys, const void *input_values, int64_t dsize_value, addr_t *output_addrs, bool *output_masks, int64_t count)
Definition: StdGPUHashmap.h:386

open3d::core::StdGPUHashmap::InsertImpl
void InsertImpl(const void *input_keys, const void *input_values, addr_t *output_addrs, bool *output_masks, int64_t count)
Definition: StdGPUHashmap.h:434

open3d::core::DeviceHashmap::GetKeyBuffer
Tensor & GetKeyBuffer()
Definition: DeviceHashmap.h:101

open3d::core::addr_t
uint32_t addr_t
Definition: HashmapBuffer.h:58

open3d::core::DeviceHashmap::dsize_key_
int64_t dsize_key_
Definition: DeviceHashmap.h:110

open3d::core::StdGPUAllocator::operator=
StdGPUAllocator & operator=(const StdGPUAllocator &)=default
Default copy assignment operator.

open3d::io::k4a_plugin::size_t
const char const char value recording_handle imu_sample recording_handle uint8_t size_t data_size k4a_record_configuration_t config target_format k4a_capture_t capture_handle k4a_imu_sample_t imu_sample playback_handle k4a_logging_message_cb_t void min_level device_handle k4a_imu_sample_t timeout_in_ms capture_handle capture_handle capture_handle image_handle temperature_c k4a_image_t image_handle uint8_t image_handle image_handle image_handle image_handle image_handle timestamp_usec white_balance image_handle k4a_device_configuration_t config device_handle char size_t serial_number_size bool int32_t int32_t int32_t int32_t k4a_color_control_mode_t default_mode value const const k4a_calibration_t calibration char size_t
Definition: K4aPlugin.cpp:724

open3d::core::Tensor::GetDataPtr
T * GetDataPtr()
Definition: Tensor.h:1004

open3d::core::InternalStdGPUHashmap
stdgpu::unordered_map< Key, addr_t, Hash, stdgpu::equal_to< Key >, InternalStdGPUHashmapAllocator< Key > > InternalStdGPUHashmap
Definition: StdGPUHashmap.h:129

open3d::core::ValueExtractor::operator()
OPEN3D_HOST_DEVICE addr_t operator()(const thrust::pair< Key, addr_t > &x) const
Definition: StdGPUHashmap.h:314

open3d::core::CUDAHashmapBufferAccessor::HostFree
__host__ void HostFree(const Device &device)
Definition: CUDAHashmapBufferAccessor.h:85

DeviceHashmap.h

open3d::core::CUDAHashmapBufferAccessor::Reset
__host__ void Reset(const Device &device)
Definition: CUDAHashmapBufferAccessor.h:67

open3d::core::DeviceHashmap::dsize_value_
int64_t dsize_value_
Definition: DeviceHashmap.h:111

CUDAUtils.h
Common CUDA utilities.

open3d::core::DeviceHashmap::GetValueBuffer
Tensor & GetValueBuffer()
Definition: DeviceHashmap.h:102

open3d::core::StdGPUAllocator::GetDevice
Device GetDevice() const
Returns the device on which memory is allocated.
Definition: StdGPUHashmap.h:107

open3d::core::StdGPUHashmap::GetImpl
InternalStdGPUHashmap< Key, Hash > GetImpl() const
Definition: StdGPUHashmap.h:172

open3d::core::DeviceHashmap::buffer_
std::shared_ptr< HashmapBuffer > buffer_
Definition: DeviceHashmap.h:115

open3d::core::StdGPUHashmap::Find
void Find(const void *input_keys, addr_t *output_addrs, bool *output_masks, int64_t count) override
Parallel find a contiguous array of keys.
Definition: StdGPUHashmap.h:256

open3d::core::StdGPUHashmap::BucketSizes
std::vector< int64_t > BucketSizes() const override
Definition: StdGPUHashmap.h:375

LogError
#define LogError(...)
Definition: Logging.h:78

CUDAHashmapBufferAccessor.h