|
uint32_t | AtomicFetchAddRelaxed (uint32_t *address, uint32_t val) |
|
uint64_t | AtomicFetchAddRelaxed (uint64_t *address, uint64_t val) |
|
std::shared_ptr< DefaultDeviceHashmap > | CreateDefaultCPUHashmap (size_t init_buckets, size_t init_capacity, size_t dsize_key, size_t dsize_value, const Device &device) |
| Non-templated factory. More...
|
|
void | UnpackIteratorsStep (const iterator_t *input_iterators, const bool *input_masks, void *output_keys, void *output_values, const Device &device, size_t dsize_key, size_t dsize_value, size_t tid) |
|
void | AssignIteratorsStep (iterator_t *input_iterators, const bool *input_masks, const void *input_values, const Device &device, size_t dsize_value, size_t tid) |
|
template<typename Hash , typename KeyEq > |
std::shared_ptr< CPUHashmap< Hash, KeyEq > > | CreateTemplateCPUHashmap (size_t init_buckets, size_t init_capacity, size_t dsize_key, size_t dsize_value, const Device &device) |
| Templated factory. More...
|
|
template<typename Hash , typename KeyEq > |
__global__ void | InsertKernelPass0 (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, const void *input_keys, addr_t *output_iterator_addrs, int heap_counter_prev, size_t count) |
| Kernels. More...
|
|
template<typename Hash , typename KeyEq > |
__global__ void | InsertKernelPass1 (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, const void *input_keys, addr_t *input_iterator_addrs, bool *output_masks, size_t count) |
|
template<typename Hash , typename KeyEq > |
__global__ void | InsertKernelPass2 (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, const void *input_values, addr_t *input_iterator_addrs, iterator_t *output_iterators, bool *output_masks, size_t count) |
|
template<typename Hash , typename KeyEq > |
__global__ void | FindKernel (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, const void *input_keys, iterator_t *output_iterators, bool *output_masks, size_t count) |
|
template<typename Hash , typename KeyEq > |
__global__ void | EraseKernelPass0 (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, const void *input_keys, addr_t *output_iterator_addrs, bool *output_masks, size_t count) |
|
template<typename Hash , typename KeyEq > |
__global__ void | EraseKernelPass1 (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, addr_t *input_iterator_addrs, bool *output_masks, size_t count) |
|
template<typename Hash , typename KeyEq > |
__global__ void | GetIteratorsKernel (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, iterator_t *output_iterators, uint32_t *output_iterator_count) |
|
template<typename Hash , typename KeyEq > |
__global__ void | CountElemsPerBucketKernel (CUDAHashmapImplContext< Hash, KeyEq > hash_ctx, size_t *bucket_elem_counts) |
|
__global__ void | UnpackIteratorsKernel (const iterator_t *input_iterators, const bool *input_masks, void *output_keys, void *output_values, size_t dsize_key, size_t dsize_value, size_t iterator_count) |
|
__global__ void | AssignIteratorsKernel (iterator_t *input_iterators, const bool *input_masks, const void *input_values, size_t dsize_value, size_t iterator_count) |
|
__global__ void | ResetInternalKvPairManagerKernel (InternalKvPairManagerContext ctx) |
|
__global__ void | CountSlabsPerSuperblockKernel (InternalNodeManagerContext context, uint32_t *slabs_per_superblock) |
|
std::shared_ptr< DefaultDeviceHashmap > | CreateDefaultDeviceHashmap (size_t init_buckets, size_t init_capacity, size_t dsize_key, size_t dsize_value, const Device &device) |
|
std::shared_ptr< DefaultDeviceHashmap > | CreateDefaultCUDAHashmap (size_t init_buckets, size_t init_capacity, size_t dsize_key, size_t dsize_value, const Device &device) |
|
template<typename Hash , typename KeyEq > |
std::shared_ptr< DeviceHashmap< Hash, KeyEq > > | CreateTemplateDeviceHashmap (size_t init_buckets, size_t init_capacity, size_t dsize_key, size_t dsize_value, const Device &device) |
|
template<typename First , typename Second > |
OPEN3D_HOST_DEVICE Pair< First, Second > | make_pair (const First &_first, const Second &_second) |
|
template<typename scalar_t > |
void | gemm_cpu (CBLAS_LAYOUT layout, CBLAS_TRANSPOSE trans_A, CBLAS_TRANSPOSE trans_B, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT k, scalar_t alpha, const scalar_t *A_data, OPEN3D_CPU_LINALG_INT lda, const scalar_t *B_data, OPEN3D_CPU_LINALG_INT ldb, scalar_t beta, scalar_t *C_data, OPEN3D_CPU_LINALG_INT ldc) |
|
template<> |
void | gemm_cpu< float > (CBLAS_LAYOUT layout, CBLAS_TRANSPOSE trans_A, CBLAS_TRANSPOSE trans_B, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT k, float alpha, const float *A_data, OPEN3D_CPU_LINALG_INT lda, const float *B_data, OPEN3D_CPU_LINALG_INT ldb, float beta, float *C_data, OPEN3D_CPU_LINALG_INT ldc) |
|
template<> |
void | gemm_cpu< double > (CBLAS_LAYOUT layout, CBLAS_TRANSPOSE trans_A, CBLAS_TRANSPOSE trans_B, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT k, double alpha, const double *A_data, OPEN3D_CPU_LINALG_INT lda, const double *B_data, OPEN3D_CPU_LINALG_INT ldb, double beta, double *C_data, OPEN3D_CPU_LINALG_INT ldc) |
|
void | Inverse (const Tensor &A, Tensor &output) |
| Computes A^{-1} with LU factorization, where A is a N x N square matrix. More...
|
|
void | InverseCPU (void *A_data, void *ipiv_data, void *output_data, int64_t n, Dtype dtype, const Device &device) |
|
void | InverseCUDA (void *A_data, void *ipiv_data, void *output_data, int64_t n, Dtype dtype, const Device &device) |
|
template<typename scalar_t > |
OPEN3D_CPU_LINALG_INT | getrf_cpu (int layout, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, scalar_t *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data) |
|
template<typename scalar_t > |
OPEN3D_CPU_LINALG_INT | getri_cpu (int layout, OPEN3D_CPU_LINALG_INT n, scalar_t *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data) |
|
template<typename scalar_t > |
OPEN3D_CPU_LINALG_INT | gesv_cpu (int layout, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT m, scalar_t *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data, scalar_t *B_data, OPEN3D_CPU_LINALG_INT ldb) |
|
template<typename scalar_t > |
OPEN3D_CPU_LINALG_INT | gels_cpu (int matrix_layout, char trans, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT nrhs, scalar_t *A_data, OPEN3D_CPU_LINALG_INT lda, scalar_t *B_data, OPEN3D_CPU_LINALG_INT ldb) |
|
template<typename scalar_t > |
OPEN3D_CPU_LINALG_INT | gesvd_cpu (int matrix_layout, char jobu, char jobvt, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, scalar_t *A_data, OPEN3D_CPU_LINALG_INT lda, scalar_t *S_data, scalar_t *U_data, OPEN3D_CPU_LINALG_INT ldu, scalar_t *VT_data, OPEN3D_CPU_LINALG_INT ldvt, scalar_t *superb) |
|
template<> |
OPEN3D_CPU_LINALG_INT | getrf_cpu< float > (int layout, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, float *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data) |
|
template<> |
OPEN3D_CPU_LINALG_INT | getrf_cpu< double > (int layout, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, double *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data) |
|
template<> |
OPEN3D_CPU_LINALG_INT | getri_cpu< float > (int layout, OPEN3D_CPU_LINALG_INT n, float *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data) |
|
template<> |
OPEN3D_CPU_LINALG_INT | getri_cpu< double > (int layout, OPEN3D_CPU_LINALG_INT n, double *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data) |
|
template<> |
OPEN3D_CPU_LINALG_INT | gesv_cpu< float > (int layout, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT m, float *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data, float *B_data, OPEN3D_CPU_LINALG_INT ldb) |
|
template<> |
OPEN3D_CPU_LINALG_INT | gesv_cpu< double > (int layout, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT m, double *A_data, OPEN3D_CPU_LINALG_INT lda, OPEN3D_CPU_LINALG_INT *ipiv_data, double *B_data, OPEN3D_CPU_LINALG_INT ldb) |
|
template<> |
OPEN3D_CPU_LINALG_INT | gels_cpu< float > (int layout, char trans, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT nrhs, float *A_data, OPEN3D_CPU_LINALG_INT lda, float *B_data, OPEN3D_CPU_LINALG_INT ldb) |
|
template<> |
OPEN3D_CPU_LINALG_INT | gels_cpu< double > (int layout, char trans, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, OPEN3D_CPU_LINALG_INT nrhs, double *A_data, OPEN3D_CPU_LINALG_INT lda, double *B_data, OPEN3D_CPU_LINALG_INT ldb) |
|
template<> |
OPEN3D_CPU_LINALG_INT | gesvd_cpu< float > (int layout, char jobu, char jobvt, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, float *A_data, OPEN3D_CPU_LINALG_INT lda, float *S_data, float *U_data, OPEN3D_CPU_LINALG_INT ldu, float *VT_data, OPEN3D_CPU_LINALG_INT ldvt, float *superb) |
|
template<> |
OPEN3D_CPU_LINALG_INT | gesvd_cpu< double > (int layout, char jobu, char jobvt, OPEN3D_CPU_LINALG_INT m, OPEN3D_CPU_LINALG_INT n, double *A_data, OPEN3D_CPU_LINALG_INT lda, double *S_data, double *U_data, OPEN3D_CPU_LINALG_INT ldu, double *VT_data, OPEN3D_CPU_LINALG_INT ldvt, double *superb) |
|
void | LeastSquares (const Tensor &A, const Tensor &B, Tensor &X) |
| Solve AX = B with QR decomposition. A is a full-rank m x n matrix (m >= n). More...
|
|
void | LeastSquaresCPU (void *A_data, void *B_data, int64_t m, int64_t n, int64_t k, Dtype dtype, const Device &device) |
|
void | LeastSquaresCUDA (void *A_data, void *B_data, int64_t m, int64_t n, int64_t k, Dtype dtype, const Device &device) |
|
void | OPEN3D_LAPACK_CHECK (OPEN3D_CPU_LINALG_INT info, const std::string &msg) |
|
void | Matmul (const Tensor &A, const Tensor &B, Tensor &C) |
| Computes matrix multiplication C = AB. More...
|
|
void | MatmulCPU (void *A_data, void *B_data, void *C_data, int64_t m, int64_t k, int64_t n, Dtype dtype) |
|
void | MatmulCUDA (void *A_data, void *B_data, void *C_data, int64_t m, int64_t k, int64_t n, Dtype dtype) |
|
void | Solve (const Tensor &A, const Tensor &B, Tensor &X) |
| Solve AX = B with LU decomposition. A is a square matrix. More...
|
|
void | SolveCPU (void *A_data, void *B_data, void *ipiv_data, int64_t n, int64_t k, Dtype dtype, const Device &device) |
|
void | SolveCUDA (void *A_data, void *B_data, void *ipiv_data, int64_t n, int64_t k, Dtype dtype, const Device &device) |
|
void | SVD (const Tensor &A, Tensor &U, Tensor &S, Tensor &VT) |
|
void | SVDCPU (const void *A_data, void *U_data, void *S_data, void *VT_data, void *superb_data, int64_t m, int64_t n, Dtype dtype, const Device &device) |
|
void | SVDCUDA (const void *A_data, void *U_data, void *S_data, void *VT_data, void *superb_data, int64_t m, int64_t n, Dtype dtype, const Device &device) |
|
template<typename T > |
Tensor | operator+ (T scalar_lhs, const Tensor &rhs) |
|
template<typename T > |
Tensor | operator- (T scalar_lhs, const Tensor &rhs) |
|
template<typename T > |
Tensor | operator* (T scalar_lhs, const Tensor &rhs) |
|
template<typename T > |
Tensor | operator/ (T scalar_lhs, const Tensor &rhs) |
|