Home
last modified time | relevance | path

Searched refs:load_vector (Results 1 – 2 of 2) sorted by relevance

/external/pytorch/aten/src/ATen/native/cuda/
DMemoryAccess.cuh165 __device__ aligned_vector<scalar_t, vec_size> load_vector(const scalar_t *base_ptr, uint32_t offset… in load_vector() function
172 __device__ aligned_vector<bool, vec_size> load_vector(const bool *base_ptr, uint32_t offset) { in load_vector() function
174 auto tmp = load_vector<vec_size>(reinterpret_cast<const uint8_t*>(base_ptr), offset); in load_vector()
260 auto v = load_vector<vec_size>(from, index); in load_single_arg()
DReduce.cuh537 const auto values_vec = memory::load_vector<input_vec_size>(data, idx); in input_vectorized_thread_reduce_impl()
589 values[i] = memory::load_vector<output_vec_size>(data_, offset); in thread_reduce_impl()
609 values[i] = memory::load_vector<output_vec_size>(data_, offset); in thread_reduce_impl()