Home
last modified time | relevance | path

Searched refs:workspace_size_list_ (Results 1 – 25 of 337) sorted by relevance

12345678910>>...14

/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/ps/
Dsparse_apply_adam_ps_kernel.cc74 …(void)workspace_size_list_.emplace_back(indices_size_ * var_outer_dim_size_ * sizeof(float) * work… in InitKernel()
75 (void)workspace_size_list_.emplace_back(indices_size_ * sizeof(int) * worker_num_); in InitKernel()
76 …(void)workspace_size_list_.emplace_back(indices_size_ * var_outer_dim_size_ * sizeof(float) * work… in InitKernel()
77 (void)workspace_size_list_.emplace_back(indices_size_ * sizeof(int) * worker_num_); in InitKernel()
78 …(void)workspace_size_list_.emplace_back(var_first_dim_size_ * var_outer_dim_size_ * sizeof(float) … in InitKernel()
87 workspace_size_list_[0] = indices_size_ * var_outer_dim_size_ * sizeof(float) * worker_num_; in ReInit()
88 workspace_size_list_[1] = indices_size_ * sizeof(int) * worker_num_; in ReInit()
98 workspace_size_list_[0] = indices_size_ * var_outer_dim_size_ * sizeof(float); in ReInit()
99 workspace_size_list_[1] = indices_size_ * sizeof(int); in ReInit()
Dsparse_apply_lazy_adam_ps_kernel.cc76 …(void)workspace_size_list_.emplace_back(indices_size_ * var_outer_dim_size_ * sizeof(float) * work… in InitKernel()
77 (void)workspace_size_list_.emplace_back(indices_size_ * sizeof(int) * worker_num_); in InitKernel()
78 …(void)workspace_size_list_.emplace_back(indices_size_ * var_outer_dim_size_ * sizeof(float) * work… in InitKernel()
79 (void)workspace_size_list_.emplace_back(indices_size_ * sizeof(int) * worker_num_); in InitKernel()
88 workspace_size_list_[0] = indices_size_ * var_outer_dim_size_ * sizeof(float) * worker_num_; in ReInit()
89 workspace_size_list_[1] = indices_size_ * sizeof(int) * worker_num_; in ReInit()
99 workspace_size_list_[0] = indices_size_ * var_outer_dim_size_ * sizeof(float) * worker_num_; in ReInit()
100 workspace_size_list_[1] = indices_size_ * sizeof(int) * worker_num_; in ReInit()
Dsparse_apply_ftrl_ps_kernel.cc86 …(void)workspace_size_list_.emplace_back(indices_size_ * var_outer_dim_size_ * sizeof(float) * work… in InitKernel()
87 (void)workspace_size_list_.emplace_back(indices_size_ * sizeof(int) * worker_num_); in InitKernel()
88 …(void)workspace_size_list_.emplace_back(indices_size_ * var_outer_dim_size_ * sizeof(float) * work… in InitKernel()
89 (void)workspace_size_list_.emplace_back(indices_size_ * sizeof(int) * worker_num_); in InitKernel()
98 workspace_size_list_[0] = indices_size_ * var_outer_dim_size_ * sizeof(float) * worker_num_; in ReInit()
99 workspace_size_list_[1] = indices_size_ * sizeof(int) * worker_num_; in ReInit()
109 workspace_size_list_[0] = indices_size_ * var_outer_dim_size_ * sizeof(float) * worker_num_; in ReInit()
110 workspace_size_list_[1] = indices_size_ * sizeof(int) * worker_num_; in ReInit()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/arrays/
Dreverse_v2_gpu_kernel.h37 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
51 … cudaMemcpyAsync(input_shape_device, &input_shape_[0], workspace_size_list_[0], in Launch()
56 … cudaMemcpyAsync(strides_device, &strides_[0], workspace_size_list_[1], in Launch()
61 … cudaMemcpyAsync(axis_device, &axis_[0], workspace_size_list_[2], cudaMemcpyHostToDevice, in Launch()
131 workspace_size_list_.clear(); in ResetResource()
139 workspace_size_list_.push_back(input_rank_ * sizeof(size_t)); in InitSizeLists()
140 workspace_size_list_.push_back(input_rank_ * sizeof(int64_t)); in InitSizeLists()
141 workspace_size_list_.push_back(axis_.size() * sizeof(int64_t)); in InitSizeLists()
154 std::vector<size_t> workspace_size_list_; variable
Dsort_gpu_kernel.h41 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
60 … cudaMemcpyAsync(input_shape_device, &input_shape_[0], workspace_size_list_[2], in Launch()
65 … cudaMemcpyAsync(perm_device, &perm_[0], workspace_size_list_[3], cudaMemcpyHostToDevice, in Launch()
97 … cudaMemcpyAsync(transposed_shape_device, &transposed_shape_[0], workspace_size_list_[4], in Launch()
200 workspace_size_list_.clear(); in ResetResource()
214 workspace_size_list_.push_back(input_bytes); in InitSizeLists()
215 workspace_size_list_.push_back(indices_bytes); in InitSizeLists()
216 workspace_size_list_.push_back(input_rank_ * sizeof(size_t)); in InitSizeLists()
217 workspace_size_list_.push_back(input_rank_ * sizeof(size_t)); in InitSizeLists()
218 workspace_size_list_.push_back(input_rank_ * sizeof(size_t)); in InitSizeLists()
[all …]
Din_top_k_gpu_kernel.h39 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
156 workspace_size_list_.clear(); in ResetResource()
165 workspace_size_list_.push_back(input_shape_[0] * k_ * sizeof(T)); in InitSizeLists()
166 workspace_size_list_.push_back(input_shape_[0] * k_ * sizeof(int32_t)); in InitSizeLists()
171 workspace_size_list_.push_back(input_size_ * sizeof(float)); in InitSizeLists()
173 workspace_size_list_.push_back(input_shape_[0] * k_ * sizeof(float)); in InitSizeLists()
192 std::vector<size_t> workspace_size_list_; variable
Dextract_image_patches_gpu_kernel.h39 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
209 workspace_size_list_.clear(); in ResetResource()
216 workspace_size_list_.push_back(input_size_ * sizeof(T)); in InitSizeLists()
217 workspace_size_list_.push_back(output_size_ * sizeof(T)); in InitSizeLists()
218 workspace_size_list_.push_back(4 * sizeof(size_t)); in InitSizeLists()
219 workspace_size_list_.push_back(4 * sizeof(size_t)); in InitSizeLists()
220 workspace_size_list_.push_back(4 * sizeof(size_t)); in InitSizeLists()
221 workspace_size_list_.push_back(4 * sizeof(size_t)); in InitSizeLists()
252 std::vector<size_t> workspace_size_list_; variable
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/nn/
Dpad_gpu_kernel.h39 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
57 … cudaMemcpyAsync(input_shape_device, &input_shape_[0], workspace_size_list_[0], in Launch()
62 … cudaMemcpyAsync(strides_device, &strides_[0], workspace_size_list_[1], in Launch()
67 … cudaMemcpyAsync(paddings_device, &flattened_paddings_[0], workspace_size_list_[2], in Launch()
144 workspace_size_list_.clear(); in ResetResource()
151 workspace_size_list_.push_back(input_rank_ * sizeof(size_t)); // input shape in InitSizeLists()
152 workspace_size_list_.push_back(input_rank_ * sizeof(size_t)); // strides in InitSizeLists()
153 workspace_size_list_.push_back(input_rank_ * sizeof(int32_t) * 2); // paddings in InitSizeLists()
183 std::vector<size_t> workspace_size_list_; variable
Dlocal_response_norm_grad_gpu_kernel.h39 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
180 workspace_size_list_.clear(); in ResetResource()
211 workspace_size_list_.push_back(shape_size); in InitSizeLists()
212 workspace_size_list_.push_back(shape_size); in InitSizeLists()
213 workspace_size_list_.push_back(shape_size); in InitSizeLists()
214 workspace_size_list_.push_back(shape_size); in InitSizeLists()
215 workspace_size_list_.push_back(input_size_); in InitSizeLists()
216 workspace_size_list_.push_back(input_size_); in InitSizeLists()
217 workspace_size_list_.push_back(input_size_); in InitSizeLists()
218 workspace_size_list_.push_back(input_size_); in InitSizeLists()
[all …]
Dlocal_response_norm_gpu_kernel.h39 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
168 workspace_size_list_.clear(); in ResetResource()
195 workspace_size_list_.push_back(shape_size); in InitSizeLists()
196 workspace_size_list_.push_back(shape_size); in InitSizeLists()
197 workspace_size_list_.push_back(shape_size); in InitSizeLists()
198 workspace_size_list_.push_back(shape_size); in InitSizeLists()
199 workspace_size_list_.push_back(input_size_); in InitSizeLists()
200 workspace_size_list_.push_back(input_size_); in InitSizeLists()
201 workspace_size_list_.push_back(num_elements_ * sizeof(float)); in InitSizeLists()
267 std::vector<size_t> workspace_size_list_; variable
Dbce_with_logits_loss_kernel.h35 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
138 workspace_size_list_.clear(); in ResetResource()
147 workspace_size_list_.push_back(input_shape_.size() * sizeof(size_t)); in InitSizeLists()
148 workspace_size_list_.push_back(weight_shape_.size() * sizeof(size_t)); in InitSizeLists()
149 workspace_size_list_.push_back(pos_weight_shape_.size() * sizeof(size_t)); in InitSizeLists()
152 workspace_size_list_.push_back(input_size_ * sizeof(T)); in InitSizeLists()
184 std::vector<size_t> workspace_size_list_; variable
Dsoftmax_grad_gpu_kernel.h52 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
169 workspace_size_list_.push_back(input_size_); in InitSizeLists()
170 workspace_size_list_.push_back(input_size_); in InitSizeLists()
171 workspace_size_list_.push_back(output_size_); in InitSizeLists()
172 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
173 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
174 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
218 std::vector<size_t> workspace_size_list_; variable
Dctcloss_gpu_kernel.h67 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
225 workspace_size_list_.push_back(probs_dims_[0] * probs_dims_[1] * probs_dims_[2] * sizeof(T)); in InitSizeLists()
226 workspace_size_list_.push_back(sequence_lengths_size_); in InitSizeLists()
227 workspace_size_list_.push_back(sequence_lengths_size_); in InitSizeLists()
228 workspace_size_list_.push_back(label_size_); in InitSizeLists()
229 workspace_size_list_.push_back(label_size_); in InitSizeLists()
230 workspace_size_list_.push_back(probs_dims_[0] * probs_dims_[1] * probs_dims_[2] * sizeof(T)); in InitSizeLists()
231 workspace_size_list_.push_back(sequence_lengths_size_); in InitSizeLists()
232 workspace_size_list_.push_back(sizeof(int)); in InitSizeLists()
281 std::vector<size_t> workspace_size_list_; variable
Dinstance_norm_gpu_kernel.h54 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
172 workspace_size_list_.push_back(para_size_); // ws gamma in InitSizeLists()
173 workspace_size_list_.push_back(para_size_); // ws beta in InitSizeLists()
174 workspace_size_list_.push_back(para_size_); // ws mean in InitSizeLists()
175 workspace_size_list_.push_back(para_size_); // ws variance in InitSizeLists()
176 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
222 std::vector<size_t> workspace_size_list_; variable
Dl2normalize_grad_gpu_kernel.h54 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
81 …nsor(cudnn_handle_, reduce_tensor_descriptor_, nullptr, 0, workspace_addr, workspace_size_list_[2], in Launch()
85 GetMaxWithEpsAndValue(workspace_size_list_[0] / sizeof(T), epsilon_, reduce_workspace_addr, in Launch()
98workspace_size_list_[3], &alpha, inputA_descriptor_, dx_addr, &beta, outputC_descriptor_, in Launch()
227 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
228 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
235 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
242 workspace_size_list_.push_back(workspace_size_); in InitSizeLists()
320 std::vector<size_t> workspace_size_list_; variable
Dnll_loss_gpu_kernel.h36 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
107 workspace_size_list_.clear(); in ResetResource()
122 workspace_size_list_.push_back(tmp_loss_size_); in InitSizeLists()
123 workspace_size_list_.push_back(tmp_target_weight_size_); in InitSizeLists()
136 std::vector<size_t> workspace_size_list_; variable
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/random/
Drandom_choice_with_mask_gpu_kernel.h38 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
132 workspace_size_list_.push_back(input_size_ * input_shape_size_ * sizeof(S)); in InitSizeLists()
133 workspace_size_list_.push_back(ceil_power2_ * sizeof(S)); in InitSizeLists()
134 workspace_size_list_.push_back(ceil_power2_ * sizeof(S)); in InitSizeLists()
136 workspace_size_list_.push_back(blocknum * sizeof(S)); in InitSizeLists()
137 workspace_size_list_.push_back(ceil_power2_ * sizeof(S)); in InitSizeLists()
138 workspace_size_list_.push_back(ceil_power2_ * sizeof(curandState)); in InitSizeLists()
155 std::vector<size_t> workspace_size_list_; variable
Drandom_categorical_gpu_kernel.h37 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
138 workspace_size_list_.push_back(sizeof(double) * num_classes_); in InitSizeLists()
140 workspace_size_list_.push_back(sizeof(double *) * batch_size_); in InitSizeLists()
143 workspace_size_list_.push_back(sizeof(double) * num_samples_); in InitSizeLists()
145 workspace_size_list_.push_back(sizeof(double *) * batch_size_); in InitSizeLists()
156 std::vector<size_t> workspace_size_list_; variable
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/math/
Dmatrix_inverse_gpu_kernel.h37 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
134 workspace_size_list_.emplace_back(input_size_); in InitSizeLists()
136 workspace_size_list_.emplace_back(lu_size); in InitSizeLists()
138 workspace_size_list_.emplace_back(inv_size); in InitSizeLists()
140 workspace_size_list_.emplace_back(pivo_size); in InitSizeLists()
142 workspace_size_list_.emplace_back(info_size); in InitSizeLists()
148 std::vector<size_t> workspace_size_list_; variable
Dcholesky_solve_gpu_kernel.h52 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
245 workspace_size_list_.push_back(workspace_size); in InitSizeLists()
251 (void)workspace_size_list_.insert(workspace_size_list_.begin(), workspace_size); in InitSizeLists()
253 (void)workspace_size_list_.insert(workspace_size_list_.begin(), workspace_size); in InitSizeLists()
255 (void)workspace_size_list_.insert(workspace_size_list_.begin(), workspace_size); in InitSizeLists()
277 std::vector<size_t> workspace_size_list_; variable
Dnms_with_mask_gpu_kernel.h45 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
112 workspace_size_list_.push_back(ceil_power_2 * sizeof(T)); // data buff in InitSizeLists()
113 workspace_size_list_.push_back(ceil_power_2 * sizeof(int)); // index buff in InitSizeLists()
114 workspace_size_list_.push_back(num_input_ * num_input_ * sizeof(bool)); // mask list in InitSizeLists()
129 std::vector<size_t> workspace_size_list_; variable
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/nccl/
Dsync_batch_norm_gpu_kernel.h40 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
178 workspace_size_list_.clear(); in ResetResource()
194 workspace_size_list_.push_back(workspace_size_ * sizeof(float)); // mean_local in InitSizeLists()
195 workspace_size_list_.push_back(workspace_size_ * sizeof(float)); // invstd_local in InitSizeLists()
196 workspace_size_list_.push_back(workspace_size_ * sizeof(int)); // count_local in InitSizeLists()
198 workspace_size_list_.push_back(workspace_size_ * sizeof(int) * group_size_); // gathered mean in InitSizeLists()
199workspace_size_list_.push_back(workspace_size_ * sizeof(float) * group_size_); // gathered invstd in InitSizeLists()
200workspace_size_list_.push_back(workspace_size_ * sizeof(float) * group_size_); // gathered count in InitSizeLists()
237 std::vector<size_t> workspace_size_list_; variable
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/sponge/pme/
Dpme_energy_update_kernel.h125 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
197 workspace_size_list_.push_back(atom_numbers * sizeof(UNSIGNED_INT_VECTOR)); in InitSizeLists()
198 workspace_size_list_.push_back(atom_numbers * sizeof(VECTOR)); in InitSizeLists()
199 workspace_size_list_.push_back(PME_Nall * sizeof(T)); in InitSizeLists()
200 workspace_size_list_.push_back(PME_Nfft * sizeof(cufftComplex)); in InitSizeLists()
201 workspace_size_list_.push_back(atom_numbers * 64 * sizeof(int)); in InitSizeLists()
202 workspace_size_list_.push_back(PME_Nfft * sizeof(float)); in InitSizeLists()
203 workspace_size_list_.push_back(64 * sizeof(UNSIGNED_INT_VECTOR)); in InitSizeLists()
204 workspace_size_list_.push_back(atom_numbers * max_neighbor_numbers * sizeof(T1)); in InitSizeLists()
205 workspace_size_list_.push_back(sizeof(T)); in InitSizeLists()
[all …]
Dpme_energy_kernel.h115 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
168 workspace_size_list_.push_back(atom_numbers * sizeof(UNSIGNED_INT_VECTOR)); in InitSizeLists()
169 workspace_size_list_.push_back(atom_numbers * sizeof(VECTOR)); in InitSizeLists()
170 workspace_size_list_.push_back(PME_Nall * sizeof(T)); in InitSizeLists()
171 workspace_size_list_.push_back(PME_Nfft * sizeof(cufftComplex)); in InitSizeLists()
172 workspace_size_list_.push_back(atom_numbers * 64 * sizeof(int)); in InitSizeLists()
173 workspace_size_list_.push_back(PME_Nfft * sizeof(float)); in InitSizeLists()
174 workspace_size_list_.push_back(64 * sizeof(UNSIGNED_INT_VECTOR)); in InitSizeLists()
175 workspace_size_list_.push_back(atom_numbers * max_nl_numbers * sizeof(T1)); in InitSizeLists()
237 std::vector<size_t> workspace_size_list_; variable
Dpme_reciprocal_force_kernel.h121 const std::vector<size_t> &GetWorkspaceSizeList() const override { return workspace_size_list_; } in GetWorkspaceSizeList()
154 workspace_size_list_.push_back(atom_numbers * sizeof(UNSIGNED_INT_VECTOR)); in InitSizeLists()
155 workspace_size_list_.push_back(atom_numbers * sizeof(VECTOR)); in InitSizeLists()
156 workspace_size_list_.push_back(PME_Nall * sizeof(T)); in InitSizeLists()
157 workspace_size_list_.push_back(PME_Nfft * sizeof(cufftComplex)); in InitSizeLists()
158 workspace_size_list_.push_back(atom_numbers * 64 * sizeof(int)); in InitSizeLists()
159 workspace_size_list_.push_back(PME_Nfft * sizeof(float)); in InitSizeLists()
160 workspace_size_list_.push_back(64 * sizeof(UNSIGNED_INT_VECTOR)); in InitSizeLists()
219 std::vector<size_t> workspace_size_list_; variable

12345678910>>...14