Home
last modified time | relevance | path

Searched refs:cudaMemcpyHostToDevice (Results 1 – 25 of 50) sorted by relevance

12

/third_party/boost/libs/fiber/examples/cuda/
Dmultiple_streams.cu62 … cudaMemcpyAsync( dev_a0, host_a + i, size * sizeof( int), cudaMemcpyHostToDevice, stream0); in main()
63 … cudaMemcpyAsync( dev_a1, host_a + i + size, size * sizeof( int), cudaMemcpyHostToDevice, stream1); in main()
64 … cudaMemcpyAsync( dev_b0, host_b + i, size * sizeof( int), cudaMemcpyHostToDevice, stream0); in main()
65 … cudaMemcpyAsync( dev_b1, host_b + i + size, size * sizeof( int), cudaMemcpyHostToDevice, stream1); in main()
Dsingle_stream.cu56 … cudaMemcpyAsync( dev_a, host_a + i, size * sizeof( int), cudaMemcpyHostToDevice, stream); in main()
57 … cudaMemcpyAsync( dev_b, host_b + i, size * sizeof( int), cudaMemcpyHostToDevice, stream); in main()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/math/
Dcholesky_solve_gpu_kernel.h71 cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
76cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
80cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
99cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
103cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dcast_all_gpu_kernel.h55 …cudaMemcpyAsync(inputs_dev, in_addr.get(), sizeof(T *) * num_input_, cudaMemcpyHostToDevice, strea… in Launch()
59 …cudaMemcpyAsync(outputs_dev, out_addr.get(), sizeof(S *) * num_input_, cudaMemcpyHostToDevice, str… in Launch()
62 …udaMemcpyAsync(size_dev, size_.get(), sizeof(size_t) * num_input_, cudaMemcpyHostToDevice, stream), in Launch()
Dcholesky_trsm_solve_gpu_kernel.h141 cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in LaunchNonSplitMatrix()
146cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in LaunchNonSplitMatrix()
150cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in LaunchNonSplitMatrix()
179cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in LaunchSplitMatrix()
183cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in LaunchSplitMatrix()
Dmatrix_inverse_gpu_kernel.h64cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
68cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/arrays/
Dreverse_v2_gpu_kernel.h52cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
57cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
61 … cudaMemcpyAsync(axis_device, &axis_[0], workspace_size_list_[2], cudaMemcpyHostToDevice, in Launch()
Dextract_image_patches_gpu_kernel.h60 … cudaMemcpyAsync(input_shape, &input_shape_[0], shape_size, cudaMemcpyHostToDevice, in Launch()
64 … cudaMemcpyAsync(input_to_nhwc_axis, &to_nhwc_axis[0], shape_size, cudaMemcpyHostToDevice, in Launch()
68 … cudaMemcpyAsync(t_output_shape, &t_output_shape_[0], shape_size, cudaMemcpyHostToDevice, in Launch()
73cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dsort_gpu_kernel.h61cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
65 … cudaMemcpyAsync(perm_device, &perm_[0], workspace_size_list_[3], cudaMemcpyHostToDevice, in Launch()
98cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dtile_gpu_kernel.h49cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
54 cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dtranspose_gpu_kernel.h48 … cudaMemcpyAsync(input_shape, &input_shape_[0], workspace_size_, cudaMemcpyHostToDevice, in Launch()
52 … cudaMemcpyAsync(input_axis, &input_axis_[0], workspace_size_, cudaMemcpyHostToDevice, in Launch()
Dconcatv2_gpu_kernel.h63cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
67cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dgathernd_gpu_kernel.h60cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
64cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/nn/
Dpad_gpu_kernel.h58cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
63cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
68cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dlocal_response_norm_gpu_kernel.h64 … cudaMemcpyAsync(ws_input_shape, &input_shape_[0], shape_size, cudaMemcpyHostToDevice, in Launch()
69cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
72 … cudaMemcpyAsync(ws_to_nhwc_axis, &to_nhwc_axis[0], shape_size, cudaMemcpyHostToDevice, in Launch()
76 … cudaMemcpyAsync(ws_to_nchw_axis, &to_nchw_axis[0], shape_size, cudaMemcpyHostToDevice, in Launch()
Dbce_with_logits_loss_kernel.h53cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
57cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
62 cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dlocal_response_norm_grad_gpu_kernel.h70 … cudaMemcpyAsync(ws_input_shape, &input_shape_[0], shape_size, cudaMemcpyHostToDevice, in Launch()
75cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
78 … cudaMemcpyAsync(ws_to_nhwc_axis, &to_nhwc_axis[0], shape_size, cudaMemcpyHostToDevice, in Launch()
82 … cudaMemcpyAsync(ws_to_nchw_axis, &to_nchw_axis[0], shape_size, cudaMemcpyHostToDevice, in Launch()
Dsoftmax_grad_gpu_kernel.h79 … cudaMemcpyAsync(input_shape, &input_shape_[0], workspace_size_, cudaMemcpyHostToDevice, in Launch()
84cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
88cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
Dsoftmax_gpu_kernel.h77 … cudaMemcpyAsync(input_shape, &input_shape_[0], workspace_size_, cudaMemcpyHostToDevice, in Launch()
82cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
86cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/random/
Drandom_categorical_gpu_kernel.h55 … host_cdf.get(), sizeof(double *) * batch_size_, cudaMemcpyHostToDevice, in Launch()
78cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
83 … host_rand.get(), sizeof(double *) * batch_size_, cudaMemcpyHostToDevice, in Launch()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/quant/
Dfake_learned_scale_quant_perlayer_grad_gpu_kernel.cc106 … cudaMemcpyAsync(grad_alpha, alpha_no_grad, sizeof(float), cudaMemcpyHostToDevice, in Launch()
115 … cudaMemcpyAsync(grad_alpha, alpha_no_grad, sizeof(float), cudaMemcpyHostToDevice, in Launch()
Dfake_learned_scale_quant_perchannel_grad_gpu_kernel.cc112cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
121cudaMemcpyHostToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)), in Launch()
/third_party/mindspore/tests/ut/cpp/stub/runtime/
Dcuda_runtime_api.h26 cudaMemcpyHostToDevice = 1, enumerator
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/sponge/neighbor_list/
Dneighbor_list_update_kernel.h97 …aMemcpyAsync(d_bucket, h_bucket.data(), sizeof(GRID_BUCKET) * grid_numbers, cudaMemcpyHostToDevice, in Launch()
99 …pyAsync(d_gpointer, h_gpointer.data(), sizeof(GRID_POINTER) * grid_numbers, cudaMemcpyHostToDevice, in Launch()
Dneighbor_list_update_new_kernel.h98 …aMemcpyAsync(d_bucket, h_bucket.data(), sizeof(GRID_BUCKET) * grid_numbers, cudaMemcpyHostToDevice, in Launch()
100 …pyAsync(d_gpointer, h_gpointer.data(), sizeof(GRID_POINTER) * grid_numbers, cudaMemcpyHostToDevice, in Launch()

12