Home
last modified time | relevance | path

Searched defs:dprops (Results 1 – 7 of 7) sorted by relevance

/external/pytorch/aten/src/ATen/native/transformers/cuda/
Dsdp_utils.cpp57 bool use_tensor_cores(sdp_params const& params, cudaDeviceProp* dprops, bool is_half) { in use_tensor_cores()
67 auto dprops = at::cuda::getCurrentDeviceProperties(); in minimum_gemm_alignment() local
173 bool check_sm_version(cudaDeviceProp * dprops) { in check_sm_version()
190 auto dprops = at::cuda::getCurrentDeviceProperties(); in check_flash_attention_hardware_support() local
198 auto dprops = at::cuda::getCurrentDeviceProperties(); in check_flash_attention_hardware_support() local
221 auto dprops = at::cuda::getCurrentDeviceProperties(); in check_mem_efficient_hardware_support() local
229 auto dprops = at::cuda::getCurrentDeviceProperties(); in check_mem_efficient_hardware_support() local
252 auto dprops = at::cuda::getCurrentDeviceProperties(); in check_requires_grad_and_head_dim_gt192_constraints_on_sm86_89() local
439 auto dprops = at::cuda::getCurrentDeviceProperties(); in check_cudnn_hardware_support() local
/external/pytorch/aten/src/ATen/native/transformers/cuda/flash_attn/
Dflash_fwd_launch_template.h209 auto dprops = at::cuda::getCurrentDeviceProperties(); in run_mha_fwd_hdim96() local
235 auto dprops = at::cuda::getCurrentDeviceProperties(); in run_mha_fwd_hdim128() local
272 auto dprops = at::cuda::getCurrentDeviceProperties(); in run_mha_fwd_hdim160() local
Dflash_api.cpp300 const int num_splits, cudaDeviceProp *dprops, struct c10::TensorOptions opts) { in set_params_splitkv()
363 auto dprops = at::cuda::getCurrentDeviceProperties(); in mha_fwd() local
563 auto dprops = at::cuda::getCurrentDeviceProperties(); in mha_varlen_fwd() local
830 auto dprops = at::cuda::getCurrentDeviceProperties(); in mha_bwd() local
1048 auto dprops = at::cuda::getCurrentDeviceProperties(); in mha_varlen_bwd() local
1273 auto dprops = at::cuda::getCurrentDeviceProperties(); in mha_fwd_kvcache() local
Dflash_bwd_launch_template.h80 auto dprops = at::cuda::getCurrentDeviceProperties(); in run_flash_bwd_seqk_parallel() local
/external/pytorch/aten/src/ATen/native/sparse/cuda/
DSparseSemiStructuredLinear.cu636 const auto dprops = at::cuda::getCurrentDeviceProperties(); in _sparse_semi_structured_linear() local
/external/pytorch/aten/src/ATen/native/nested/cuda/
DNestedTensorMatmul.cu373 auto dprops = at::cuda::getCurrentDeviceProperties(); in bmm_nested_cuda() local
/external/pytorch/aten/src/ATen/native/cuda/
DBlas.cpp863 auto dprops = at::cuda::getCurrentDeviceProperties(); in _scaled_mm_allowed_device() local