Searched refs:device_sqrt (Results 1 – 4 of 4) sorted by relevance
8 static __forceinline__ __device__ scalar_t device_sqrt(scalar_t val);11 __forceinline__ __device__ float device_sqrt(float val) { in device_sqrt() function16 __forceinline__ __device__ double device_sqrt(double val) { in device_sqrt() function21 __forceinline__ __device__ double device_sqrt(scalar_t val) {
60 …e__ scalar_t finish(const scalar_t agg, const scalar_t /*p*/) { return device_sqrt<scalar_t>(agg);… in finish()102 int64_t i = static_cast<int64_t>((n2 - device_sqrt<double>(n2_squared_minus_1 - 2 * k))); in pdist_kernel_cuda_impl()166 int64_t i = static_cast<int64_t>((n2 - device_sqrt<double>(n2_squared_minus_1 - 2 * k))); in pdist_backward_kernel_cuda_impl()
234 …invstd = static_cast<stat_accscalar_t>(1) / device_sqrt(static_cast<stat_accscalar_t>(var_or_invst… in batch_norm_transform_input_kernel()255 invstd = static_cast<T>(1) / device_sqrt(var + epsilon); in operator ()()379 …invstd = static_cast<stat_accscalar_t>(1) / device_sqrt(static_cast<stat_accscalar_t>(running_var[… in batch_norm_backward_kernel()460 invstd[i] = static_cast<accscalar_t>(1) / device_sqrt(var_n / n + epsilon); in batch_norm_reduce_statistics_kernel()
21 #define device_sqrt std::sqrt macro139 res_t results(take_sqrt ? device_sqrt(var) : var, mean); in project()378 return device_sqrt(a); in project()