/external/tensorflow/tensorflow/compiler/xla/service/gpu/ |
D | kernel_mapping_scheme.h | 116 return CeilOfRatio(dims_in_elems_[0], GetTileSizeZ()) * in GetNumberOfBlocks() 117 CeilOfRatio(dims_in_elems_[1], GetTileSizeY()) * in GetNumberOfBlocks() 118 CeilOfRatio(dims_in_elems_[2], GetTileSizeX()); in GetNumberOfBlocks()
|
D | launch_dimensions.cc | 92 int64 block_count = CeilOfRatio(num_elements, threads_per_block); in CalculateLaunchDimensions()
|
D | ir_emission_utils.cc | 526 int num_segments = CeilOfRatio(bit_width, 32); in EmitFullWarpShuffleDown()
|
/external/tensorflow/tensorflow/compiler/xla/client/ |
D | padding.cc | 123 tensorflow::MathUtil::CeilOfRatio(input_dimension, window_stride); in MakePadding() 130 tensorflow::MathUtil::CeilOfRatio(padding_size, int64{2})); in MakePadding()
|
D | sharding_builder.cc | 64 tile_dimension = CeilOfRatio(static_cast<int64>(tile_dimension), num_tiles); in Tile1D()
|
/external/tensorflow/tensorflow/compiler/xla/ |
D | reference_util.h | 345 CeilOfRatio(limits[0] - starts[0], strides[0]), in Slice2D() 346 CeilOfRatio(limits[1] - starts[1], strides[1])); in Slice2D() 371 CeilOfRatio(limits[0] - starts[0], strides[0]), in Slice3D() 372 CeilOfRatio(limits[1] - starts[1], strides[1]), in Slice3D() 373 CeilOfRatio(limits[2] - starts[2], strides[2])); in Slice3D() 405 CeilOfRatio(limits[0] - starts[0], strides[0]), in Slice4D() 406 CeilOfRatio(limits[1] - starts[1], strides[1]), in Slice4D() 407 CeilOfRatio(limits[2] - starts[2], strides[2]), in Slice4D() 408 CeilOfRatio(limits[3] - starts[3], strides[3])); in Slice4D()
|
D | util.h | 410 T CeilOfRatio(T dividend, T divisor) { in CeilOfRatio() function 411 return tensorflow::MathUtil::CeilOfRatio<T>(dividend, divisor); in CeilOfRatio() 418 return CeilOfRatio(value, divisor) * divisor; in RoundUpToNearest()
|
/external/tensorflow/tensorflow/core/lib/math/ |
D | math_util_test.cc | 50 IntegralType ceil_1 = MathUtil::CeilOfRatio(numerator, denominator); in TestCeilOfRatio() 172 const int64 correct_result = MathUtil::CeilOfRatio(numerator, denominator); in TestThatCeilOfRatioDenomMinusOneIsIncorrect() 189 TEST(MathUtil, CeilOfRatio) { in TEST() argument
|
D | math_util.h | 51 static IntegralType CeilOfRatio(IntegralType numerator, in CeilOfRatio() function
|
/external/tensorflow/tensorflow/stream_executor/ |
D | device_description.cc | 151 return port::MathUtil::CeilOfRatio(x, y); in DivideCeil() 158 *block_count = port::MathUtil::CeilOfRatio(element_count, *threads_per_block); in CalculateDimensionality()
|
/external/tensorflow/tensorflow/compiler/xla/client/lib/ |
D | sorting.cc | 42 CeilOfRatio(last_dim_size - k, kPerPartitionSize - k); in TopK() 84 const int64 per_partition_size = CeilOfRatio(last_dim_size, num_partitions); in TopKWithPartitions()
|
D | quantize_test.cc | 58 int64 padded_output_width = CeilOfRatio(width, size_per_pack); in PackLargeInput() 85 int64 padded_output_width = CeilOfRatio(width, size_per_pack) * size_per_pack; in GenerateLargeSizeMinCombinedOutput() 152 CeilOfRatio(output_size, pack_size) * pack_size - output_size; in GenerateMinCombinedOutput()
|
D | quantize.h | 53 const int64 output_size = CeilOfRatio(input_size, kElementsPerPack); in PackToUint32()
|
D | prng.cc | 202 half_shape_dims.push_back(CeilOfRatio<int64>(shape.dimensions(i), 2)); in SplitShapeIntoHalves() 395 const int64 num_vector4 = CeilOfRatio<int64>(num_elems, 4); in GeneratePhiloxBits()
|
/external/tensorflow/tensorflow/compiler/xla/service/ |
D | hlo_sharding.cc | 280 index[i] * CeilOfRatio(shape_dim, tile_assignment_.dim(i)), shape_dim); in TileOffsetForDevice() 301 (index[i] + 1) * CeilOfRatio(shape_dim, tile_assignment_.dim(i)), in TileLimitForDevice() 574 i, CeilOfRatio<int64>(shape.dimensions(i), tile_assignment_.dim(i))); in TileShape() 589 index[i] * CeilOfRatio(shape_dim, tile_assignment_.dim(i)), shape_dim); in TileShape() 591 (index[i] + 1) * CeilOfRatio(shape_dim, tile_assignment_.dim(i)), in TileShape()
|
D | space_to_batch_converter.cc | 336 if (c.halo_size > CeilOfRatio(c.spatial_size, kNumSplits)) { in IsConvSuitableForSpaceToBatch() 1913 CeilOfRatio(output_offsets, num_splits); in PropagateOnConv() 1916 CeilOfRatio(output_offsets_per_split, c.base_dilation_factor) * c.stride; in PropagateOnConv() 2238 CeilOfRatio(new_split_dim_size, rhs_dilation); in PropagateOnBackpropFilterConv() 2517 ->set_size(CeilOfRatio(new_split_dim_size, rhs_dilation)); in PropagateOnBackpropFilterConv() 2679 CeilOfRatio(output_offsets, kNumSplits); in PerformSpaceToBatchOnConvolution() 2682 CeilOfRatio(output_offsets_per_split, c.base_dilation_factor) * c.stride; in PerformSpaceToBatchOnConvolution()
|
D | sharding_propagation.cc | 1187 const int64 tile_shape = CeilOfRatio(user.shape().dimensions(cdim), in GetShardingFromUser() 1192 end_indices[cdim] = CeilOfRatio( in GetShardingFromUser()
|
/external/tensorflow/tensorflow/stream_executor/lib/ |
D | mathutil.h | 34 static IntegralType CeilOfRatio(IntegralType numerator, in CeilOfRatio() function
|
/external/tensorflow/tensorflow/stream_executor/gpu/ |
D | redzone_allocator.cc | 39 return tensorflow::MathUtil::CeilOfRatio(value, divisor) * divisor; in RoundUpToNearest() 226 tensorflow::MathUtil::CeilOfRatio(num_elements, threads_per_block); in RunRedzoneChecker()
|
/external/tensorflow/tensorflow/compiler/tf2xla/kernels/ |
D | spmd_manual_sharding_ops.cc | 56 xla::CeilOfRatio(output_shape.dimensions(i), partitions_i); in Compile()
|
/external/tensorflow/tensorflow/core/kernels/ |
D | conv_2d_gpu.h | 969 MathUtil::CeilOfRatio<int>(input_dims[1], requested_tile_size_i), 970 MathUtil::CeilOfRatio<int>(input_dims[2], requested_tile_size_j), 1009 MathUtil::CeilOfRatio<int>(input_dims[1], kTileSize), 1010 MathUtil::CeilOfRatio<int>(input_dims[2], kTileSize),
|
D | clustering_ops.cc | 67 int64 CeilOfRatio(int64 a, int64 b) { return (a + b - 1) / b; } in CeilOfRatio() function 390 NextMultiple(num_threads, CeilOfRatio(num_points, rows_per_block)); in Compute()
|
/external/tensorflow/tensorflow/compiler/xla/service/spmd/ |
D | convolution_handler.cc | 332 CeilOfRatio(lhs.base_shape().dimensions(lhs_dimension), shard_count); in PartitionConvolutionWithSpatialDimensionHaloExchangeOnRHS() 334 CeilOfRatio(rhs.base_shape().dimensions(rhs_dimension), shard_count); in PartitionConvolutionWithSpatialDimensionHaloExchangeOnRHS() 641 CeilOfRatio(lhs.base_shape().dimensions(lhs_dimension), shard_count); in PartitionConvolutionWithSpatialDimensionHaloExchangeOnLHS() 643 CeilOfRatio(rhs.base_shape().dimensions(rhs_dimension), shard_count); in PartitionConvolutionWithSpatialDimensionHaloExchangeOnLHS()
|
D | fft_handler.cc | 58 CeilOfRatio(size_per_partition, num_partitions) * num_partitions; in PadEachPartitionWithHaloExchange()
|
D | spmd_partitioner_util.cc | 819 for (int64 i = CeilOfRatio(max_left_halo_size, input_shard_size) - 1; i >= 0; in ExchangeHalo() 853 for (int64 i = 0; i < CeilOfRatio(max_right_halo_size, input_shard_size); in ExchangeHalo() 1251 const int64 per_partition_size = CeilOfRatio(input_size, shard_count); in GetKValueInTopKWhenPartitionSortDim()
|