Searched refs:bytes_accessed (Results 1 – 9 of 9) sorted by relevance
/external/tensorflow/tensorflow/compiler/xla/service/ |
D | human_readable_profile_builder.cc | 41 if (op.cycles <= 0 || op.bytes_accessed < 0) { in ToString() 46 HumanReadableNumBytes(op.bytes_accessed / CyclesToSeconds(op.cycles)); in ToString() 47 if (op.bytes_accessed > op.cycles) { in ToString() 48 bytes_per_cycle = HumanReadableNumBytes(op.bytes_accessed / op.cycles); in ToString() 51 Printf("%.3fB", static_cast<float>(op.bytes_accessed) / op.cycles); in ToString() 84 total_bytes += op.bytes_accessed; in ToString()
|
D | human_readable_profile_builder.h | 48 int64 transcendental_count, int64 bytes_accessed, in AddOp() argument 52 flop_count, transcendental_count, bytes_accessed, optimal_seconds}); in AddOp() 66 int64 bytes_accessed; member
|
D | hlo_cost_analysis_test.cc | 165 EXPECT_EQ(analysis.bytes_accessed(), in TEST_F() 183 EXPECT_EQ(analysis.bytes_accessed(), 80); in TEST_F() 209 EXPECT_EQ(analysis.bytes_accessed(), in TEST_F() 388 constexpr int64 bytes_accessed = sizeof(float) * 4 * 2 * 2; in TEST_F() local 389 static_assert(bytes_accessed == 64, ""); in TEST_F() 390 EXPECT_EQ(fusion_analysis.bytes_accessed(), bytes_accessed); in TEST_F() 440 EXPECT_EQ(analysis.bytes_accessed(), kPointerSize * 2); in TEST_F()
|
D | hlo_cost_analysis.cc | 51 float bytes_accessed = shape_size_(hlo->shape()); in Preprocess() local 53 bytes_accessed += shape_size_(operand->shape()); in Preprocess() 55 current_properties_[kBytesAccessedKey] = bytes_accessed; in Preprocess() 553 float HloCostAnalysis::bytes_accessed() const { in bytes_accessed() function in xla::HloCostAnalysis 569 int64 HloCostAnalysis::bytes_accessed(const HloInstruction& hlo) const { in bytes_accessed() function in xla::HloCostAnalysis
|
D | hlo_cost_analysis.h | 124 float bytes_accessed() const; 131 int64 bytes_accessed(const HloInstruction& hlo) const;
|
D | hlo_profile_printer.cc | 55 instruction_info.bytes_accessed(), in PrintHloProfile()
|
D | hlo_execution_profile.cc | 97 instruction_info->set_bytes_accessed(cost_analysis.bytes_accessed(*hlo)); in CreateHloProfilePrinterData()
|
D | hlo_profile_printer_data.proto | 34 float bytes_accessed = 6; field
|
/external/tensorflow/tensorflow/compiler/xla/service/cpu/ |
D | parallel_task_assignment.cc | 65 const int64 bytes_accessed = in GetParallelTaskCount() local 66 std::max(1LL, cost_analysis_->bytes_accessed(*instruction)); in GetParallelTaskCount() 69 static_cast<float>(bytes_accessed); in GetParallelTaskCount() 90 10 * cost_analysis_->bytes_accessed(*instruction); in GetParallelTaskCount()
|