Home
last modified time | relevance | path

Searched refs:bytes_accessed (Results 1 – 9 of 9) sorted by relevance

/external/tensorflow/tensorflow/compiler/xla/service/
Dhuman_readable_profile_builder.cc41 if (op.cycles <= 0 || op.bytes_accessed < 0) { in ToString()
46 HumanReadableNumBytes(op.bytes_accessed / CyclesToSeconds(op.cycles)); in ToString()
47 if (op.bytes_accessed > op.cycles) { in ToString()
48 bytes_per_cycle = HumanReadableNumBytes(op.bytes_accessed / op.cycles); in ToString()
51 Printf("%.3fB", static_cast<float>(op.bytes_accessed) / op.cycles); in ToString()
84 total_bytes += op.bytes_accessed; in ToString()
Dhuman_readable_profile_builder.h48 int64 transcendental_count, int64 bytes_accessed, in AddOp() argument
52 flop_count, transcendental_count, bytes_accessed, optimal_seconds}); in AddOp()
66 int64 bytes_accessed; member
Dhlo_cost_analysis_test.cc165 EXPECT_EQ(analysis.bytes_accessed(), in TEST_F()
183 EXPECT_EQ(analysis.bytes_accessed(), 80); in TEST_F()
209 EXPECT_EQ(analysis.bytes_accessed(), in TEST_F()
388 constexpr int64 bytes_accessed = sizeof(float) * 4 * 2 * 2; in TEST_F() local
389 static_assert(bytes_accessed == 64, ""); in TEST_F()
390 EXPECT_EQ(fusion_analysis.bytes_accessed(), bytes_accessed); in TEST_F()
440 EXPECT_EQ(analysis.bytes_accessed(), kPointerSize * 2); in TEST_F()
Dhlo_cost_analysis.cc51 float bytes_accessed = shape_size_(hlo->shape()); in Preprocess() local
53 bytes_accessed += shape_size_(operand->shape()); in Preprocess()
55 current_properties_[kBytesAccessedKey] = bytes_accessed; in Preprocess()
553 float HloCostAnalysis::bytes_accessed() const { in bytes_accessed() function in xla::HloCostAnalysis
569 int64 HloCostAnalysis::bytes_accessed(const HloInstruction& hlo) const { in bytes_accessed() function in xla::HloCostAnalysis
Dhlo_cost_analysis.h124 float bytes_accessed() const;
131 int64 bytes_accessed(const HloInstruction& hlo) const;
Dhlo_profile_printer.cc55 instruction_info.bytes_accessed(), in PrintHloProfile()
Dhlo_execution_profile.cc97 instruction_info->set_bytes_accessed(cost_analysis.bytes_accessed(*hlo)); in CreateHloProfilePrinterData()
Dhlo_profile_printer_data.proto34 float bytes_accessed = 6; field
/external/tensorflow/tensorflow/compiler/xla/service/cpu/
Dparallel_task_assignment.cc65 const int64 bytes_accessed = in GetParallelTaskCount() local
66 std::max(1LL, cost_analysis_->bytes_accessed(*instruction)); in GetParallelTaskCount()
69 static_cast<float>(bytes_accessed); in GetParallelTaskCount()
90 10 * cost_analysis_->bytes_accessed(*instruction); in GetParallelTaskCount()