/external/tensorflow/tensorflow/compiler/xla/service/ |
hlo_profile_printer_data.proto | 34 float bytes_accessed = 6;
|
human_readable_profile_builder.h | 50 int64 transcendental_count, int64 bytes_accessed, 54 bytes_accessed, optimal_seconds}); 68 int64 bytes_accessed; // -1 if unknown member in struct:xla::HumanReadableProfileBuilder::OpInfo
|
hlo_profile_printer.cc | 62 instruction_info.bytes_accessed(),
|
human_readable_profile_builder.cc | 51 if (op.cycles > 0 && op.bytes_accessed >= 0) { 53 HumanReadableNumBytes(op.bytes_accessed / CyclesToSeconds(op.cycles)), 55 double bpc = static_cast<double>(op.bytes_accessed) / op.cycles; 56 if (op.bytes_accessed > op.cycles) { 119 total_bytes += std::max(op.bytes_accessed, int64{0}); 211 entry.metric = static_cast<double>(op.bytes_accessed) / (1 << 20);
|
hlo_cost_analysis_test.cc | 157 EXPECT_EQ(analysis.bytes_accessed(), 186 EXPECT_EQ(analysis.bytes_accessed(), 215 EXPECT_EQ(analysis.bytes_accessed(), 238 EXPECT_EQ(analysis.bytes_accessed(), 256 EXPECT_EQ(analysis.bytes_accessed(), 80); 284 EXPECT_EQ(analysis.bytes_accessed(), 313 EXPECT_EQ(analysis.bytes_accessed(), 489 constexpr int64 bytes_accessed = sizeof(float) * 4 * 2 * 2; local 490 static_assert(bytes_accessed == 64, ""); 491 EXPECT_EQ(fusion_analysis.bytes_accessed(), bytes_accessed) [all...] |
hlo_cost_analysis.cc | 52 float bytes_accessed = GetShapeSize(hlo->shape()); local 54 bytes_accessed += GetShapeSize(operand->shape()); 56 current_properties_[kBytesAccessedKey] = bytes_accessed; 551 float bytes_accessed = GetShapeSize(hlo->operand(0)->shape()) / 2.0f; local 552 bytes_accessed += GetShapeSize(hlo->operand(1)->shape()); 553 current_properties_[kBytesAccessedKey] = bytes_accessed; 565 float bytes_accessed = GetShapeSize(hlo->operand(0)->shape()) / 2.0f; local 566 current_properties_[kBytesAccessedKey] = bytes_accessed; 753 float HloCostAnalysis::bytes_accessed() const { function in class:xla::HloCostAnalysis 769 int64 HloCostAnalysis::bytes_accessed(const HloInstruction& hlo) const function in class:xla::HloCostAnalysis [all...] |
hlo_execution_profile.cc | 105 instruction_info->set_bytes_accessed(cost_analysis.bytes_accessed(*hlo));
|
hlo_cost_analysis.h | 135 float bytes_accessed() const; 142 int64 bytes_accessed(const HloInstruction& hlo) const; 200 // including nested elements, if any). If null then bytes_accessed methods
|
/external/tensorflow/tensorflow/compiler/xla/service/cpu/ |
parallel_task_assignment.cc | 67 const int64 bytes_accessed = variable 68 std::max(int64{1}, cost_analysis_->bytes_accessed(*instruction)); 71 static_cast<float>(bytes_accessed); 92 10 * cost_analysis_->bytes_accessed(*instruction);
|
/external/tensorflow/tensorflow/compiler/xla/service/gpu/ |
nvptx_compiler.cc | [all...] |