Home
last modified time | relevance | path

Searched refs:flops (Results 1 – 16 of 16) sorted by relevance

/external/tensorflow/tensorflow/core/profiler/g3doc/
Dprofile_model_architecture.md48 * It must have `RegisterStatistics('flops')` defined in TensorFlow. tfprof
51 * It must have known "shape" information for RegisterStatistics('flops')
70 _TFProfRoot (--/17.63b flops)
71 gradients/pool_logit/xw_plus_b/MatMul_grad/MatMul (163.84k/163.84k flops)
72 gradients/pool_logit/xw_plus_b/MatMul_grad/MatMul_1 (163.84k/163.84k flops)
73 init/init_conv/Conv2D (113.25m/113.25m flops)
74 pool_logit/xw_plus_b (1.28k/165.12k flops)
75 pool_logit/xw_plus_b/MatMul (163.84k/163.84k flops)
76 unit_1_0/sub1/conv1/Conv2D (603.98m/603.98m flops)
77 unit_1_0/sub2/conv2/Conv2D (603.98m/603.98m flops)
[all …]
Dcommand_line.md299 # Get run-time shape information in order to fill shapes and get flops.
/external/eigen/bench/perf_monitoring/gemm/
Dgemm.cpp43 double flops = 2. * m * n * k; in bench() local
44 long rep = std::max(1., std::min(100., up/flops) ); in bench()
45 long tries = std::max(tm0, std::min(tm1, up/flops) ); in bench()
49 return 1e-9 * rep * flops / t.best(); in bench()
Dlazy_gemm.cpp44 double flops = 2. * m * n * k; in bench() local
45 long rep = std::max(10., std::min(10000., up/flops) ); in bench()
46 long tries = std::max(tm0, std::min(tm1, up/flops) ); in bench()
50 return 1e-9 * rep * flops / t.best(); in bench()
/external/tensorflow/tensorflow/contrib/tpu/profiler/
Dop_profile.proto58 // - utilization is flops/time
59 // - wasted potential flops is proportional to time - flops
61 double flops = 2; field
/external/tensorflow/tensorflow/compiler/xla/tests/
Dxla_hlo_profile_test.cc45 string flops; member
54 if (RE2::FullMatch(parsed_line.flops, "[0-9.TGMk]+FLOP/s")) { in HasFlops()
57 << parsed_line.flops << "'"; in HasFlops()
62 << parsed_line.flops << "'"; in HasFlops()
105 &parsed_line.usec, &parsed_line.flops, &parsed_line.trops, in ParseOneProfileOutputLine()
/external/tensorflow/tensorflow/python/kernel_tests/
Dmatmul_op_test.py143 flops = ops.get_stats_for_node_def(g, op.node_def, "flops").value
145 self.assertEqual(7200, flops)
154 flops = ops.get_stats_for_node_def(g, op.node_def, "flops").value
156 self.assertEqual(7200, flops)
/external/tensorflow/tensorflow/compiler/xla/
Dutil.cc237 string HumanReadableNumOps(double flops, double nanoseconds, in HumanReadableNumOps() argument
242 double nano_flops = flops / nanoseconds; in HumanReadableNumOps()
256 string HumanReadableNumFlops(double flops, double nanoseconds) { in HumanReadableNumFlops() argument
257 return HumanReadableNumOps(flops, nanoseconds, "FL"); in HumanReadableNumFlops()
Dutil.h380 string HumanReadableNumFlops(double flops, double nanoseconds);
/external/tensorflow/tensorflow/compiler/xla/service/
Dhlo_cost_analysis.cc420 double flops = 0.0; in HandleCrossReplicaSum() local
424 flops += ShapeUtil::ElementsIn(subshape); in HandleCrossReplicaSum()
427 current_properties_[kFlopsKey] = flops; in HandleCrossReplicaSum()
/external/llvm/test/CodeGen/X86/
Dbreak-false-dep.ll109 ; flops-6. Make sure the unused register read by vcvtsi2sdq is zeroed
/external/eigen/unsupported/Eigen/
DMatrixFunctions455 cost is approximately \f$ 25 n^3 \f$ real flops for the real Schur
456 decomposition and \f$ 3\frac13 n^3 \f$ real flops for the remainder
/external/tensorflow/tensorflow/python/framework/
Dops_test.py2368 flops = ops.get_stats_for_node_def(graph, node, "flops")
2369 self.assertEqual(20, flops.value)
/external/llvm/lib/Target/X86/
DREADME.txt1011 From flops:
/external/swiftshader/third_party/LLVM/lib/Target/X86/
DREADME.txt1174 From flops:
/external/jline/src/src/test/resources/jline/example/
Denglish.gz