Home
last modified time | relevance | path

Searched refs:flops (Results 1 – 23 of 23) sorted by relevance

/external/tensorflow/tensorflow/core/profiler/g3doc/
Dprofile_model_architecture.md48 * It must have `RegisterStatistics('flops')` defined in TensorFlow. tfprof
52 * It must have known "shape" information for RegisterStatistics('flops') to
70 _TFProfRoot (--/17.63b flops)
71 gradients/pool_logit/xw_plus_b/MatMul_grad/MatMul (163.84k/163.84k flops)
72 gradients/pool_logit/xw_plus_b/MatMul_grad/MatMul_1 (163.84k/163.84k flops)
73 init/init_conv/Conv2D (113.25m/113.25m flops)
74 pool_logit/xw_plus_b (1.28k/165.12k flops)
75 pool_logit/xw_plus_b/MatMul (163.84k/163.84k flops)
76 unit_1_0/sub1/conv1/Conv2D (603.98m/603.98m flops)
77 unit_1_0/sub2/conv2/Conv2D (603.98m/603.98m flops)
[all …]
Dcommand_line.md299 # Get run-time shape information in order to fill shapes and get flops.
/external/eigen/bench/perf_monitoring/gemm/
Dgemm.cpp43 double flops = 2. * m * n * k; in bench() local
44 long rep = std::max(1., std::min(100., up/flops) ); in bench()
45 long tries = std::max(tm0, std::min(tm1, up/flops) ); in bench()
49 return 1e-9 * rep * flops / t.best(); in bench()
Dlazy_gemm.cpp44 double flops = 2. * m * n * k; in bench() local
45 long rep = std::max(10., std::min(10000., up/flops) ); in bench()
46 long tries = std::max(tm0, std::min(tm1, up/flops) ); in bench()
50 return 1e-9 * rep * flops / t.best(); in bench()
/external/tensorflow/tensorflow/core/kernels/
Deigen_benchmark_cpu_test.cc53 auto flops = in SpatialConvolution() local
55 ::tensorflow::testing::ItemsProcessed(flops * iters); in SpatialConvolution()
81 auto flops = in SpatialConvolutionBackwardInput() local
83 ::tensorflow::testing::ItemsProcessed(flops * iters); in SpatialConvolutionBackwardInput()
109 auto flops = in SpatialConvolutionBackwardKernel() local
111 ::tensorflow::testing::ItemsProcessed(flops * iters); in SpatialConvolutionBackwardKernel()
275 auto flops = num_computed_elements * in CuboidConvolution() local
277 ::tensorflow::testing::ItemsProcessed(flops * iters); in CuboidConvolution()
304 auto flops = num_computed_elements * in CuboidConvolutionBackwardInput() local
306 ::tensorflow::testing::ItemsProcessed(flops * iters); in CuboidConvolutionBackwardInput()
[all …]
/external/tensorflow/tensorflow/core/profiler/
Dop_profile.proto64 // - utilization is flops/time
65 // - wasted potential flops is proportional to time - flops
67 double flops = 2; field
/external/tensorflow/tensorflow/compiler/xla/
Dutil.cc151 string HumanReadableNumOps(double flops, double nanoseconds, in HumanReadableNumOps() argument
156 double nano_flops = flops / nanoseconds; in HumanReadableNumOps()
170 string HumanReadableNumFlops(double flops, double nanoseconds) { in HumanReadableNumFlops() argument
171 return HumanReadableNumOps(flops, nanoseconds, "FL"); in HumanReadableNumFlops()
Dutil.h437 string HumanReadableNumFlops(double flops, double nanoseconds);
/external/tensorflow/tensorflow/compiler/xla/tests/
Dxla_hlo_profile_test.cc49 string flops; member
58 if (RE2::FullMatch(parsed_line.flops, "[0-9.TGMk]+FLOP/s")) { in HasFlops()
61 << parsed_line.flops << "'"; in HasFlops()
66 << parsed_line.flops << "'"; in HasFlops()
110 &parsed_line.usec, &parsed_line.flops, &parsed_line.trops,
/external/tensorflow/tensorflow/python/kernel_tests/
Dmatmul_op_test.py155 flops = ops.get_stats_for_node_def(g, op.node_def, "flops").value
157 self.assertEqual(7200, flops)
166 flops = ops.get_stats_for_node_def(g, op.node_def, "flops").value
168 self.assertEqual(7200, flops)
/external/tensorflow/tensorflow/compiler/xla/service/
Dhlo_cost_analysis.cc582 double flops = 0.0; in HandleAllReduce() local
586 flops += ShapeUtil::ElementsIn(subshape); in HandleAllReduce()
589 current_properties_[kFlopsKey] = flops; in HandleAllReduce()
/external/llvm/test/CodeGen/X86/
Dbreak-false-dep.ll109 ; flops-6. Make sure the unused register read by vcvtsi2sdq is zeroed
/external/eigen/unsupported/Eigen/
DMatrixFunctions455 cost is approximately \f$ 25 n^3 \f$ real flops for the real Schur
456 decomposition and \f$ 3\frac13 n^3 \f$ real flops for the remainder
/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/X86/
Dbreak-false-dep.ll110 ; flops-6. Make sure the unused register read by vcvtsi2sdq is zeroed
/external/tensorflow/tensorflow/python/framework/
Dops_test.py2669 flops = ops.get_stats_for_node_def(graph, node, "flops")
2670 self.assertEqual(20, flops.value)
/external/skqp/src/compute/skc/platforms/cl_12/kernels/
Drender.cl817 // evaluation might save some flops.
/external/llvm/lib/Target/X86/
DREADME.txt1011 From flops:
/external/swiftshader/third_party/llvm-7.0/llvm/lib/Target/X86/
DREADME.txt1011 From flops:
/external/skia/src/compute/skc/platforms/cl_12/kernels/
Drender.cl817 // evaluation might save some flops.
/external/swiftshader/third_party/LLVM/lib/Target/X86/
DREADME.txt1174 From flops:
/external/jline/src/src/test/resources/jline/example/
Denglish.gz
/external/cldr/tools/java/org/unicode/cldr/util/data/transforms/
Dinternal_raw_IPA.txt60974 flops %32310 flɑps
Dinternal_raw_IPA-old.txt72240 flops %21123 flɑps