Home
last modified time | relevance | path

Searched refs:vectorized (Results 1 – 25 of 88) sorted by relevance

1234

/external/eigen/unsupported/Eigen/CXX11/src/Tensor/
DTensorEvaluator.h106 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const { in costPerCoeff()
107 return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized, in costPerCoeff()
205 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
206 return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized,
269 costPerCoeff(bool vectorized) const {
270 return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized,
338 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
340 return m_argImpl.costPerCoeff(vectorized) +
341 TensorOpCost(0, 0, functor_cost, vectorized, PacketSize);
417 costPerCoeff(bool vectorized) const {
[all …]
DTensorAssign.h154 costPerCoeff(bool vectorized) const {
158 TensorOpCost left = m_leftImpl.costPerCoeff(vectorized);
159 return m_rightImpl.costPerCoeff(vectorized) +
163 TensorOpCost(0, sizeof(CoeffReturnType), 0, vectorized, PacketSize);
DTensorArgMax.h116 costPerCoeff(bool vectorized) const {
117 return m_impl.costPerCoeff(vectorized) + TensorOpCost(0, 0, 1);
258 costPerCoeff(bool vectorized) const {
261 return m_orig_impl.costPerCoeff(vectorized) +
262 m_impl.costPerCoeff(vectorized) + TensorOpCost(0, 0, compute_cost);
DTensorEvalTo.h155 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
158 return m_impl.costPerCoeff(vectorized) +
159 TensorOpCost(0, sizeof(CoeffReturnType), 0, vectorized, PacketSize);
DTensorCustomOp.h136 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
138 return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized, PacketSize);
291 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
293 return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized, PacketSize);
DTensorConversion.h233 costPerCoeff(bool vectorized) const {
235 if (vectorized) {
240 return m_impl.costPerCoeff(vectorized) * (SrcCoeffRatio / PacketSize) +
243 return m_impl.costPerCoeff(vectorized) + TensorOpCost(0, 0, cast_cost);
DTensorInflation.h203 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
211 return m_impl.costPerCoeff(vectorized) +
213 compute_cost, vectorized, PacketSize);
DTensorStriding.h211 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
216 if (vectorized) {
220 return m_impl.costPerCoeff(vectorized && m_inputStrides[innerDim] == 1) +
222 TensorOpCost(0, 0, compute_cost, vectorized, PacketSize);
DTensorCostModel.h64 bool vectorized, double packet_size) in TensorOpCost() argument
67 compute_cycles_(vectorized ? compute_cycles / packet_size in TensorOpCost()
DTensorConvolution.h452 costPerCoeff(bool vectorized) const {
461 return TensorOpCost(0, 0, firstIndex_compute_cost, vectorized, PacketSize) +
462 kernel_size * (m_inputImpl.costPerCoeff(vectorized) +
463 m_kernelImpl.costPerCoeff(vectorized) +
464 TensorOpCost(0, 0, convolve_compute_cost, vectorized,
1066 costPerCoeff(bool vectorized) const {
1077 return TensorOpCost(0, 0, firstIndex_compute_cost, vectorized, PacketSize) +
1078 kernel_size * (m_inputImpl.costPerCoeff(vectorized) +
1079 m_kernelImpl.costPerCoeff(vectorized) +
1080 TensorOpCost(0, 0, convolve_compute_cost, vectorized,
DTensorPatch.h248 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
252 return m_impl.costPerCoeff(vectorized) +
253 TensorOpCost(0, 0, compute_cost, vectorized, PacketSize);
DTensorForcedEval.h147 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {
148 return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized, PacketSize);
/external/llvm/test/Transforms/LoopVectorize/
Dno_switch.ll5 ; CHECK: remark: source.cpp:4:5: loop not vectorized: loop contains a switch statement
6 ; CHECK: warning: source.cpp:4:5: loop not vectorized: failed explicitly specified loop vectorizati…
11 ; MOREINFO: remark: source.cpp:4:5: loop not vectorized: loop contains a switch statement
12 ; MOREINFO: remark: source.cpp:4:5: loop not vectorized: use -Rpass-analysis=loop-vectorize for mor…
13 ; MOREINFO: warning: source.cpp:4:5: loop not vectorized: failed explicitly specified loop vectoriz…
Druntime-limit.ll7 ;CHECK: remark: {{.*}}:0:0: vectorized loop (vectorization width: 4, interleaved count: 1)
9 ;CHECK: remark: {{.*}}:0:0: loop not vectorized: cannot prove it is safe to reorder memory operatio…
12 ;OVERRIDE: remark: {{.*}}:0:0: vectorized loop (vectorization width: 4, interleaved count: 1)
14 ;OVERRIDE: remark: {{.*}}:0:0: vectorized loop (vectorization width: 4, interleaved count: 1)
Dinterleaved-accesses-pred-stores.ll8 ; vectorized.
56 ; groups are separately vectorized. The store group contains gaps and is not
57 ; vectorized.
115 ; predicated block. The load group is vectorized, and the store groups contain
116 ; gaps and are not vectorized.
Dvect.stats.ll9 ; CHECK: 1 loop-vectorize - Number of loops vectorized
14 define void @vectorized(float* nocapture %a, i64 %size) {
Dmemdep.ll8 ; No plausible dependence - can be vectorized.
34 ; Plausible dependence of distance 1 - can't be vectorized.
60 ; Plausible dependence of distance 2 - can be vectorized with a width of 2.
92 ; Plausible dependence of distance 1 - cannot be vectorized (without reordering
Dcontrol-flow.ll13 ; CHECK: remark: source.cpp:5:9: loop not vectorized: loop control flow is not understood by vector…
14 ; CHECK: remark: source.cpp:5:9: loop not vectorized: use -Rpass-analysis=loop-vectorize for more i…
/external/llvm/test/Transforms/LoopVectorize/X86/
Dvect.omp.force.small-tc.ll9 ; CHECK: 1 loop-vectorize - Number of loops vectorized
24 ; This loop will be vectorized, although the trip count is below the threshold, but vectorization i…
26 define void @vectorized(float* noalias nocapture %A, float* noalias nocapture readonly %B) {
50 ; This loop will not be vectorized as the trip count is below the threshold.
Dvect.omp.force.ll9 ; CHECK: 1 loop-vectorize - Number of loops vectorized
25 ; This loop will be vectorized, although the scalar cost is lower than any of vector costs, but vec…
28 define void @vectorized(float* noalias nocapture %A, float* noalias nocapture %B) {
55 ; This method will not be vectorized, as scalar cost is lower than any of vector costs.
Dalready-vectorized.ll4 ; The vectorizer used to mark the un-vectorized loop only as already vectorized
5 ; thus, trying to vectorize the vectorized loop again
Dvectorization-remarks-missed.ll26 ; CHECK: remark: source.cpp:4:5: loop not vectorized: could not determine number of loop iterations
27 ; CHECK: remark: source.cpp:4:5: loop not vectorized: use -Rpass-analysis=loop-vectorize for more i…
28 ; CHECK: remark: source.cpp:13:5: loop not vectorized: vectorization and interleaving are explicitl…
29 ; CHECK: remark: source.cpp:19:5: loop not vectorized: cannot identify array bounds
30 ; CHECK: remark: source.cpp:19:5: loop not vectorized: use -Rpass-analysis=loop-vectorize for more …
31 ; CHECK: warning: source.cpp:19:5: loop not vectorized: failed explicitly specified loop vectorizat…
Dno_fpmath.ll3 ; CHECK: remark: no_fpmath.c:6:11: loop not vectorized: cannot prove it is safe to reorder floating…
4 ; CHECK: remark: no_fpmath.c:6:14: loop not vectorized:
5 ; CHECK: remark: no_fpmath.c:17:14: vectorized loop (vectorization width: 2, interleaved count: 2)
/external/llvm/docs/
DVectorizers.rst89 Many loops cannot be vectorized including loops with complicated control flow,
96 ``-Rpass=loop-vectorize`` identifies loops that were successfully vectorized.
117 The command line ``-Rpass-missed=loop-vectorized`` prints the remark:
121 …no_switch.cpp:4:5: remark: loop not vectorized: vectorization is explicitly enabled [-Rpass-missed…
124 switch statement cannot be vectorized.
128 …no_switch.cpp:4:5: remark: loop not vectorized: loop contains a switch statement [-Rpass-analysis=…
293 Access to global structures can also be vectorized, with alias analysis being
298 ignored (as other compilers do) are still being left un-vectorized.
331 example, the loop below will be vectorized on Intel x86 if the SSE4.1 roundps
394 operations, PHI-nodes, can all be vectorized using this technique.
/external/eigen/doc/
DUnalignedArrayAssert.dox116vectorized and non-vectorized code are not mutually ABI-compatible. This ABI compatibility is very…

1234