/external/eigen/Eigen/src/Core/arch/SSE/ |
D | PacketMath.h | 51 typedef eigen_packet_wrapper<__m128> Packet4f; typedef 55 typedef __m128 Packet4f; 80 const Packet4f p4f_##NAME = pset1<Packet4f>(X) 86 const Packet4f p4f_##NAME = _mm_castsi128_ps(pset1<Packet4i>(X)) 97 typedef Packet4f type; 98 typedef Packet4f half; 161 template<> struct unpacket_traits<Packet4f> { typedef float type; enum {size=4, alignment=Aligned1… 174 template<> EIGEN_STRONG_INLINE Packet4f pset1<Packet4f>(const float& from) { return _mm_set_ps(fro… 178 template<> EIGEN_STRONG_INLINE Packet4f pset1<Packet4f>(const float& from) { return _mm_set_ps1(fr… 189 template<> EIGEN_STRONG_INLINE Packet4f pload1<Packet4f>(const float *from) { [all …]
|
D | MathFunctions.h | 23 Packet4f plog<Packet4f>(const Packet4f& _x) 25 Packet4f x = _x; 55 …Packet4f invalid_mask = _mm_cmpnge_ps(x, _mm_setzero_ps()); // not greater equal is true if x is N… 56 Packet4f iszero_mask = _mm_cmpeq_ps(x, _mm_setzero_ps()); 66 Packet4f e = padd(Packet4f(_mm_cvtepi32_ps(emm0)), p4f_1); 74 Packet4f mask = _mm_cmplt_ps(x, p4f_cephes_SQRTHF); 75 Packet4f tmp = pand(x, mask); 80 Packet4f x2 = pmul(x,x); 81 Packet4f x3 = pmul(x2,x); 83 Packet4f y, y1, y2; [all …]
|
D | TypeCasting.h | 26 template<> EIGEN_STRONG_INLINE Packet4i pcast<Packet4f, Packet4i>(const Packet4f& a) { 40 template<> EIGEN_STRONG_INLINE Packet4f pcast<Packet4i, Packet4f>(const Packet4i& a) { 54 template<> EIGEN_STRONG_INLINE Packet4f pcast<Packet2d, Packet4f>(const Packet2d& a, const Packet2d… 67 template<> EIGEN_STRONG_INLINE Packet2d pcast<Packet4f, Packet2d>(const Packet4f& a) {
|
D | Complex.h | 90 …complex<float>* from) { EIGEN_DEBUG_ALIGNED_LOAD return Packet2cf(pload<Packet4f>(&numext::real_re… 91 …plex<float>* from) { EIGEN_DEBUG_UNALIGNED_LOAD return Packet2cf(ploadu<Packet4f>(&numext::real_re… 113 …st Packet2cf& from) { EIGEN_DEBUG_ALIGNED_STORE pstore(&numext::real_ref(*to), Packet4f(from.v)); } 114 …Packet2cf& from) { EIGEN_DEBUG_UNALIGNED_STORE pstoreu(&numext::real_ref(*to), Packet4f(from.v)); } 232 template<> struct conj_helper<Packet4f, Packet2cf, false,false> 234 …EIGEN_STRONG_INLINE Packet2cf pmadd(const Packet4f& x, const Packet2cf& y, const Packet2cf& c) con… 237 EIGEN_STRONG_INLINE Packet2cf pmul(const Packet4f& x, const Packet2cf& y) const 238 { return Packet2cf(Eigen::internal::pmul<Packet4f>(x, y.v)); } 241 template<> struct conj_helper<Packet2cf, Packet4f, false,false> 243 …EIGEN_STRONG_INLINE Packet2cf pmadd(const Packet2cf& x, const Packet4f& y, const Packet2cf& c) con… [all …]
|
/external/eigen/Eigen/src/Core/arch/AltiVec/ |
D | PacketMath.h | 34 typedef __vector float Packet4f; typedef 45 Packet4f p4f_##NAME = reinterpret_cast<Packet4f>(vec_splat_s32(X)) 51 Packet4f p4f_##NAME = pset1<Packet4f>(X) 63 const Packet4f p4f_##NAME = reinterpret_cast<Packet4f>(pset1<Packet4i>(X)) 75 static Packet4f p4f_MZERO = (Packet4f) vec_sl((Packet4ui)p4i_MINUS1, (Packet4ui)p4i_MINUS1); //{ 0x… 77 static Packet4f p4f_ONE = vec_ctf(p4i_ONE, 0); //{ 1.0, 1.0, 1.0, 1.0} 80 static Packet4f p4f_COUNTDOWN = { 0.0, 1.0, 2.0, 3.0 }; 134 typedef Packet4f type; 135 typedef Packet4f half; 190 template<> struct unpacket_traits<Packet4f> { typedef float type; enum {size=4, alignment=Aligned1… [all …]
|
D | MathFunctions.h | 95 Packet4f plog<Packet4f>(const Packet4f& _x) 97 Packet4f x = _x; 114 Packet4f e = padd(vec_ctf(emm0, 0), p4f_1); 122 Packet4f mask = reinterpret_cast<Packet4f>(vec_cmplt(x, p4f_cephes_SQRTHF)); 123 Packet4f tmp = pand(x, mask); 128 Packet4f x2 = pmul(x,x); 129 Packet4f x3 = pmul(x2,x); 131 Packet4f y, y1, y2; 156 Packet4f pexp<Packet4f>(const Packet4f& _x) 158 Packet4f x = _x; [all …]
|
D | Complex.h | 33 EIGEN_STRONG_INLINE explicit Packet2cf(const Packet4f& a) : v(a) {} in Packet2cf() 34 Packet4f v; 69 res.v = pload<Packet4f>((const float *)&from); 71 res.v = ploadu<Packet4f>((const float *)&from); 76 …et2cf>(const std::complex<float>* from) { return Packet2cf(pload<Packet4f>((const float *) … 77 …et2cf>(const std::complex<float>* from) { return Packet2cf(ploadu<Packet4f>((const float*) f… 101 …et2cf pconj(const Packet2cf& a) { return Packet2cf(pxor<Packet4f>(a.v, reinterpret_cast<Packet4f>(… 105 Packet4f v1, v2; 115 v2 = reinterpret_cast<Packet4f>(pxor(v2, reinterpret_cast<Packet4f>(p4ui_CONJ_XOR))); 119 return Packet2cf(padd<Packet4f>(v1, v2)); [all …]
|
/external/eigen/Eigen/src/Core/arch/NEON/ |
D | PacketMath.h | 40 typedef float32x4_t Packet4f; typedef 46 const Packet4f p4f_##NAME = pset1<Packet4f>(X) 49 const Packet4f p4f_##NAME = vreinterpretq_f32_u32(pset1<int32_t>(X)) 72 typedef Packet4f type; 73 typedef Packet4f half; // Packet2f intrinsics not implemented yet 111 …emplate<> struct unpacket_traits<Packet4f> { typedef float type; enum {size=4, alignment=Aligned… 114 template<> EIGEN_STRONG_INLINE Packet4f pset1<Packet4f>(const float& from) { return vdupq_n_f32(fr… 117 template<> EIGEN_STRONG_INLINE Packet4f plset<Packet4f>(const float& a) 120 Packet4f countdown = vld1q_f32(f); 121 return vaddq_f32(pset1<Packet4f>(a), countdown); [all …]
|
D | MathFunctions.h | 20 Packet4f pexp<Packet4f>(const Packet4f& _x) 22 Packet4f x = _x; 23 Packet4f tmp, fx; 56 Packet4f z = vmulq_f32(fx, p4f_cephes_exp_C2); 60 Packet4f y = vmulq_f32(p4f_cephes_exp_p0, x); 81 Packet4f pow2n = vreinterpretq_f32_s32(mm);
|
D | Complex.h | 38 EIGEN_STRONG_INLINE explicit Packet2cf(const Packet4f& a) : v(a) {} in Packet2cf() 39 Packet4f v; 75 …d<Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(padd<Packet4f>(a.v,b.v)); } 76 …b<Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(psub<Packet4f>(a.v,b.v)); } 77 …N_STRONG_INLINE Packet2cf pnegate(const Packet2cf& a) { return Packet2cf(pnegate<Packet4f>(a.v)); } 86 Packet4f v1, v2; 121 …complex<float>* from) { EIGEN_DEBUG_ALIGNED_LOAD return Packet2cf(pload<Packet4f>((const float*)fr… 122 …plex<float>* from) { EIGEN_DEBUG_UNALIGNED_LOAD return Packet2cf(ploadu<Packet4f>((const float*)fr… 131 Packet4f res = pset1<Packet4f>(0.f); 157 Packet4f a_r128; [all …]
|
/external/eigen/Eigen/src/Core/arch/ZVector/ |
D | PacketMath.h | 46 } Packet4f; typedef 94 static Packet4f p4f_COUNTDOWN = { 0.0, 1.0, 2.0, 3.0 }; 154 typedef Packet4f type; 155 typedef Packet4f half; 215 template<> struct unpacket_traits<Packet4f> { typedef float type; enum {size=4, alignment=Aligned1… 219 EIGEN_DEVICE_FUNC inline void ptranspose(PacketBlock<Packet4f,4>& kernel); 263 template<int element> EIGEN_STRONG_INLINE Packet4f vec_splat_packet4f(const Packet4f& from) 265 Packet4f splat; 306 struct palign_impl<Offset,Packet4f> 308 static EIGEN_STRONG_INLINE void run(Packet4f& first, const Packet4f& second) [all …]
|
D | MathFunctions.h | 96 Packet4f pexp<Packet4f>(const Packet4f& x) 98 Packet4f res; 111 Packet4f psqrt<Packet4f>(const Packet4f& x) 113 Packet4f res; 126 Packet4f prsqrt<Packet4f>(const Packet4f& x) { 127 Packet4f res;
|
D | Complex.h | 31 EIGEN_STRONG_INLINE explicit Packet2cf(const Packet4f& a) : v(a) {} in Packet2cf() 33 Packet4f v; 92 …omplex<float>* from) { EIGEN_DEBUG_ALIGNED_LOAD return Packet2cf(pload<Packet4f>((const float*)fr… 94 …lex<float>* from) { EIGEN_DEBUG_UNALIGNED_LOAD return Packet2cf(ploadu<Packet4f>((const float*)fr… 134 …<Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(padd<Packet4f>(a.v, b.v)); } 136 …<Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(psub<Packet4f>(a.v, b.v)); } 139 …N_STRONG_INLINE Packet2cf pnegate(const Packet2cf& a) { return Packet2cf(pnegate(Packet4f(a.v))); } 175 … <Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(pand<Packet4f>(a.v,b.v)); } 177 … <Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(por<Packet4f>(a.v,b.v)); } 179 … <Packet2cf>(const Packet2cf& a, const Packet2cf& b) { return Packet2cf(pxor<Packet4f>(a.v,b.v)); } [all …]
|
/external/eigen/unsupported/Eigen/src/MoreVectorization/ |
D | MathFunctions.h | 23 template<> EIGEN_DONT_INLINE Packet4f pasin(Packet4f x) in pasin() 40 Packet4f a = pabs(x);//got the absolute value in pasin() 42 Packet4f sign_bit= _mm_and_ps(x, p4f_sign_mask);//extracted the sign bit in pasin() 44 Packet4f z1,z2;//will need them during computation in pasin() 50 Packet4f branch_mask= _mm_cmpgt_ps(a, p4f_half);//this is to select which branch to take in pasin() 57 Packet4f x1=psqrt(z1); in pasin() 58 Packet4f s1=pmadd(p4f_asin1, z1, p4f_asin2); in pasin() 59 Packet4f s2=pmadd(s1, z1, p4f_asin3); in pasin() 60 Packet4f s3=pmadd(s2,z1, p4f_asin4); in pasin() 61 Packet4f s4=pmadd(s3,z1, p4f_asin5); in pasin() [all …]
|
/external/tensorflow/tensorflow/core/kernels/ |
D | sparse_matmul_op.h | 61 EIGEN_DEVICE_FUNC inline Packet4f pexpand_bf16_l(const Packet4f& from) { in pexpand_bf16_l() 70 return ploadu<Packet4f>(reinterpret_cast<float*>(p)); in pexpand_bf16_l() 74 EIGEN_DEVICE_FUNC inline Packet4f pexpand_bf16_u(const Packet4f& from) { in pexpand_bf16_u() 83 return ploadu<Packet4f>(reinterpret_cast<float*>(p)); in pexpand_bf16_u() 134 EIGEN_STRONG_INLINE Packet4f pload4bf16<Packet4f>(const float* from) { 142 return ploadu<Packet4f>(reinterpret_cast<float*>(p)); 146 EIGEN_STRONG_INLINE Packet4f pload2bf16<Packet4f>(const float* from) { 154 return ploadu<Packet4f>(reinterpret_cast<float*>(p)); 161 EIGEN_STRONG_INLINE Packet4f pbroadcast_first<Packet4f>(const Packet4f& a) { 167 EIGEN_STRONG_INLINE Packet4f pbroadcast_second<Packet4f>(const Packet4f& a) { [all …]
|
/external/tensorflow/third_party/eigen3/ |
D | gpu_packet_math.patch | 4 Packet4f b = be.template packet<BAlignment,Packet4f>(0); 5 Packet4f s1 = pmul(vec4f_swizzle1(a,1,2,0,2),vec4f_swizzle1(b,2,0,1,2)); 6 Packet4f s2 = pmul(vec4f_swizzle1(a,3,3,3,1),vec4f_swizzle1(b,0,1,2,1)); 7 - pstoret<float,Packet4f,ResAlignment>( 14 + pstoret<float, Packet4f, ResAlignment>( 16 + padd<Packet4f>( 17 + psub<Packet4f>(pmul<Packet4f>(a, vec4f_swizzle1(b, 3, 3, 3, 3)), 18 + pmul<Packet4f>(vec4f_swizzle1(a, 2, 0, 1, 0), 20 + pxor<Packet4f>(mask, padd(s1, s2))));
|
/external/eigen/Eigen/src/Core/arch/AVX512/ |
D | PacketMath.h | 259 Packet4f lane0_a = _mm512_extractf32x4_ps(a, 0); 260 Packet4f lane0_b = _mm512_extractf32x4_ps(b, 0); 263 Packet4f lane1_a = _mm512_extractf32x4_ps(a, 1); 264 Packet4f lane1_b = _mm512_extractf32x4_ps(b, 1); 267 Packet4f lane2_a = _mm512_extractf32x4_ps(a, 2); 268 Packet4f lane2_b = _mm512_extractf32x4_ps(b, 2); 271 Packet4f lane3_a = _mm512_extractf32x4_ps(a, 3); 272 Packet4f lane3_b = _mm512_extractf32x4_ps(b, 3); 303 Packet4f lane0_a = _mm512_extractf32x4_ps(a, 0); 304 Packet4f lane0_b = _mm512_extractf32x4_ps(b, 0); [all …]
|
/external/eigen/Eigen/src/Core/arch/CUDA/ |
D | TypeCasting.h | 171 template<> EIGEN_STRONG_INLINE Packet4f pcast<Packet4h, Packet4f>(const Packet4h& a) { 193 template<> EIGEN_STRONG_INLINE Packet4h pcast<Packet4f, Packet4h>(const Packet4f& a) {
|
/external/eigen/bench/ |
D | bench_norm.cpp | 88 Packet4f plt(const Packet4f& a, Packet4f& b) { return _mm_cmplt_ps(a,b); } in plt() 91 Packet4f pandnot(const Packet4f& a, Packet4f& b) { return _mm_andnot_ps(a,b); } in pandnot()
|
/external/eigen/Eigen/src/Geometry/arch/ |
D | Geometry_SSE.h | 34 pstoret<float,Packet4f,ResAlignment>( 55 …pstoret<float,Packet4f,ResAlignment>(&res.x(), _mm_xor_ps(mask, q.coeffs().template packet<traits<… 75 pstoret<float,Packet4f,ResAlignment>(&res.x(),_mm_sub_ps(mul1,mul2));
|
/external/eigen/Eigen/src/LU/arch/ |
D | Inverse_SSE.h | 158 pstoret<float, Packet4f, ResultAlignment>(res+0, _mm_shuffle_ps(iA,iB,0x77)); 159 pstoret<float, Packet4f, ResultAlignment>(res+res_stride, _mm_shuffle_ps(iA,iB,0x22)); 160 pstoret<float, Packet4f, ResultAlignment>(res+2*res_stride, _mm_shuffle_ps(iC,iD,0x77)); 161 pstoret<float, Packet4f, ResultAlignment>(res+3*res_stride, _mm_shuffle_ps(iC,iD,0x22));
|
/external/eigen/Eigen/src/Core/arch/AVX/ |
D | PacketMath.h | 57 typedef Packet4f half; 116 template<> struct unpacket_traits<Packet8f> { typedef float type; typedef Packet4f half; enum {siz… 398 return predux(Packet4f(_mm_add_ps(_mm256_castps256_ps128(a),_mm256_extractf128_ps(a,1)))); 405 template<> EIGEN_STRONG_INLINE Packet4f predux_downto4<Packet8f>(const Packet8f& a)
|