Home
last modified time | relevance | path

Searched refs:simdscalar (Results 1 – 20 of 20) sorted by relevance

/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/
Ddepthstencil.h33 void StencilOp(SWR_STENCILOP op, simdscalar mask, simdscalar stencilRefps, simdscalar &stencilps) in StencilOp()
73simdscalar stencilinvert = _simd_andnot_ps(stencilps, _simd_cmpeq_ps(_simd_setzero_ps(), _simd_set… in StencilOp()
84 simdscalar QuantizeDepth(simdscalar depth) in QuantizeDepth()
102 simdscalar result = _simd_mul_ps(depth, _simd_set1_ps(quantize)); in QuantizeDepth()
119 simdscalar DepthStencilTest(const API_STATE* pState, in DepthStencilTest()
120 …bool frontFacing, uint32_t viewportIndex, simdscalar interpZ, uint8_t* pDepthBase, simdscalar cove… in DepthStencilTest()
121 uint8_t *pStencilBase, simdscalar* pStencilMask) in DepthStencilTest()
129 simdscalar depthResult = _simd_set1_ps(-1.0f); in DepthStencilTest()
130 simdscalar zbuf; in DepthStencilTest()
133 simdscalar vMinZ = _simd_broadcast_ss(&pViewport->minZ); in DepthStencilTest()
[all …]
Dformat_types.h39 static simdscalar loadSOA(const uint8_t *pSrc) = delete;
40 static void storeSOA(uint8_t *pDst, simdscalar src) = delete;
41 static simdscalar unpack(simdscalar &in) = delete;
42 static simdscalar pack(simdscalar &in) = delete;
59 static simdscalar loadSOA(const uint8_t *pSrc) { return _simd_setzero_ps(); }
60 static void storeSOA(uint8_t *pDst, simdscalar src) { return; }
61 static simdscalar unpack(simdscalar &in) { return _simd_setzero_ps(); }
62 static simdscalar pack(simdscalar &in) { return _simd_setzero_ps(); }
79 static simdscalar loadSOA(const uint8_t *pSrc)
90 static void storeSOA(uint8_t *pDst, simdscalar src)
[all …]
Dclip.h66 void ComputeClipCodes(const API_STATE& state, const simdvector& vertex, simdscalar& clipCodes, simd… in ComputeClipCodes()
71 simdscalar vNegW = _simd_mul_ps(vertex.w, _simd_set1_ps(-1.0f)); in ComputeClipCodes()
74 simdscalar vRes = _simd_cmplt_ps(vertex.x, vNegW); in ComputeClipCodes()
113simdscalar gbMult = _simd_mul_ps(vNegW, _simd_i32gather_ps(&state.gbState.left[0], viewportIndexes… in ComputeClipCodes()
151 simdscalar ComputeClipCodeIntersection() in ComputeClipCodeIntersection()
153 simdscalar result = this->clipCodes[0]; in ComputeClipCodeIntersection()
161 simdscalar ComputeClipCodeUnion() in ComputeClipCodeUnion()
163 simdscalar result = this->clipCodes[0]; in ComputeClipCodeUnion()
173 simdscalar clipCodeUnion = ComputeClipCodeUnion(); in ComputeNegWMask()
180 simdscalar clipUnion = ComputeClipCodeUnion(); in ComputeClipMask()
[all …]
Dmultisample.h66 INLINE static simdscalar vX(uint32_t sampleNum) = delete;
67 INLINE static simdscalar vY(uint32_t sampleNum) = delete;
92 INLINE static simdscalar vX(uint32_t sampleNum)
94 static const simdscalar X = _simd_set1_ps(0.5f);
98 INLINE static simdscalar vY(uint32_t sampleNum)
100 static const simdscalar Y = _simd_set1_ps(0.5f);
149 INLINE static simdscalar vX(uint32_t sampleNum)
154 INLINE static simdscalar vY(uint32_t sampleNum)
200 INLINE static simdscalar vX(uint32_t sampleNum)
202 static const simdscalar X[numSamples] {_simd_set1_ps(0.75f), _simd_set1_ps(0.25f)};
[all …]
Dcontext.h317 simdscalar vIa;
318 simdscalar vIb;
319 simdscalar vIc;
321 simdscalar vJa;
322 simdscalar vJb;
323 simdscalar vJc;
325 simdscalar vZa;
326 simdscalar vZb;
327 simdscalar vZc;
329 simdscalar vRecipDet;
[all …]
Dfrontend.h66 void triangleSetupABVertical(const simdscalar vX[3], const simdscalar vY[3], simdscalar (&vA)[3], s… in triangleSetupABVertical()
207 simdscalar m00 = _simd_load1_ps(&vpMatrices.m00[0]); in viewportTransform()
208 simdscalar m30 = _simd_load1_ps(&vpMatrices.m30[0]); in viewportTransform()
209 simdscalar m11 = _simd_load1_ps(&vpMatrices.m11[0]); in viewportTransform()
210 simdscalar m31 = _simd_load1_ps(&vpMatrices.m31[0]); in viewportTransform()
211 simdscalar m22 = _simd_load1_ps(&vpMatrices.m22[0]); in viewportTransform()
212 simdscalar m32 = _simd_load1_ps(&vpMatrices.m32[0]); in viewportTransform()
227 simdscalar m00 = _simd_i32gather_ps(&vpMatrices.m00[0], vViewportIdx, 4); in viewportTransform()
228 simdscalar m30 = _simd_i32gather_ps(&vpMatrices.m30[0], vViewportIdx, 4); in viewportTransform()
229 simdscalar m11 = _simd_i32gather_ps(&vpMatrices.m11[0], vViewportIdx, 4); in viewportTransform()
[all …]
Dformat_conversion.h44 simdscalar vComp = _simd_load_ps((const float*)(pSrc + comp*sizeof(simdscalar))); in LoadSOA()
56 simdscalar vComp = FormatTraits<SrcFormat>::loadSOA(comp, pSrc); in LoadSOA()
82 INLINE simdscalar Clamp(simdscalar vComp, uint32_t Component) in Clamp()
128 INLINE simdscalar Normalize(simdscalar vComp, uint32_t Component) in Normalize()
151 simdscalar vComp = src.v[FormatTraits<DstFormat>::swizzle(comp)]; in StoreSOA()
162 _simd_store_ps((float*)(pDst + comp*sizeof(simdscalar)), vComp); in StoreSOA()
169 simdscalar vComp = src.v[FormatTraits<DstFormat>::swizzle(comp)]; in StoreSOA()
Dstate.h268 simdscalar* pDomainU; // IN: (SIMD) Domain Point U coords
269 simdscalar* pDomainV; // IN: (SIMD) Domain Point V coords
271simdscalar* pOutputData; // OUT: (SIMD) Vertex Attributes (2D array of vectors, one row per…
291 simdscalar UL;
292 simdscalar center;
293 simdscalar sample;
294 simdscalar centroid;
307 simdscalar vZ; // INOUT: z location of pixels
309 simdscalar inputMask; // IN: input coverage mask for all samples
813 simdvector& vSrc, simdvector& vSrc1, simdscalar& vSrc0Alpha, uint32_t sample,
[all …]
Dbackend.cpp160 simdscalar vComp; in ClearMacroTile()
430 simdmask ComputeUserClipMask(uint8_t clipMask, float* pUserClipBuffer, simdscalar vI, simdscalar vJ) in ComputeUserClipMask()
432 simdscalar vClipMask = _simd_setzero_ps(); in ComputeUserClipMask()
438 simdscalar vA = _simd_broadcast_ss(pUserClipBuffer++); in ComputeUserClipMask()
439 simdscalar vB = _simd_broadcast_ss(pUserClipBuffer++); in ComputeUserClipMask()
440 simdscalar vC = _simd_broadcast_ss(pUserClipBuffer++); in ComputeUserClipMask()
443 simdscalar vInterp = vplaneps(vA, vB, vC, vI, vJ); in ComputeUserClipMask()
446 simdscalar vCull = _simd_cmp_ps(_simd_setzero_ps(), vInterp, _CMP_NLE_UQ); in ComputeUserClipMask()
478 const simdscalar dy = _simd_set1_ps(static_cast<float>(SIMD_TILE_Y_DIM)); in BackendSingleSample()
485 const simdscalar dx = _simd_set1_ps(static_cast<float>(SIMD_TILE_X_DIM)); in BackendSingleSample()
[all …]
Dbackend.h44 simdmask ComputeUserClipMask(uint8_t clipMask, float* pUserClipBuffer, simdscalar vI, simdscalar vJ…
327 const simdscalar vXSamplePosUL, const simdscalar vYSamplePosUL)
401 const simdscalar vXSamplePosUL, const simdscalar vYSamplePosUL)
413 INLINE simdmask CalcDepthBoundsAcceptMask(simdscalar z, float minz, float maxz)
415 const simdscalar minzMask = _simd_cmpge_ps(z, _simd_set1_ps(minz));
416 const simdscalar maxzMask = _simd_cmple_ps(z, _simd_set1_ps(maxz));
554 uint32_t operator()(simdscalar& activeLanes, SWR_PS_CONTEXT& psContext,
560 simdscalar anyDepthSamplePassed = _simd_setzero_ps();
580 const simdscalar z = _simd_load_ps(reinterpret_cast<const float *>(pDepthSample));
651 simdscalar vZ[T::MultisampleT::numCoverageSamples];
[all …]
Dpa.h254 simdscalar tmp0 = _mm256_unpacklo_ps(a.x, a.z); in swizzleLane0()
255 simdscalar tmp1 = _mm256_unpacklo_ps(a.y, a.w); in swizzleLane0()
261 simdscalar tmp0 = _mm256_unpacklo_ps(a.x, a.z); in swizzleLane1()
262 simdscalar tmp1 = _mm256_unpacklo_ps(a.y, a.w); in swizzleLane1()
268 simdscalar tmp0 = _mm256_unpackhi_ps(a.x, a.z); in swizzleLane2()
269 simdscalar tmp1 = _mm256_unpackhi_ps(a.y, a.w); in swizzleLane2()
275 simdscalar tmp0 = _mm256_unpackhi_ps(a.x, a.z); in swizzleLane3()
276 simdscalar tmp1 = _mm256_unpackhi_ps(a.y, a.w); in swizzleLane3()
282 simdscalar tmp0 = _mm256_unpacklo_ps(a.x, a.z); in swizzleLane4()
283 simdscalar tmp1 = _mm256_unpacklo_ps(a.y, a.w); in swizzleLane4()
[all …]
Dbinner.cpp38 …AW_CONTEXT *pDC, PA_STATE& pa, uint32_t workerId, simdvector prims[3], simdscalar vRecipW[2], uint…
43 static const simdscalar g_pixelOffsets[SWR_PIXEL_LOCATION_UL + 1] =
53 INLINE simdscalari fpToFixedPointVertical(const simdscalar vIn) in fpToFixedPointVertical()
55 simdscalar vFixed = _simd_mul_ps(vIn, _simd_set1_ps(PT::ScaleT::value)); in fpToFixedPointVertical()
454 simdscalar vRecipW0 = _simd_set1_ps(1.0f); in BinTriangles()
455 simdscalar vRecipW1 = _simd_set1_ps(1.0f); in BinTriangles()
456 simdscalar vRecipW2 = _simd_set1_ps(1.0f); in BinTriangles()
496 simdscalar offset = g_pixelOffsets[rastState.pixelLocation]; in BinTriangles()
573 simdscalar recipW[2]; in BinTriangles()
912 simdscalar vRecipW0 = _simd_div_ps(_simd_set1_ps(1.0f), primVerts.w); in BinPoints()
[all …]
Dtilemgr.cpp297 simdscalar valR = _simd_broadcast_ss(&pClearData[0]); in ClearColorHotTile()
298 simdscalar valG = _simd_broadcast_ss(&pClearData[1]); in ClearColorHotTile()
299 simdscalar valB = _simd_broadcast_ss(&pClearData[2]); in ClearColorHotTile()
300 simdscalar valA = _simd_broadcast_ss(&pClearData[3]); in ClearColorHotTile()
328 simdscalar valZ = _simd_broadcast_ss(&pClearData[0]); in ClearDepthHotTile()
Dpa_avx.cpp205 simdscalar s; in PaTriList2()
341 simdscalar s; in PaTriStrip1()
345 simdscalar a0 = a[i]; in PaTriStrip1()
346 simdscalar b0 = b[i]; in PaTriStrip1()
454 simdscalar s; in PaTriFan1()
459 simdscalar a0 = a[i]; in PaTriFan1()
460 simdscalar b0 = b[i]; in PaTriFan1()
519 simdscalar s1, s2; in PaQuadList1()
523 simdscalar a0 = a[i]; in PaQuadList1()
524 simdscalar b0 = b[i]; in PaQuadList1()
Dutils.h412 simdscalar src0 = _simd_load_ps((const float*)pSrc); in Transpose()
413 simdscalar src1 = _simd_load_ps((const float*)pSrc + 8); in Transpose()
414 simdscalar src2 = _simd_load_ps((const float*)pSrc + 16); in Transpose()
415 simdscalar src3 = _simd_load_ps((const float*)pSrc + 24); in Transpose()
464 simdscalar src0 = _simd_load_ps((const float*)pSrc); in Transpose()
465 simdscalar src1 = _simd_load_ps((const float*)pSrc + 8); in Transpose()
466 simdscalar src2 = _simd_load_ps((const float*)pSrc + 16); in Transpose()
708 simdscalar src = _simd_load_ps((const float*)pSrc); in Transpose()
Dblend.h82 simdscalar oneMinusSrcA = _simd_sub_ps(_simd_set1_ps(1.0), src.w); in GenerateBlendFactor()
98 simdscalar oneMinusDstA = _simd_sub_ps(_simd_set1_ps(1.0), dst.w); in GenerateBlendFactor()
108 simdscalar sat = _simd_min_ps(src.w, _simd_sub_ps(_simd_set1_ps(1.0), dst.w)); in GenerateBlendFactor()
Dfrontend.cpp912 simdscalar* pDSOutput;
1046 … gt_pTessellationThreadData->pDSOutput = (simdscalar*)AlignedMalloc(requiredAllocSize, 64); in TessellationStages()
1060 dsContext.pDomainU = (simdscalar*)tsData.pDomainPointsU; in TessellationStages()
1061 dsContext.pDomainV = (simdscalar*)tsData.pDomainPointsV; in TessellationStages()
/external/mesa3d/src/gallium/drivers/swr/rasterizer/common/
Dsimdintrin.h36 typedef __m256 simdscalar; typedef
46 simdscalar v[4]; in OSALIGNSIMD()
49 simdscalar x, y, z, w; in OSALIGNSIMD()
52 simdscalar& operator[] (const int i) { return v[i]; } in OSALIGNSIMD()
53 const simdscalar& operator[] (const int i) const { return v[i]; } in OSALIGNSIMD()
370 simdscalar vResult; in _simd_i32gather_ps()
386 simdscalar vResult = vSrc; in _simd_mask_i32gather_ps()
640 simdscalari _simd_blendv_epi32(simdscalari a, simdscalari b, simdscalar mask) in _simd_blendv_epi32()
653 simdscalar vMask(int32_t mask) in vMask()
663 void _simd_mov(simdscalar &r, unsigned int rlane, simdscalar& s, unsigned int slane) in _simd_mov()
[all …]
Dsimd16intrin.h290 INLINE simdscalar _simd16_extract_ps(simd16scalar a, int imm8) in _simd16_extract_ps()
314 INLINE simd16scalar _simd16_insert_ps(simd16scalar a, simdscalar b, int imm8) in _simd16_insert_ps()
641 simdscalar lolo = _simd_permute_ps(a.lo, _simd_and_si(i.lo, mask)); in SIMD16_EMU_AVX512_2()
642 simdscalar lohi = _simd_permute_ps(a.hi, _simd_and_si(i.lo, mask)); in SIMD16_EMU_AVX512_2()
644 simdscalar hilo = _simd_permute_ps(a.lo, _simd_and_si(i.hi, mask)); in SIMD16_EMU_AVX512_2()
645 simdscalar hihi = _simd_permute_ps(a.hi, _simd_and_si(i.hi, mask)); in SIMD16_EMU_AVX512_2()
/external/mesa3d/src/gallium/drivers/swr/rasterizer/memory/
DStoreTile.h694 static const uint32_t offset = sizeof(simdscalar);
697simdscalar vComp0 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(0))*offs…
698simdscalar vComp1 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(1))*offs…
699simdscalar vComp2 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(2))*offs…
700simdscalar vComp3 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(3))*offs…
866 static const uint32_t offset = sizeof(simdscalar);
869simdscalar vComp0 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(0))*offs…
870simdscalar vComp1 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(1))*offs…
871simdscalar vComp2 = _simd_load_ps((const float*)(pSrc + (FormatTraits<DstFormat>::swizzle(2))*offs…