Home
last modified time | relevance | path

Searched refs:KNOB_SIMD_WIDTH (Results 1 – 17 of 17) sorted by relevance

/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/
Dknobs.h54 #define KNOB_SIMD_WIDTH 8 macro
59 #define KNOB_SIMD_WIDTH 8 macro
66 #define KNOB_SIMD_WIDTH 16
71 #define KNOB_SIMD_WIDTH 8 macro
142 #if KNOB_SIMD_WIDTH==8 && KNOB_TILE_X_DIM < 4
152 #if KNOB_SIMD_WIDTH == 8
Dfifo.hpp58 T* pNewBlock = (T*)arena.AllocAligned(sizeof(T)*mBlockSize, KNOB_SIMD_WIDTH*4); in clear()
112 __m256 vSrc = _simd_load_ps(pSrc + i*KNOB_SIMD_WIDTH); in enqueue_try_nosync()
113 _simd_stream_ps(pDst + i*KNOB_SIMD_WIDTH, vSrc); in enqueue_try_nosync()
116 const uint32_t numSimdLines = sizeof(T) / (KNOB_SIMD_WIDTH*4); in enqueue_try_nosync()
117 static_assert(numSimdLines * KNOB_SIMD_WIDTH * 4 == sizeof(T), in enqueue_try_nosync()
131 T* newBlock = (T*)arena.AllocAligned(sizeof(T)*mBlockSize, KNOB_SIMD_WIDTH*4); in enqueue_try_nosync()
Dpa.h177 const uint32_t numSimdVerts = this->streamSizeInVerts / KNOB_SIMD_WIDTH; in GetNextVsOutput()
202 …(KNOB_SIMD_WIDTH - (this->numPrimsComplete + this->nextNumPrimsIncrement - this->numPrims)) : KNOB… in NumPrims()
234 … _simd_set1_epi32(startID + this->primIDIncr * (this->numPrimsComplete / KNOB_SIMD_WIDTH))); in GetPrimID()
341 …OSALIGNSIMD(uint32_t) indices[MAX_NUM_VERTS_PER_PRIM][KNOB_SIMD_WIDTH]; // current index buffer…
415 uint32_t vertexIndex = this->headVertex / KNOB_SIMD_WIDTH; in GetNextVsOutput()
416 this->headVertex = (this->headVertex + KNOB_SIMD_WIDTH) % this->numVerts; in GetNextVsOutput()
423 uint32_t vertexIndex = this->headVertex / KNOB_SIMD_WIDTH; in GetNextVsIndices()
437 this->headVertex += KNOB_SIMD_WIDTH; in GetNextStreamOutput()
467 return ((this->headVertex + KNOB_SIMD_WIDTH) % this->numVerts) == this->tailVertex; in IsVertexStoreFull()
479 uint32_t vertexIndex = vertex / KNOB_SIMD_WIDTH; in IsCutIndex()
[all …]
Dfrontend.cpp482 … uint32_t numActive = (numItemsRemaining >= KNOB_SIMD_WIDTH) ? KNOB_SIMD_WIDTH : numItemsRemaining; in GenerateMask()
590 return (remainder >= KNOB_SIMD_WIDTH) ? KNOB_SIMD_WIDTH : remainder; in GetNumInvocations()
695 …onst uint32_t numSimdBatches = (state.gsState.maxNumVerts + KNOB_SIMD_WIDTH - 1) / KNOB_SIMD_WIDTH; in GeometryShaderStage()
697 const uint32_t instanceStride = inputPrimStride * KNOB_SIMD_WIDTH; in GeometryShaderStage()
704 cutInstanceStride = cutPrimStride * KNOB_SIMD_WIDTH; in GeometryShaderStage()
709 cutInstanceStride = cutPrimStride * KNOB_SIMD_WIDTH; in GeometryShaderStage()
876 …onst uint32_t numSimdBatches = (state.gsState.maxNumVerts + KNOB_SIMD_WIDTH - 1) / KNOB_SIMD_WIDTH; in AllocateGsBuffers()
877 uint32_t size = state.gsState.instanceCount * numSimdBatches * vertexStride * KNOB_SIMD_WIDTH; in AllocateGsBuffers()
878 *ppGsOut = pArena->AllocAligned(size, KNOB_SIMD_WIDTH * sizeof(float)); in AllocateGsBuffers()
882 const uint32_t cutBufferSize = cutPrimStride * state.gsState.instanceCount * KNOB_SIMD_WIDTH; in AllocateGsBuffers()
[all …]
Dbinner.cpp522 int cullZeroAreaMask = maskLo | (maskHi << (KNOB_SIMD_WIDTH / 2)); in BinTriangles()
547 frontWindingTris = maskLo | (maskHi << (KNOB_SIMD_WIDTH / 2)); in BinTriangles()
626 SWR_ASSERT(KNOB_SIMD_WIDTH == 8, "Need to update degenerate mask code for avx512"); in BinTriangles()
701 GatherScissors<KNOB_SIMD_WIDTH>::Gather(&state.scissorsInFixedPoint[0], pViewportIndex, in BinTriangles()
747 …SALIGNSIMD(uint32_t) aMTLeft[KNOB_SIMD_WIDTH], aMTRight[KNOB_SIMD_WIDTH], aMTTop[KNOB_SIMD_WIDTH],… in BinTriangles()
762 OSALIGNSIMD(uint32_t) aRTAI[KNOB_SIMD_WIDTH]; in BinTriangles()
952 OSALIGNSIMD(uint32_t) aMacroX[KNOB_SIMD_WIDTH], aMacroY[KNOB_SIMD_WIDTH]; in BinPoints()
967 OSALIGNSIMD(uint32_t) aTileRelativeX[KNOB_SIMD_WIDTH]; in BinPoints()
968 OSALIGNSIMD(uint32_t) aTileRelativeY[KNOB_SIMD_WIDTH]; in BinPoints()
972 OSALIGNSIMD(uint32_t) aTileAlignedX[KNOB_SIMD_WIDTH]; in BinPoints()
[all …]
Dpa_avx.cpp35 #if (KNOB_SIMD_WIDTH == 8)
87 uint32_t input_vec = input_cp / KNOB_SIMD_WIDTH; in PaPatchListSingle()
88 uint32_t input_lane = input_cp % KNOB_SIMD_WIDTH; in PaPatchListSingle()
124 float vec[KNOB_SIMD_WIDTH]; in PaPatchListTerm()
125 for (uint32_t lane = 0; lane < KNOB_SIMD_WIDTH; ++lane) in PaPatchListTerm()
128 uint32_t input_vec = input_cp / KNOB_SIMD_WIDTH; in PaPatchListTerm()
129 uint32_t input_lane = input_cp % KNOB_SIMD_WIDTH; in PaPatchListTerm()
143 KNOB_SIMD_WIDTH, in PaPatchListTerm()
268 SetNextPaState(pa, PaTriList0, PaTriListSingle0, 0, KNOB_SIMD_WIDTH, true); in PaTriList2()
369 SetNextPaState(pa, PaTriStrip1, PaTriStripSingle0, 0, KNOB_SIMD_WIDTH); in PaTriStrip1()
[all …]
Dformat_types.h81 #if KNOB_SIMD_WIDTH == 8
93 #if KNOB_SIMD_WIDTH == 8
102 #if KNOB_SIMD_WIDTH == 8
122 #if KNOB_SIMD_WIDTH == 8
195 #if KNOB_SIMD_WIDTH == 8
207 #if KNOB_SIMD_WIDTH == 8
216 #if KNOB_SIMD_WIDTH == 8
237 #if KNOB_SIMD_WIDTH == 8
310 #if KNOB_SIMD_WIDTH == 8
321 #if KNOB_SIMD_WIDTH == 8
[all …]
Dtilemgr.cpp103 hotTile.pBuffer = (uint8_t*)AllocHotTileMem(size, KNOB_SIMD_WIDTH * 4, numaNode); in GetHotTile()
127 hotTile.pBuffer = (uint8_t*)AllocHotTileMem(size, KNOB_SIMD_WIDTH * 4, numaNode); in GetHotTile()
197 hotTile.pBuffer = (uint8_t*)AlignedMalloc(size, KNOB_SIMD_WIDTH * 4); in GetHotTileNoLoad()
312 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile()
314 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile()
316 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile()
318 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile()
340 pfBuf += KNOB_SIMD_WIDTH; in ClearDepthHotTile()
Dbackend.cpp105 pTileBuffer += (KNOB_SIMD_WIDTH * FormatTraits<format>::GetBPC(comp) / 8); in ClearRasterTile()
421 #if KNOB_SIMD_WIDTH == 8
624 … pColorBuffer[rt] += (2 * KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample()
630 … pColorBuffer[rt] += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample()
633 pDepthBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_DEPTH_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample()
634 … pStencilBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_STENCIL_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample()
841 … pColorBuffer[rt] += (2 * KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate()
847 … pColorBuffer[rt] += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate()
850 pDepthBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_DEPTH_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate()
851 … pStencilBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_STENCIL_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate()
[all …]
Dbackend.h57 #if KNOB_SIMD_WIDTH == 8
140 …utCoverage(const uint64_t *const coverageMask, uint32_t (&inputMask)[KNOB_SIMD_WIDTH], const uint3… in generateInputCoverage()
143 assert(KNOB_SIMD_WIDTH == 8); in generateInputCoverage()
263 for(int32_t i = KNOB_SIMD_WIDTH - 1; i >= 0; i--) in generateInputCoverage()
281 uint32_t inputMask[KNOB_SIMD_WIDTH]; in generateInputCoverage()
294 assert(KNOB_SIMD_WIDTH == 8);
303 …utCoverage(const uint64_t *const coverageMask, uint32_t (&inputMask)[KNOB_SIMD_WIDTH], const uint3…
307 for(int i = 0; i < KNOB_SIMD_WIDTH; i++)
329 uint32_t inputMask[KNOB_SIMD_WIDTH];
335 unsigned long sampleNum[KNOB_SIMD_WIDTH];
[all …]
Dutils.h143 #if KNOB_SIMD_WIDTH == 8
148 #if KNOB_SIMD_WIDTH == 8
269 memcpy(pDst, pSrc, (bpp * KNOB_SIMD_WIDTH) / 8); in Transpose()
293 #if KNOB_SIMD_WIDTH == 8 in Transpose()
370 #if KNOB_SIMD_WIDTH == 8 in Transpose()
411 #if KNOB_SIMD_WIDTH == 8 in Transpose()
463 #if KNOB_SIMD_WIDTH == 8 in Transpose()
514 #if KNOB_SIMD_WIDTH == 8 in Transpose()
568 #if KNOB_SIMD_WIDTH == 8 in Transpose()
638 #if KNOB_SIMD_WIDTH == 8 in Transpose()
[all …]
Dformat_conversion.h70 pSrc += (FormatTraits<SrcFormat>::GetBPC(comp) * KNOB_SIMD_WIDTH) / 8; in LoadSOA()
192 pDst += (FormatTraits<DstFormat>::GetBPC(comp) * KNOB_SIMD_WIDTH) / 8; in StoreSOA()
Dapi.cpp72 void* pContextMem = AlignedMalloc(sizeof(SWR_CONTEXT), KNOB_SIMD_WIDTH * 4); in SwrCreateContext()
132 … pContext->ppScratch[i] = (uint8_t*)AlignedMalloc(32 * sizeof(KILOBYTE), KNOB_SIMD_WIDTH * 4); in SwrCreateContext()
1537 …vateState = pState->pArena->AllocAligned(pContext->privateStateSize, KNOB_SIMD_WIDTH*sizeof(float)… in SwrGetPrivateContextState()
/external/mesa3d/src/gallium/drivers/swr/rasterizer/memory/
DStoreTile.h519 for (uint32_t t = 0; t < KNOB_SIMD_WIDTH; ++t)
1224 ppRows[0] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2;
1225 ppRows[1] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2;
1226 pSrc += SRC_BYTES_PER_PIXEL * KNOB_SIMD_WIDTH;
1311 ppRows[0] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2;
1312 ppRows[1] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2;
1313 pSrc += SRC_BYTES_PER_PIXEL * KNOB_SIMD_WIDTH;
1398 ppRows[0] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2;
1399 ppRows[1] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2;
1400 pSrc += SRC_BYTES_PER_PIXEL * KNOB_SIMD_WIDTH;
[all …]
DTilingFunctions.h47 float color[FormatTraits<HotTileFormat>::numComps][KNOB_SIMD_WIDTH];
103 uint8_t color[FormatTraits<R8_UINT>::numComps][KNOB_SIMD_WIDTH];
/external/mesa3d/src/gallium/drivers/swr/rasterizer/common/
Dsimdintrin.h35 #if KNOB_SIMD_WIDTH == 8
56 #if KNOB_SIMD_WIDTH == 8
372 for (uint32_t i = 0; i < KNOB_SIMD_WIDTH; ++i) in _simd_i32gather_ps()
665 OSALIGNSIMD(float) rArray[KNOB_SIMD_WIDTH], sArray[KNOB_SIMD_WIDTH]; in _simd_mov()
/external/mesa3d/src/gallium/drivers/swr/
Dswr_screen.cpp975 screen->hJitMgr = JitCreateContext(KNOB_SIMD_WIDTH, KNOB_ARCH_STR, "swr"); in swr_create_screen_internal()