/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/ |
D | knobs.h | 54 #define KNOB_SIMD_WIDTH 8 macro 59 #define KNOB_SIMD_WIDTH 8 macro 66 #define KNOB_SIMD_WIDTH 16 71 #define KNOB_SIMD_WIDTH 8 macro 142 #if KNOB_SIMD_WIDTH==8 && KNOB_TILE_X_DIM < 4 152 #if KNOB_SIMD_WIDTH == 8
|
D | fifo.hpp | 58 T* pNewBlock = (T*)arena.AllocAligned(sizeof(T)*mBlockSize, KNOB_SIMD_WIDTH*4); in clear() 112 __m256 vSrc = _simd_load_ps(pSrc + i*KNOB_SIMD_WIDTH); in enqueue_try_nosync() 113 _simd_stream_ps(pDst + i*KNOB_SIMD_WIDTH, vSrc); in enqueue_try_nosync() 116 const uint32_t numSimdLines = sizeof(T) / (KNOB_SIMD_WIDTH*4); in enqueue_try_nosync() 117 static_assert(numSimdLines * KNOB_SIMD_WIDTH * 4 == sizeof(T), in enqueue_try_nosync() 131 T* newBlock = (T*)arena.AllocAligned(sizeof(T)*mBlockSize, KNOB_SIMD_WIDTH*4); in enqueue_try_nosync()
|
D | pa.h | 177 const uint32_t numSimdVerts = this->streamSizeInVerts / KNOB_SIMD_WIDTH; in GetNextVsOutput() 202 …(KNOB_SIMD_WIDTH - (this->numPrimsComplete + this->nextNumPrimsIncrement - this->numPrims)) : KNOB… in NumPrims() 234 … _simd_set1_epi32(startID + this->primIDIncr * (this->numPrimsComplete / KNOB_SIMD_WIDTH))); in GetPrimID() 341 …OSALIGNSIMD(uint32_t) indices[MAX_NUM_VERTS_PER_PRIM][KNOB_SIMD_WIDTH]; // current index buffer… 415 uint32_t vertexIndex = this->headVertex / KNOB_SIMD_WIDTH; in GetNextVsOutput() 416 this->headVertex = (this->headVertex + KNOB_SIMD_WIDTH) % this->numVerts; in GetNextVsOutput() 423 uint32_t vertexIndex = this->headVertex / KNOB_SIMD_WIDTH; in GetNextVsIndices() 437 this->headVertex += KNOB_SIMD_WIDTH; in GetNextStreamOutput() 467 return ((this->headVertex + KNOB_SIMD_WIDTH) % this->numVerts) == this->tailVertex; in IsVertexStoreFull() 479 uint32_t vertexIndex = vertex / KNOB_SIMD_WIDTH; in IsCutIndex() [all …]
|
D | frontend.cpp | 482 … uint32_t numActive = (numItemsRemaining >= KNOB_SIMD_WIDTH) ? KNOB_SIMD_WIDTH : numItemsRemaining; in GenerateMask() 590 return (remainder >= KNOB_SIMD_WIDTH) ? KNOB_SIMD_WIDTH : remainder; in GetNumInvocations() 695 …onst uint32_t numSimdBatches = (state.gsState.maxNumVerts + KNOB_SIMD_WIDTH - 1) / KNOB_SIMD_WIDTH; in GeometryShaderStage() 697 const uint32_t instanceStride = inputPrimStride * KNOB_SIMD_WIDTH; in GeometryShaderStage() 704 cutInstanceStride = cutPrimStride * KNOB_SIMD_WIDTH; in GeometryShaderStage() 709 cutInstanceStride = cutPrimStride * KNOB_SIMD_WIDTH; in GeometryShaderStage() 876 …onst uint32_t numSimdBatches = (state.gsState.maxNumVerts + KNOB_SIMD_WIDTH - 1) / KNOB_SIMD_WIDTH; in AllocateGsBuffers() 877 uint32_t size = state.gsState.instanceCount * numSimdBatches * vertexStride * KNOB_SIMD_WIDTH; in AllocateGsBuffers() 878 *ppGsOut = pArena->AllocAligned(size, KNOB_SIMD_WIDTH * sizeof(float)); in AllocateGsBuffers() 882 const uint32_t cutBufferSize = cutPrimStride * state.gsState.instanceCount * KNOB_SIMD_WIDTH; in AllocateGsBuffers() [all …]
|
D | binner.cpp | 522 int cullZeroAreaMask = maskLo | (maskHi << (KNOB_SIMD_WIDTH / 2)); in BinTriangles() 547 frontWindingTris = maskLo | (maskHi << (KNOB_SIMD_WIDTH / 2)); in BinTriangles() 626 SWR_ASSERT(KNOB_SIMD_WIDTH == 8, "Need to update degenerate mask code for avx512"); in BinTriangles() 701 GatherScissors<KNOB_SIMD_WIDTH>::Gather(&state.scissorsInFixedPoint[0], pViewportIndex, in BinTriangles() 747 …SALIGNSIMD(uint32_t) aMTLeft[KNOB_SIMD_WIDTH], aMTRight[KNOB_SIMD_WIDTH], aMTTop[KNOB_SIMD_WIDTH],… in BinTriangles() 762 OSALIGNSIMD(uint32_t) aRTAI[KNOB_SIMD_WIDTH]; in BinTriangles() 952 OSALIGNSIMD(uint32_t) aMacroX[KNOB_SIMD_WIDTH], aMacroY[KNOB_SIMD_WIDTH]; in BinPoints() 967 OSALIGNSIMD(uint32_t) aTileRelativeX[KNOB_SIMD_WIDTH]; in BinPoints() 968 OSALIGNSIMD(uint32_t) aTileRelativeY[KNOB_SIMD_WIDTH]; in BinPoints() 972 OSALIGNSIMD(uint32_t) aTileAlignedX[KNOB_SIMD_WIDTH]; in BinPoints() [all …]
|
D | pa_avx.cpp | 35 #if (KNOB_SIMD_WIDTH == 8) 87 uint32_t input_vec = input_cp / KNOB_SIMD_WIDTH; in PaPatchListSingle() 88 uint32_t input_lane = input_cp % KNOB_SIMD_WIDTH; in PaPatchListSingle() 124 float vec[KNOB_SIMD_WIDTH]; in PaPatchListTerm() 125 for (uint32_t lane = 0; lane < KNOB_SIMD_WIDTH; ++lane) in PaPatchListTerm() 128 uint32_t input_vec = input_cp / KNOB_SIMD_WIDTH; in PaPatchListTerm() 129 uint32_t input_lane = input_cp % KNOB_SIMD_WIDTH; in PaPatchListTerm() 143 KNOB_SIMD_WIDTH, in PaPatchListTerm() 268 SetNextPaState(pa, PaTriList0, PaTriListSingle0, 0, KNOB_SIMD_WIDTH, true); in PaTriList2() 369 SetNextPaState(pa, PaTriStrip1, PaTriStripSingle0, 0, KNOB_SIMD_WIDTH); in PaTriStrip1() [all …]
|
D | format_types.h | 81 #if KNOB_SIMD_WIDTH == 8 93 #if KNOB_SIMD_WIDTH == 8 102 #if KNOB_SIMD_WIDTH == 8 122 #if KNOB_SIMD_WIDTH == 8 195 #if KNOB_SIMD_WIDTH == 8 207 #if KNOB_SIMD_WIDTH == 8 216 #if KNOB_SIMD_WIDTH == 8 237 #if KNOB_SIMD_WIDTH == 8 310 #if KNOB_SIMD_WIDTH == 8 321 #if KNOB_SIMD_WIDTH == 8 [all …]
|
D | tilemgr.cpp | 103 hotTile.pBuffer = (uint8_t*)AllocHotTileMem(size, KNOB_SIMD_WIDTH * 4, numaNode); in GetHotTile() 127 hotTile.pBuffer = (uint8_t*)AllocHotTileMem(size, KNOB_SIMD_WIDTH * 4, numaNode); in GetHotTile() 197 hotTile.pBuffer = (uint8_t*)AlignedMalloc(size, KNOB_SIMD_WIDTH * 4); in GetHotTileNoLoad() 312 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile() 314 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile() 316 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile() 318 pfBuf += KNOB_SIMD_WIDTH; in ClearColorHotTile() 340 pfBuf += KNOB_SIMD_WIDTH; in ClearDepthHotTile()
|
D | backend.cpp | 105 pTileBuffer += (KNOB_SIMD_WIDTH * FormatTraits<format>::GetBPC(comp) / 8); in ClearRasterTile() 421 #if KNOB_SIMD_WIDTH == 8 624 … pColorBuffer[rt] += (2 * KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample() 630 … pColorBuffer[rt] += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample() 633 pDepthBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_DEPTH_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample() 634 … pStencilBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_STENCIL_HOT_TILE_FORMAT>::bpp) / 8; in BackendSingleSample() 841 … pColorBuffer[rt] += (2 * KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate() 847 … pColorBuffer[rt] += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_COLOR_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate() 850 pDepthBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_DEPTH_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate() 851 … pStencilBuffer += (KNOB_SIMD_WIDTH * FormatTraits<KNOB_STENCIL_HOT_TILE_FORMAT>::bpp) / 8; in BackendSampleRate() [all …]
|
D | backend.h | 57 #if KNOB_SIMD_WIDTH == 8 140 …utCoverage(const uint64_t *const coverageMask, uint32_t (&inputMask)[KNOB_SIMD_WIDTH], const uint3… in generateInputCoverage() 143 assert(KNOB_SIMD_WIDTH == 8); in generateInputCoverage() 263 for(int32_t i = KNOB_SIMD_WIDTH - 1; i >= 0; i--) in generateInputCoverage() 281 uint32_t inputMask[KNOB_SIMD_WIDTH]; in generateInputCoverage() 294 assert(KNOB_SIMD_WIDTH == 8); 303 …utCoverage(const uint64_t *const coverageMask, uint32_t (&inputMask)[KNOB_SIMD_WIDTH], const uint3… 307 for(int i = 0; i < KNOB_SIMD_WIDTH; i++) 329 uint32_t inputMask[KNOB_SIMD_WIDTH]; 335 unsigned long sampleNum[KNOB_SIMD_WIDTH]; [all …]
|
D | utils.h | 143 #if KNOB_SIMD_WIDTH == 8 148 #if KNOB_SIMD_WIDTH == 8 269 memcpy(pDst, pSrc, (bpp * KNOB_SIMD_WIDTH) / 8); in Transpose() 293 #if KNOB_SIMD_WIDTH == 8 in Transpose() 370 #if KNOB_SIMD_WIDTH == 8 in Transpose() 411 #if KNOB_SIMD_WIDTH == 8 in Transpose() 463 #if KNOB_SIMD_WIDTH == 8 in Transpose() 514 #if KNOB_SIMD_WIDTH == 8 in Transpose() 568 #if KNOB_SIMD_WIDTH == 8 in Transpose() 638 #if KNOB_SIMD_WIDTH == 8 in Transpose() [all …]
|
D | format_conversion.h | 70 pSrc += (FormatTraits<SrcFormat>::GetBPC(comp) * KNOB_SIMD_WIDTH) / 8; in LoadSOA() 192 pDst += (FormatTraits<DstFormat>::GetBPC(comp) * KNOB_SIMD_WIDTH) / 8; in StoreSOA()
|
D | api.cpp | 72 void* pContextMem = AlignedMalloc(sizeof(SWR_CONTEXT), KNOB_SIMD_WIDTH * 4); in SwrCreateContext() 132 … pContext->ppScratch[i] = (uint8_t*)AlignedMalloc(32 * sizeof(KILOBYTE), KNOB_SIMD_WIDTH * 4); in SwrCreateContext() 1537 …vateState = pState->pArena->AllocAligned(pContext->privateStateSize, KNOB_SIMD_WIDTH*sizeof(float)… in SwrGetPrivateContextState()
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/memory/ |
D | StoreTile.h | 519 for (uint32_t t = 0; t < KNOB_SIMD_WIDTH; ++t) 1224 ppRows[0] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2; 1225 ppRows[1] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2; 1226 pSrc += SRC_BYTES_PER_PIXEL * KNOB_SIMD_WIDTH; 1311 ppRows[0] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2; 1312 ppRows[1] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2; 1313 pSrc += SRC_BYTES_PER_PIXEL * KNOB_SIMD_WIDTH; 1398 ppRows[0] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2; 1399 ppRows[1] += KNOB_SIMD_WIDTH * DST_BYTES_PER_PIXEL / 2; 1400 pSrc += SRC_BYTES_PER_PIXEL * KNOB_SIMD_WIDTH; [all …]
|
D | TilingFunctions.h | 47 float color[FormatTraits<HotTileFormat>::numComps][KNOB_SIMD_WIDTH]; 103 uint8_t color[FormatTraits<R8_UINT>::numComps][KNOB_SIMD_WIDTH];
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/common/ |
D | simdintrin.h | 35 #if KNOB_SIMD_WIDTH == 8 56 #if KNOB_SIMD_WIDTH == 8 372 for (uint32_t i = 0; i < KNOB_SIMD_WIDTH; ++i) in _simd_i32gather_ps() 665 OSALIGNSIMD(float) rArray[KNOB_SIMD_WIDTH], sArray[KNOB_SIMD_WIDTH]; in _simd_mov()
|
/external/mesa3d/src/gallium/drivers/swr/ |
D | swr_screen.cpp | 975 screen->hJitMgr = JitCreateContext(KNOB_SIMD_WIDTH, KNOB_ARCH_STR, "swr"); in swr_create_screen_internal()
|