Searched refs:koff (Results 1 – 3 of 3) sorted by relevance
674 for (int koff = 0; koff < 16; koff ++) { in EigenFloatContractionKernelInternal16x16() local676 float2 fl1 = lhs_shmem2[koff][threadIdx.x]; in EigenFloatContractionKernelInternal16x16()677 float2 fl2 = lhs_shmem2[koff + 16][threadIdx.x]; in EigenFloatContractionKernelInternal16x16()680 float2 fr1 = rhs_shmem2[(start_feature>>1) + 32*((koff%4)/2)][koff/4 + (koff%2)*4]; in EigenFloatContractionKernelInternal16x16()681 float2 fr2 = rhs_shmem2[(start_feature>>1) + 1 + 32*((koff%4)/2)][koff/4 + (koff%2)*4]; in EigenFloatContractionKernelInternal16x16()1048 for (int koff = 0; koff < 32; koff ++) { in EigenFloatContractionKernelInternal() local1049 float2 a3 = lhs_shmem2[koff][threadIdx.x + (threadIdx.y % 4) * 8]; in EigenFloatContractionKernelInternal()1050 float2 a4 = lhs_shmem2[koff + 32][threadIdx.x + (threadIdx.y % 4) * 8]; in EigenFloatContractionKernelInternal()1055 float2 br1 = rhs_shmem2[start_feature/2 + (koff % 4) * 32][koff/4]; in EigenFloatContractionKernelInternal()1056 float2 br2 = rhs_shmem2[start_feature/2 + 1 + (koff % 4) * 32][koff/4]; in EigenFloatContractionKernelInternal()[all …]
91741 koff %35036 kɔf
108816 koff kɔf