• Home
  • Raw
  • Download

Lines Matching refs:vi

72       __m128 vi${M}x6024 = _mm_setzero_ps();
75 __m128 vi${M}x7135 = _mm_setzero_ps();
78 const __m128 vi${M}x89AB = _mm_loadu_ps(i${M});
79 const __m128 vi${M}xCDEF = _mm_loadu_ps(i${M} + 4);
83 __m128 vi${M}x8ACE = _mm_shuffle_ps(vi${M}x89AB, vi${M}xCDEF, _MM_SHUFFLE(2, 0, 2, 0));
84 __m128 vi${M}x9BDF = _mm_shuffle_ps(vi${M}x89AB, vi${M}xCDEF, _MM_SHUFFLE(3, 1, 3, 1));
91 __m128 vo${M}p0 = _mm_add_ps(vbias, _mm_mul_ps(vi${2*M+K}x8ACE, vk${K}2));
93 __m128 vo${M}p${K} = _mm_mul_ps(vi${2*M+K}x8ACE, vk${K}2);
95 …vo${M}p${K % ACCUMULATORS} = _mm_add_ps(vo${M}p${K % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x8ACE, vk…
98 … const __m128 vi${M}xE8AC = _mm_shuffle_ps(vi${M}x8ACE, vi${M}x8ACE, _MM_SHUFFLE(2, 1, 0, 3));
102 …vo${M}p${(K+5) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+5) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x…
105 const __m128 vi${M}x68AC = _mm_move_ss(vi${M}xE8AC, vi${M}x6024);
106 vi${M}x6024 = vi${M}xE8AC;
109 … const __m128 vi${M}xF9BD = _mm_shuffle_ps(vi${M}x9BDF, vi${M}x9BDF, _MM_SHUFFLE(2, 1, 0, 3));
113 …) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+10) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x68AC, vk${K}…
116 const __m128 vi${M}xGHIJ = _mm_loadu_ps(i${M});
117 const __m128 vi${M}xKLMN = _mm_loadu_ps(i${M} + 4);
121 const __m128 vi${M}x79BD = _mm_move_ss(vi${M}xF9BD, vi${M}x7135);
122 vi${M}x7135 = vi${M}xF9BD;
125 … const __m128 vi${M}xGIKM = _mm_shuffle_ps(vi${M}xGHIJ, vi${M}xKLMN, _MM_SHUFFLE(2, 0, 2, 0));
126 … const __m128 vi${M}xHJLN = _mm_shuffle_ps(vi${M}xGHIJ, vi${M}xKLMN, _MM_SHUFFLE(3, 1, 3, 1));
127 vi${M}x9BDF = vi${M}xHJLN;
131 …) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+15) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x79BD, vk${K}…
134 const __m128 vi${M}xGACE = _mm_move_ss(vi${M}x8ACE, vi${M}xGIKM);
135 vi${M}x8ACE = vi${M}xGIKM;
138 … const __m128 vi${M}xACEG = _mm_shuffle_ps(vi${M}xGACE, vi${M}xGACE, _MM_SHUFFLE(0, 3, 2, 1));
142 …) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+20) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}xACEG, vk${K}…
168 vi${M}x8ACE = _mm_and_ps(vi${M}x8ACE, vmask_even);
169 vi${M}x9BDF = _mm_and_ps(vi${M}x9BDF, vmask_odd);
174 __m128 vo${M}p0 = _mm_add_ps(vbias, _mm_mul_ps(vi${2*M+K}x8ACE, vk${K}2));
176 __m128 vo${M}p${K} = _mm_mul_ps(vi${2*M+K}x8ACE, vk${K}2);
178 …vo${M}p${K % ACCUMULATORS} = _mm_add_ps(vo${M}p${K % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x8ACE, vk…
181 … const __m128 vi${M}xE8AC = _mm_shuffle_ps(vi${M}x8ACE, vi${M}x8ACE, _MM_SHUFFLE(2, 1, 0, 3));
185 …vo${M}p${(K+5) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+5) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x…
188 const __m128 vi${M}x68AC = _mm_move_ss(vi${M}xE8AC, vi${M}x6024);
191 … const __m128 vi${M}xF9BD = _mm_shuffle_ps(vi${M}x9BDF, vi${M}x9BDF, _MM_SHUFFLE(2, 1, 0, 3));
195 …) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+10) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x68AC, vk${K}…
198 const __m128 vi${M}x79BD = _mm_move_ss(vi${M}xF9BD, vi${M}x7135);
202 …) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+15) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}x79BD, vk${K}…
206 const __m128 vi${M}xGACE = _mm_move_ss(vi${M}x8ACE, vzero);
209 … const __m128 vi${M}xACEG = _mm_shuffle_ps(vi${M}xGACE, vi${M}xGACE, _MM_SHUFFLE(0, 3, 2, 1));
213 …) % ACCUMULATORS} = _mm_add_ps(vo${M}p${(K+20) % ACCUMULATORS}, _mm_mul_ps(vi${2*M+K}xACEG, vk${K}…