Lines Matching refs:vfloat
118 vfloat sample = loada(dec_weight_ideal_value + i) * (SINCOS_STEPS - 1.0f) + vfloat(12582912.0f); in compute_angular_offsets()
124 vfloat mult = vfloat(1.0f / (2.0f * astc::PI)); in compute_angular_offsets()
128 vfloat anglesum_x = vfloat::zero(); in compute_angular_offsets()
129 vfloat anglesum_y = vfloat::zero(); in compute_angular_offsets()
138 vfloat angle = atan2(anglesum_y, anglesum_x); in compute_angular_offsets()
139 vfloat ofs = angle * mult; in compute_angular_offsets()
177 vfloat rcp_stepsize = vfloat::lane_id() + vfloat(1.0f); in compute_lowest_and_highest_weight()
182 vfloat minidx(128.0f); in compute_lowest_and_highest_weight()
183 vfloat maxidx(-128.0f); in compute_lowest_and_highest_weight()
184 vfloat errval = vfloat::zero(); in compute_lowest_and_highest_weight()
185 vfloat cut_low_weight_err = vfloat::zero(); in compute_lowest_and_highest_weight()
186 vfloat cut_high_weight_err = vfloat::zero(); in compute_lowest_and_highest_weight()
187 vfloat offset = loada(&offsets[sp]); in compute_lowest_and_highest_weight()
191 vfloat sval = load1(&dec_weight_ideal_value[j]) * rcp_stepsize - offset; in compute_lowest_and_highest_weight()
192 vfloat svalrte = round(sval); in compute_lowest_and_highest_weight()
193 vfloat diff = sval - svalrte; in compute_lowest_and_highest_weight()
199 cut_low_weight_err = select(cut_low_weight_err, vfloat::zero(), mask); in compute_lowest_and_highest_weight()
203 vfloat accum = cut_low_weight_err + vfloat(1.0f) - vfloat(2.0f) * diff; in compute_lowest_and_highest_weight()
209 cut_high_weight_err = select(cut_high_weight_err, vfloat::zero(), mask); in compute_lowest_and_highest_weight()
213 accum = cut_high_weight_err + vfloat(1.0f) + vfloat(2.0f) * diff; in compute_lowest_and_highest_weight()
218 vint span = float_to_int(maxidx - minidx + vfloat(1)); in compute_lowest_and_highest_weight()
226 vfloat ssize = 1.0f / rcp_stepsize; in compute_lowest_and_highest_weight()
227 vfloat errscale = ssize * ssize; in compute_lowest_and_highest_weight()
232 rcp_stepsize = rcp_stepsize + vfloat(ASTCENC_SIMD_WIDTH); in compute_lowest_and_highest_weight()
375 vfloat rcp_stepsize = vfloat::lane_id() + vfloat(1.0f); in compute_lowest_and_highest_weight_lwc()
380 vfloat minidx(128.0f); in compute_lowest_and_highest_weight_lwc()
381 vfloat maxidx(-128.0f); in compute_lowest_and_highest_weight_lwc()
382 vfloat errval = vfloat::zero(); in compute_lowest_and_highest_weight_lwc()
383 vfloat offset = loada(&offsets[sp]); in compute_lowest_and_highest_weight_lwc()
387 vfloat sval = load1(&dec_weight_quant_uvalue[j]) * rcp_stepsize - offset; in compute_lowest_and_highest_weight_lwc()
388 vfloat svalrte = round(sval); in compute_lowest_and_highest_weight_lwc()
389 vfloat diff = sval - svalrte; in compute_lowest_and_highest_weight_lwc()
402 vint span = float_to_int(maxidx - minidx + vfloat(1.0f)); in compute_lowest_and_highest_weight_lwc()
410 vfloat ssize = 1.0f / rcp_stepsize; in compute_lowest_and_highest_weight_lwc()
411 vfloat errscale = ssize * ssize; in compute_lowest_and_highest_weight_lwc()
414 rcp_stepsize = rcp_stepsize + vfloat(ASTCENC_SIMD_WIDTH); in compute_lowest_and_highest_weight_lwc()