/external/XNNPACK/src/f32-argmaxpool/ |
D | 9p8x-wasmsimd-c4.c | 79 vmax = wasm_v128_bitselect(vi1, vmax, vm1); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 80 vidx = wasm_v128_bitselect(wasm_i32x4_splat(1), vidx, vm1); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 83 vmax = wasm_v128_bitselect(vi2, vmax, vm2); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 84 vidx = wasm_v128_bitselect(wasm_i32x4_splat(2), vidx, vm2); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 87 vmax = wasm_v128_bitselect(vi3, vmax, vm3); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 88 vidx = wasm_v128_bitselect(wasm_i32x4_splat(3), vidx, vm3); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 91 vmax = wasm_v128_bitselect(vi4, vmax, vm4); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 92 vidx = wasm_v128_bitselect(wasm_i32x4_splat(4), vidx, vm4); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 95 vmax = wasm_v128_bitselect(vi5, vmax, vm5); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() 96 vidx = wasm_v128_bitselect(wasm_i32x4_splat(5), vidx, vm5); in xnn_f32_argmaxpool_ukernel_9p8x__wasmsimd_c4() [all …]
|
D | 9x-wasmsimd-c4.c | 99 vmax = wasm_v128_bitselect(vi1, vmax, vm1); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 100 vidx = wasm_v128_bitselect(wasm_i32x4_splat(1), vidx, vm1); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 103 vmax = wasm_v128_bitselect(vi2, vmax, vm2); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 104 vidx = wasm_v128_bitselect(wasm_i32x4_splat(2), vidx, vm2); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 107 vmax = wasm_v128_bitselect(vi3, vmax, vm3); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 108 vidx = wasm_v128_bitselect(wasm_i32x4_splat(3), vidx, vm3); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 111 vmax = wasm_v128_bitselect(vi4, vmax, vm4); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 112 vidx = wasm_v128_bitselect(wasm_i32x4_splat(4), vidx, vm4); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 115 vmax = wasm_v128_bitselect(vi5, vmax, vm5); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() 116 vidx = wasm_v128_bitselect(wasm_i32x4_splat(5), vidx, vm5); in xnn_f32_argmaxpool_ukernel_9x__wasmsimd_c4() [all …]
|
D | 4x-wasmsimd-c4.c | 64 vmax = wasm_v128_bitselect(vi1, vmax, vm1); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 65 vidx = wasm_v128_bitselect(wasm_i32x4_splat(1), vidx, vm1); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 68 vmax = wasm_v128_bitselect(vi2, vmax, vm2); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 69 vidx = wasm_v128_bitselect(wasm_i32x4_splat(2), vidx, vm2); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 72 vmax = wasm_v128_bitselect(vi3, vmax, vm3); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 73 vidx = wasm_v128_bitselect(wasm_i32x4_splat(3), vidx, vm3); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 90 vmax = wasm_v128_bitselect(vi1, vmax, vm1); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 91 vidx = wasm_v128_bitselect(wasm_i32x4_splat(1), vidx, vm1); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 94 vmax = wasm_v128_bitselect(vi2, vmax, vm2); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() 95 vidx = wasm_v128_bitselect(wasm_i32x4_splat(2), vidx, vm2); in xnn_f32_argmaxpool_ukernel_4x__wasmsimd_c4() [all …]
|
/external/XNNPACK/src/f32-maxpool/ |
D | 9p8x-minmax-wasmsimd-x86-c4.c | 97 const v128_t vmax01 = wasm_v128_bitselect(vi1, vi0, wasm_f32x4_lt(vi0, vi1)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 98 const v128_t vmax23 = wasm_v128_bitselect(vi3, vi2, wasm_f32x4_lt(vi2, vi3)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 99 const v128_t vmax45 = wasm_v128_bitselect(vi5, vi4, wasm_f32x4_lt(vi4, vi5)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 100 const v128_t vmax018 = wasm_v128_bitselect(vi8, vmax01, wasm_f32x4_lt(vmax01, vi8)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 101 const v128_t vmax67 = wasm_v128_bitselect(vi7, vi6, wasm_f32x4_lt(vi6, vi7)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 103 const v128_t vmax2345 = wasm_v128_bitselect(vmax45, vmax23, wasm_f32x4_lt(vmax23, vmax45)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 104 … const v128_t vmax01678 = wasm_v128_bitselect(vmax67, vmax018, wasm_f32x4_lt(vmax018, vmax67)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 105 … const v128_t vmax = wasm_v128_bitselect(vmax2345, vmax01678, wasm_f32x4_lt(vmax01678, vmax2345)); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 110 v128_t vout = wasm_v128_bitselect(voutput_min, vmax, vmaskmin); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 111 vout = wasm_v128_bitselect(vout, voutput_max, vmaskmax); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() [all …]
|
/external/XNNPACK/src/f32-spmm/gen/ |
D | 32x1-minmax-wasmsimd-x86.c | 73 v128_t vout0123 = wasm_v128_bitselect(vacc0123, vmax, wasm_f32x4_le(vacc0123, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 74 v128_t vout4567 = wasm_v128_bitselect(vacc4567, vmax, wasm_f32x4_le(vacc4567, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 75 v128_t vout89AB = wasm_v128_bitselect(vacc89AB, vmax, wasm_f32x4_le(vacc89AB, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 76 v128_t voutCDEF = wasm_v128_bitselect(vaccCDEF, vmax, wasm_f32x4_le(vaccCDEF, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 77 v128_t voutGHIJ = wasm_v128_bitselect(vaccGHIJ, vmax, wasm_f32x4_le(vaccGHIJ, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 78 v128_t voutKLMN = wasm_v128_bitselect(vaccKLMN, vmax, wasm_f32x4_le(vaccKLMN, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 79 v128_t voutOPQR = wasm_v128_bitselect(vaccOPQR, vmax, wasm_f32x4_le(vaccOPQR, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 80 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 81 vout0123 = wasm_v128_bitselect(vmin, vout0123, wasm_f32x4_lt(vout0123, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 82 vout4567 = wasm_v128_bitselect(vmin, vout4567, wasm_f32x4_lt(vout4567, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() [all …]
|
D | 32x1-minmax-wasmsimd-x86-pipelined.c | 87 v128_t vout0123 = wasm_v128_bitselect(vacc0123, vmax, wasm_f32x4_le(vacc0123, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 88 v128_t vout4567 = wasm_v128_bitselect(vacc4567, vmax, wasm_f32x4_le(vacc4567, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 89 v128_t vout89AB = wasm_v128_bitselect(vacc89AB, vmax, wasm_f32x4_le(vacc89AB, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 90 v128_t voutCDEF = wasm_v128_bitselect(vaccCDEF, vmax, wasm_f32x4_le(vaccCDEF, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 91 v128_t voutGHIJ = wasm_v128_bitselect(vaccGHIJ, vmax, wasm_f32x4_le(vaccGHIJ, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 92 v128_t voutKLMN = wasm_v128_bitselect(vaccKLMN, vmax, wasm_f32x4_le(vaccKLMN, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 93 v128_t voutOPQR = wasm_v128_bitselect(vaccOPQR, vmax, wasm_f32x4_le(vaccOPQR, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 94 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 95 vout0123 = wasm_v128_bitselect(vmin, vout0123, wasm_f32x4_lt(vout0123, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 96 vout4567 = wasm_v128_bitselect(vmin, vout4567, wasm_f32x4_lt(vout4567, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() [all …]
|
D | 32x1-minmax-wasmsimd-x86-pipelined-x2.c | 127 v128_t vout0123 = wasm_v128_bitselect(vacc0123, vmax, wasm_f32x4_le(vacc0123, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 128 v128_t vout4567 = wasm_v128_bitselect(vacc4567, vmax, wasm_f32x4_le(vacc4567, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 129 v128_t vout89AB = wasm_v128_bitselect(vacc89AB, vmax, wasm_f32x4_le(vacc89AB, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 130 v128_t voutCDEF = wasm_v128_bitselect(vaccCDEF, vmax, wasm_f32x4_le(vaccCDEF, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 131 v128_t voutGHIJ = wasm_v128_bitselect(vaccGHIJ, vmax, wasm_f32x4_le(vaccGHIJ, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 132 v128_t voutKLMN = wasm_v128_bitselect(vaccKLMN, vmax, wasm_f32x4_le(vaccKLMN, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 133 v128_t voutOPQR = wasm_v128_bitselect(vaccOPQR, vmax, wasm_f32x4_le(vaccOPQR, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 134 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 135 vout0123 = wasm_v128_bitselect(vmin, vout0123, wasm_f32x4_lt(vout0123, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 136 vout4567 = wasm_v128_bitselect(vmin, vout4567, wasm_f32x4_lt(vout4567, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() [all …]
|
D | 32x1-minmax-wasmsimd-x86-x2.c | 142 v128_t vout0123 = wasm_v128_bitselect(vacc0123, vmax, wasm_f32x4_le(vacc0123, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 143 v128_t vout4567 = wasm_v128_bitselect(vacc4567, vmax, wasm_f32x4_le(vacc4567, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 144 v128_t vout89AB = wasm_v128_bitselect(vacc89AB, vmax, wasm_f32x4_le(vacc89AB, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 145 v128_t voutCDEF = wasm_v128_bitselect(vaccCDEF, vmax, wasm_f32x4_le(vaccCDEF, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 146 v128_t voutGHIJ = wasm_v128_bitselect(vaccGHIJ, vmax, wasm_f32x4_le(vaccGHIJ, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 147 v128_t voutKLMN = wasm_v128_bitselect(vaccKLMN, vmax, wasm_f32x4_le(vaccKLMN, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 148 v128_t voutOPQR = wasm_v128_bitselect(vaccOPQR, vmax, wasm_f32x4_le(vaccOPQR, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 149 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 150 vout0123 = wasm_v128_bitselect(vmin, vout0123, wasm_f32x4_lt(vout0123, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 151 vout4567 = wasm_v128_bitselect(vmin, vout4567, wasm_f32x4_lt(vout4567, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() [all …]
|
/external/XNNPACK/src/f32-gemm/gen/ |
D | 6x8-minmax-wasmsimd-x86-loadsplat.c | 122 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 123 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 124 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 125 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 126 vacc4x0123 = wasm_v128_bitselect(vmin, vacc4x0123, wasm_f32x4_lt(vacc4x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 127 vacc5x0123 = wasm_v128_bitselect(vmin, vacc5x0123, wasm_f32x4_lt(vacc5x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 128 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 129 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 130 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 131 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() [all …]
|
D | 5x8-minmax-wasmsimd-x86-loadsplat.c | 110 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 111 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 112 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 113 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 114 vacc4x0123 = wasm_v128_bitselect(vmin, vacc4x0123, wasm_f32x4_lt(vacc4x0123, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 115 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 116 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 117 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 118 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 119 vacc4x4567 = wasm_v128_bitselect(vmin, vacc4x4567, wasm_f32x4_lt(vacc4x4567, vmin)); in xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() [all …]
|
/external/XNNPACK/src/f32-gemm/gen-inc/ |
D | 6x8inc-minmax-wasmsimd-x86-loadsplat.c | 124 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 125 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 126 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 127 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 128 vacc4x0123 = wasm_v128_bitselect(vmin, vacc4x0123, wasm_f32x4_lt(vacc4x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 129 vacc5x0123 = wasm_v128_bitselect(vmin, vacc5x0123, wasm_f32x4_lt(vacc5x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 130 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 131 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 132 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 133 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() [all …]
|
D | 5x8inc-minmax-wasmsimd-x86-loadsplat.c | 112 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 113 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 114 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 115 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 116 vacc4x0123 = wasm_v128_bitselect(vmin, vacc4x0123, wasm_f32x4_lt(vacc4x0123, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 117 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 118 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 119 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 120 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 121 vacc4x4567 = wasm_v128_bitselect(vmin, vacc4x4567, wasm_f32x4_lt(vacc4x4567, vmin)); in xnn_f32_gemminc_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() [all …]
|
/external/XNNPACK/src/f32-igemm/gen/ |
D | 6x8-minmax-wasmsimd-x86-loadsplat.c | 151 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 152 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 153 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 154 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 155 vacc4x0123 = wasm_v128_bitselect(vmin, vacc4x0123, wasm_f32x4_lt(vacc4x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 156 vacc5x0123 = wasm_v128_bitselect(vmin, vacc5x0123, wasm_f32x4_lt(vacc5x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 157 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 158 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 159 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() 160 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat() [all …]
|
D | 5x8-minmax-wasmsimd-x86-loadsplat.c | 136 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 137 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 138 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 139 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 140 vacc4x0123 = wasm_v128_bitselect(vmin, vacc4x0123, wasm_f32x4_lt(vacc4x0123, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 141 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 142 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 143 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 144 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() 145 vacc4x4567 = wasm_v128_bitselect(vmin, vacc4x4567, wasm_f32x4_lt(vacc4x4567, vmin)); in xnn_f32_igemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat() [all …]
|
/external/XNNPACK/src/f32-vmulcaddc/gen/ |
D | c8-minmax-wasmsimd-x86-2x.c | 68 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 69 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 70 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 71 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 73 vacc0x0123 = wasm_v128_bitselect(vacc0x0123, vmax, wasm_f32x4_le(vacc0x0123, vmax)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 74 vacc0x4567 = wasm_v128_bitselect(vacc0x4567, vmax, wasm_f32x4_le(vacc0x4567, vmax)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 75 vacc1x0123 = wasm_v128_bitselect(vacc1x0123, vmax, wasm_f32x4_le(vacc1x0123, vmax)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 76 vacc1x4567 = wasm_v128_bitselect(vacc1x4567, vmax, wasm_f32x4_le(vacc1x4567, vmax)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 100 vacc0 = wasm_v128_bitselect(vmin, vacc0, wasm_f32x4_lt(vacc0, vmin)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() 101 vacc1 = wasm_v128_bitselect(vmin, vacc1, wasm_f32x4_lt(vacc1, vmin)); in xnn_f32_vmulcaddc_minmax_ukernel_c8__wasmsimd_x86_2x() [all …]
|
/external/XNNPACK/src/f32-vbinary/gen/ |
D | vmulc-minmax-wasmsimd-x86-x16.c | 53 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 55 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 57 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 59 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 61 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 62 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 64 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 80 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() 81 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vmulc_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vrsubc-minmax-wasmsimd-x86-x16.c | 53 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 55 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 57 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 59 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 61 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 62 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 64 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 80 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() 81 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vrsubc_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vsubc-minmax-wasmsimd-x86-x16.c | 53 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 55 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 57 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 59 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 61 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 62 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 64 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 80 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() 81 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vsubc_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vrdivc-minmax-wasmsimd-x86-x16.c | 53 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 55 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 57 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 59 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 61 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 62 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 64 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 80 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() 81 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vrdivc_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vdivc-minmax-wasmsimd-x86-x16.c | 53 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 55 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 57 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 59 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 61 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 62 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 64 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 80 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() 81 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vdivc_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vaddc-minmax-wasmsimd-x86-x16.c | 53 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 55 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 57 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 59 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 61 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 62 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 64 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 80 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() 81 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vaddc_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vsub-minmax-wasmsimd-x86-x16.c | 59 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 61 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 65 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 67 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 68 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 69 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 70 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 89 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() 90 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vsub_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
D | vmul-minmax-wasmsimd-x86-x16.c | 59 vy0123 = wasm_v128_bitselect(vy_min, vy0123, vltmask0123); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 61 vy4567 = wasm_v128_bitselect(vy_min, vy4567, vltmask4567); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 63 vy89AB = wasm_v128_bitselect(vy_min, vy89AB, vltmask89AB); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 65 vyCDEF = wasm_v128_bitselect(vy_min, vyCDEF, vltmaskCDEF); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 67 vy0123 = wasm_v128_bitselect(vy0123, vy_max, vngtmask0123); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 68 vy4567 = wasm_v128_bitselect(vy4567, vy_max, vngtmask4567); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 69 vy89AB = wasm_v128_bitselect(vy89AB, vy_max, vngtmask89AB); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 70 vyCDEF = wasm_v128_bitselect(vyCDEF, vy_max, vngtmaskCDEF); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 89 vy = wasm_v128_bitselect(vy_min, vy, vltmask); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() 90 vy = wasm_v128_bitselect(vy, vy_max, vngtmask); in xnn_f32_vmul_minmax_ukernel__wasmsimd_x86_x16() [all …]
|
/external/XNNPACK/src/f32-ppmm/gen/ |
D | 4x8-minmax-wasmsimd-x86-splat.c | 86 vacc0x0123 = wasm_v128_bitselect(vmin, vacc0x0123, wasm_f32x4_lt(vacc0x0123, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 87 vacc1x0123 = wasm_v128_bitselect(vmin, vacc1x0123, wasm_f32x4_lt(vacc1x0123, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 88 vacc2x0123 = wasm_v128_bitselect(vmin, vacc2x0123, wasm_f32x4_lt(vacc2x0123, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 89 vacc3x0123 = wasm_v128_bitselect(vmin, vacc3x0123, wasm_f32x4_lt(vacc3x0123, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 90 vacc0x4567 = wasm_v128_bitselect(vmin, vacc0x4567, wasm_f32x4_lt(vacc0x4567, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 91 vacc1x4567 = wasm_v128_bitselect(vmin, vacc1x4567, wasm_f32x4_lt(vacc1x4567, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 92 vacc2x4567 = wasm_v128_bitselect(vmin, vacc2x4567, wasm_f32x4_lt(vacc2x4567, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 93 vacc3x4567 = wasm_v128_bitselect(vmin, vacc3x4567, wasm_f32x4_lt(vacc3x4567, vmin)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 96 vacc0x0123 = wasm_v128_bitselect(vacc0x0123, vmax, wasm_f32x4_le(vacc0x0123, vmax)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() 97 vacc1x0123 = wasm_v128_bitselect(vacc1x0123, vmax, wasm_f32x4_le(vacc1x0123, vmax)); in xnn_f32_ppmm_minmax_ukernel_4x8__wasmsimd_x86_splat() [all …]
|
/external/XNNPACK/src/f32-prelu/gen/ |
D | wasmsimd-bitselect-4x16.c | 120 vacc0x0123 = wasm_v128_bitselect(vacc0x0123, vi0x0123, vmask0x0123); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 121 vacc0x4567 = wasm_v128_bitselect(vacc0x4567, vi0x4567, vmask0x4567); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 122 vacc0x89AB = wasm_v128_bitselect(vacc0x89AB, vi0x89AB, vmask0x89AB); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 123 vacc0xCDEF = wasm_v128_bitselect(vacc0xCDEF, vi0xCDEF, vmask0xCDEF); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 124 vacc1x0123 = wasm_v128_bitselect(vacc1x0123, vi1x0123, vmask1x0123); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 125 vacc1x4567 = wasm_v128_bitselect(vacc1x4567, vi1x4567, vmask1x4567); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 126 vacc1x89AB = wasm_v128_bitselect(vacc1x89AB, vi1x89AB, vmask1x89AB); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 127 vacc1xCDEF = wasm_v128_bitselect(vacc1xCDEF, vi1xCDEF, vmask1xCDEF); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 128 vacc2x0123 = wasm_v128_bitselect(vacc2x0123, vi2x0123, vmask2x0123); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() 129 vacc2x4567 = wasm_v128_bitselect(vacc2x4567, vi2x4567, vmask2x4567); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() [all …]
|