/external/XNNPACK/src/f32-velu/gen/ |
D | velu-wasmsimd-arm-rr2-p6-x4.c | 69 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x4() local 71 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x4() 99 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x4() local 101 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x4()
|
D | velu-wasmsimd-x86-rr2-p6-x4.c | 72 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x4() local 74 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x4() 105 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x4() local 107 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x4()
|
D | velu-wasmsimd-arm-rr2-lut16-p3-x4.c | 77 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x4() local 79 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x4() 115 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x4() local 117 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x4()
|
D | velu-wasmsimd-x86-rr2-lut16-p3-x4.c | 80 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x4() local 82 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x4() 121 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x4() local 123 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x4()
|
D | velu-wasmsimd-arm-rr2-p6-x8.c | 130 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x8() local 132 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x8() 160 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x8() local 162 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x8()
|
D | velu-wasmsimd-x86-rr2-p6-x8.c | 139 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x8() local 141 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x8() 172 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x8() local 174 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x8()
|
D | velu-wasmsimd-arm-rr2-lut16-p3-x8.c | 148 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x8() local 150 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x8() 186 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x8() local 188 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x8()
|
D | velu-wasmsimd-arm-rr2-p6-x12.c | 150 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x12() local 152 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x12() 180 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x12() local 182 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x12()
|
D | velu-wasmsimd-arm-rr2-p6-x16.c | 170 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x16() local 172 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x16() 200 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x16() local 202 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x16()
|
D | velu-wasmsimd-x86-rr2-lut16-p3-x8.c | 157 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x8() local 159 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x8() 198 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x8() local 200 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x8()
|
D | velu-wasmsimd-x86-rr2-p6-x12.c | 162 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x12() local 164 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x12() 195 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x12() local 197 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x12()
|
D | velu-wasmsimd-arm-rr2-lut16-p3-x12.c | 174 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x12() local 176 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x12() 212 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x12() local 214 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x12()
|
D | velu-wasmsimd-x86-rr2-lut16-p3-x12.c | 186 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x12() local 188 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x12() 227 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x12() local 229 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x12()
|
D | velu-wasmsimd-arm-rr2-p6-x20.c | 190 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x20() local 192 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x20() 220 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x20() local 222 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x20()
|
D | velu-wasmsimd-x86-rr2-p6-x16.c | 185 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x16() local 187 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x16() 218 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x16() local 220 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x16()
|
D | velu-wasmsimd-arm-rr2-lut16-p3-x16.c | 200 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x16() local 202 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x16() 238 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x16() local 240 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x16()
|
D | velu-wasmsimd-x86-rr2-p6-x20.c | 208 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x20() local 210 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x20() 241 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x20() local 243 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x20()
|
D | velu-wasmsimd-x86-rr2-lut16-p3-x16.c | 215 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x16() local 217 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x16() 256 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x16() local 258 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x16()
|
D | velu-wasmsimd-arm-rr2-p6-x24.c | 210 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x24() local 212 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x24() 240 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x24() local 242 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_p6_x24()
|
D | velu-wasmsimd-x86-rr2-p6-x24.c | 231 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x24() local 233 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x24() 264 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x24() local 266 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_p6_x24()
|
D | velu-wasmsimd-arm-rr2-lut16-p3-x20.c | 226 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x20() local 228 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x20() 264 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x20() local 266 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x20()
|
D | velu-wasmsimd-arm-rr2-lut16-p3-x24.c | 252 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x24() local 254 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x24() 290 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x24() local 292 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_arm_rr2_lut16_p3_x24()
|
D | velu-wasmsimd-x86-rr2-lut16-p3-x20.c | 244 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x20() local 246 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x20() 285 const v128_t vsignm = wasm_i32x4_shr(vx, 31); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x20() local 287 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); in xnn_f32_velu_ukernel__wasmsimd_x86_rr2_lut16_p3_x20()
|
/external/XNNPACK/src/f32-velu/ |
D | wasmsimd-rr2-p6.c.in | 104 const v128_t vsignm${ABC[N:N+4]} = wasm_i32x4_shr(vx${ABC[N:N+4]}, 31); 108 …const v128_t vy${ABC[N:N+4]} = wasm_v128_bitselect(ve${ABC[N:N+4]}, vx${ABC[N:N+4]}, vsignm${ABC[N… 147 const v128_t vsignm = wasm_i32x4_shr(vx, 31); 149 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); 185 const v128_t vsignm = wasm_i32x4_shr(vx, 31); 187 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm);
|
D | wasmsimd-rr2-lut16-p3.c.in | 106 const v128_t vsignm${ABC[N:N+4]} = wasm_i32x4_shr(vx${ABC[N:N+4]}, 31); 110 …const v128_t vy${ABC[N:N+4]} = wasm_v128_bitselect(ve${ABC[N:N+4]}, vx${ABC[N:N+4]}, vsignm${ABC[N… 157 const v128_t vsignm = wasm_i32x4_shr(vx, 31); 159 const v128_t vy = wasm_v128_bitselect(ve, vx, vsignm); 203 const v128_t vsignm = wasm_i32x4_shr(vx, 31); 205 v128_t vy = wasm_v128_bitselect(ve, vx, vsignm);
|