/external/XNNPACK/src/qs8-gemm/gen/ |
D | 8x8c4-minmax-neondot.c | 356 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 357 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 358 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 359 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 360 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 361 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 362 vst1q_lane_s8(c6, vout6x01234567_7x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot() 363 vst1q_lane_s8(c7, vout6x01234567_7x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x8c4__neondot()
|
D | 6x8c4-minmax-neondot.c | 292 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_6x8c4__neondot() 293 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_6x8c4__neondot() 294 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_6x8c4__neondot() 295 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_6x8c4__neondot() 296 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_6x8c4__neondot() 297 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_6x8c4__neondot()
|
D | 4x8c4-minmax-neondot.c | 228 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c4__neondot() 229 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c4__neondot() 230 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c4__neondot() 231 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c4__neondot()
|
D | 8x16c4-minmax-neondot.c | 524 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 525 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 526 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 527 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 528 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 529 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 530 vst1q_lane_s8(c6, vout6x01234567_7x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot() 531 vst1q_lane_s8(c7, vout6x01234567_7x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_8x16c4__neondot()
|
D | 6x16c4-minmax-neondot.c | 420 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_6x16c4__neondot() 421 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_6x16c4__neondot() 422 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_6x16c4__neondot() 423 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_6x16c4__neondot() 424 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_6x16c4__neondot() 425 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_6x16c4__neondot()
|
D | 4x16c4-minmax-neondot.c | 316 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x16c4__neondot() 317 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x16c4__neondot() 318 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x16c4__neondot() 319 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x16c4__neondot()
|
D | 4x8c2-minmax-neon-mull-padal-dup.c | 319 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c2__neon_mull_padal_dup() 320 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c2__neon_mull_padal_dup() 321 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c2__neon_mull_padal_dup() 322 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c2__neon_mull_padal_dup()
|
D | 4x8c8-minmax-neon-mull-padal.c | 355 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c8__neon_mull_padal() 356 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c8__neon_mull_padal() 357 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c8__neon_mull_padal() 358 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c8__neon_mull_padal()
|
D | 4x8-minmax-neon-mlal-lane.c | 372 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mlal_lane() 373 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mlal_lane() 374 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mlal_lane() 375 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mlal_lane()
|
D | 4x8-minmax-neon-mull-addw-dup.c | 407 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mull_addw_dup() 408 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mull_addw_dup() 409 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mull_addw_dup() 410 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8__neon_mull_addw_dup()
|
D | 4x8c16-minmax-neon-mlal-padal.c | 387 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c16__neon_mlal_padal() 388 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c16__neon_mlal_padal() 389 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_4x8c16__neon_mlal_padal() 390 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_4x8c16__neon_mlal_padal()
|
D | 2x8c2-minmax-neon-mull-padal-dup.c | 211 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_gemm_minmax_ukernel_2x8c2__neon_mull_padal_dup() 212 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_gemm_minmax_ukernel_2x8c2__neon_mull_padal_dup()
|
/external/XNNPACK/src/qs8-igemm/gen/ |
D | 8x8c4-minmax-neondot.c | 370 vst1q_lane_s8(c7, vout6x01234567_7x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 371 vst1q_lane_s8(c6, vout6x01234567_7x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 372 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 373 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 374 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 375 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 376 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot() 377 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x8c4__neondot()
|
D | 6x8c4-minmax-neondot.c | 304 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_6x8c4__neondot() 305 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_6x8c4__neondot() 306 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_6x8c4__neondot() 307 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_6x8c4__neondot() 308 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_6x8c4__neondot() 309 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_6x8c4__neondot()
|
D | 4x8c4-minmax-neondot.c | 238 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c4__neondot() 239 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c4__neondot() 240 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c4__neondot() 241 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c4__neondot()
|
D | 8x16c4-minmax-neondot.c | 538 vst1q_lane_s8(c7, vout6x01234567_7x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 539 vst1q_lane_s8(c6, vout6x01234567_7x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 540 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 541 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 542 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 543 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 544 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot() 545 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_8x16c4__neondot()
|
D | 6x16c4-minmax-neondot.c | 432 vst1q_lane_s8(c5, vout4x01234567_5x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_6x16c4__neondot() 433 vst1q_lane_s8(c4, vout4x01234567_5x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_6x16c4__neondot() 434 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_6x16c4__neondot() 435 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_6x16c4__neondot() 436 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_6x16c4__neondot() 437 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_6x16c4__neondot()
|
D | 4x16c4-minmax-neondot.c | 326 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x16c4__neondot() 327 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x16c4__neondot() 328 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x16c4__neondot() 329 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x16c4__neondot()
|
D | 4x8c2-minmax-neon-mull-padal-dup.c | 336 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c2__neon_mull_padal_dup() 337 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c2__neon_mull_padal_dup() 338 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c2__neon_mull_padal_dup() 339 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c2__neon_mull_padal_dup()
|
D | 4x8c8-minmax-neon-mull-padal.c | 372 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c8__neon_mull_padal() 373 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c8__neon_mull_padal() 374 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c8__neon_mull_padal() 375 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c8__neon_mull_padal()
|
D | 4x8-minmax-neon-mlal-lane.c | 388 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mlal_lane() 389 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mlal_lane() 390 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mlal_lane() 391 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mlal_lane()
|
D | 4x8c16-minmax-neon-mlal-padal.c | 404 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c16__neon_mlal_padal() 405 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c16__neon_mlal_padal() 406 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8c16__neon_mlal_padal() 407 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8c16__neon_mlal_padal()
|
D | 4x8-minmax-neon-mull-addw-dup.c | 424 vst1q_lane_s8(c3, vout2x01234567_3x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mull_addw_dup() 425 vst1q_lane_s8(c2, vout2x01234567_3x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mull_addw_dup() 426 vst1q_lane_s8(c1, vout0x01234567_1x01234567, 8); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mull_addw_dup() 427 vst1q_lane_s8(c0, vout0x01234567_1x01234567, 0); in xnn_qs8_igemm_minmax_ukernel_4x8__neon_mull_addw_dup()
|
/external/llvm-project/clang/test/Sema/ |
D | aarch64-neon-ranges.c | 65 vst1q_lane_s8(addr, big, 15); in test_ld1st1() 75 …vst1q_lane_s8(addr, big, 16); // expected-error-re {{argument value {{.*}} is outside the valid ra… in test_ld1st1()
|
/external/clang/test/Sema/ |
D | aarch64-neon-ranges.c | 65 vst1q_lane_s8(addr, big, 15); in test_ld1st1() 75 vst1q_lane_s8(addr, big, 16); // expected-error {{argument should be a value from 0 to 15}} in test_ld1st1()
|