• Home
  • Raw
  • Download

Lines Matching refs:GEMMBenchmark

34 static void GEMMBenchmark(benchmark::State& state,  in GEMMBenchmark()  function
354 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__aarch64_neonfma_ld64, 1, 8, 1, 1); in f32_gemm_1x8__aarch64_neonfma_ld64()
357 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x12__aarch64_neonfma_cortex_a53, 1, 12, 1, 1); in f32_gemm_1x12__aarch64_neonfma_cortex_a53()
360 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__aarch64_neonfma_cortex_a53, 1, 8, 1, 1); in f32_gemm_1x8__aarch64_neonfma_cortex_a53()
363 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__aarch64_neonfma_cortex_a57, 1, 8, 1, 1); in f32_gemm_1x8__aarch64_neonfma_cortex_a57()
366 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__aarch64_neonfma_cortex_a75, 1, 8, 1, 1); in f32_gemm_1x8__aarch64_neonfma_cortex_a75()
369 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x12__aarch64_neonfma_cortex_a53, 4, 12, 1, 1); in f32_gemm_4x12__aarch64_neonfma_cortex_a53()
372 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch64_neonfma_cortex_a53, 4, 8, 1, 1); in f32_gemm_4x8__aarch64_neonfma_cortex_a53()
375 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch64_neonfma_cortex_a55, 4, 8, 1, 1); in f32_gemm_4x8__aarch64_neonfma_cortex_a55()
378 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch64_neonfma_cortex_a57, 4, 8, 1, 1); in f32_gemm_4x8__aarch64_neonfma_cortex_a57()
381 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch64_neonfma_cortex_a75, 4, 8, 1, 1); in f32_gemm_4x8__aarch64_neonfma_cortex_a75()
384 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch64_neonfma_ld64, 4, 8, 1, 1); in f32_gemm_4x8__aarch64_neonfma_ld64()
387 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch64_neonfma_ld128, 4, 8, 1, 1); in f32_gemm_4x8__aarch64_neonfma_ld128()
390 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__aarch64_neonfma_cortex_a57, 5, 8, 1, 1); in f32_gemm_5x8__aarch64_neonfma_cortex_a57()
393 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__aarch64_neonfma_cortex_a75, 5, 8, 1, 1); in f32_gemm_5x8__aarch64_neonfma_cortex_a75()
396 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_ld64, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_ld64()
399 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_ld128, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_ld128()
402 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_cortex_a53, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_cortex_a53()
405 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_cortex_a55, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_cortex_a55()
408 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_cortex_a73, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_cortex_a73()
411 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_cortex_a57, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_cortex_a57()
414 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__aarch64_neonfma_cortex_a75, 6, 8, 1, 1); in f32_gemm_6x8__aarch64_neonfma_cortex_a75()
417 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__neonfma_lane_ld64, 1, 8, 1, 1); in f32_gemm_1x8__neonfma_lane_ld64()
420 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__neonfma_lane_ld64, 4, 8, 1, 1); in f32_gemm_4x8__neonfma_lane_ld64()
423 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__neonfma_lane_ld128, 4, 8, 1, 1); in f32_gemm_4x8__neonfma_lane_ld128()
426 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__neonfma_lane_ld64, 5, 8, 1, 1); in f32_gemm_5x8__neonfma_lane_ld64()
429 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__neonfma_lane_ld64, 6, 8, 1, 1); in f32_gemm_6x8__neonfma_lane_ld64()
432 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__neonfma_lane_ld128, 6, 8, 1, 1); in f32_gemm_6x8__neonfma_lane_ld128()
465GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x4__aarch32_vfp_ld64, 4, 4, 1, 1, benchmark::uti… in BENCHMARK_GEMM()
468GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_ld64, 4, 8, 1, 1, benchmark::ut… in f32_gemm_4x8__aarch32_neon_ld64()
471GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a7, 4, 8, 1, 1, benchmar… in f32_gemm_4x8__aarch32_neon_cortex_a7()
474GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a53, 4, 8, 1, 1, benchma… in f32_gemm_4x8__aarch32_neon_cortex_a53()
477GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a55, 4, 8, 1, 1, benchma… in f32_gemm_4x8__aarch32_neon_cortex_a55()
480GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a75, 4, 8, 1, 1, benchma… in f32_gemm_4x8__aarch32_neon_cortex_a75()
483GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_pld_cortex_a75, 4, 8, 1, 1, ben… in f32_gemm_4x8__aarch32_neon_pld_cortex_a75()
497GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__neon_lane_ld64, 1, 8, 1, 1, benchmark::utils… in BENCHMARK_GEMM()
500GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__neon_lane_ld64, 4, 8, 1, 1, benchmark::utils… in f32_gemm_4x8__neon_lane_ld64()
503GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__neon_lane_ld128, 4, 8, 1, 1, benchmark::util… in f32_gemm_4x8__neon_lane_ld128()
506GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__neon_lane_ld64, 5, 8, 1, 1, benchmark::utils… in f32_gemm_5x8__neon_lane_ld64()
509GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__neon_lane_ld64, 6, 8, 1, 1, benchmark::utils… in f32_gemm_6x8__neon_lane_ld64()
512GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__neon_lane_ld128, 6, 8, 1, 1, benchmark::util… in f32_gemm_6x8__neon_lane_ld128()
515GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__neonfma_dup_ld64, 1, 8, 1, 1, benchmark::uti… in f32_gemm_1x8__neonfma_dup_ld64()
518GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__neonfma_dup_ld64, 4, 8, 1, 1, benchmark::uti… in f32_gemm_4x8__neonfma_dup_ld64()
521GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__neonfma_dup_ld128, 4, 8, 1, 1, benchmark::ut… in f32_gemm_4x8__neonfma_dup_ld128()
524GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__neonfma_dup_ld64, 6, 8, 1, 1, benchmark::uti… in f32_gemm_6x8__neonfma_dup_ld64()
527GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__neonfma_dup_ld128, 6, 8, 1, 1, benchmark::ut… in f32_gemm_6x8__neonfma_dup_ld128()
530GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8s4__neon, 1, 8, 1, 4, benchmark::utils::CheckN… in f32_gemm_1x8s4__neon()
533GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8s4__neonfma, 1, 8, 1, 4, benchmark::utils::Che… in f32_gemm_1x8s4__neonfma()
536GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8s4__neon, 4, 8, 1, 4, benchmark::utils::CheckN… in f32_gemm_4x8s4__neon()
539GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8s4__neonfma, 4, 8, 1, 4, benchmark::utils::Che… in f32_gemm_4x8s4__neonfma()
542GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8s4__neon, 6, 8, 1, 4, benchmark::utils::CheckN… in f32_gemm_6x8s4__neon()
545GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8s4__neonfma, 6, 8, 1, 4, benchmark::utils::Che… in f32_gemm_6x8s4__neonfma()
548GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_8x8s4__neon, 8, 8, 1, 4, benchmark::utils::CheckN… in f32_gemm_8x8s4__neon()
551GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_8x8s4__neonfma, 8, 8, 1, 4, benchmark::utils::Che… in f32_gemm_8x8s4__neonfma()
585 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__sse_load1, 1, 8, 1, 1); in BENCHMARK_GEMM()
588 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__sse_load1, 3, 8, 1, 1); in f32_gemm_3x8__sse_load1()
591 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__sse_load1, 4, 8, 1, 1); in f32_gemm_4x8__sse_load1()
594 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__sse_load1, 5, 8, 1, 1); in f32_gemm_5x8__sse_load1()
598 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__sse_dup, 1, 8, 1, 1); in f32_gemm_1x8__sse_dup()
601 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__sse_dup, 3, 8, 1, 1); in f32_gemm_3x8__sse_dup()
604 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__sse_dup, 4, 8, 1, 1); in f32_gemm_4x8__sse_dup()
607 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__sse_dup, 5, 8, 1, 1); in f32_gemm_5x8__sse_dup()
611 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8s4__sse, 1, 8, 1, 4); in f32_gemm_1x8s4__sse()
614 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8s4__sse, 3, 8, 1, 4); in f32_gemm_3x8s4__sse()
617 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8s4__sse, 4, 8, 1, 4); in f32_gemm_4x8s4__sse()
620 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8s4__sse, 5, 8, 1, 4); in f32_gemm_5x8s4__sse()
624 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__sse2_dup, 1, 8, 1, 1); in f32_gemm_1x8__sse2_dup()
627 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__sse2_dup, 3, 8, 1, 1); in f32_gemm_3x8__sse2_dup()
630 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__sse2_dup, 4, 8, 1, 1); in f32_gemm_4x8__sse2_dup()
633 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__sse2_dup, 5, 8, 1, 1); in f32_gemm_5x8__sse2_dup()
644GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__avx_broadcast, 1, 8, 1, 1, benchmark::utils:… in f32_gemm_1x8__avx_broadcast()
647GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__avx_broadcast, 4, 8, 1, 1, benchmark::utils:… in f32_gemm_4x8__avx_broadcast()
650GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__avx_broadcast, 5, 8, 1, 1, benchmark::utils:… in f32_gemm_5x8__avx_broadcast()
653GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__avx_broadcast, 6, 8, 1, 1, benchmark::utils:… in f32_gemm_6x8__avx_broadcast()
656GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_7x8__avx_broadcast, 7, 8, 1, 1, benchmark::utils:… in f32_gemm_7x8__avx_broadcast()
659GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x16__avx_broadcast, 1, 16, 1, 1, benchmark::util… in f32_gemm_1x16__avx_broadcast()
662GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x16__avx_broadcast, 4, 16, 1, 1, benchmark::util… in f32_gemm_3x16__avx_broadcast()
665GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x16__avx_broadcast, 4, 16, 1, 1, benchmark::util… in f32_gemm_4x16__avx_broadcast()
668GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x16__avx_broadcast, 5, 16, 1, 1, benchmark::util… in f32_gemm_5x16__avx_broadcast()
672GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x8__fma3_broadcast, 1, 8, 1, 1, benchmark::utils… in f32_gemm_1x8__fma3_broadcast()
675GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__fma3_broadcast, 4, 8, 1, 1, benchmark::utils… in f32_gemm_4x8__fma3_broadcast()
678GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__fma3_broadcast, 5, 8, 1, 1, benchmark::utils… in f32_gemm_5x8__fma3_broadcast()
681GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__fma3_broadcast, 6, 8, 1, 1, benchmark::utils… in f32_gemm_6x8__fma3_broadcast()
684GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_7x8__fma3_broadcast, 7, 8, 1, 1, benchmark::utils… in f32_gemm_7x8__fma3_broadcast()
687GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_8x8__fma3_broadcast, 8, 8, 1, 1, benchmark::utils… in f32_gemm_8x8__fma3_broadcast()
690GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x16__fma3_broadcast, 1, 16, 1, 1, benchmark::uti… in f32_gemm_1x16__fma3_broadcast()
693GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x16__fma3_broadcast, 4, 16, 1, 1, benchmark::uti… in f32_gemm_3x16__fma3_broadcast()
696GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x16__fma3_broadcast, 4, 16, 1, 1, benchmark::uti… in f32_gemm_4x16__fma3_broadcast()
699GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x16__fma3_broadcast, 5, 16, 1, 1, benchmark::uti… in f32_gemm_5x16__fma3_broadcast()
703GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x16s4__fma3_broadcast, 1, 16, 1, 4, benchmark::u… in f32_gemm_1x16s4__fma3_broadcast()
706GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x16s4__fma3_broadcast, 4, 16, 1, 4, benchmark::u… in f32_gemm_3x16s4__fma3_broadcast()
709GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x16s4__fma3_broadcast, 4, 16, 1, 4, benchmark::u… in f32_gemm_4x16s4__fma3_broadcast()
712GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x16s4__fma3_broadcast, 5, 16, 1, 4, benchmark::u… in f32_gemm_5x16s4__fma3_broadcast()
716GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x16__avx512f_broadcast, 1, 16, 1, 1, benchmark::… in f32_gemm_1x16__avx512f_broadcast()
719GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x16__avx512f_broadcast, 4, 16, 1, 1, benchmark::… in f32_gemm_4x16__avx512f_broadcast()
722GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x16__avx512f_broadcast, 5, 16, 1, 1, benchmark::… in f32_gemm_5x16__avx512f_broadcast()
725GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x16__avx512f_broadcast, 6, 16, 1, 1, benchmark::… in f32_gemm_6x16__avx512f_broadcast()
728GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_7x16__avx512f_broadcast, 7, 16, 1, 1, benchmark::… in f32_gemm_7x16__avx512f_broadcast()
731GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_8x16__avx512f_broadcast, 8, 16, 1, 1, benchmark::… in f32_gemm_8x16__avx512f_broadcast()
793 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__wasmsimd_arm_loadsplat, 3, 8, 1, 1); in BENCHMARK_GEMM()
797 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__wasmsimd_arm_loadsplat, 4, 8, 1, 1); in f32_gemm_4x8__wasmsimd_arm_loadsplat()
801 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_arm_loadsplat, 5, 8, 1, 1); in f32_gemm_5x8__wasmsimd_arm_loadsplat()
805 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_arm_loadsplat, 6, 8, 1, 1); in f32_gemm_6x8__wasmsimd_arm_loadsplat()
809 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__wasmsimd_x86_loadsplat, 3, 8, 1, 1); in f32_gemm_3x8__wasmsimd_x86_loadsplat()
813 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__wasmsimd_x86_loadsplat, 4, 8, 1, 1); in f32_gemm_4x8__wasmsimd_x86_loadsplat()
817 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_loadsplat, 5, 8, 1, 1); in f32_gemm_5x8__wasmsimd_x86_loadsplat()
821 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_loadsplat, 6, 8, 1, 1); in f32_gemm_6x8__wasmsimd_x86_loadsplat()
825 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__wasmsimd_arm_splat, 3, 8, 1, 1); in f32_gemm_3x8__wasmsimd_arm_splat()
829 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__wasmsimd_arm_splat, 4, 8, 1, 1); in f32_gemm_4x8__wasmsimd_arm_splat()
833 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_arm_splat, 5, 8, 1, 1); in f32_gemm_5x8__wasmsimd_arm_splat()
837 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_arm_splat, 6, 8, 1, 1); in f32_gemm_6x8__wasmsimd_arm_splat()
841 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8__wasmsimd_x86_splat, 3, 8, 1, 1); in f32_gemm_3x8__wasmsimd_x86_splat()
845 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8__wasmsimd_x86_splat, 4, 8, 1, 1); in f32_gemm_4x8__wasmsimd_x86_splat()
849 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8__wasmsimd_x86_splat, 5, 8, 1, 1); in f32_gemm_5x8__wasmsimd_x86_splat()
853 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8__wasmsimd_x86_splat, 6, 8, 1, 1); in f32_gemm_6x8__wasmsimd_x86_splat()
857 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8s4__wasmsimd_arm, 3, 8, 1, 4); in f32_gemm_3x8s4__wasmsimd_arm()
861 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8s4__wasmsimd_arm, 4, 8, 1, 4); in f32_gemm_4x8s4__wasmsimd_arm()
865 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8s4__wasmsimd_arm, 5, 8, 1, 4); in f32_gemm_5x8s4__wasmsimd_arm()
869 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8s4__wasmsimd_arm, 6, 8, 1, 4); in f32_gemm_6x8s4__wasmsimd_arm()
873 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_3x8s4__wasmsimd_x86, 3, 8, 1, 4); in f32_gemm_3x8s4__wasmsimd_x86()
877 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x8s4__wasmsimd_x86, 4, 8, 1, 4); in f32_gemm_4x8s4__wasmsimd_x86()
881 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_5x8s4__wasmsimd_x86, 5, 8, 1, 4); in f32_gemm_5x8s4__wasmsimd_x86()
885 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_6x8s4__wasmsimd_x86, 6, 8, 1, 4); in f32_gemm_6x8s4__wasmsimd_x86()
933 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_1x4__scalar, 1, 4, 1, 1); in BENCHMARK_GEMM()
937 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_2x4__scalar, 2, 4, 1, 1); in f32_gemm_2x4__scalar()
941 GEMMBenchmark(state, xnn_f32_gemm_minmax_ukernel_4x4__scalar, 4, 4, 1, 1); in f32_gemm_4x4__scalar()