Home
last modified time | relevance | path

Searched refs:GCN (Results 1 – 25 of 807) sorted by relevance

12345678910>>...33

/external/llvm/test/CodeGen/AMDGPU/
Dload-global-i32.ll1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN
2 …-mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-HSA -check…
3 … -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-NOHSA -che…
8 ; GCN-NOHSA: buffer_load_dword v{{[0-9]+}}
9 ; GCN-HSA: flat_load_dword
20 ; GCN-NOHSA: buffer_load_dwordx2
21 ; GCN-HSA: flat_load_dwordx2
32 ; GCN-NOHSA: buffer_load_dwordx4
33 ; GCN-HSA: flat_load_dwordx4
44 ; GCN-NOHSA: buffer_load_dwordx4
[all …]
Dhalf.ll1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=SI …
2 ; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -chec…
6 ; GCN-LABEL: {{^}}load_f16_arg:
7 ; GCN: s_load_dword [[ARG:s[0-9]+]]
8 ; GCN: v_cvt_f16_f32_e32 [[CVT:v[0-9]+]], [[ARG]]
9 ; GCN: buffer_store_short [[CVT]]
15 ; GCN-LABEL: {{^}}load_v2f16_arg:
16 ; GCN-DAG: buffer_load_ushort [[V0:v[0-9]+]], off, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:44
17 ; GCN-DAG: buffer_load_ushort [[V1:v[0-9]+]], off, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:46
18 ; GCN: v_lshlrev_b32_e32 [[HI:v[0-9]+]], 16, [[V1]]
[all …]
Dstore-v3i64.ll1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=SI …
2 ; RUN: llc -march=amdgcn -mcpu=bonaire -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -ch…
3 ; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -chec…
5 ; GCN-LABEL: {{^}}global_store_v3i64:
6 ; GCN-DAG: buffer_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, off, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:16
7 ; GCN-DAG: buffer_store_dwordx4 v{{\[[0-9]+:[0-9]+\]}}, off, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
13 ; GCN-LABEL: {{^}}global_store_v3i64_unaligned:
14 ; GCN: buffer_store_byte
15 ; GCN: buffer_store_byte
16 ; GCN: buffer_store_byte
[all …]
Dload-constant-i32.ll1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN
2 …-mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-HSA -check…
3 … -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-NOHSA -che…
7 ; GCN: s_load_dword s{{[0-9]+}}
18 ; GCN: s_load_dwordx2
29 ; GCN: s_load_dwordx4
40 ; GCN: s_load_dwordx4
51 ; GCN: s_load_dwordx8
63 ; GCN: s_load_dwordx16
77 ; GCN-DAG: s_load_dword s[[SLO:[0-9]+]],
[all …]
Dsdivrem64.ll1 ;RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck --check-prefix=SI --check-prefix=GCN
2 …ga -verify-machineinstrs < %s | FileCheck --check-prefix=VI --check-prefix=GCN --check-prefix=FUNC…
39 ; GCN: s_bfe_u32
40 ; GCN: s_bfe_u32
41 ; GCN: s_bfe_u32
42 ; GCN: s_bfe_u32
43 ; GCN: s_bfe_u32
44 ; GCN: s_bfe_u32
45 ; GCN: s_bfe_u32
46 ; GCN: s_bfe_u32
[all …]
Dudivrem64.ll1 ;RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck --check-prefix=SI --check-prefix=GCN
2 …ga -verify-machineinstrs < %s | FileCheck --check-prefix=VI --check-prefix=GCN --check-prefix=FUNC…
39 ;GCN: s_bfe_u32
40 ;GCN: s_bfe_u32
41 ;GCN: s_bfe_u32
42 ;GCN: s_bfe_u32
43 ;GCN: s_bfe_u32
44 ;GCN: s_bfe_u32
45 ;GCN: s_bfe_u32
46 ;GCN: s_bfe_u32
[all …]
/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/AMDGPU/
Dpartial-sgpr-to-vgpr-spills.ll1 …ii -verify-machineinstrs < %s | FileCheck -check-prefix=ALL -check-prefix=VGPR -check-prefix=GCN %s
11 ; GCN-LABEL: {{^}}spill_sgprs_to_multiple_vgprs:
13 ; GCN: def s[4:11]
14 ; GCN: def s[12:19]
15 ; GCN: def s[20:27]
16 ; GCN: def s[28:35]
17 ; GCN: def s[36:43]
18 ; GCN: def s[44:51]
19 ; GCN: def s[52:59]
20 ; GCN: def s[60:67]
[all …]
Dload-global-i32.ll1 …strs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=GCN-NOHSA -che…
2 …strs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=GCN-HSA -check…
3 …strs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=GCN-NOHSA -che…
8 ; GCN-NOHSA: buffer_load_dword v{{[0-9]+}}
9 ; GCN-HSA: flat_load_dword
20 ; GCN-NOHSA: buffer_load_dwordx2
21 ; GCN-HSA: flat_load_dwordx2
32 ; GCN-NOHSA: buffer_load_dwordx4
33 ; GCN-HSA: flat_load_dwordx4
44 ; GCN-NOHSA: buffer_load_dwordx4
[all …]
Dcall-preserved-registers.ll1 …cn-amd-amdhsa -mcpu=fiji -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
2 …-amd-amdhsa -mcpu=hawaii -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
3 …-amd-amdhsa -mcpu=gfx900 -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
7 ; GCN-LABEL: {{^}}test_kernel_call_external_void_func_void_clobber_s30_s31_call_external_void_func_…
8 ; GCN: s_mov_b32 s33, s7
9 ; GCN: s_getpc_b64 s[34:35]
10 ; GCN-NEXT: s_add_u32 s34, s34,
11 ; GCN-NEXT: s_addc_u32 s35, s35,
12 ; GCN-NEXT: s_mov_b32 s4, s33
13 ; GCN-NEXT: s_mov_b32 s32, s33
[all …]
Dfdiv32-to-rcp-folding.ll1 …arch=amdgcn -mcpu=gfx900 -mattr=+fp32-denormals < %s | FileCheck --check-prefixes=GCN,GCN-DENORM %s
2 …march=amdgcn -mcpu=gfx900 -mattr=-fp32-denormals < %s | FileCheck --check-prefixes=GCN,GCN-FLUSH %s
4 ; GCN-LABEL: {{^}}div_1_by_x_25ulp:
5 ; GCN-DENORM-DAG: v_mov_b32_e32 [[L:v[0-9]+]], 0x6f800000
6 ; GCN-DENORM-DAG: v_mov_b32_e32 [[S:v[0-9]+]], 0x2f800000
7 ; GCN-DAG: s_load_dword [[VAL:s[0-9]+]], s[{{[0-9:]+}}], 0x0{{$}}
8 ; GCN-DENORM-DAG: v_cmp_gt_f32_e64 vcc, |[[VAL]]|, [[L]]
9 ; GCN-DENORM-DAG: v_cndmask_b32_e32 [[SCALE:v[0-9]+]], 1.0, [[S]], vcc
10 ; GCN-DENORM: v_mul_f32_e32 [[PRESCALED:v[0-9]+]], [[VAL]], [[SCALE]]
11 ; GCN-DENORM: v_rcp_f32_e32 [[RCP:v[0-9]+]], [[PRESCALED]]
[all …]
Dcallee-special-input-sgprs.ll1 …instrs < %s | FileCheck -allow-deprecated-dag-overlap -enable-var-scope -check-prefixes=GCN,CIVI %s
2 …instrs < %s | FileCheck -allow-deprecated-dag-overlap -enable-var-scope -check-prefixes=GCN,GFX9 %s
4 ; GCN-LABEL: {{^}}use_dispatch_ptr:
5 ; GCN: v_mov_b32_e32 v[[LO:[0-9]+]], s6
6 ; GCN: v_mov_b32_e32 v[[HI:[0-9]+]], s7
7 ; GCN: {{flat|global}}_load_dword v{{[0-9]+}}, v{{\[}}[[LO]]:[[HI]]{{\]}}
15 ; GCN-LABEL: {{^}}kern_indirect_use_dispatch_ptr:
16 ; GCN: enable_sgpr_dispatch_ptr = 1
17 ; GCN: s_mov_b64 s[6:7], s[4:5]
23 ; GCN-LABEL: {{^}}use_queue_ptr:
[all …]
Dbranch-relaxation.ll1 …cn -mcpu=tahiti -verify-machineinstrs -amdgpu-s-branch-bits=4 < %s | FileCheck -check-prefix=GCN %s
21 ; GCN-LABEL: {{^}}uniform_conditional_max_short_forward_branch:
22 ; GCN: s_load_dword [[CND:s[0-9]+]]
23 ; GCN: s_cmp_eq_u32 [[CND]], 0
24 ; GCN-NEXT: s_cbranch_scc1 [[BB3:BB[0-9]+_[0-9]+]]
27 ; GCN-NEXT: ; %bb.1: ; %bb2
28 ; GCN-NEXT: ;;#ASMSTART
29 ; GCN-NEXT: v_nop_e64
30 ; GCN-NEXT: v_nop_e64
31 ; GCN-NEXT: v_nop_e64
[all …]
Dstore-v3i64.ll1 …-machineinstrs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=SI %s
2 …-machineinstrs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=CI %s
3 …-machineinstrs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=VI %s
5 ; GCN-LABEL: {{^}}global_store_v3i64:
6 ; GCN-DAG: buffer_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, off, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:16
7 ; GCN-DAG: buffer_store_dwordx4 v{{\[[0-9]+:[0-9]+\]}}, off, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
13 ; GCN-LABEL: {{^}}global_store_v3i64_unaligned:
14 ; GCN: buffer_store_byte
15 ; GCN: buffer_store_byte
16 ; GCN: buffer_store_byte
[all …]
Dload-constant-i32.ll1 …strs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=GCN-NOHSA -che…
2 …strs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=GCN-HSA -check…
3 …strs < %s | FileCheck -allow-deprecated-dag-overlap -check-prefix=GCN -check-prefix=GCN-NOHSA -che…
7 ; GCN: s_load_dword s{{[0-9]+}}
18 ; GCN: s_load_dwordx2
29 ; GCN: s_load_dwordx4
40 ; GCN: s_load_dwordx4
51 ; GCN: s_load_dwordx8
63 ; GCN: s_load_dwordx16
77 ; GCN-DAG: s_load_dword s[[SLO:[0-9]+]],
[all …]
Dinserted-wait-states.mir1 …-march=amdgcn -mcpu=tahiti -run-pass post-RA-hazard-rec %s -o - | FileCheck %s -check-prefixes=GCN
2 …h=amdgcn -mcpu=hawaii -run-pass post-RA-hazard-rec %s -o - | FileCheck %s -check-prefixes=GCN,CIVI
3 …=amdgcn -mcpu=fiji -run-pass post-RA-hazard-rec %s -o - | FileCheck %s -check-prefixes=GCN,CIVI,VI
4 … -mcpu=gfx900 -run-pass post-RA-hazard-rec %s -o - | FileCheck %s -check-prefixes=GCN,CIVI,VI,GFX9
47 # GCN-LABEL: name: div_fmas
49 # GCN-LABEL: bb.0:
50 # GCN: S_MOV_B64
51 # GCN-NOT: S_NOP
52 # GCN: V_DIV_FMAS
54 # GCN-LABEL: bb.1:
[all …]
Dcall-argument-types.ll1 …bal-loads=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,VI,MESA %s
2 …bal-loads=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,CI,MESA %s
3 …oads=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,GFX9,VI,MESA %s
4 …obal-loads=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,VI,HSA %s
59 ; GCN-LABEL: {{^}}test_call_external_void_func_i1_imm:
64 ; GCN: s_getpc_b64 s{{\[}}[[PC_LO:[0-9]+]]:[[PC_HI:[0-9]+]]{{\]}}
65 ; GCN-NEXT: s_add_u32 s[[PC_LO]], s[[PC_LO]], external_void_func_i1@rel32@lo+4
66 ; GCN-NEXT: s_addc_u32 s[[PC_HI]], s[[PC_HI]], external_void_func_i1@rel32@hi+4
67 ; GCN-DAG: v_mov_b32_e32 v0, 1{{$}}
70 ; GCN: s_swappc_b64 s[30:31], s{{\[}}[[PC_LO]]:[[PC_HI]]{{\]}}
[all …]
Didiv-licm.ll1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefix=GCN
3 ; GCN-LABEL: {{^}}udiv32_invariant_denom:
4 ; GCN: v_cvt_f32_u32
5 ; GCN: v_rcp_iflag_f32
6 ; GCN: v_mul_f32_e32 v{{[0-9]+}}, 0x4f800000,
7 ; GCN: v_cvt_u32_f32_e32
8 ; GCN-DAG: v_mul_hi_u32
9 ; GCN-DAG: v_mul_lo_i32
10 ; GCN-DAG: v_sub_i32_e32
11 ; GCN-DAG: v_cmp_eq_u32_e64
[all …]
Dfunction-args.ll1 …mcpu=hawaii -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,CI,CIVI %s
2 …lobal -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,VI,CIVI,GFX89 %s
3 …for-global -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,VI,GFX89 %s
5 ; GCN-LABEL: {{^}}void_func_i1:
6 ; GCN: v_and_b32_e32 v0, 1, v0
7 ; GCN: buffer_store_byte v0, off
13 ; GCN-LABEL: {{^}}void_func_i1_zeroext:
14 ; GCN: s_waitcnt
15 ; GCN-NEXT: v_or_b32_e32 v0, 12, v0
16 ; GCN-NOT: v0
[all …]
Dmemory-legalizer-atomic-rmw.ll1 …mtriple=amdgcn-amd- -mcpu=gfx803 -verify-machineinstrs < %s | FileCheck -check-prefixes=GCN,GFX8 %s
2 …e=amdgcn-amd-amdhsa -mcpu=gfx803 -verify-machineinstrs < %s | FileCheck -check-prefixes=GCN,GFX8 %s
4 ; GCN-LABEL: {{^}}system_monotonic:
5 ; GCN-NOT: s_waitcnt vmcnt(0){{$}}
6 ; GCN: flat_atomic_swap v[{{[0-9]+}}:{{[0-9]+}}], v{{[0-9]+}}{{$}}
7 ; GCN-NOT: s_waitcnt vmcnt(0){{$}}
8 ; GCN-NOT: buffer_wbinvl1_vol
16 ; GCN-LABEL: {{^}}system_acquire:
17 ; GCN-NOT: s_waitcnt vmcnt(0){{$}}
18 ; GCN: flat_atomic_swap v[{{[0-9]+}}:{{[0-9]+}}], v{{[0-9]+}}{{$}}
[all …]
Dhalf.ll1 …neinstrs < %s | FileCheck -allow-deprecated-dag-overlap -enable-var-scope -check-prefixes=GCN,SI %s
2 …neinstrs < %s | FileCheck -allow-deprecated-dag-overlap -enable-var-scope -check-prefixes=GCN,VI %s
6 ; GCN-LABEL: {{^}}load_f16_arg:
7 ; GCN: s_load_dword [[ARG:s[0-9]+]]
8 ; GCN: v_mov_b32_e32 [[V_ARG:v[0-9]+]], [[ARG]]
9 ; GCN: flat_store_short v{{\[[0-9]+:[0-9]+\]}}, [[V_ARG]]
15 ; GCN-LABEL: {{^}}load_v2f16_arg:
16 ; GCN: s_load_dword [[ARG:s[0-9]+]]
17 ; GCN: v_mov_b32_e32 [[V_ARG:v[0-9]+]], [[ARG]]
18 ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[V_ARG]]
[all …]
Dipra.ll1 …-amd-amdhsa -verify-machineinstrs -enable-ipra -amdgpu-sroa=0 < %s | FileCheck -check-prefix=GCN %s
2 …triple=amdgcn-amd-amdhsa -verify-machineinstrs -amdgpu-sroa=0 < %s | FileCheck -check-prefix=GCN %s
5 ; GCN-LABEL: {{^}}kernel:
6 ; GCN: flat_store_dword
13 ; GCN-LABEL: {{^}}func:
14 ; GCN: ; NumVgprs: 8
20 ; GCN-LABEL: {{^}}kernel_call:
21 ; GCN-NOT: buffer_store
22 ; GCN-NOT: buffer_load
23 ; GCN-NOT: readlane
[all …]
Dllvm.amdgcn.ubfe.ll1 …s=false -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=SI %s
2 …mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=VI %s
4 ; GCN-LABEL: {{^}}bfe_u32_arg_arg_arg:
5 ; GCN: v_bfe_u32
12 ; GCN-LABEL: {{^}}bfe_u32_arg_arg_imm:
13 ; GCN: v_bfe_u32
20 ; GCN-LABEL: {{^}}bfe_u32_arg_imm_arg:
21 ; GCN: v_bfe_u32
28 ; GCN-LABEL: {{^}}bfe_u32_imm_arg_arg:
29 ; GCN: v_bfe_u32
[all …]
Dbitreverse-inline-immediates.ll1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
7 ; GCN-LABEL: {{^}}materialize_0_i32:
8 ; GCN: v_mov_b32_e32 [[K:v[0-9]+]], 0{{$}}
9 ; GCN: buffer_store_dword [[K]]
15 ; GCN-LABEL: {{^}}materialize_0_i64:
16 ; GCN: v_mov_b32_e32 v[[LOK:[0-9]+]], 0{{$}}
17 ; GCN: v_mov_b32_e32 v[[HIK:[0-9]+]], v[[LOK]]{{$}}
18 ; GCN: buffer_store_dwordx2 v{{\[}}[[LOK]]:[[HIK]]{{\]}}
24 ; GCN-LABEL: {{^}}materialize_neg1_i32:
25 ; GCN: v_mov_b32_e32 [[K:v[0-9]+]], -1{{$}}
[all …]
Dbreak-smem-soft-clauses.mir1 …verify-machineinstrs -run-pass post-RA-hazard-rec %s -o - | FileCheck -check-prefixes=GCN,XNACK %s
2 …rify-machineinstrs -run-pass post-RA-hazard-rec %s -o - | FileCheck -check-prefixes=GCN,NOXNACK %s
10 ; GCN-LABEL: name: trivial_smem_clause_load_smrd4_x1
11 ; GCN: $sgpr0 = S_LOAD_DWORD_IMM $sgpr10_sgpr11, 0, 0
12 ; GCN-NEXT: S_ENDPGM
22 ; GCN-LABEL: name: trivial_smem_clause_load_smrd4_x2
23 ; GCN: $sgpr0 = S_LOAD_DWORD_IMM $sgpr10_sgpr11, 0, 0
24 ; GCN-NEXT: $sgpr1 = S_LOAD_DWORD_IMM $sgpr12_sgpr13, 0, 0
25 ; GCN-NEXT: S_ENDPGM
36 ; GCN-LABEL: name: trivial_smem_clause_load_smrd4_x3
[all …]
Dimm.ll1 …erde -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=SI %s
2 …obal -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=VI %s
5 ; GCN-LABEL: {{^}}i64_imm_inline_lo:
6 ; GCN: v_mov_b32_e32 v[[LO_VGPR:[0-9]+]], 5
7 ; GCN: buffer_store_dwordx2 v{{\[}}[[LO_VGPR]]:
15 ; GCN-LABEL: {{^}}i64_imm_inline_hi:
16 ; GCN: v_mov_b32_e32 v[[HI_VGPR:[0-9]+]], 5
17 ; GCN: buffer_store_dwordx2 v{{\[[0-9]+:}}[[HI_VGPR]]
24 ; GCN-LABEL: {{^}}store_imm_neg_0.0_i64:
25 ; GCN-DAG: v_mov_b32_e32 v[[LO_VREG:[0-9]+]], 0{{$}}
[all …]

12345678910>>...33