• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1; Check that a division is bypassed when appropriate only.
2; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mcpu=atom       < %s | FileCheck -check-prefixes=ATOM,CHECK %s
3; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mcpu=silvermont < %s | FileCheck -check-prefixes=REST,CHECK %s
4; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mcpu=skylake    < %s | FileCheck -check-prefixes=REST,CHECK %s
5; RUN: llc -profile-summary-huge-working-set-size-threshold=1 -mtriple=x86_64-unknown-linux-gnu -mcpu=skylake    < %s | FileCheck -check-prefixes=HUGEWS %s
6
7; Verify that div32 is bypassed only for Atoms.
8define i32 @div32(i32 %a, i32 %b) {
9entry:
10; ATOM-LABEL: div32:
11; ATOM: orl   %{{.*}}, [[REG:%[a-z]+]]
12; ATOM: testl $-256, [[REG]]
13; ATOM: divb
14;
15; REST-LABEL: div32:
16; REST-NOT: divb
17;
18  %div = sdiv i32 %a, %b
19  ret i32 %div
20}
21
22; Verify that div64 is always bypassed.
23define i64 @div64(i64 %a, i64 %b) {
24entry:
25; CHECK-LABEL: div64:
26; CHECK:     orq     %{{.*}}, [[REG:%[a-z]+]]
27; CHECK:     shrq    $32, [[REG]]
28; CHECK:     divl
29;
30  %div = sdiv i64 %a, %b
31  ret i64 %div
32}
33
34
35; Verify that no extra code is generated when optimizing for size.
36
37define i64 @div64_optsize(i64 %a, i64 %b) optsize {
38; CHECK-LABEL: div64_optsize:
39; CHECK-NOT: divl
40; CHECK: ret
41  %div = sdiv i64 %a, %b
42  ret i64 %div
43}
44
45define i64 @div64_hugews(i64 %a, i64 %b) {
46; HUGEWS-LABEL: div64_hugews:
47; HUGEWS-NOT: divl
48; HUGEWS: ret
49  %div = sdiv i64 %a, %b
50  ret i64 %div
51}
52
53define i32 @div32_optsize(i32 %a, i32 %b) optsize {
54; CHECK-LABEL: div32_optsize:
55; CHECK-NOT: divb
56; CHECK: ret
57  %div = sdiv i32 %a, %b
58  ret i32 %div
59}
60
61define i32 @div32_minsize(i32 %a, i32 %b) minsize {
62; CHECK-LABEL: div32_minsize:
63; CHECK-NOT: divb
64; CHECK: ret
65  %div = sdiv i32 %a, %b
66  ret i32 %div
67}
68
69!llvm.module.flags = !{!1}
70!1 = !{i32 1, !"ProfileSummary", !2}
71!2 = !{!3, !4, !5, !6, !7, !8, !9, !10}
72!3 = !{!"ProfileFormat", !"InstrProf"}
73!4 = !{!"TotalCount", i64 10000}
74!5 = !{!"MaxCount", i64 1000}
75!6 = !{!"MaxInternalCount", i64 1}
76!7 = !{!"MaxFunctionCount", i64 1000}
77!8 = !{!"NumCounts", i64 3}
78!9 = !{!"NumFunctions", i64 3}
79!10 = !{!"DetailedSummary", !11}
80!11 = !{!12, !13, !14}
81!12 = !{i32 10000, i64 1000, i32 1}
82!13 = !{i32 999000, i64 1000, i32 3}
83!14 = !{i32 999999, i64 5, i32 3}
84