1; RUN: opt < %s -pgo-instr-gen -S | FileCheck %s --check-prefix=GEN
2; RUN: opt < %s -passes=pgo-instr-gen -S | FileCheck %s --check-prefix=GEN
3; RUN: llvm-profdata merge %S/Inputs/loop2.proftext -o %t.profdata
4; RUN: opt < %s -pgo-instr-use -pgo-test-profile-file=%t.profdata -S | FileCheck %s --check-prefix=USE
5; RUN: opt < %s -passes=pgo-instr-use -pgo-test-profile-file=%t.profdata -S | FileCheck %s --check-prefix=USE
6target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
7target triple = "x86_64-unknown-linux-gnu"
8
9; GEN: $__llvm_profile_raw_version = comdat any
10; GEN: @__llvm_profile_raw_version = constant i64 {{[0-9]+}}, comdat
11; GEN: @__profn_test_nested_for = private constant [15 x i8] c"test_nested_for"
12
13define i32 @test_nested_for(i32 %r, i32 %s) {
14entry:
15; GEN: entry:
16; GEN-NOT: call void @llvm.instrprof.increment
17  br label %for.cond.outer
18
19for.cond.outer:
20; GEN: for.cond.outer:
21; GEN-NOT: call void @llvm.instrprof.increment
22  %i.0 = phi i32 [ 0, %entry ], [ %inc.2, %for.inc.outer ]
23  %sum.0 = phi i32 [ 1, %entry ], [ %sum.1, %for.inc.outer ]
24  %cmp = icmp slt i32 %i.0, %r
25  br i1 %cmp, label %for.body.outer, label %for.end.outer
26; USE: br i1 %cmp, label %for.body.outer, label %for.end.outer
27; USE-SAME: !prof ![[BW_FOR_COND_OUTER:[0-9]+]]
28
29for.body.outer:
30; GEN: for.body.outer:
31; GEN-NOT: call void @llvm.instrprof.increment
32  br label %for.cond.inner
33
34for.cond.inner:
35; GEN: for.cond.inner:
36; GEN-NOT: call void @llvm.instrprof.increment
37  %j.0 = phi i32 [ 0, %for.body.outer ], [ %inc.1, %for.inc.inner ]
38  %sum.1 = phi i32 [ %sum.0, %for.body.outer ], [ %inc, %for.inc.inner ]
39  %cmp2 = icmp slt i32 %j.0, %s
40  br i1 %cmp2, label %for.body.inner, label %for.end.inner
41; USE: br i1 %cmp2, label %for.body.inner, label %for.end.inner
42; USE-SAME: !prof ![[BW_FOR_COND_INNER:[0-9]+]]
43
44for.body.inner:
45; GEN: for.body.inner:
46; GEN-NOT: call void @llvm.instrprof.increment
47  %inc = add nsw i32 %sum.1, 1
48  br label %for.inc.inner
49
50for.inc.inner:
51; GEN: for.inc.inner:
52; GEN: call void @llvm.instrprof.increment(i8* getelementptr inbounds ([15 x i8], [15 x i8]* @__profn_test_nested_for, i32 0, i32 0), i64 53929068288, i32 3, i32 0)
53  %inc.1 = add nsw i32 %j.0, 1
54  br label %for.cond.inner
55
56for.end.inner:
57; GEN: for.end.inner:
58  br label %for.inc.outer
59
60for.inc.outer:
61; GEN: for.inc.outer:
62; GEN: call void @llvm.instrprof.increment(i8* getelementptr inbounds ([15 x i8], [15 x i8]* @__profn_test_nested_for, i32 0, i32 0), i64 53929068288, i32 3, i32 1)
63  %inc.2 = add nsw i32 %i.0, 1
64  br label %for.cond.outer
65
66for.end.outer:
67; GEN: for.end.outer:
68; GEN: call void @llvm.instrprof.increment(i8* getelementptr inbounds ([15 x i8], [15 x i8]* @__profn_test_nested_for, i32 0, i32 0), i64 53929068288, i32 3, i32 2)
69  ret i32 %sum.0
70}
71
72; USE-DAG: ![[BW_FOR_COND_OUTER]] = !{!"branch_weights", i32 10, i32 6}
73; USE-DAG: ![[BW_FOR_COND_INNER]] = !{!"branch_weights", i32 33, i32 10}
74
75