1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt < %s -force-vector-width=2 -force-vector-interleave=1 -loop-vectorize -S | FileCheck %s
3
4; Test case for PR44488. Checks that the correct predicates are created for
5; branches where true and false successors are equal. See the checks involving
6; CMP1 and CMP2.
7
8@v_38 = global i16 12061, align 1
9@v_39 = global i16 11333, align 1
10
11define i16 @test_true_and_false_branch_equal() {
12; CHECK-LABEL: @test_true_and_false_branch_equal(
13; CHECK-NEXT:  entry:
14; CHECK-NEXT:    br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]]
15; CHECK:       vector.ph:
16; CHECK-NEXT:    br label [[VECTOR_BODY:%.*]]
17; CHECK:       vector.body:
18; CHECK-NEXT:    [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[PRED_SREM_CONTINUE4:%.*]] ]
19; CHECK-NEXT:    [[TMP0:%.*]] = trunc i32 [[INDEX]] to i16
20; CHECK-NEXT:    [[OFFSET_IDX:%.*]] = add i16 99, [[TMP0]]
21; CHECK-NEXT:    [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x i16> undef, i16 [[OFFSET_IDX]], i32 0
22; CHECK-NEXT:    [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x i16> [[BROADCAST_SPLATINSERT]], <2 x i16> undef, <2 x i32> zeroinitializer
23; CHECK-NEXT:    [[INDUCTION:%.*]] = add <2 x i16> [[BROADCAST_SPLAT]], <i16 0, i16 1>
24; CHECK-NEXT:    [[TMP1:%.*]] = add i16 [[OFFSET_IDX]], 0
25; CHECK-NEXT:    [[TMP2:%.*]] = load i16, i16* @v_38, align 1
26; CHECK-NEXT:    [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <2 x i16> undef, i16 [[TMP2]], i32 0
27; CHECK-NEXT:    [[BROADCAST_SPLAT2:%.*]] = shufflevector <2 x i16> [[BROADCAST_SPLATINSERT1]], <2 x i16> undef, <2 x i32> zeroinitializer
28; CHECK-NEXT:    [[TMP3:%.*]] = icmp eq <2 x i16> [[BROADCAST_SPLAT2]], <i16 32767, i16 32767>
29; CHECK-NEXT:    [[TMP4:%.*]] = icmp eq <2 x i16> [[BROADCAST_SPLAT2]], zeroinitializer
30; CHECK-NEXT:    [[TMP5:%.*]] = xor <2 x i1> [[TMP4]], <i1 true, i1 true>
31; CHECK-NEXT:    [[TMP6:%.*]] = extractelement <2 x i1> [[TMP5]], i32 0
32; CHECK-NEXT:    br i1 [[TMP6]], label [[PRED_SREM_IF:%.*]], label [[PRED_SREM_CONTINUE:%.*]]
33; CHECK:       pred.srem.if:
34; CHECK-NEXT:    [[TMP7:%.*]] = srem i16 5786, [[TMP2]]
35; CHECK-NEXT:    [[TMP8:%.*]] = insertelement <2 x i16> undef, i16 [[TMP7]], i32 0
36; CHECK-NEXT:    br label [[PRED_SREM_CONTINUE]]
37; CHECK:       pred.srem.continue:
38; CHECK-NEXT:    [[TMP9:%.*]] = phi <2 x i16> [ undef, [[VECTOR_BODY]] ], [ [[TMP8]], [[PRED_SREM_IF]] ]
39; CHECK-NEXT:    [[TMP10:%.*]] = extractelement <2 x i1> [[TMP5]], i32 1
40; CHECK-NEXT:    br i1 [[TMP10]], label [[PRED_SREM_IF3:%.*]], label [[PRED_SREM_CONTINUE4]]
41; CHECK:       pred.srem.if3:
42; CHECK-NEXT:    [[TMP11:%.*]] = srem i16 5786, [[TMP2]]
43; CHECK-NEXT:    [[TMP12:%.*]] = insertelement <2 x i16> [[TMP9]], i16 [[TMP11]], i32 1
44; CHECK-NEXT:    br label [[PRED_SREM_CONTINUE4]]
45; CHECK:       pred.srem.continue4:
46; CHECK-NEXT:    [[TMP13:%.*]] = phi <2 x i16> [ [[TMP9]], [[PRED_SREM_CONTINUE]] ], [ [[TMP12]], [[PRED_SREM_IF3]] ]
47; CHECK-NEXT:    [[PREDPHI:%.*]] = select <2 x i1> [[TMP4]], <2 x i16> <i16 5786, i16 5786>, <2 x i16> [[TMP13]]
48; CHECK-NEXT:    [[TMP14:%.*]] = extractelement <2 x i16> [[PREDPHI]], i32 0
49; CHECK-NEXT:    store i16 [[TMP14]], i16* @v_39, align 1
50; CHECK-NEXT:    [[TMP15:%.*]] = extractelement <2 x i16> [[PREDPHI]], i32 1
51; CHECK-NEXT:    store i16 [[TMP15]], i16* @v_39, align 1
52; CHECK-NEXT:    [[INDEX_NEXT]] = add i32 [[INDEX]], 2
53; CHECK-NEXT:    [[TMP16:%.*]] = icmp eq i32 [[INDEX_NEXT]], 12
54; CHECK-NEXT:    br i1 [[TMP16]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], [[LOOP0:!llvm.loop !.*]]
55; CHECK:       middle.block:
56; CHECK-NEXT:    [[CMP_N:%.*]] = icmp eq i32 12, 12
57; CHECK-NEXT:    br i1 [[CMP_N]], label [[EXIT:%.*]], label [[SCALAR_PH]]
58; CHECK:       scalar.ph:
59; CHECK-NEXT:    [[BC_RESUME_VAL:%.*]] = phi i16 [ 111, [[MIDDLE_BLOCK]] ], [ 99, [[ENTRY:%.*]] ]
60; CHECK-NEXT:    br label [[FOR_BODY:%.*]]
61; CHECK:       for.body:
62; CHECK-NEXT:    [[I_07:%.*]] = phi i16 [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ], [ [[INC7:%.*]], [[FOR_LATCH:%.*]] ]
63; CHECK-NEXT:    [[LV:%.*]] = load i16, i16* @v_38, align 1
64; CHECK-NEXT:    [[CMP1:%.*]] = icmp eq i16 [[LV]], 32767
65; CHECK-NEXT:    br i1 [[CMP1]], label [[COND_END:%.*]], label [[COND_END]]
66; CHECK:       cond.end:
67; CHECK-NEXT:    [[CMP2:%.*]] = icmp eq i16 [[LV]], 0
68; CHECK-NEXT:    br i1 [[CMP2]], label [[FOR_LATCH]], label [[COND_FALSE4:%.*]]
69; CHECK:       cond.false4:
70; CHECK-NEXT:    [[REM:%.*]] = srem i16 5786, [[LV]]
71; CHECK-NEXT:    br label [[FOR_LATCH]]
72; CHECK:       for.latch:
73; CHECK-NEXT:    [[COND6:%.*]] = phi i16 [ [[REM]], [[COND_FALSE4]] ], [ 5786, [[COND_END]] ]
74; CHECK-NEXT:    store i16 [[COND6]], i16* @v_39, align 1
75; CHECK-NEXT:    [[INC7]] = add nsw i16 [[I_07]], 1
76; CHECK-NEXT:    [[CMP:%.*]] = icmp slt i16 [[INC7]], 111
77; CHECK-NEXT:    br i1 [[CMP]], label [[FOR_BODY]], label [[EXIT]], [[LOOP2:!llvm.loop !.*]]
78; CHECK:       exit:
79; CHECK-NEXT:    [[RV:%.*]] = load i16, i16* @v_39, align 1
80; CHECK-NEXT:    ret i16 [[RV]]
81;
82entry:
83  br label %for.body
84
85for.body:                                         ; preds = %entry, %for.latch
86  %i.07 = phi i16 [ 99, %entry ], [ %inc7, %for.latch ]
87  %lv = load i16, i16* @v_38, align 1
88  %cmp1 = icmp eq i16 %lv, 32767
89  br i1 %cmp1, label %cond.end, label %cond.end
90
91cond.end:                                         ; preds = %for.body, %for.body
92  %cmp2 = icmp eq i16 %lv, 0
93  br i1 %cmp2, label %for.latch, label %cond.false4
94
95cond.false4:                                      ; preds = %cond.end
96  %rem = srem i16 5786, %lv
97  br label %for.latch
98
99for.latch:                                        ; preds = %cond.end, %cond.false4
100  %cond6 = phi i16 [ %rem, %cond.false4 ], [ 5786, %cond.end ]
101  store i16 %cond6, i16* @v_39, align 1
102  %inc7 = add nsw i16 %i.07, 1
103  %cmp = icmp slt i16 %inc7, 111
104  br i1 %cmp, label %for.body, label %exit
105
106exit:                                 ; preds = %for.latch
107  %rv = load i16, i16* @v_39, align 1
108  ret i16 %rv
109}
110