summaryrefslogtreecommitdiff
path: root/test/CodeGen/PowerPC/licm-remat.ll
blob: f9c1405245210ee079344a6f7621d29ecfb4dff3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
; RUN: llc -verify-machineinstrs -ppc-reduce-cr-logicals \
; RUN:   -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s

; Test case is reduced from the snappy benchmark.
; Verify MachineLICM will always hoist trivially rematerializable instructions even when register pressure is high.

%"class.snappy::SnappyDecompressor" = type <{ %"class.snappy::Source"*, i8*, i8*, i32, i8, [5 x i8], [6 x i8] }>
%"class.snappy::Source" = type { i32 (...)** }
%"struct.snappy::iovec" = type { i8*, i64 }
%"class.snappy::SnappyIOVecWriter" = type { %"struct.snappy::iovec"*, i64, i64, i64, i64, i64 }

@_ZN6snappy8internalL10char_tableE = internal unnamed_addr constant [5 x i16] [i16 1, i16 2052, i16 4097, i16 8193, i16 2], align 2
@_ZN6snappy8internalL8wordmaskE = internal unnamed_addr constant [5 x i32] [i32 0, i32 255, i32 65535, i32 16777215, i32 -1], align 4

; Function Attrs: argmemonly nounwind
declare void @llvm.memmove.p0i8.p0i8.i64(i8* nocapture, i8* nocapture readonly, i64, i32, i1) #2
; Function Attrs: argmemonly nounwind
declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture writeonly, i8* nocapture readonly, i64, i32, i1) #2

define linkonce_odr void @ZN6snappyDecompressor_(%"class.snappy::SnappyDecompressor"* %this, %"class.snappy::SnappyIOVecWriter"* %writer) {
; CHECK-LABEL: ZN6snappyDecompressor_:
; CHECK:       # %bb.0: # %entry
; CHECK:       addis 3, 2, _ZN6snappy8internalL8wordmaskE@toc@ha
; CHECK-DAG:   addi 25, 3, _ZN6snappy8internalL8wordmaskE@toc@l
; CHECK-DAG:   addis 5, 2, _ZN6snappy8internalL10char_tableE@toc@ha
; CHECK-DAG:   addi 24, 5, _ZN6snappy8internalL10char_tableE@toc@l
; CHECK:       b .LBB0_2
; CHECK:       .LBB0_2: # %for.cond
; CHECK-NOT:   addis {{[0-9]+}}, 2, _ZN6snappy8internalL8wordmaskE@toc@ha
; CHECK-NOT:   addis {{[0-9]+}}, 2, _ZN6snappy8internalL10char_tableE@toc@ha
; CHECK:       bctrl
entry:
  %ip_limit_ = getelementptr inbounds %"class.snappy::SnappyDecompressor", %"class.snappy::SnappyDecompressor"* %this, i64 0, i32 2
  %0 = bitcast i8** %ip_limit_ to i64*
  %curr_iov_index_.i = getelementptr inbounds %"class.snappy::SnappyIOVecWriter", %"class.snappy::SnappyIOVecWriter"* %writer, i64 0, i32 2
  %curr_iov_written_.i = getelementptr inbounds %"class.snappy::SnappyIOVecWriter", %"class.snappy::SnappyIOVecWriter"* %writer, i64 0, i32 3
  %1 = bitcast i64* %curr_iov_written_.i to <2 x i64>*
  br label %for.cond

for.cond:                                         ; preds = %if.end82, %if.then56, %if.end49, %entry
  %ip.0 = phi i8* [ null, %entry ], [ %add.ptr50, %if.end49 ], [ null, %if.then56 ], [ undef, %if.end82 ]
  %incdec.ptr = getelementptr inbounds i8, i8* %ip.0, i64 1
  %2 = load i8, i8* %ip.0, align 1
  %conv = zext i8 %2 to i32
  br i1 undef, label %if.then7, label %if.else

if.then7:                                         ; preds = %for.cond
  %3 = lshr i32 %conv, 2
  %add = add nuw nsw i32 %3, 1
  %conv9 = zext i32 %add to i64
  %4 = load i64, i64* %0, align 8
  %sub.ptr.sub13 = sub i64 %4, 0
  %5 = load i64, i64* undef, align 8
  %6 = load i64, i64* null, align 8
  %sub.i = sub i64 %5, %6
  %cmp.i = icmp ult i32 %add, 17
  %cmp2.i = icmp ugt i64 %sub.ptr.sub13, 20
  %or.cond.i = and i1 %cmp.i, %cmp2.i
  %cmp4.i = icmp ugt i64 %sub.i, 15
  %or.cond13.i = and i1 %or.cond.i, %cmp4.i
  br i1 %or.cond13.i, label %land.lhs.true5.i, label %if.end17

land.lhs.true5.i:                                 ; preds = %if.then7
  %7 = load %"struct.snappy::iovec"*, %"struct.snappy::iovec"** undef, align 8
  %8 = load i64, i64* %curr_iov_index_.i, align 8
  %9 = load i64, i64* %curr_iov_written_.i, align 8
  %sub6.i = sub i64 0, %9
  %cmp7.i = icmp ugt i64 %sub6.i, 15
  br i1 %cmp7.i, label %cleanup102, label %if.end17

if.end17:                                         ; preds = %land.lhs.true5.i, %if.then7
  %sub = add nsw i64 %conv9, -60
  %10 = load i32, i32* undef, align 4
  %arrayidx = getelementptr inbounds [5 x i32], [5 x i32]* @_ZN6snappy8internalL8wordmaskE, i64 0, i64 %sub
  %11 = load i32, i32* %arrayidx, align 4
  %and21 = and i32 %11, %10
  %add22 = add i32 %and21, 1
  %conv23 = zext i32 %add22 to i64
  %add.ptr24 = getelementptr inbounds i8, i8* %incdec.ptr, i64 %sub
  br label %if.end25

if.end25:                                         ; preds = %if.end17
  %sub.ptr.rhs.cast28 = ptrtoint i8* %add.ptr24 to i64
  %cmp30233 = icmp ugt i64 %conv23, 0
  br i1 %cmp30233, label %while.body.preheader, label %while.end

while.body.preheader:                             ; preds = %if.end25
  %add.i158256 = add i64 %6, 0
  %cmp.i160257 = icmp ugt i64 %add.i158256, %5
  br i1 %cmp.i160257, label %cleanup105, label %while.cond.preheader.i

while.cond.preheader.i:                           ; preds = %while.body.preheader
  %call39 = call i8* undef(%"class.snappy::Source"* undef, i64* nonnull undef)
  unreachable

while.end:                                        ; preds = %if.end25
  br label %while.cond.preheader.i176

while.cond.preheader.i176:                        ; preds = %while.end
  br i1 undef, label %if.end49, label %while.body.lr.ph.i182

while.body.lr.ph.i182:                            ; preds = %while.cond.preheader.i176
  %.pre.i181 = load i64, i64* %curr_iov_written_.i, align 8
  %12 = load %"struct.snappy::iovec"*, %"struct.snappy::iovec"** undef, align 8
  %13 = load i64, i64* %curr_iov_index_.i, align 8
  %iov_len.i185 = getelementptr inbounds %"struct.snappy::iovec", %"struct.snappy::iovec"* %12, i64 %13, i32 1
  %14 = load i64, i64* %iov_len.i185, align 8
  br label %cond.end.i190

cond.end.i190:                                    ; preds = %while.body.lr.ph.i182
  br i1 undef, label %if.end18.i207, label %if.then10.i193

if.then10.i193:                                   ; preds = %cond.end.i190
  %add12.i191 = add i64 %13, 1
  %iov_len22.phi.trans.insert.i194 = getelementptr inbounds %"struct.snappy::iovec", %"struct.snappy::iovec"* %12, i64 %add12.i191, i32 1
  %.pre48.i195 = load i64, i64* %iov_len22.phi.trans.insert.i194, align 8
  br label %if.end18.i207

if.end18.i207:                                    ; preds = %if.then10.i193, %cond.end.i190
  %15 = phi i64 [ %.pre.i181, %cond.end.i190 ], [ 0, %if.then10.i193 ]
  %16 = phi i64 [ %14, %cond.end.i190 ], [ %.pre48.i195, %if.then10.i193 ]
  %17 = phi i64 [ %13, %cond.end.i190 ], [ %add12.i191, %if.then10.i193 ]
  %sub.i197 = sub i64 %16, %15
  %cmp.i.i198 = icmp ult i64 %sub.i197, %conv23
  %.sroa.speculated.i199 = select i1 %cmp.i.i198, i64 %sub.i197, i64 %conv23
  %iov_base.i.i200 = getelementptr inbounds %"struct.snappy::iovec", %"struct.snappy::iovec"* %12, i64 %17, i32 0
  %18 = load i8*, i8** %iov_base.i.i200, align 8
  %add.ptr.i.i201 = getelementptr inbounds i8, i8* %18, i64 %15
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %add.ptr.i.i201, i8* %add.ptr24, i64 %.sroa.speculated.i199, i32 1, i1 false) #12
  %add30.i203 = add i64 0, %.sroa.speculated.i199
  store i64 %add30.i203, i64* null, align 8
  %.pre245 = load i64, i64* %0, align 8
  br label %if.end49

if.end49:                                         ; preds = %if.end18.i207, %while.cond.preheader.i176
  %19 = phi i64 [ %.pre245, %if.end18.i207 ], [ %4, %while.cond.preheader.i176 ]
  %add.ptr50 = getelementptr inbounds i8, i8* %add.ptr24, i64 %conv23
  %sub.ptr.sub54 = sub i64 %19, 0
  %cmp55 = icmp slt i64 %sub.ptr.sub54, 5
  br i1 %cmp55, label %if.then56, label %for.cond

if.then56:                                        ; preds = %if.end49
  br label %for.cond

if.else:                                          ; preds = %for.cond
  %idxprom = zext i8 %2 to i64
  %arrayidx68 = getelementptr inbounds [5 x i16], [5 x i16]* @_ZN6snappy8internalL10char_tableE, i64 0, i64 %idxprom
  %20 = load i16, i16* %arrayidx68, align 2
  %conv69 = zext i16 %20 to i64
  %21 = load i32, i32* undef, align 4
  %shr71 = lshr i64 %conv69, 11
  %arrayidx72 = getelementptr inbounds [5 x i32], [5 x i32]* @_ZN6snappy8internalL8wordmaskE, i64 0, i64 %shr71
  %22 = load i32, i32* %arrayidx72, align 4
  %and73 = and i32 %22, %21
  %conv74 = zext i32 %and73 to i64
  %add79 = add nuw nsw i64 0, %conv74
  %call80 = call zeroext i1 @_ZN6snappy17SnappyIOVecWriterAppendFromSelfEmm(%"class.snappy::SnappyIOVecWriter"* %writer, i64 %add79, i64 undef)
  br i1 %call80, label %if.end82, label %cleanup105

if.end82:                                         ; preds = %if.else
  br label %for.cond

cleanup102:                                       ; preds = %land.lhs.true5.i
  %iov_base.i.i = getelementptr inbounds %"struct.snappy::iovec", %"struct.snappy::iovec"* %7, i64 %8, i32 0
  %23 = load i8*, i8** %iov_base.i.i, align 8
  %add.ptr.i.i = getelementptr inbounds i8, i8* %23, i64 %9
  call void @llvm.memmove.p0i8.p0i8.i64(i8* %add.ptr.i.i, i8* %incdec.ptr, i64 16, i32 1, i1 false) #12
  %24 = load <2 x i64>, <2 x i64>* %1, align 8
  %25 = insertelement <2 x i64> undef, i64 %conv9, i32 0
  %26 = shufflevector <2 x i64> %25, <2 x i64> undef, <2 x i32> zeroinitializer
  %27 = add <2 x i64> %24, %26
  store <2 x i64> %27, <2 x i64>* undef, align 8
  unreachable

cleanup105:                                       ; preds = %if.else, %while.body.preheader
  ret void
}

; Function Attrs: inlinehint
declare zeroext i1 @_ZN6snappy17SnappyIOVecWriterAppendFromSelfEmm(%"class.snappy::SnappyIOVecWriter"*, i64, i64) local_unnamed_addr #10 align 2