1; RUN: llc < %s -asm-verbose=false -disable-wasm-fallthrough-return-opt | FileCheck %s 2 3target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128" 4target triple = "wasm32-unknown-unknown" 5 6declare void @ext_func(i64* %ptr) 7declare void @ext_func_i32(i32* %ptr) 8 9; CHECK-LABEL: alloca32: 10; Check that there is an extra local for the stack pointer. 11; CHECK: .local i32{{$}} 12define void @alloca32() noredzone { 13 ; CHECK-NEXT: get_global $push[[L2:.+]]=, __stack_pointer{{$}} 14 ; CHECK-NEXT: i32.const $push[[L3:.+]]=, 16 15 ; CHECK-NEXT: i32.sub $push[[L9:.+]]=, $pop[[L2]], $pop[[L3]] 16 ; CHECK-NEXT: tee_local $push[[L8:.+]]=, [[SP:.+]], $pop[[L9]]{{$}} 17 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L8]]{{$}} 18 %retval = alloca i32 19 ; CHECK: get_local $push[[L4:.+]]=, [[SP]]{{$}} 20 ; CHECK: i32.const $push[[L0:.+]]=, 0 21 ; CHECK: i32.store 12($pop[[L4]]), $pop[[L0]] 22 store i32 0, i32* %retval 23 ; CHECK: get_local $push[[L6:.+]]=, [[SP]]{{$}} 24 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 16 25 ; CHECK-NEXT: i32.add $push[[L7:.+]]=, $pop[[L6]], $pop[[L5]] 26 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L7]] 27 ret void 28} 29 30; CHECK-LABEL: alloca3264: 31; CHECK: .local i32{{$}} 32define void @alloca3264() { 33 ; CHECK: get_global $push[[L3:.+]]=, __stack_pointer{{$}} 34 ; CHECK-NEXT: i32.const $push[[L4:.+]]=, 16 35 ; CHECK-NEXT: i32.sub $push[[L6:.+]]=, $pop[[L3]], $pop[[L4]] 36 ; CHECK-NEXT: tee_local $push[[L5:.+]]=, [[SP:.+]], $pop[[L6]] 37 %r1 = alloca i32 38 %r2 = alloca double 39 store i32 0, i32* %r1 40 store double 0.0, double* %r2 41 ; CHECK-NEXT: i64.const $push[[L1:.+]]=, 0 42 ; CHECK-NEXT: i64.store 0($pop[[L5]]), $pop[[L1]] 43 ; CHECK-NEXT: get_local $push[[L2:.+]]=, [[SP]]{{$}} 44 ; CHECK-NEXT: i32.const $push[[L0:.+]]=, 0 45 ; CHECK-NEXT: i32.store 12($pop[[L2]]), $pop[[L0]] 46 ; CHECK-NEXT: return 47 ret void 48} 49 50; CHECK-LABEL: allocarray: 51; CHECK: .local i32{{$}} 52define void @allocarray() { 53 ; CHECK-NEXT: get_global $push[[L4:.+]]=, __stack_pointer{{$}} 54 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 144{{$}} 55 ; CHECK-NEXT: i32.sub $push[[L12:.+]]=, $pop[[L4]], $pop[[L5]] 56 ; CHECK-NEXT: tee_local $push[[L11:.+]]=, 0, $pop[[L12]] 57 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L11]] 58 %r = alloca [33 x i32] 59 60 ; CHECK: i32.const $push{{.+}}=, 24 61 ; CHECK-NEXT: i32.add $push[[L3:.+]]=, $pop{{.+}}, $pop{{.+}} 62 ; CHECK-NEXT: i32.const $push[[L1:.+]]=, 1{{$}} 63 ; CHECK-NEXT: i32.store 0($pop[[L3]]), $pop[[L1]]{{$}} 64 ; CHECK-NEXT: get_local $push[[L4:.+]]=, 0{{$}} 65 ; CHECK-NEXT: i32.const $push[[L10:.+]]=, 1{{$}} 66 ; CHECK-NEXT: i32.store 12($pop[[L4]]), $pop[[L10]]{{$}} 67 %p = getelementptr [33 x i32], [33 x i32]* %r, i32 0, i32 0 68 store i32 1, i32* %p 69 %p2 = getelementptr [33 x i32], [33 x i32]* %r, i32 0, i32 3 70 store i32 1, i32* %p2 71 72 ; CHECK-NEXT: get_local $push[[L2:.+]]=, [[SP]]{{$}} 73 ; CHECK-NEXT: i32.const $push[[L7:.+]]=, 144 74 ; CHECK-NEXT: i32.add $push[[L8:.+]]=, $pop[[L2]], $pop[[L7]] 75 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L8]] 76 ret void 77} 78 79; CHECK-LABEL: non_mem_use 80define void @non_mem_use(i8** %addr) { 81 ; CHECK: i32.const $push[[L2:.+]]=, 48 82 ; CHECK-NEXT: i32.sub $push[[L12:.+]]=, {{.+}}, $pop[[L2]] 83 ; CHECK-NEXT: tee_local $push[[L11:.+]]=, [[SP:.+]], $pop[[L12]] 84 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L11]] 85 %buf = alloca [27 x i8], align 16 86 %r = alloca i64 87 %r2 = alloca i64 88 ; %r is at SP+8 89 ; CHECK: get_local $push[[L3:.+]]=, [[SP]] 90 ; CHECK: i32.const $push[[OFF:.+]]=, 8 91 ; CHECK-NEXT: i32.add $push[[ARG1:.+]]=, $pop[[L3]], $pop[[OFF]] 92 ; CHECK-NEXT: call ext_func@FUNCTION, $pop[[ARG1]] 93 call void @ext_func(i64* %r) 94 ; %r2 is at SP+0, no add needed 95 ; CHECK: get_local $push[[L4:.+]]=, [[SP]] 96 ; CHECK-NEXT: call ext_func@FUNCTION, $pop[[L4]] 97 call void @ext_func(i64* %r2) 98 ; Use as a value, but in a store 99 ; %buf is at SP+16 100 ; CHECK: get_local $push[[L5:.+]]=, [[SP]] 101 ; CHECK: i32.const $push[[OFF:.+]]=, 16 102 ; CHECK-NEXT: i32.add $push[[VAL:.+]]=, $pop[[L5]], $pop[[OFF]] 103 ; CHECK-NEXT: i32.store 0($pop{{.+}}), $pop[[VAL]] 104 %gep = getelementptr inbounds [27 x i8], [27 x i8]* %buf, i32 0, i32 0 105 store i8* %gep, i8** %addr 106 ret void 107} 108 109; CHECK-LABEL: allocarray_inbounds: 110; CHECK: .local i32{{$}} 111define void @allocarray_inbounds() { 112 ; CHECK: get_global $push[[L3:.+]]=, __stack_pointer{{$}} 113 ; CHECK-NEXT: i32.const $push[[L4:.+]]=, 32{{$}} 114 ; CHECK-NEXT: i32.sub $push[[L11:.+]]=, $pop[[L3]], $pop[[L4]] 115 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, [[SP:.+]], $pop[[L11]] 116 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L10]]{{$}} 117 %r = alloca [5 x i32] 118 ; CHECK: i32.const $push[[L3:.+]]=, 1 119 ; CHECK-DAG: i32.store 24(${{.+}}), $pop[[L3]] 120 %p = getelementptr inbounds [5 x i32], [5 x i32]* %r, i32 0, i32 0 121 store i32 1, i32* %p 122 ; This store should have both the GEP and the FI folded into it. 123 ; CHECK-DAG: i32.store 12(${{.+}}), $pop 124 %p2 = getelementptr inbounds [5 x i32], [5 x i32]* %r, i32 0, i32 3 125 store i32 1, i32* %p2 126 call void @ext_func(i64* null); 127 ; CHECK: call ext_func 128 ; CHECK: i32.const $push[[L5:.+]]=, 32{{$}} 129 ; CHECK-NEXT: i32.add $push[[L7:.+]]=, ${{.+}}, $pop[[L5]] 130 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L7]] 131 ret void 132} 133 134; CHECK-LABEL: dynamic_alloca: 135define void @dynamic_alloca(i32 %alloc) { 136 ; CHECK: get_global $push[[L13:.+]]=, __stack_pointer{{$}} 137 ; CHECK-NEXT: tee_local $push[[L12:.+]]=, [[SP:.+]], $pop[[L13]]{{$}} 138 ; Target independent codegen bumps the stack pointer. 139 ; CHECK: i32.sub 140 ; Check that SP is written back to memory after decrement 141 ; CHECK: set_global __stack_pointer, 142 %r = alloca i32, i32 %alloc 143 ; Target-independent codegen also calculates the store addr 144 ; CHECK: call ext_func_i32@FUNCTION 145 call void @ext_func_i32(i32* %r) 146 ; CHECK: set_global __stack_pointer, $pop{{.+}} 147 ret void 148} 149 150; CHECK-LABEL: dynamic_alloca_redzone: 151define void @dynamic_alloca_redzone(i32 %alloc) { 152 ; CHECK: get_global $push[[L13:.+]]=, __stack_pointer{{$}} 153 ; CHECK-NEXT: tee_local $push[[L12:.+]]=, [[SP:.+]], $pop[[L13]]{{$}} 154 ; Target independent codegen bumps the stack pointer 155 ; CHECK: i32.sub 156 %r = alloca i32, i32 %alloc 157 ; CHECK-NEXT: tee_local $push[[L8:.+]]=, {{.+}}, $pop 158 ; CHECK: get_local $push[[L7:.+]]=, 0{{$}} 159 ; CHECK-NEXT: i32.const $push[[L6:.+]]=, 0{{$}} 160 ; CHECK-NEXT: i32.store 0($pop[[L7]]), $pop[[L6]]{{$}} 161 store i32 0, i32* %r 162 ; CHECK-NEXT: return 163 ret void 164} 165 166; CHECK-LABEL: dynamic_static_alloca: 167define void @dynamic_static_alloca(i32 %alloc) noredzone { 168 ; Decrement SP in the prolog by the static amount and writeback to memory. 169 ; CHECK: get_global $push[[L11:.+]]=, __stack_pointer{{$}} 170 ; CHECK-NEXT: i32.const $push[[L12:.+]]=, 16 171 ; CHECK-NEXT: i32.sub $push[[L23:.+]]=, $pop[[L11]], $pop[[L12]] 172 ; CHECK-NEXT: tee_local $push[[L22:.+]]=, [[SP:.+]], $pop[[L23]] 173 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L22]] 174 175 ; Alloc and write to a static alloca 176 ; CHECK: get_local $push[[L21:.+]]=, [[SP:.+]] 177 ; CHECK-NEXT: tee_local $push[[pushedFP:.+]]=, [[FP:.+]], $pop[[L21]] 178 ; CHECK-NEXT: i32.const $push[[L0:.+]]=, 101 179 ; CHECK-NEXT: i32.store [[static_offset:.+]]($pop[[pushedFP]]), $pop[[L0]] 180 %static = alloca i32 181 store volatile i32 101, i32* %static 182 183 ; Decrement SP in the body by the dynamic amount. 184 ; CHECK: i32.sub 185 ; CHECK: tee_local $push[[L16:.+]]=, [[dynamic_local:.+]], $pop{{.+}} 186 ; CHECK: tee_local $push[[L15:.+]]=, [[other:.+]], $pop[[L16]]{{$}} 187 ; CHECK: set_global __stack_pointer, $pop[[L15]]{{$}} 188 %dynamic = alloca i32, i32 %alloc 189 190 ; Ensure we don't modify the frame pointer after assigning it. 191 ; CHECK-NOT: $[[FP]]= 192 193 ; Ensure the static address doesn't change after modifying the stack pointer. 194 ; CHECK: get_local $push[[L17:.+]]=, [[FP]] 195 ; CHECK: i32.const $push[[L7:.+]]=, 102 196 ; CHECK-NEXT: i32.store [[static_offset]]($pop[[L17]]), $pop[[L7]] 197 ; CHECK-NEXT: get_local $push[[L9:.+]]=, [[dynamic_local]]{{$}} 198 ; CHECK-NEXT: i32.const $push[[L8:.+]]=, 103 199 ; CHECK-NEXT: i32.store 0($pop[[L9]]), $pop[[L8]] 200 store volatile i32 102, i32* %static 201 store volatile i32 103, i32* %dynamic 202 203 ; Decrement SP in the body by the dynamic amount. 204 ; CHECK: i32.sub 205 ; CHECK: tee_local $push{{.+}}=, [[dynamic2_local:.+]], $pop{{.+}} 206 %dynamic.2 = alloca i32, i32 %alloc 207 208 ; CHECK-NOT: $[[FP]]= 209 210 ; Ensure neither the static nor dynamic address changes after the second 211 ; modification of the stack pointer. 212 ; CHECK: get_local $push[[L22:.+]]=, [[FP]] 213 ; CHECK: i32.const $push[[L9:.+]]=, 104 214 ; CHECK-NEXT: i32.store [[static_offset]]($pop[[L22]]), $pop[[L9]] 215 ; CHECK-NEXT: get_local $push[[L23:.+]]=, [[dynamic_local]] 216 ; CHECK-NEXT: i32.const $push[[L10:.+]]=, 105 217 ; CHECK-NEXT: i32.store 0($pop[[L23]]), $pop[[L10]] 218 ; CHECK-NEXT: get_local $push[[L23:.+]]=, [[dynamic2_local]] 219 ; CHECK-NEXT: i32.const $push[[L11:.+]]=, 106 220 ; CHECK-NEXT: i32.store 0($pop[[L23]]), $pop[[L11]] 221 store volatile i32 104, i32* %static 222 store volatile i32 105, i32* %dynamic 223 store volatile i32 106, i32* %dynamic.2 224 225 ; Writeback to memory. 226 ; CHECK: get_local $push[[L24:.+]]=, [[FP]]{{$}} 227 ; CHECK: i32.const $push[[L18:.+]]=, 16 228 ; CHECK-NEXT: i32.add $push[[L19:.+]]=, $pop[[L24]], $pop[[L18]] 229 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L19]] 230 ret void 231} 232 233declare i8* @llvm.stacksave() 234declare void @llvm.stackrestore(i8*) 235 236; CHECK-LABEL: llvm_stack_builtins: 237define void @llvm_stack_builtins(i32 %alloc) noredzone { 238 ; CHECK: get_global $push[[L11:.+]]=, __stack_pointer{{$}} 239 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, {{.+}}, $pop[[L11]] 240 ; CHECK-NEXT: set_local [[STACK:.+]], $pop[[L10]] 241 %stack = call i8* @llvm.stacksave() 242 243 ; Ensure we don't reassign the stacksave local 244 ; CHECK-NOT: set_local [[STACK]], 245 %dynamic = alloca i32, i32 %alloc 246 247 ; CHECK: get_local $push[[L12:.+]]=, [[STACK]] 248 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L12]] 249 call void @llvm.stackrestore(i8* %stack) 250 251 ret void 252} 253 254; Not actually using the alloca'd variables exposed an issue with register 255; stackification, where copying the stack pointer into the frame pointer was 256; moved after the stack pointer was updated for the dynamic alloca. 257; CHECK-LABEL: dynamic_alloca_nouse: 258define void @dynamic_alloca_nouse(i32 %alloc) noredzone { 259 ; CHECK: get_global $push[[L11:.+]]=, __stack_pointer{{$}} 260 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, {{.+}}, $pop[[L11]] 261 ; CHECK-NEXT: set_local [[FP:.+]], $pop[[L10]] 262 %dynamic = alloca i32, i32 %alloc 263 264 ; CHECK-NOT: set_local [[FP]], 265 266 ; CHECK: get_local $push[[L12:.+]]=, [[FP]] 267 ; CHECK-NEXT: set_global __stack_pointer, $pop[[L12]] 268 ret void 269} 270 271; The use of the alloca in a phi causes a CopyToReg DAG node to be generated, 272; which has to have special handling because CopyToReg can't have a FI operand 273; CHECK-LABEL: copytoreg_fi: 274define void @copytoreg_fi(i1 %cond, i32* %b) { 275entry: 276 ; CHECK: i32.const $push[[L1:.+]]=, 16 277 ; CHECK-NEXT: i32.sub $push[[L3:.+]]=, {{.+}}, $pop[[L1]] 278 %addr = alloca i32 279 ; CHECK: i32.const $push[[OFF:.+]]=, 12 280 ; CHECK-NEXT: i32.add $push[[ADDR:.+]]=, $pop[[L3]], $pop[[OFF]] 281 ; CHECK-NEXT: set_local [[COPY:.+]], $pop[[ADDR]] 282 br label %body 283body: 284 %a = phi i32* [%addr, %entry], [%b, %body] 285 store i32 1, i32* %a 286 ; CHECK: get_local $push[[L12:.+]]=, [[COPY]] 287 ; CHECK: i32.store 0($pop[[L12]]), 288 br i1 %cond, label %body, label %exit 289exit: 290 ret void 291} 292 293declare void @use_i8_star(i8*) 294declare i8* @llvm.frameaddress(i32) 295 296; Test __builtin_frame_address(0). 297; CHECK-LABEL: frameaddress_0: 298; CHECK: get_global $push[[L3:.+]]=, __stack_pointer{{$}} 299; CHECK-NEXT: tee_local $push[[L2:.+]]=, [[FP:.+]], $pop[[L3]]{{$}} 300; CHECK-NEXT: call use_i8_star@FUNCTION, $pop[[L2]] 301; CHECK-NEXT: get_local $push[[L5:.+]]=, [[FP]] 302; CHECK-NEXT: set_global __stack_pointer, $pop[[L5]] 303define void @frameaddress_0() { 304 %t = call i8* @llvm.frameaddress(i32 0) 305 call void @use_i8_star(i8* %t) 306 ret void 307} 308 309; Test __builtin_frame_address(1). 310 311; CHECK-LABEL: frameaddress_1: 312; CHECK-NEXT: i32.const $push0=, 0{{$}} 313; CHECK-NEXT: call use_i8_star@FUNCTION, $pop0{{$}} 314; CHECK-NEXT: return{{$}} 315define void @frameaddress_1() { 316 %t = call i8* @llvm.frameaddress(i32 1) 317 call void @use_i8_star(i8* %t) 318 ret void 319} 320 321; Test a stack address passed to an inline asm. 322; CHECK-LABEL: inline_asm: 323; CHECK: get_global {{.+}}, __stack_pointer{{$}} 324; CHECK: #APP 325; CHECK-NEXT: # %{{[0-9]+}}{{$}} 326; CHECK-NEXT: #NO_APP 327define void @inline_asm() { 328 %tmp = alloca i8 329 call void asm sideeffect "# %0", "r"(i8* %tmp) 330 ret void 331} 332 333; TODO: test over-aligned alloca 334