1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2; RUN: opt < %s -basic-aa -dse -enable-dse-memoryssa=false -S | FileCheck %s 3target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128" 4 5%struct.vec2 = type { <4 x i32>, <4 x i32> } 6%struct.vec2plusi = type { <4 x i32>, <4 x i32>, i32 } 7 8@glob1 = global %struct.vec2 zeroinitializer, align 16 9@glob2 = global %struct.vec2plusi zeroinitializer, align 16 10 11define void @write24to28(i32* nocapture %p) nounwind uwtable ssp { 12; CHECK-LABEL: @write24to28( 13; CHECK-NEXT: entry: 14; CHECK-NEXT: [[ARRAYIDX0:%.*]] = getelementptr inbounds i32, i32* [[P:%.*]], i64 1 15; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[ARRAYIDX0]] to i8* 16; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 4 [[P3]], i8 0, i64 24, i1 false) 17; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 18; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4 19; CHECK-NEXT: ret void 20; 21entry: 22 %arrayidx0 = getelementptr inbounds i32, i32* %p, i64 1 23 %p3 = bitcast i32* %arrayidx0 to i8* 24 call void @llvm.memset.p0i8.i64(i8* align 4 %p3, i8 0, i64 28, i1 false) 25 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 26 store i32 1, i32* %arrayidx1, align 4 27 ret void 28} 29 30define void @write24to28_atomic(i32* nocapture %p) nounwind uwtable ssp { 31; CHECK-LABEL: @write24to28_atomic( 32; CHECK-NEXT: entry: 33; CHECK-NEXT: [[ARRAYIDX0:%.*]] = getelementptr inbounds i32, i32* [[P:%.*]], i64 1 34; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[ARRAYIDX0]] to i8* 35; CHECK-NEXT: call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 4 [[P3]], i8 0, i64 24, i32 4) 36; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 37; CHECK-NEXT: store atomic i32 1, i32* [[ARRAYIDX1]] unordered, align 4 38; CHECK-NEXT: ret void 39; 40entry: 41 %arrayidx0 = getelementptr inbounds i32, i32* %p, i64 1 42 %p3 = bitcast i32* %arrayidx0 to i8* 43 call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 4 %p3, i8 0, i64 28, i32 4) 44 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 45 store atomic i32 1, i32* %arrayidx1 unordered, align 4 46 ret void 47} 48 49; Atomicity of the store is weaker from the memset 50define void @write24to28_atomic_weaker(i32* nocapture %p) nounwind uwtable ssp { 51; CHECK-LABEL: @write24to28_atomic_weaker( 52; CHECK-NEXT: entry: 53; CHECK-NEXT: [[ARRAYIDX0:%.*]] = getelementptr inbounds i32, i32* [[P:%.*]], i64 1 54; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[ARRAYIDX0]] to i8* 55; CHECK-NEXT: call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 4 [[P3]], i8 0, i64 24, i32 4) 56; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 57; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4 58; CHECK-NEXT: ret void 59; 60entry: 61 %arrayidx0 = getelementptr inbounds i32, i32* %p, i64 1 62 %p3 = bitcast i32* %arrayidx0 to i8* 63 call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 4 %p3, i8 0, i64 28, i32 4) 64 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 65 store i32 1, i32* %arrayidx1, align 4 66 ret void 67} 68 69define void @write28to32(i32* nocapture %p) nounwind uwtable ssp { 70; CHECK-LABEL: @write28to32( 71; CHECK-NEXT: entry: 72; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[P:%.*]] to i8* 73; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 4 [[P3]], i8 0, i64 28, i1 false) 74; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 75; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4 76; CHECK-NEXT: ret void 77; 78entry: 79 %p3 = bitcast i32* %p to i8* 80 call void @llvm.memset.p0i8.i64(i8* align 4 %p3, i8 0, i64 32, i1 false) 81 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 82 store i32 1, i32* %arrayidx1, align 4 83 ret void 84} 85 86define void @write28to32_atomic(i32* nocapture %p) nounwind uwtable ssp { 87; CHECK-LABEL: @write28to32_atomic( 88; CHECK-NEXT: entry: 89; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[P:%.*]] to i8* 90; CHECK-NEXT: call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 4 [[P3]], i8 0, i64 28, i32 4) 91; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 92; CHECK-NEXT: store atomic i32 1, i32* [[ARRAYIDX1]] unordered, align 4 93; CHECK-NEXT: ret void 94; 95entry: 96 %p3 = bitcast i32* %p to i8* 97 call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 4 %p3, i8 0, i64 32, i32 4) 98 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 99 store atomic i32 1, i32* %arrayidx1 unordered, align 4 100 ret void 101} 102 103define void @dontwrite28to32memset(i32* nocapture %p) nounwind uwtable ssp { 104; CHECK-LABEL: @dontwrite28to32memset( 105; CHECK-NEXT: entry: 106; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[P:%.*]] to i8* 107; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 16 [[P3]], i8 0, i64 32, i1 false) 108; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 109; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4 110; CHECK-NEXT: ret void 111; 112entry: 113 %p3 = bitcast i32* %p to i8* 114 call void @llvm.memset.p0i8.i64(i8* align 16 %p3, i8 0, i64 32, i1 false) 115 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 116 store i32 1, i32* %arrayidx1, align 4 117 ret void 118} 119 120define void @dontwrite28to32memset_atomic(i32* nocapture %p) nounwind uwtable ssp { 121; CHECK-LABEL: @dontwrite28to32memset_atomic( 122; CHECK-NEXT: entry: 123; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[P:%.*]] to i8* 124; CHECK-NEXT: call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 16 [[P3]], i8 0, i64 32, i32 4) 125; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 7 126; CHECK-NEXT: store atomic i32 1, i32* [[ARRAYIDX1]] unordered, align 4 127; CHECK-NEXT: ret void 128; 129entry: 130 %p3 = bitcast i32* %p to i8* 131 call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 16 %p3, i8 0, i64 32, i32 4) 132 %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7 133 store atomic i32 1, i32* %arrayidx1 unordered, align 4 134 ret void 135} 136 137define void @write32to36(%struct.vec2plusi* nocapture %p) nounwind uwtable ssp { 138; CHECK-LABEL: @write32to36( 139; CHECK-NEXT: entry: 140; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2plusi* [[P:%.*]] to i8* 141; CHECK-NEXT: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2plusi* @glob2 to i8*), i64 32, i1 false) 142; CHECK-NEXT: [[C:%.*]] = getelementptr inbounds [[STRUCT_VEC2PLUSI:%.*]], %struct.vec2plusi* [[P]], i64 0, i32 2 143; CHECK-NEXT: store i32 1, i32* [[C]], align 4 144; CHECK-NEXT: ret void 145; 146entry: 147 %0 = bitcast %struct.vec2plusi* %p to i8* 148 tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2plusi* @glob2 to i8*), i64 36, i1 false) 149 %c = getelementptr inbounds %struct.vec2plusi, %struct.vec2plusi* %p, i64 0, i32 2 150 store i32 1, i32* %c, align 4 151 ret void 152} 153 154define void @write32to36_atomic(%struct.vec2plusi* nocapture %p) nounwind uwtable ssp { 155; CHECK-LABEL: @write32to36_atomic( 156; CHECK-NEXT: entry: 157; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2plusi* [[P:%.*]] to i8* 158; CHECK-NEXT: tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2plusi* @glob2 to i8*), i64 32, i32 4) 159; CHECK-NEXT: [[C:%.*]] = getelementptr inbounds [[STRUCT_VEC2PLUSI:%.*]], %struct.vec2plusi* [[P]], i64 0, i32 2 160; CHECK-NEXT: store atomic i32 1, i32* [[C]] unordered, align 4 161; CHECK-NEXT: ret void 162; 163entry: 164 %0 = bitcast %struct.vec2plusi* %p to i8* 165 tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2plusi* @glob2 to i8*), i64 36, i32 4) 166 %c = getelementptr inbounds %struct.vec2plusi, %struct.vec2plusi* %p, i64 0, i32 2 167 store atomic i32 1, i32* %c unordered, align 4 168 ret void 169} 170 171; Atomicity of the store is weaker than the memcpy 172define void @write32to36_atomic_weaker(%struct.vec2plusi* nocapture %p) nounwind uwtable ssp { 173; CHECK-LABEL: @write32to36_atomic_weaker( 174; CHECK-NEXT: entry: 175; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2plusi* [[P:%.*]] to i8* 176; CHECK-NEXT: tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2plusi* @glob2 to i8*), i64 32, i32 4) 177; CHECK-NEXT: [[C:%.*]] = getelementptr inbounds [[STRUCT_VEC2PLUSI:%.*]], %struct.vec2plusi* [[P]], i64 0, i32 2 178; CHECK-NEXT: store i32 1, i32* [[C]], align 4 179; CHECK-NEXT: ret void 180; 181entry: 182 %0 = bitcast %struct.vec2plusi* %p to i8* 183 tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2plusi* @glob2 to i8*), i64 36, i32 4) 184 %c = getelementptr inbounds %struct.vec2plusi, %struct.vec2plusi* %p, i64 0, i32 2 185 store i32 1, i32* %c, align 4 186 ret void 187} 188 189define void @write16to32(%struct.vec2* nocapture %p) nounwind uwtable ssp { 190; CHECK-LABEL: @write16to32( 191; CHECK-NEXT: entry: 192; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2* [[P:%.*]] to i8* 193; CHECK-NEXT: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 16, i1 false) 194; CHECK-NEXT: [[C:%.*]] = getelementptr inbounds [[STRUCT_VEC2:%.*]], %struct.vec2* [[P]], i64 0, i32 1 195; CHECK-NEXT: store <4 x i32> <i32 1, i32 2, i32 3, i32 4>, <4 x i32>* [[C]], align 4 196; CHECK-NEXT: ret void 197; 198entry: 199 %0 = bitcast %struct.vec2* %p to i8* 200 tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 32, i1 false) 201 %c = getelementptr inbounds %struct.vec2, %struct.vec2* %p, i64 0, i32 1 202 store <4 x i32> <i32 1, i32 2, i32 3, i32 4>, <4 x i32>* %c, align 4 203 ret void 204} 205 206define void @write16to32_atomic(%struct.vec2* nocapture %p) nounwind uwtable ssp { 207; CHECK-LABEL: @write16to32_atomic( 208; CHECK-NEXT: entry: 209; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2* [[P:%.*]] to i8* 210; CHECK-NEXT: tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 16, i32 4) 211; CHECK-NEXT: [[C:%.*]] = getelementptr inbounds [[STRUCT_VEC2:%.*]], %struct.vec2* [[P]], i64 0, i32 1 212; CHECK-NEXT: store <4 x i32> <i32 1, i32 2, i32 3, i32 4>, <4 x i32>* [[C]], align 4 213; CHECK-NEXT: ret void 214; 215entry: 216 %0 = bitcast %struct.vec2* %p to i8* 217 tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 32, i32 4) 218 %c = getelementptr inbounds %struct.vec2, %struct.vec2* %p, i64 0, i32 1 219 store <4 x i32> <i32 1, i32 2, i32 3, i32 4>, <4 x i32>* %c, align 4 220 ret void 221} 222 223define void @dontwrite28to32memcpy(%struct.vec2* nocapture %p) nounwind uwtable ssp { 224; CHECK-LABEL: @dontwrite28to32memcpy( 225; CHECK-NEXT: entry: 226; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2* [[P:%.*]] to i8* 227; CHECK-NEXT: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 32, i1 false) 228; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds [[STRUCT_VEC2:%.*]], %struct.vec2* [[P]], i64 0, i32 0, i64 7 229; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4 230; CHECK-NEXT: ret void 231; 232entry: 233 %0 = bitcast %struct.vec2* %p to i8* 234 tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 32, i1 false) 235 %arrayidx1 = getelementptr inbounds %struct.vec2, %struct.vec2* %p, i64 0, i32 0, i64 7 236 store i32 1, i32* %arrayidx1, align 4 237 ret void 238} 239 240define void @dontwrite28to32memcpy_atomic(%struct.vec2* nocapture %p) nounwind uwtable ssp { 241; CHECK-LABEL: @dontwrite28to32memcpy_atomic( 242; CHECK-NEXT: entry: 243; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.vec2* [[P:%.*]] to i8* 244; CHECK-NEXT: tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 [[TMP0]], i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 32, i32 4) 245; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds [[STRUCT_VEC2:%.*]], %struct.vec2* [[P]], i64 0, i32 0, i64 7 246; CHECK-NEXT: store atomic i32 1, i32* [[ARRAYIDX1]] unordered, align 4 247; CHECK-NEXT: ret void 248; 249entry: 250 %0 = bitcast %struct.vec2* %p to i8* 251 tail call void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* align 16 %0, i8* align 16 bitcast (%struct.vec2* @glob1 to i8*), i64 32, i32 4) 252 %arrayidx1 = getelementptr inbounds %struct.vec2, %struct.vec2* %p, i64 0, i32 0, i64 7 253 store atomic i32 1, i32* %arrayidx1 unordered, align 4 254 ret void 255} 256 257declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i1) nounwind 258declare void @llvm.memcpy.element.unordered.atomic.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i32) nounwind 259declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i1) nounwind 260declare void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* nocapture, i8, i64, i32) nounwind 261 262%struct.trapframe = type { i64, i64, i64 } 263 264; bugzilla 11455 - make sure negative GEP's don't break this optimisation 265define void @cpu_lwp_fork(%struct.trapframe* %md_regs, i64 %pcb_rsp0) nounwind uwtable noinline ssp { 266; CHECK-LABEL: @cpu_lwp_fork( 267; CHECK-NEXT: entry: 268; CHECK-NEXT: [[TMP0:%.*]] = inttoptr i64 [[PCB_RSP0:%.*]] to %struct.trapframe* 269; CHECK-NEXT: [[ADD_PTR:%.*]] = getelementptr inbounds [[STRUCT_TRAPFRAME:%.*]], %struct.trapframe* [[TMP0]], i64 -1 270; CHECK-NEXT: [[TMP1:%.*]] = bitcast %struct.trapframe* [[ADD_PTR]] to i8* 271; CHECK-NEXT: [[TMP2:%.*]] = bitcast %struct.trapframe* [[MD_REGS:%.*]] to i8* 272; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[TMP1]], i8* [[TMP2]], i64 24, i1 false) 273; CHECK-NEXT: [[TF_TRAPNO:%.*]] = getelementptr inbounds [[STRUCT_TRAPFRAME]], %struct.trapframe* [[TMP0]], i64 -1, i32 1 274; CHECK-NEXT: store i64 3, i64* [[TF_TRAPNO]], align 8 275; CHECK-NEXT: ret void 276; 277entry: 278 %0 = inttoptr i64 %pcb_rsp0 to %struct.trapframe* 279 %add.ptr = getelementptr inbounds %struct.trapframe, %struct.trapframe* %0, i64 -1 280 %1 = bitcast %struct.trapframe* %add.ptr to i8* 281 %2 = bitcast %struct.trapframe* %md_regs to i8* 282 call void @llvm.memcpy.p0i8.p0i8.i64(i8* %1, i8* %2, i64 24, i1 false) 283 %tf_trapno = getelementptr inbounds %struct.trapframe, %struct.trapframe* %0, i64 -1, i32 1 284 store i64 3, i64* %tf_trapno, align 8 285 ret void 286} 287 288define void @write16To23AndThen24To31(i64* nocapture %P, i64 %n64, i32 %n32, i16 %n16, i8 %n8) { 289; CHECK-LABEL: @write16To23AndThen24To31( 290; CHECK-NEXT: entry: 291; CHECK-NEXT: [[BASE0:%.*]] = bitcast i64* [[P:%.*]] to i8* 292; CHECK-NEXT: [[MYBASE0:%.*]] = getelementptr inbounds i8, i8* [[BASE0]], i64 0 293; CHECK-NEXT: tail call void @llvm.memset.p0i8.i64(i8* align 8 [[MYBASE0]], i8 0, i64 16, i1 false) 294; CHECK-NEXT: [[BASE64_2:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 2 295; CHECK-NEXT: [[BASE64_3:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 3 296; CHECK-NEXT: store i64 3, i64* [[BASE64_2]] 297; CHECK-NEXT: store i64 3, i64* [[BASE64_3]] 298; CHECK-NEXT: ret void 299; 300entry: 301 302 %base0 = bitcast i64* %P to i8* 303 %mybase0 = getelementptr inbounds i8, i8* %base0, i64 0 304 tail call void @llvm.memset.p0i8.i64(i8* align 8 %mybase0, i8 0, i64 32, i1 false) 305 306 %base64_2 = getelementptr inbounds i64, i64* %P, i64 2 307 %base64_3 = getelementptr inbounds i64, i64* %P, i64 3 308 309 store i64 3, i64* %base64_2 310 store i64 3, i64* %base64_3 311 ret void 312} 313 314define void @write16To23AndThen24To31_atomic(i64* nocapture %P, i64 %n64, i32 %n32, i16 %n16, i8 %n8) { 315; CHECK-LABEL: @write16To23AndThen24To31_atomic( 316; CHECK-NEXT: entry: 317; CHECK-NEXT: [[BASE0:%.*]] = bitcast i64* [[P:%.*]] to i8* 318; CHECK-NEXT: [[MYBASE0:%.*]] = getelementptr inbounds i8, i8* [[BASE0]], i64 0 319; CHECK-NEXT: tail call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 8 [[MYBASE0]], i8 0, i64 16, i32 8) 320; CHECK-NEXT: [[BASE64_2:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 2 321; CHECK-NEXT: [[BASE64_3:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 3 322; CHECK-NEXT: store atomic i64 3, i64* [[BASE64_2]] unordered, align 8 323; CHECK-NEXT: store atomic i64 3, i64* [[BASE64_3]] unordered, align 8 324; CHECK-NEXT: ret void 325; 326entry: 327 328 %base0 = bitcast i64* %P to i8* 329 %mybase0 = getelementptr inbounds i8, i8* %base0, i64 0 330 tail call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 8 %mybase0, i8 0, i64 32, i32 8) 331 332 %base64_2 = getelementptr inbounds i64, i64* %P, i64 2 333 %base64_3 = getelementptr inbounds i64, i64* %P, i64 3 334 335 store atomic i64 3, i64* %base64_2 unordered, align 8 336 store atomic i64 3, i64* %base64_3 unordered, align 8 337 ret void 338} 339 340define void @write16To23AndThen24To31_atomic_weaker1(i64* nocapture %P, i64 %n64, i32 %n32, i16 %n16, i8 %n8) { 341; CHECK-LABEL: @write16To23AndThen24To31_atomic_weaker1( 342; CHECK-NEXT: entry: 343; CHECK-NEXT: [[BASE0:%.*]] = bitcast i64* [[P:%.*]] to i8* 344; CHECK-NEXT: [[MYBASE0:%.*]] = getelementptr inbounds i8, i8* [[BASE0]], i64 0 345; CHECK-NEXT: tail call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 8 [[MYBASE0]], i8 0, i64 16, i32 8) 346; CHECK-NEXT: [[BASE64_2:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 2 347; CHECK-NEXT: [[BASE64_3:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 3 348; CHECK-NEXT: store i64 3, i64* [[BASE64_2]], align 8 349; CHECK-NEXT: store atomic i64 3, i64* [[BASE64_3]] unordered, align 8 350; CHECK-NEXT: ret void 351; 352entry: 353 354 %base0 = bitcast i64* %P to i8* 355 %mybase0 = getelementptr inbounds i8, i8* %base0, i64 0 356 tail call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 8 %mybase0, i8 0, i64 32, i32 8) 357 358 %base64_2 = getelementptr inbounds i64, i64* %P, i64 2 359 %base64_3 = getelementptr inbounds i64, i64* %P, i64 3 360 361 store i64 3, i64* %base64_2, align 8 362 store atomic i64 3, i64* %base64_3 unordered, align 8 363 ret void 364} 365 366define void @write16To23AndThen24To31_atomic_weaker2(i64* nocapture %P, i64 %n64, i32 %n32, i16 %n16, i8 %n8) { 367; CHECK-LABEL: @write16To23AndThen24To31_atomic_weaker2( 368; CHECK-NEXT: entry: 369; CHECK-NEXT: [[BASE0:%.*]] = bitcast i64* [[P:%.*]] to i8* 370; CHECK-NEXT: [[MYBASE0:%.*]] = getelementptr inbounds i8, i8* [[BASE0]], i64 0 371; CHECK-NEXT: tail call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 8 [[MYBASE0]], i8 0, i64 16, i32 8) 372; CHECK-NEXT: [[BASE64_2:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 2 373; CHECK-NEXT: [[BASE64_3:%.*]] = getelementptr inbounds i64, i64* [[P]], i64 3 374; CHECK-NEXT: store atomic i64 3, i64* [[BASE64_2]] unordered, align 8 375; CHECK-NEXT: store i64 3, i64* [[BASE64_3]], align 8 376; CHECK-NEXT: ret void 377; 378entry: 379 380 %base0 = bitcast i64* %P to i8* 381 %mybase0 = getelementptr inbounds i8, i8* %base0, i64 0 382 tail call void @llvm.memset.element.unordered.atomic.p0i8.i64(i8* align 8 %mybase0, i8 0, i64 32, i32 8) 383 384 %base64_2 = getelementptr inbounds i64, i64* %P, i64 2 385 %base64_3 = getelementptr inbounds i64, i64* %P, i64 3 386 387 store atomic i64 3, i64* %base64_2 unordered, align 8 388 store i64 3, i64* %base64_3, align 8 389 ret void 390} 391