1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=verde -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s 3*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s 4*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=r600 -mcpu=cayman < %s | FileCheck -check-prefix=CM -check-prefix=FUNC %s 5*9880d681SAndroid Build Coastguard Worker 6*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===; 7*9880d681SAndroid Build Coastguard Worker; Global Address Space 8*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===; 9*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i1: 10*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR 11*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_byte 12*9880d681SAndroid Build Coastguard Workerdefine void @store_i1(i1 addrspace(1)* %out) { 13*9880d681SAndroid Build Coastguard Workerentry: 14*9880d681SAndroid Build Coastguard Worker store i1 true, i1 addrspace(1)* %out 15*9880d681SAndroid Build Coastguard Worker ret void 16*9880d681SAndroid Build Coastguard Worker} 17*9880d681SAndroid Build Coastguard Worker 18*9880d681SAndroid Build Coastguard Worker; i8 store 19*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i8: 20*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR T[[RW_GPR:[0-9]]].XW, T{{[0-9]}}.X 21*9880d681SAndroid Build Coastguard Worker 22*9880d681SAndroid Build Coastguard Worker; IG 0: Get the byte index and truncate the value 23*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[BI_CHAN:[XYZW]]], KC0[2].Y, literal.x 24*9880d681SAndroid Build Coastguard Worker; EG: LSHL T{{[0-9]}}.[[SHIFT_CHAN:[XYZW]]], PV.[[BI_CHAN]], literal.x 25*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[TRUNC_CHAN:[XYZW]]], KC0[2].Z, literal.y 26*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 3(4.203895e-45), 255(3.573311e-43) 27*9880d681SAndroid Build Coastguard Worker 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Worker; IG 1: Truncate the calculated the shift amount for the mask 30*9880d681SAndroid Build Coastguard Worker 31*9880d681SAndroid Build Coastguard Worker; IG 2: Shift the value and the mask 32*9880d681SAndroid Build Coastguard Worker; EG: LSHL T[[RW_GPR]].X, PS, PV.[[SHIFT_CHAN]] 33*9880d681SAndroid Build Coastguard Worker; EG: LSHL * T[[RW_GPR]].W, literal.x, PV.[[SHIFT_CHAN]] 34*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 255 35*9880d681SAndroid Build Coastguard Worker; IG 3: Initialize the Y and Z channels to zero 36*9880d681SAndroid Build Coastguard Worker; XXX: An optimal scheduler should merge this into one of the prevous IGs. 37*9880d681SAndroid Build Coastguard Worker; EG: MOV T[[RW_GPR]].Y, 0.0 38*9880d681SAndroid Build Coastguard Worker; EG: MOV * T[[RW_GPR]].Z, 0.0 39*9880d681SAndroid Build Coastguard Worker 40*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_byte 41*9880d681SAndroid Build Coastguard Worker 42*9880d681SAndroid Build Coastguard Workerdefine void @store_i8(i8 addrspace(1)* %out, i8 %in) { 43*9880d681SAndroid Build Coastguard Workerentry: 44*9880d681SAndroid Build Coastguard Worker store i8 %in, i8 addrspace(1)* %out 45*9880d681SAndroid Build Coastguard Worker ret void 46*9880d681SAndroid Build Coastguard Worker} 47*9880d681SAndroid Build Coastguard Worker 48*9880d681SAndroid Build Coastguard Worker; i16 store 49*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i16: 50*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR T[[RW_GPR:[0-9]]].XW, T{{[0-9]}}.X 51*9880d681SAndroid Build Coastguard Worker 52*9880d681SAndroid Build Coastguard Worker; IG 0: Get the byte index and truncate the value 53*9880d681SAndroid Build Coastguard Worker 54*9880d681SAndroid Build Coastguard Worker 55*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[BI_CHAN:[XYZW]]], KC0[2].Y, literal.x 56*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 3(4.203895e-45), 57*9880d681SAndroid Build Coastguard Worker 58*9880d681SAndroid Build Coastguard Worker; EG: LSHL T{{[0-9]}}.[[SHIFT_CHAN:[XYZW]]], PV.[[BI_CHAN]], literal.x 59*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[TRUNC_CHAN:[XYZW]]], KC0[2].Z, literal.y 60*9880d681SAndroid Build Coastguard Worker 61*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 3(4.203895e-45), 65535(9.183409e-41) 62*9880d681SAndroid Build Coastguard Worker; IG 1: Truncate the calculated the shift amount for the mask 63*9880d681SAndroid Build Coastguard Worker 64*9880d681SAndroid Build Coastguard Worker; IG 2: Shift the value and the mask 65*9880d681SAndroid Build Coastguard Worker; EG: LSHL T[[RW_GPR]].X, PS, PV.[[SHIFT_CHAN]] 66*9880d681SAndroid Build Coastguard Worker; EG: LSHL * T[[RW_GPR]].W, literal.x, PV.[[SHIFT_CHAN]] 67*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 65535 68*9880d681SAndroid Build Coastguard Worker; IG 3: Initialize the Y and Z channels to zero 69*9880d681SAndroid Build Coastguard Worker; XXX: An optimal scheduler should merge this into one of the prevous IGs. 70*9880d681SAndroid Build Coastguard Worker; EG: MOV T[[RW_GPR]].Y, 0.0 71*9880d681SAndroid Build Coastguard Worker; EG: MOV * T[[RW_GPR]].Z, 0.0 72*9880d681SAndroid Build Coastguard Worker 73*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_short 74*9880d681SAndroid Build Coastguard Workerdefine void @store_i16(i16 addrspace(1)* %out, i16 %in) { 75*9880d681SAndroid Build Coastguard Workerentry: 76*9880d681SAndroid Build Coastguard Worker store i16 %in, i16 addrspace(1)* %out 77*9880d681SAndroid Build Coastguard Worker ret void 78*9880d681SAndroid Build Coastguard Worker} 79*9880d681SAndroid Build Coastguard Worker 80*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i24: 81*9880d681SAndroid Build Coastguard Worker; SI: s_lshr_b32 s{{[0-9]+}}, s{{[0-9]+}}, 16 82*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_store_byte 83*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_store_short 84*9880d681SAndroid Build Coastguard Workerdefine void @store_i24(i24 addrspace(1)* %out, i24 %in) { 85*9880d681SAndroid Build Coastguard Workerentry: 86*9880d681SAndroid Build Coastguard Worker store i24 %in, i24 addrspace(1)* %out 87*9880d681SAndroid Build Coastguard Worker ret void 88*9880d681SAndroid Build Coastguard Worker} 89*9880d681SAndroid Build Coastguard Worker 90*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i25: 91*9880d681SAndroid Build Coastguard Worker; SI: s_and_b32 [[AND:s[0-9]+]], s{{[0-9]+}}, 0x1ffffff{{$}} 92*9880d681SAndroid Build Coastguard Worker; SI: v_mov_b32_e32 [[VAND:v[0-9]+]], [[AND]] 93*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[VAND]] 94*9880d681SAndroid Build Coastguard Workerdefine void @store_i25(i25 addrspace(1)* %out, i25 %in) { 95*9880d681SAndroid Build Coastguard Workerentry: 96*9880d681SAndroid Build Coastguard Worker store i25 %in, i25 addrspace(1)* %out 97*9880d681SAndroid Build Coastguard Worker ret void 98*9880d681SAndroid Build Coastguard Worker} 99*9880d681SAndroid Build Coastguard Worker 100*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v2i8: 101*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR 102*9880d681SAndroid Build Coastguard Worker; EG-NOT: MEM_RAT MSKOR 103*9880d681SAndroid Build Coastguard Worker 104*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_short 105*9880d681SAndroid Build Coastguard Workerdefine void @store_v2i8(<2 x i8> addrspace(1)* %out, <2 x i32> %in) { 106*9880d681SAndroid Build Coastguard Workerentry: 107*9880d681SAndroid Build Coastguard Worker %0 = trunc <2 x i32> %in to <2 x i8> 108*9880d681SAndroid Build Coastguard Worker store <2 x i8> %0, <2 x i8> addrspace(1)* %out 109*9880d681SAndroid Build Coastguard Worker ret void 110*9880d681SAndroid Build Coastguard Worker} 111*9880d681SAndroid Build Coastguard Worker 112*9880d681SAndroid Build Coastguard Worker 113*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v2i16: 114*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW 115*9880d681SAndroid Build Coastguard Worker 116*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD 117*9880d681SAndroid Build Coastguard Worker 118*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword 119*9880d681SAndroid Build Coastguard Workerdefine void @store_v2i16(<2 x i16> addrspace(1)* %out, <2 x i32> %in) { 120*9880d681SAndroid Build Coastguard Workerentry: 121*9880d681SAndroid Build Coastguard Worker %0 = trunc <2 x i32> %in to <2 x i16> 122*9880d681SAndroid Build Coastguard Worker store <2 x i16> %0, <2 x i16> addrspace(1)* %out 123*9880d681SAndroid Build Coastguard Worker ret void 124*9880d681SAndroid Build Coastguard Worker} 125*9880d681SAndroid Build Coastguard Worker 126*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v4i8: 127*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW 128*9880d681SAndroid Build Coastguard Worker 129*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD 130*9880d681SAndroid Build Coastguard Worker 131*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword 132*9880d681SAndroid Build Coastguard Workerdefine void @store_v4i8(<4 x i8> addrspace(1)* %out, <4 x i32> %in) { 133*9880d681SAndroid Build Coastguard Workerentry: 134*9880d681SAndroid Build Coastguard Worker %0 = trunc <4 x i32> %in to <4 x i8> 135*9880d681SAndroid Build Coastguard Worker store <4 x i8> %0, <4 x i8> addrspace(1)* %out 136*9880d681SAndroid Build Coastguard Worker ret void 137*9880d681SAndroid Build Coastguard Worker} 138*9880d681SAndroid Build Coastguard Worker 139*9880d681SAndroid Build Coastguard Worker; floating-point store 140*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_f32: 141*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW T{{[0-9]+\.X, T[0-9]+\.X}}, 1 142*9880d681SAndroid Build Coastguard Worker 143*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD T{{[0-9]+\.X, T[0-9]+\.X}} 144*9880d681SAndroid Build Coastguard Worker 145*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword 146*9880d681SAndroid Build Coastguard Worker 147*9880d681SAndroid Build Coastguard Workerdefine void @store_f32(float addrspace(1)* %out, float %in) { 148*9880d681SAndroid Build Coastguard Worker store float %in, float addrspace(1)* %out 149*9880d681SAndroid Build Coastguard Worker ret void 150*9880d681SAndroid Build Coastguard Worker} 151*9880d681SAndroid Build Coastguard Worker 152*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v4i16: 153*9880d681SAndroid Build Coastguard Worker; MEM_RAT_CACHELESS STORE_RAW T{{[0-9]+}}.XYZW 154*9880d681SAndroid Build Coastguard Worker 155*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx2 156*9880d681SAndroid Build Coastguard Workerdefine void @store_v4i16(<4 x i16> addrspace(1)* %out, <4 x i32> %in) { 157*9880d681SAndroid Build Coastguard Workerentry: 158*9880d681SAndroid Build Coastguard Worker %0 = trunc <4 x i32> %in to <4 x i16> 159*9880d681SAndroid Build Coastguard Worker store <4 x i16> %0, <4 x i16> addrspace(1)* %out 160*9880d681SAndroid Build Coastguard Worker ret void 161*9880d681SAndroid Build Coastguard Worker} 162*9880d681SAndroid Build Coastguard Worker 163*9880d681SAndroid Build Coastguard Worker; vec2 floating-point stores 164*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v2f32: 165*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW 166*9880d681SAndroid Build Coastguard Worker 167*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD 168*9880d681SAndroid Build Coastguard Worker 169*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx2 170*9880d681SAndroid Build Coastguard Worker 171*9880d681SAndroid Build Coastguard Workerdefine void @store_v2f32(<2 x float> addrspace(1)* %out, float %a, float %b) { 172*9880d681SAndroid Build Coastguard Workerentry: 173*9880d681SAndroid Build Coastguard Worker %0 = insertelement <2 x float> <float 0.0, float 0.0>, float %a, i32 0 174*9880d681SAndroid Build Coastguard Worker %1 = insertelement <2 x float> %0, float %b, i32 1 175*9880d681SAndroid Build Coastguard Worker store <2 x float> %1, <2 x float> addrspace(1)* %out 176*9880d681SAndroid Build Coastguard Worker ret void 177*9880d681SAndroid Build Coastguard Worker} 178*9880d681SAndroid Build Coastguard Worker 179*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v4i32: 180*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW 181*9880d681SAndroid Build Coastguard Worker; EG-NOT: MEM_RAT_CACHELESS STORE_RAW 182*9880d681SAndroid Build Coastguard Worker 183*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD 184*9880d681SAndroid Build Coastguard Worker; CM-NOT: MEM_RAT_CACHELESS STORE_DWORD 185*9880d681SAndroid Build Coastguard Worker 186*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx4 187*9880d681SAndroid Build Coastguard Workerdefine void @store_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> %in) { 188*9880d681SAndroid Build Coastguard Workerentry: 189*9880d681SAndroid Build Coastguard Worker store <4 x i32> %in, <4 x i32> addrspace(1)* %out 190*9880d681SAndroid Build Coastguard Worker ret void 191*9880d681SAndroid Build Coastguard Worker} 192*9880d681SAndroid Build Coastguard Worker 193*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i64_i8: 194*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR 195*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_byte 196*9880d681SAndroid Build Coastguard Workerdefine void @store_i64_i8(i8 addrspace(1)* %out, i64 %in) { 197*9880d681SAndroid Build Coastguard Workerentry: 198*9880d681SAndroid Build Coastguard Worker %0 = trunc i64 %in to i8 199*9880d681SAndroid Build Coastguard Worker store i8 %0, i8 addrspace(1)* %out 200*9880d681SAndroid Build Coastguard Worker ret void 201*9880d681SAndroid Build Coastguard Worker} 202*9880d681SAndroid Build Coastguard Worker 203*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i64_i16: 204*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR 205*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_short 206*9880d681SAndroid Build Coastguard Workerdefine void @store_i64_i16(i16 addrspace(1)* %out, i64 %in) { 207*9880d681SAndroid Build Coastguard Workerentry: 208*9880d681SAndroid Build Coastguard Worker %0 = trunc i64 %in to i16 209*9880d681SAndroid Build Coastguard Worker store i16 %0, i16 addrspace(1)* %out 210*9880d681SAndroid Build Coastguard Worker ret void 211*9880d681SAndroid Build Coastguard Worker} 212*9880d681SAndroid Build Coastguard Worker 213*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===; 214*9880d681SAndroid Build Coastguard Worker; Local Address Space 215*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===; 216*9880d681SAndroid Build Coastguard Worker 217*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i1: 218*9880d681SAndroid Build Coastguard Worker; EG: LDS_BYTE_WRITE 219*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b8 220*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i1(i1 addrspace(3)* %out) { 221*9880d681SAndroid Build Coastguard Workerentry: 222*9880d681SAndroid Build Coastguard Worker store i1 true, i1 addrspace(3)* %out 223*9880d681SAndroid Build Coastguard Worker ret void 224*9880d681SAndroid Build Coastguard Worker} 225*9880d681SAndroid Build Coastguard Worker 226*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i8: 227*9880d681SAndroid Build Coastguard Worker; EG: LDS_BYTE_WRITE 228*9880d681SAndroid Build Coastguard Worker 229*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b8 230*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i8(i8 addrspace(3)* %out, i8 %in) { 231*9880d681SAndroid Build Coastguard Worker store i8 %in, i8 addrspace(3)* %out 232*9880d681SAndroid Build Coastguard Worker ret void 233*9880d681SAndroid Build Coastguard Worker} 234*9880d681SAndroid Build Coastguard Worker 235*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i16: 236*9880d681SAndroid Build Coastguard Worker; EG: LDS_SHORT_WRITE 237*9880d681SAndroid Build Coastguard Worker 238*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b16 239*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i16(i16 addrspace(3)* %out, i16 %in) { 240*9880d681SAndroid Build Coastguard Worker store i16 %in, i16 addrspace(3)* %out 241*9880d681SAndroid Build Coastguard Worker ret void 242*9880d681SAndroid Build Coastguard Worker} 243*9880d681SAndroid Build Coastguard Worker 244*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v2i16: 245*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 246*9880d681SAndroid Build Coastguard Worker 247*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 248*9880d681SAndroid Build Coastguard Worker 249*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b32 250*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v2i16(<2 x i16> addrspace(3)* %out, <2 x i16> %in) { 251*9880d681SAndroid Build Coastguard Workerentry: 252*9880d681SAndroid Build Coastguard Worker store <2 x i16> %in, <2 x i16> addrspace(3)* %out 253*9880d681SAndroid Build Coastguard Worker ret void 254*9880d681SAndroid Build Coastguard Worker} 255*9880d681SAndroid Build Coastguard Worker 256*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v4i8: 257*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 258*9880d681SAndroid Build Coastguard Worker 259*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 260*9880d681SAndroid Build Coastguard Worker 261*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b32 262*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v4i8(<4 x i8> addrspace(3)* %out, <4 x i8> %in) { 263*9880d681SAndroid Build Coastguard Workerentry: 264*9880d681SAndroid Build Coastguard Worker store <4 x i8> %in, <4 x i8> addrspace(3)* %out 265*9880d681SAndroid Build Coastguard Worker ret void 266*9880d681SAndroid Build Coastguard Worker} 267*9880d681SAndroid Build Coastguard Worker 268*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v2i32: 269*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 270*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 271*9880d681SAndroid Build Coastguard Worker 272*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 273*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 274*9880d681SAndroid Build Coastguard Worker 275*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b64 276*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v2i32(<2 x i32> addrspace(3)* %out, <2 x i32> %in) { 277*9880d681SAndroid Build Coastguard Workerentry: 278*9880d681SAndroid Build Coastguard Worker store <2 x i32> %in, <2 x i32> addrspace(3)* %out 279*9880d681SAndroid Build Coastguard Worker ret void 280*9880d681SAndroid Build Coastguard Worker} 281*9880d681SAndroid Build Coastguard Worker 282*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v4i32: 283*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 284*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 285*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 286*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 287*9880d681SAndroid Build Coastguard Worker 288*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 289*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 290*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 291*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 292*9880d681SAndroid Build Coastguard Worker 293*9880d681SAndroid Build Coastguard Worker; SI: ds_write2_b64 294*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v4i32(<4 x i32> addrspace(3)* %out, <4 x i32> %in) { 295*9880d681SAndroid Build Coastguard Workerentry: 296*9880d681SAndroid Build Coastguard Worker store <4 x i32> %in, <4 x i32> addrspace(3)* %out 297*9880d681SAndroid Build Coastguard Worker ret void 298*9880d681SAndroid Build Coastguard Worker} 299*9880d681SAndroid Build Coastguard Worker 300*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v4i32_align4: 301*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 302*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 303*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 304*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE 305*9880d681SAndroid Build Coastguard Worker 306*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 307*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 308*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 309*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE 310*9880d681SAndroid Build Coastguard Worker 311*9880d681SAndroid Build Coastguard Worker; SI: ds_write2_b32 312*9880d681SAndroid Build Coastguard Worker; SI: ds_write2_b32 313*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v4i32_align4(<4 x i32> addrspace(3)* %out, <4 x i32> %in) { 314*9880d681SAndroid Build Coastguard Workerentry: 315*9880d681SAndroid Build Coastguard Worker store <4 x i32> %in, <4 x i32> addrspace(3)* %out, align 4 316*9880d681SAndroid Build Coastguard Worker ret void 317*9880d681SAndroid Build Coastguard Worker} 318*9880d681SAndroid Build Coastguard Worker 319*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i64_i8: 320*9880d681SAndroid Build Coastguard Worker; EG: LDS_BYTE_WRITE 321*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b8 322*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i64_i8(i8 addrspace(3)* %out, i64 %in) { 323*9880d681SAndroid Build Coastguard Workerentry: 324*9880d681SAndroid Build Coastguard Worker %0 = trunc i64 %in to i8 325*9880d681SAndroid Build Coastguard Worker store i8 %0, i8 addrspace(3)* %out 326*9880d681SAndroid Build Coastguard Worker ret void 327*9880d681SAndroid Build Coastguard Worker} 328*9880d681SAndroid Build Coastguard Worker 329*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i64_i16: 330*9880d681SAndroid Build Coastguard Worker; EG: LDS_SHORT_WRITE 331*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b16 332*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i64_i16(i16 addrspace(3)* %out, i64 %in) { 333*9880d681SAndroid Build Coastguard Workerentry: 334*9880d681SAndroid Build Coastguard Worker %0 = trunc i64 %in to i16 335*9880d681SAndroid Build Coastguard Worker store i16 %0, i16 addrspace(3)* %out 336*9880d681SAndroid Build Coastguard Worker ret void 337*9880d681SAndroid Build Coastguard Worker} 338*9880d681SAndroid Build Coastguard Worker 339*9880d681SAndroid Build Coastguard Worker; The stores in this function are combined by the optimizer to create a 340*9880d681SAndroid Build Coastguard Worker; 64-bit store with 32-bit alignment. This is legal for SI and the legalizer 341*9880d681SAndroid Build Coastguard Worker; should not try to split the 64-bit store back into 2 32-bit stores. 342*9880d681SAndroid Build Coastguard Worker; 343*9880d681SAndroid Build Coastguard Worker; Evergreen / Northern Islands don't support 64-bit stores yet, so there should 344*9880d681SAndroid Build Coastguard Worker; be two 32-bit stores. 345*9880d681SAndroid Build Coastguard Worker 346*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}vecload2: 347*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW 348*9880d681SAndroid Build Coastguard Worker 349*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD 350*9880d681SAndroid Build Coastguard Worker 351*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx2 352*9880d681SAndroid Build Coastguard Workerdefine void @vecload2(i32 addrspace(1)* nocapture %out, i32 addrspace(2)* nocapture %mem) #0 { 353*9880d681SAndroid Build Coastguard Workerentry: 354*9880d681SAndroid Build Coastguard Worker %0 = load i32, i32 addrspace(2)* %mem, align 4 355*9880d681SAndroid Build Coastguard Worker %arrayidx1.i = getelementptr inbounds i32, i32 addrspace(2)* %mem, i64 1 356*9880d681SAndroid Build Coastguard Worker %1 = load i32, i32 addrspace(2)* %arrayidx1.i, align 4 357*9880d681SAndroid Build Coastguard Worker store i32 %0, i32 addrspace(1)* %out, align 4 358*9880d681SAndroid Build Coastguard Worker %arrayidx1 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 1 359*9880d681SAndroid Build Coastguard Worker store i32 %1, i32 addrspace(1)* %arrayidx1, align 4 360*9880d681SAndroid Build Coastguard Worker ret void 361*9880d681SAndroid Build Coastguard Worker} 362*9880d681SAndroid Build Coastguard Worker 363*9880d681SAndroid Build Coastguard Worker; When i128 was a legal type this program generated cannot select errors: 364*9880d681SAndroid Build Coastguard Worker 365*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}"i128-const-store": 366*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW T{{[0-9]+}}.XYZW, T{{[0-9]+}}.X, 1 367*9880d681SAndroid Build Coastguard Worker 368*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD T{{[0-9]+}}, T{{[0-9]+}}.X 369*9880d681SAndroid Build Coastguard Worker 370*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx4 371*9880d681SAndroid Build Coastguard Workerdefine void @i128-const-store(i32 addrspace(1)* %out) { 372*9880d681SAndroid Build Coastguard Workerentry: 373*9880d681SAndroid Build Coastguard Worker store i32 1, i32 addrspace(1)* %out, align 4 374*9880d681SAndroid Build Coastguard Worker %arrayidx2 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 1 375*9880d681SAndroid Build Coastguard Worker store i32 1, i32 addrspace(1)* %arrayidx2, align 4 376*9880d681SAndroid Build Coastguard Worker %arrayidx4 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 2 377*9880d681SAndroid Build Coastguard Worker store i32 2, i32 addrspace(1)* %arrayidx4, align 4 378*9880d681SAndroid Build Coastguard Worker %arrayidx6 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 3 379*9880d681SAndroid Build Coastguard Worker store i32 2, i32 addrspace(1)* %arrayidx6, align 4 380*9880d681SAndroid Build Coastguard Worker ret void 381*9880d681SAndroid Build Coastguard Worker} 382*9880d681SAndroid Build Coastguard Worker 383*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind } 384