1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=hexagon < %s | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker; Testing for these 6 variants of circular load: 3*9880d681SAndroid Build Coastguard Worker; Q6_circ_load_update_B(inputLR, pDelay, -1, nConvLength, 4); 4*9880d681SAndroid Build Coastguard Worker; Q6_circ_load_update_D(inputLR, pDelay, -1, nConvLength, 4); 5*9880d681SAndroid Build Coastguard Worker; Q6_circ_load_update_H(inputLR, pDelay, -1, nConvLength, 4); 6*9880d681SAndroid Build Coastguard Worker; Q6_circ_load_update_UB(inputLR, pDelay, -1, nConvLength, 4); 7*9880d681SAndroid Build Coastguard Worker; Q6_circ_load_update_UH(inputLR, pDelay, -1, nConvLength, 4); 8*9880d681SAndroid Build Coastguard Worker; Q6_circ_load_update_W(inputLR, pDelay, -1, nConvLength, 4); 9*9880d681SAndroid Build Coastguard Worker; producing these: 10*9880d681SAndroid Build Coastguard Worker; r0 = memb(r1++#-1:circ(m0)) 11*9880d681SAndroid Build Coastguard Worker; r3:2 = memd(r1++#-8:circ(m0)) 12*9880d681SAndroid Build Coastguard Worker; r0 = memh(r1++#-2:circ(m0)) 13*9880d681SAndroid Build Coastguard Worker; r0 = memub(r1++#-1:circ(m0)) 14*9880d681SAndroid Build Coastguard Worker; r0 = memuh(r1++#-2:circ(m0)) 15*9880d681SAndroid Build Coastguard Worker; r0 = memw(r1++#-4:circ(m0)) 16*9880d681SAndroid Build Coastguard Worker 17*9880d681SAndroid Build Coastguard Workertarget datalayout = "e-p:32:32:32-i64:64:64-i32:32:32-i16:16:16-i1:32:32-f64:64:64-f32:32:32-v64:64:64-v32:32:32-a0:0-n16:32" 18*9880d681SAndroid Build Coastguard Workertarget triple = "hexagon" 19*9880d681SAndroid Build Coastguard Worker 20*9880d681SAndroid Build Coastguard Workerdefine signext i8 @foo1(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { 21*9880d681SAndroid Build Coastguard Workerentry: 22*9880d681SAndroid Build Coastguard Worker %inputLR = alloca i8, align 1 23*9880d681SAndroid Build Coastguard Worker %conv = zext i16 %filtMemLen to i32 24*9880d681SAndroid Build Coastguard Worker %shr1 = lshr i32 %conv, 1 25*9880d681SAndroid Build Coastguard Worker %idxprom = sext i16 %filtMemIndex to i32 26*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom 27*9880d681SAndroid Build Coastguard Worker %0 = bitcast i16* %arrayidx to i8* 28*9880d681SAndroid Build Coastguard Worker %or = or i32 %shr1, 33554432 29*9880d681SAndroid Build Coastguard Worker; CHECK: = memb(r{{[0-9]*.}}++{{.}}#-1:circ(m{{[0-1]}})) 30*9880d681SAndroid Build Coastguard Worker %1 = call i8* @llvm.hexagon.circ.ldb(i8* %0, i8* %inputLR, i32 %or, i32 -1) 31*9880d681SAndroid Build Coastguard Worker %2 = load i8, i8* %inputLR, align 1, !tbaa !0 32*9880d681SAndroid Build Coastguard Worker ret i8 %2 33*9880d681SAndroid Build Coastguard Worker} 34*9880d681SAndroid Build Coastguard Worker 35*9880d681SAndroid Build Coastguard Workerdeclare i8* @llvm.hexagon.circ.ldb(i8*, i8*, i32, i32) nounwind 36*9880d681SAndroid Build Coastguard Worker 37*9880d681SAndroid Build Coastguard Workerdefine i64 @foo2(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { 38*9880d681SAndroid Build Coastguard Workerentry: 39*9880d681SAndroid Build Coastguard Worker %inputLR = alloca i64, align 8 40*9880d681SAndroid Build Coastguard Worker %conv = zext i16 %filtMemLen to i32 41*9880d681SAndroid Build Coastguard Worker %shr1 = lshr i32 %conv, 1 42*9880d681SAndroid Build Coastguard Worker %idxprom = sext i16 %filtMemIndex to i32 43*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom 44*9880d681SAndroid Build Coastguard Worker %0 = bitcast i16* %arrayidx to i8* 45*9880d681SAndroid Build Coastguard Worker %1 = bitcast i64* %inputLR to i8* 46*9880d681SAndroid Build Coastguard Worker %shl = shl nuw nsw i32 %shr1, 3 47*9880d681SAndroid Build Coastguard Worker %or = or i32 %shl, 83886080 48*9880d681SAndroid Build Coastguard Worker; CHECK: = memd(r{{[0-9]*.}}++{{.}}#-8:circ(m{{[0-1]}})) 49*9880d681SAndroid Build Coastguard Worker %2 = call i8* @llvm.hexagon.circ.ldd(i8* %0, i8* %1, i32 %or, i32 -8) 50*9880d681SAndroid Build Coastguard Worker %3 = bitcast i8* %1 to i64* 51*9880d681SAndroid Build Coastguard Worker %4 = load i64, i64* %3, align 8, !tbaa !0 52*9880d681SAndroid Build Coastguard Worker ret i64 %4 53*9880d681SAndroid Build Coastguard Worker} 54*9880d681SAndroid Build Coastguard Worker 55*9880d681SAndroid Build Coastguard Workerdeclare i8* @llvm.hexagon.circ.ldd(i8*, i8*, i32, i32) nounwind 56*9880d681SAndroid Build Coastguard Worker 57*9880d681SAndroid Build Coastguard Workerdefine signext i16 @foo3(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { 58*9880d681SAndroid Build Coastguard Workerentry: 59*9880d681SAndroid Build Coastguard Worker %inputLR = alloca i16, align 2 60*9880d681SAndroid Build Coastguard Worker %conv = zext i16 %filtMemLen to i32 61*9880d681SAndroid Build Coastguard Worker %shr1 = and i32 %conv, 65534 62*9880d681SAndroid Build Coastguard Worker %idxprom = sext i16 %filtMemIndex to i32 63*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom 64*9880d681SAndroid Build Coastguard Worker %0 = bitcast i16* %arrayidx to i8* 65*9880d681SAndroid Build Coastguard Worker %1 = bitcast i16* %inputLR to i8* 66*9880d681SAndroid Build Coastguard Worker %or = or i32 %shr1, 50331648 67*9880d681SAndroid Build Coastguard Worker; CHECK: = memh(r{{[0-9]*.}}++{{.}}#-2:circ(m{{[0-1]}})) 68*9880d681SAndroid Build Coastguard Worker %2 = call i8* @llvm.hexagon.circ.ldh(i8* %0, i8* %1, i32 %or, i32 -2) 69*9880d681SAndroid Build Coastguard Worker %3 = bitcast i8* %1 to i16* 70*9880d681SAndroid Build Coastguard Worker %4 = load i16, i16* %3, align 2, !tbaa !2 71*9880d681SAndroid Build Coastguard Worker ret i16 %4 72*9880d681SAndroid Build Coastguard Worker} 73*9880d681SAndroid Build Coastguard Worker 74*9880d681SAndroid Build Coastguard Workerdeclare i8* @llvm.hexagon.circ.ldh(i8*, i8*, i32, i32) nounwind 75*9880d681SAndroid Build Coastguard Worker 76*9880d681SAndroid Build Coastguard Workerdefine zeroext i8 @foo4(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { 77*9880d681SAndroid Build Coastguard Workerentry: 78*9880d681SAndroid Build Coastguard Worker %inputLR = alloca i8, align 1 79*9880d681SAndroid Build Coastguard Worker %conv = zext i16 %filtMemLen to i32 80*9880d681SAndroid Build Coastguard Worker %shr1 = lshr i32 %conv, 1 81*9880d681SAndroid Build Coastguard Worker %idxprom = sext i16 %filtMemIndex to i32 82*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom 83*9880d681SAndroid Build Coastguard Worker %0 = bitcast i16* %arrayidx to i8* 84*9880d681SAndroid Build Coastguard Worker %or = or i32 %shr1, 33554432 85*9880d681SAndroid Build Coastguard Worker; CHECK: = memub(r{{[0-9]*.}}++{{.}}#-1:circ(m{{[0-1]}})) 86*9880d681SAndroid Build Coastguard Worker %1 = call i8* @llvm.hexagon.circ.ldub(i8* %0, i8* %inputLR, i32 %or, i32 -1) 87*9880d681SAndroid Build Coastguard Worker %2 = load i8, i8* %inputLR, align 1, !tbaa !0 88*9880d681SAndroid Build Coastguard Worker ret i8 %2 89*9880d681SAndroid Build Coastguard Worker} 90*9880d681SAndroid Build Coastguard Worker 91*9880d681SAndroid Build Coastguard Workerdeclare i8* @llvm.hexagon.circ.ldub(i8*, i8*, i32, i32) nounwind 92*9880d681SAndroid Build Coastguard Worker 93*9880d681SAndroid Build Coastguard Workerdefine zeroext i16 @foo5(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { 94*9880d681SAndroid Build Coastguard Workerentry: 95*9880d681SAndroid Build Coastguard Worker %inputLR = alloca i16, align 2 96*9880d681SAndroid Build Coastguard Worker %conv = zext i16 %filtMemLen to i32 97*9880d681SAndroid Build Coastguard Worker %shr1 = and i32 %conv, 65534 98*9880d681SAndroid Build Coastguard Worker %idxprom = sext i16 %filtMemIndex to i32 99*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom 100*9880d681SAndroid Build Coastguard Worker %0 = bitcast i16* %arrayidx to i8* 101*9880d681SAndroid Build Coastguard Worker %1 = bitcast i16* %inputLR to i8* 102*9880d681SAndroid Build Coastguard Worker %or = or i32 %shr1, 50331648 103*9880d681SAndroid Build Coastguard Worker; CHECK: = memuh(r{{[0-9]*.}}++{{.}}#-2:circ(m{{[0-1]}})) 104*9880d681SAndroid Build Coastguard Worker %2 = call i8* @llvm.hexagon.circ.lduh(i8* %0, i8* %1, i32 %or, i32 -2) 105*9880d681SAndroid Build Coastguard Worker %3 = bitcast i8* %1 to i16* 106*9880d681SAndroid Build Coastguard Worker %4 = load i16, i16* %3, align 2, !tbaa !2 107*9880d681SAndroid Build Coastguard Worker ret i16 %4 108*9880d681SAndroid Build Coastguard Worker} 109*9880d681SAndroid Build Coastguard Worker 110*9880d681SAndroid Build Coastguard Workerdeclare i8* @llvm.hexagon.circ.lduh(i8*, i8*, i32, i32) nounwind 111*9880d681SAndroid Build Coastguard Worker 112*9880d681SAndroid Build Coastguard Workerdefine i32 @foo6(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { 113*9880d681SAndroid Build Coastguard Workerentry: 114*9880d681SAndroid Build Coastguard Worker %inputLR = alloca i32, align 4 115*9880d681SAndroid Build Coastguard Worker %conv = zext i16 %filtMemLen to i32 116*9880d681SAndroid Build Coastguard Worker %shr1 = lshr i32 %conv, 1 117*9880d681SAndroid Build Coastguard Worker %idxprom = sext i16 %filtMemIndex to i32 118*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom 119*9880d681SAndroid Build Coastguard Worker %0 = bitcast i16* %arrayidx to i8* 120*9880d681SAndroid Build Coastguard Worker %1 = bitcast i32* %inputLR to i8* 121*9880d681SAndroid Build Coastguard Worker %shl = shl nuw nsw i32 %shr1, 2 122*9880d681SAndroid Build Coastguard Worker %or = or i32 %shl, 67108864 123*9880d681SAndroid Build Coastguard Worker; CHECK: = memw(r{{[0-9]*.}}++{{.}}#-4:circ(m{{[0-1]}})) 124*9880d681SAndroid Build Coastguard Worker %2 = call i8* @llvm.hexagon.circ.ldw(i8* %0, i8* %1, i32 %or, i32 -4) 125*9880d681SAndroid Build Coastguard Worker %3 = bitcast i8* %1 to i32* 126*9880d681SAndroid Build Coastguard Worker %4 = load i32, i32* %3, align 4, !tbaa !3 127*9880d681SAndroid Build Coastguard Worker ret i32 %4 128*9880d681SAndroid Build Coastguard Worker} 129*9880d681SAndroid Build Coastguard Worker 130*9880d681SAndroid Build Coastguard Workerdeclare i8* @llvm.hexagon.circ.ldw(i8*, i8*, i32, i32) nounwind 131*9880d681SAndroid Build Coastguard Worker 132*9880d681SAndroid Build Coastguard Worker!0 = !{!"omnipotent char", !1} 133*9880d681SAndroid Build Coastguard Worker!1 = !{!"Simple C/C++ TBAA"} 134*9880d681SAndroid Build Coastguard Worker!2 = !{!"short", !0} 135*9880d681SAndroid Build Coastguard Worker!3 = !{!"int", !0} 136