; RUN: llc < %s -mtriple=arm64-eabi | FileCheck %s ; RUN: llc -O0 --global-isel-abort=1 < %s -mtriple=arm64-eabi | FileCheck %s @a = common global ptr null, align 8 define void @test(i32 %i, i32 %j) nounwind ssp { entry: ; CHECK: @test %j.addr = alloca i32, align 4 store i32 %j, ptr %j.addr, align 4, !tbaa !0 ; CHECK: prfum pldl1strm call void @llvm.prefetch(ptr %j.addr, i32 0, i32 0, i32 1) ; CHECK: prfum pldl3keep call void @llvm.prefetch(ptr %j.addr, i32 0, i32 1, i32 1) ; CHECK: prfum pldl2keep call void @llvm.prefetch(ptr %j.addr, i32 0, i32 2, i32 1) ; CHECK: prfum pldl1keep call void @llvm.prefetch(ptr %j.addr, i32 0, i32 3, i32 1) ; CHECK: prfum plil1strm call void @llvm.prefetch(ptr %j.addr, i32 0, i32 0, i32 0) ; CHECK: prfum plil3keep call void @llvm.prefetch(ptr %j.addr, i32 0, i32 1, i32 0) ; CHECK: prfum plil2keep call void @llvm.prefetch(ptr %j.addr, i32 0, i32 2, i32 0) ; CHECK: prfum plil1keep call void @llvm.prefetch(ptr %j.addr, i32 0, i32 3, i32 0) ; CHECK: prfum pstl1strm call void @llvm.prefetch(ptr %j.addr, i32 1, i32 0, i32 1) ; CHECK: prfum pstl3keep call void @llvm.prefetch(ptr %j.addr, i32 1, i32 1, i32 1) ; CHECK: prfum pstl2keep call void @llvm.prefetch(ptr %j.addr, i32 1, i32 2, i32 1) ; CHECK: prfum pstl1keep call void @llvm.prefetch(ptr %j.addr, i32 1, i32 3, i32 1) %tmp1 = load i32, ptr %j.addr, align 4, !tbaa !0 %add = add nsw i32 %tmp1, %i %idxprom = sext i32 %add to i64 %tmp2 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx = getelementptr inbounds i32, ptr %tmp2, i64 %idxprom ; CHECK: prfm pldl1strm call void @llvm.prefetch(ptr %arrayidx, i32 0, i32 0, i32 1) %tmp4 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx3 = getelementptr inbounds i32, ptr %tmp4, i64 %idxprom ; CHECK: prfm pldl3keep call void @llvm.prefetch(ptr %arrayidx3, i32 0, i32 1, i32 1) %tmp6 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx6 = getelementptr inbounds i32, ptr %tmp6, i64 %idxprom ; CHECK: prfm pldl2keep call void @llvm.prefetch(ptr %arrayidx6, i32 0, i32 2, i32 1) %tmp8 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx9 = getelementptr inbounds i32, ptr %tmp8, i64 %idxprom ; CHECK: prfm pldl1keep call void @llvm.prefetch(ptr %arrayidx9, i32 0, i32 3, i32 1) %tmp10 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx12 = getelementptr inbounds i32, ptr %tmp10, i64 %idxprom ; CHECK: prfm plil1strm call void @llvm.prefetch(ptr %arrayidx12, i32 0, i32 0, i32 0) %tmp12 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx15 = getelementptr inbounds i32, ptr %tmp12, i64 %idxprom ; CHECK: prfm plil3keep call void @llvm.prefetch(ptr %arrayidx3, i32 0, i32 1, i32 0) %tmp14 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx18 = getelementptr inbounds i32, ptr %tmp14, i64 %idxprom ; CHECK: prfm plil2keep call void @llvm.prefetch(ptr %arrayidx6, i32 0, i32 2, i32 0) %tmp16 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx21 = getelementptr inbounds i32, ptr %tmp16, i64 %idxprom ; CHECK: prfm plil1keep call void @llvm.prefetch(ptr %arrayidx9, i32 0, i32 3, i32 0) %tmp18 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx24 = getelementptr inbounds i32, ptr %tmp18, i64 %idxprom ; CHECK: prfm pstl1strm call void @llvm.prefetch(ptr %arrayidx12, i32 1, i32 0, i32 1) %tmp20 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx27 = getelementptr inbounds i32, ptr %tmp20, i64 %idxprom ; CHECK: prfm pstl3keep call void @llvm.prefetch(ptr %arrayidx15, i32 1, i32 1, i32 1) %tmp22 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx30 = getelementptr inbounds i32, ptr %tmp22, i64 %idxprom ; CHECK: prfm pstl2keep call void @llvm.prefetch(ptr %arrayidx18, i32 1, i32 2, i32 1) %tmp24 = load ptr, ptr @a, align 8, !tbaa !3 %arrayidx33 = getelementptr inbounds i32, ptr %tmp24, i64 %idxprom ; CHECK: prfm pstl1keep call void @llvm.prefetch(ptr %arrayidx21, i32 1, i32 3, i32 1) ret void } declare void @llvm.prefetch(ptr nocapture, i32, i32, i32) nounwind !0 = !{!"int", !1} !1 = !{!"omnipotent char", !2} !2 = !{!"Simple C/C++ TBAA"} !3 = !{!"any pointer", !1}