; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -mtriple=riscv32 -mattr=+d -mattr=+xtheadmemidx -mattr=+m -verify-machineinstrs < %s \ ; RUN: | FileCheck %s -check-prefix=RV32XTHEADMEMIDX ; RUN: llc -mtriple=riscv64 -mattr=+d -mattr=+xtheadmemidx -mattr=+m -verify-machineinstrs < %s \ ; RUN: | FileCheck %s -check-prefix=RV64XTHEADMEMIDX define i8* @lbia(i8* %base, i8* %addr.2, i8 %a) { ; RV32XTHEADMEMIDX-LABEL: lbia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lbia a3, (a0), -1, 0 ; RV32XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV32XTHEADMEMIDX-NEXT: sb a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lbia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lbia a3, (a0), -1, 0 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sb a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i8, i8* %base, i8 0 %ld = load i8, i8* %addr %addr.1 = getelementptr i8, i8* %base, i8 -1 %res = add i8 %ld, %a store i8 %res, i8* %addr.2 ret i8* %addr.1 } define i8* @lbib(i8* %base, i8 %a) { ; RV32XTHEADMEMIDX-LABEL: lbib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lbib a2, (a0), 1, 0 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: sb a1, 1(a0) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lbib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lbib a2, (a0), 1, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV64XTHEADMEMIDX-NEXT: sb a1, 1(a0) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i8, i8* %base, i8 1 %ld = load i8, i8* %addr %addr.1 = getelementptr i8, i8* %base, i8 2 %res = add i8 %ld, %a store i8 %res, i8* %addr.1 ret i8* %addr } define i8* @lbuia(i8* %base, i64* %addr.2, i64 %a) { ; RV32XTHEADMEMIDX-LABEL: lbuia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lbuia a4, (a0), -1, 0 ; RV32XTHEADMEMIDX-NEXT: add a2, a4, a2 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a2, a4 ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a4 ; RV32XTHEADMEMIDX-NEXT: sw a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: sw a3, 4(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lbuia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lbuia a3, (a0), -1, 0 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sd a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i8, i8* %base, i8 0 %ld = load i8, i8* %addr %zext = zext i8 %ld to i64 %addr.1 = getelementptr i8, i8* %base, i8 -1 %res = add i64 %zext, %a store i64 %res, i64* %addr.2 ret i8* %addr.1 } define i8* @lbuib(i8* %base, i64 %a, i64* %addr.1) { ; RV32XTHEADMEMIDX-LABEL: lbuib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lbuib a4, (a0), 1, 0 ; RV32XTHEADMEMIDX-NEXT: add a1, a4, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a1, a4 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a4 ; RV32XTHEADMEMIDX-NEXT: sw a1, 0(a3) ; RV32XTHEADMEMIDX-NEXT: sw a2, 4(a3) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lbuib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lbuib a3, (a0), 1, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a3, a1 ; RV64XTHEADMEMIDX-NEXT: sd a1, 0(a2) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i8, i8* %base, i8 1 %ld = load i8, i8* %addr %zext = zext i8 %ld to i64 %res = add i64 %zext, %a store i64 %res, i64* %addr.1 ret i8* %addr } define i16* @lhia(i16* %base, i16* %addr.2, i16 %a) { ; RV32XTHEADMEMIDX-LABEL: lhia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lhia a3, (a0), -16, 1 ; RV32XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV32XTHEADMEMIDX-NEXT: sh a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lhia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lhia a3, (a0), -16, 1 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sh a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i16, i16* %base, i16 0 %ld = load i16, i16* %addr %addr.1 = getelementptr i16, i16* %base, i16 -16 %res = add i16 %ld, %a store i16 %res, i16* %addr.2 ret i16* %addr.1 } define i16* @lhib(i16* %base, i16 %a) { ; RV32XTHEADMEMIDX-LABEL: lhib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lhib a2, (a0), 2, 0 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: sh a1, 2(a0) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lhib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lhib a2, (a0), 2, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV64XTHEADMEMIDX-NEXT: sh a1, 2(a0) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i16, i16* %base, i16 1 %ld = load i16, i16* %addr %addr.1 = getelementptr i16, i16* %base, i16 2 %res = add i16 %ld, %a store i16 %res, i16* %addr.1 ret i16* %addr } define i16* @lhuia(i16* %base, i64* %addr.2, i64 %a) { ; RV32XTHEADMEMIDX-LABEL: lhuia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lhuia a4, (a0), -16, 1 ; RV32XTHEADMEMIDX-NEXT: add a2, a4, a2 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a2, a4 ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a4 ; RV32XTHEADMEMIDX-NEXT: sw a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: sw a3, 4(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lhuia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lhuia a3, (a0), -16, 1 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sd a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i16, i16* %base, i16 0 %ld = load i16, i16* %addr %zext = zext i16 %ld to i64 %addr.1 = getelementptr i16, i16* %base, i16 -16 %res = add i64 %zext, %a store i64 %res, i64* %addr.2 ret i16* %addr.1 } define i16* @lhuib(i16* %base, i64 %a, i64* %addr.1) { ; RV32XTHEADMEMIDX-LABEL: lhuib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lhuib a4, (a0), 2, 0 ; RV32XTHEADMEMIDX-NEXT: add a1, a4, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a1, a4 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a4 ; RV32XTHEADMEMIDX-NEXT: sw a1, 0(a3) ; RV32XTHEADMEMIDX-NEXT: sw a2, 4(a3) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lhuib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lhuib a3, (a0), 2, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a3, a1 ; RV64XTHEADMEMIDX-NEXT: sd a1, 0(a2) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i16, i16* %base, i16 1 %ld = load i16, i16* %addr %zext = zext i16 %ld to i64 %res = add i64 %zext, %a store i64 %res, i64* %addr.1 ret i16* %addr } define i32* @lwia(i32* %base, i32* %addr.2, i32 %a) { ; RV32XTHEADMEMIDX-LABEL: lwia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lwia a3, (a0), -16, 2 ; RV32XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV32XTHEADMEMIDX-NEXT: sw a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lwia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lwia a3, (a0), -16, 2 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sw a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i32, i32* %base, i32 0 %ld = load i32, i32* %addr %addr.1 = getelementptr i32, i32* %base, i32 -16 %res = add i32 %ld, %a store i32 %res, i32* %addr.2 ret i32* %addr.1 } define i32* @lwib(i32* %base, i32 %a) { ; RV32XTHEADMEMIDX-LABEL: lwib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lwib a2, (a0), 4, 0 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: sw a1, 4(a0) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lwib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lwib a2, (a0), 4, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV64XTHEADMEMIDX-NEXT: sw a1, 4(a0) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i32, i32* %base, i32 1 %ld = load i32, i32* %addr %addr.1 = getelementptr i32, i32* %base, i32 2 %res = add i32 %ld, %a store i32 %res, i32* %addr.1 ret i32* %addr } define i32* @lwuia(i32* %base, i64* %addr.2, i64 %a) { ; RV32XTHEADMEMIDX-LABEL: lwuia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lwia a4, (a0), -16, 2 ; RV32XTHEADMEMIDX-NEXT: add a2, a4, a2 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a2, a4 ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a4 ; RV32XTHEADMEMIDX-NEXT: sw a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: sw a3, 4(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lwuia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lwuia a3, (a0), -16, 2 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sd a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i32, i32* %base, i32 0 %ld = load i32, i32* %addr %zext = zext i32 %ld to i64 %addr.1 = getelementptr i32, i32* %base, i32 -16 %res = add i64 %zext, %a store i64 %res, i64* %addr.2 ret i32* %addr.1 } define i32* @lwuib(i32* %base, i64 %a, i64* %addr.1) { ; RV32XTHEADMEMIDX-LABEL: lwuib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lwib a4, (a0), 4, 0 ; RV32XTHEADMEMIDX-NEXT: add a1, a4, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a1, a4 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a4 ; RV32XTHEADMEMIDX-NEXT: sw a1, 0(a3) ; RV32XTHEADMEMIDX-NEXT: sw a2, 4(a3) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lwuib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lwuib a3, (a0), 4, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a3, a1 ; RV64XTHEADMEMIDX-NEXT: sd a1, 0(a2) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i32, i32* %base, i32 1 %ld = load i32, i32* %addr %zext = zext i32 %ld to i64 %res = add i64 %zext, %a store i64 %res, i64* %addr.1 ret i32* %addr } define i64* @ldia(i64* %base, i64* %addr.2, i64 %a) { ; RV32XTHEADMEMIDX-LABEL: ldia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: lw a4, 4(a0) ; RV32XTHEADMEMIDX-NEXT: lw a5, 0(a0) ; RV32XTHEADMEMIDX-NEXT: addi a0, a0, -128 ; RV32XTHEADMEMIDX-NEXT: add a3, a4, a3 ; RV32XTHEADMEMIDX-NEXT: add a2, a5, a2 ; RV32XTHEADMEMIDX-NEXT: sltu a4, a2, a5 ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a4 ; RV32XTHEADMEMIDX-NEXT: sw a2, 0(a1) ; RV32XTHEADMEMIDX-NEXT: sw a3, 4(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: ldia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.ldia a3, (a0), -16, 3 ; RV64XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV64XTHEADMEMIDX-NEXT: sd a2, 0(a1) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i64, i64* %base, i64 0 %ld = load i64, i64* %addr %addr.1 = getelementptr i64, i64* %base, i64 -16 %res = add i64 %ld, %a store i64 %res, i64* %addr.2 ret i64* %addr.1 } define i64* @ldib(i64* %base, i64 %a) { ; RV32XTHEADMEMIDX-LABEL: ldib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lwib a3, (a0), 8, 0 ; RV32XTHEADMEMIDX-NEXT: lw a4, 4(a0) ; RV32XTHEADMEMIDX-NEXT: add a1, a3, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a3, a1, a3 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a3 ; RV32XTHEADMEMIDX-NEXT: add a2, a4, a2 ; RV32XTHEADMEMIDX-NEXT: sw a1, 8(a0) ; RV32XTHEADMEMIDX-NEXT: sw a2, 12(a0) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: ldib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.ldib a2, (a0), 8, 0 ; RV64XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV64XTHEADMEMIDX-NEXT: sd a1, 8(a0) ; RV64XTHEADMEMIDX-NEXT: ret %addr = getelementptr i64, i64* %base, i64 1 %ld = load i64, i64* %addr %addr.1 = getelementptr i64, i64* %base, i64 2 %res = add i64 %ld, %a store i64 %res, i64* %addr.1 ret i64* %addr } define i8* @sbia(i8* %base, i8 %a, i8 %b) { ; RV32XTHEADMEMIDX-LABEL: sbia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.sbia a1, (a0), 1, 0 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: sbia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.sbia a1, (a0), 1, 0 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i8, i8* %base, i8 1 %res = add i8 %a, %b store i8 %res, i8* %base ret i8* %addr.1 } define i8* @sbib(i8* %base, i8 %a, i8 %b) { ; RV32XTHEADMEMIDX-LABEL: sbib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.sbib a1, (a0), 1, 0 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: sbib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.sbib a1, (a0), 1, 0 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i8, i8* %base, i8 1 %res = add i8 %a, %b store i8 %res, i8* %addr.1 ret i8* %addr.1 } define i16* @shia(i16* %base, i16 %a, i16 %b) { ; RV32XTHEADMEMIDX-LABEL: shia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.shia a1, (a0), -9, 1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: shia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.shia a1, (a0), -9, 1 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i16, i16* %base, i16 -9 %res = add i16 %a, %b store i16 %res, i16* %base ret i16* %addr.1 } define i16* @shib(i16* %base, i16 %a, i16 %b) { ; RV32XTHEADMEMIDX-LABEL: shib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.shib a1, (a0), 2, 0 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: shib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.shib a1, (a0), 2, 0 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i16, i16* %base, i16 1 %res = add i16 %a, %b store i16 %res, i16* %addr.1 ret i16* %addr.1 } define i32* @swia(i32* %base, i32 %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: swia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.swia a1, (a0), 8, 2 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: swia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.swia a1, (a0), 8, 2 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i32, i32* %base, i32 8 %res = add i32 %a, %b store i32 %res, i32* %base ret i32* %addr.1 } define i32* @swib(i32* %base, i32 %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: swib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.swib a1, (a0), -13, 3 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: swib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.swib a1, (a0), -13, 3 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i32, i32* %base, i32 -26 %res = add i32 %a, %b store i32 %res, i32* %addr.1 ret i32* %addr.1 } define i64* @sdia(i64* %base, i64 %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: sdia: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: addi a5, a0, 64 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a4 ; RV32XTHEADMEMIDX-NEXT: add a3, a1, a3 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a3, a1 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: sw a3, 0(a0) ; RV32XTHEADMEMIDX-NEXT: sw a1, 4(a0) ; RV32XTHEADMEMIDX-NEXT: mv a0, a5 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: sdia: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.sdia a1, (a0), 8, 3 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i64, i64* %base, i64 8 %res = add i64 %a, %b store i64 %res, i64* %base ret i64* %addr.1 } define i64* @sdib(i64* %base, i64 %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: sdib: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a4 ; RV32XTHEADMEMIDX-NEXT: add a3, a1, a3 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a3, a1 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: th.swib a3, (a0), 8, 0 ; RV32XTHEADMEMIDX-NEXT: sw a1, 4(a0) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: sdib: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.sdib a1, (a0), 8, 0 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i64, i64* %base, i64 1 %res = add i64 %a, %b store i64 %res, i64* %addr.1 ret i64* %addr.1 } define i64 @lrb(i8* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrb: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrb a1, a0, a1, 0 ; RV32XTHEADMEMIDX-NEXT: srai a2, a1, 31 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrb: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrb a0, a0, a1, 0 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i8, i8* %a, i64 %b %2 = load i8, i8* %1, align 1 %3 = sext i8 %2 to i64 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurb(i8* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurb: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrb a1, a0, a1, 0 ; RV32XTHEADMEMIDX-NEXT: srai a2, a1, 31 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurb: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurb a0, a0, a1, 0 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i8, i8* %a, i64 %1 %3 = load i8, i8* %2, align 1 %4 = sext i8 %3 to i64 %5 = add i64 %4, %4 ret i64 %5 } define i64 @lrbu(i8* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrbu: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrbu a1, a0, a1, 0 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrbu: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrbu a0, a0, a1, 0 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i8, i8* %a, i64 %b %2 = load i8, i8* %1, align 1 %3 = zext i8 %2 to i64 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurbu(i8* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurbu: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrbu a1, a0, a1, 0 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurbu: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurbu a0, a0, a1, 0 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i8, i8* %a, i64 %1 %3 = load i8, i8* %2, align 1 %4 = zext i8 %3 to i64 %5 = add i64 %4, %4 ret i64 %5 } define i64 @lrh(i16* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrh: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrh a1, a0, a1, 1 ; RV32XTHEADMEMIDX-NEXT: srai a2, a1, 31 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrh: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrh a0, a0, a1, 1 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i16, i16* %a, i64 %b %2 = load i16, i16* %1, align 4 %3 = sext i16 %2 to i64 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurh(i16* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurh: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrh a1, a0, a1, 1 ; RV32XTHEADMEMIDX-NEXT: srai a2, a1, 31 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurh: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurh a0, a0, a1, 1 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i16, i16* %a, i64 %1 %3 = load i16, i16* %2, align 4 %4 = sext i16 %3 to i64 %5 = add i64 %4, %4 ret i64 %5 } define i64 @lrhu(i16* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrhu: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrhu a1, a0, a1, 1 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrhu: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrhu a0, a0, a1, 1 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i16, i16* %a, i64 %b %2 = load i16, i16* %1, align 4 %3 = zext i16 %2 to i64 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurhu(i16* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurhu: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrhu a1, a0, a1, 1 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurhu: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurhu a0, a0, a1, 1 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i16, i16* %a, i64 %1 %3 = load i16, i16* %2, align 4 %4 = zext i16 %3 to i64 %5 = add i64 %4, %4 ret i64 %5 } define i64 @lrw(i32* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrw: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 2 ; RV32XTHEADMEMIDX-NEXT: srai a2, a1, 31 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrw: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrw a0, a0, a1, 2 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i32, i32* %a, i64 %b %2 = load i32, i32* %1, align 4 %3 = sext i32 %2 to i64 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurw(i32* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurw: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 2 ; RV32XTHEADMEMIDX-NEXT: srai a2, a1, 31 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurw: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurw a0, a0, a1, 2 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i32, i32* %a, i64 %1 %3 = load i32, i32* %2, align 4 %4 = sext i32 %3 to i64 %5 = add i64 %4, %4 ret i64 %5 } define i64 @lrwu(i32* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrwu: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 2 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrwu: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrwu a0, a0, a1, 2 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i32, i32* %a, i64 %b %2 = load i32, i32* %1, align 4 %3 = zext i32 %2 to i64 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurwu(i32* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurwu: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 2 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurwu: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurwu a0, a0, a1, 2 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i32, i32* %a, i64 %1 %3 = load i32, i32* %2, align 4 %4 = zext i32 %3 to i64 %5 = add i64 %4, %4 ret i64 %5 } define i64 @lrd(i64* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrd: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: slli a2, a1, 3 ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 3 ; RV32XTHEADMEMIDX-NEXT: add a0, a0, a2 ; RV32XTHEADMEMIDX-NEXT: lw a2, 4(a0) ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrd: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lrd a0, a0, a1, 3 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = getelementptr i64, i64* %a, i64 %b %2 = load i64, i64* %1, align 8 %3 = add i64 %2, %2 ret i64 %3 } define i64 @lrd_2(i64* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrd_2: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: addi a2, a0, 96 ; RV32XTHEADMEMIDX-NEXT: th.lrw a2, a2, a1, 3 ; RV32XTHEADMEMIDX-NEXT: addi a0, a0, 100 ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 3 ; RV32XTHEADMEMIDX-NEXT: add a0, a2, a2 ; RV32XTHEADMEMIDX-NEXT: sltu a2, a0, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a1 ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrd_2: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: addi a0, a0, 96 ; RV64XTHEADMEMIDX-NEXT: th.lrd a0, a0, a1, 3 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i64 %b, 12 %2 = getelementptr i64, i64* %a, i64 %1 %3 = load i64, i64* %2, align 8 %4 = add i64 %3, %3 ret i64 %4 } define i64 @lurd(i64* %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: lurd: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: slli a2, a1, 3 ; RV32XTHEADMEMIDX-NEXT: th.lrw a1, a0, a1, 3 ; RV32XTHEADMEMIDX-NEXT: add a0, a0, a2 ; RV32XTHEADMEMIDX-NEXT: lw a2, 4(a0) ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a1 ; RV32XTHEADMEMIDX-NEXT: sltu a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: add a1, a2, a1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lurd: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: th.lurd a0, a0, a1, 3 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = getelementptr i64, i64* %a, i64 %1 %3 = load i64, i64* %2, align 8 %4 = add i64 %3, %3 ret i64 %4 } define void @srb(i8* %a, i64 %b, i8 %c) { ; RV32XTHEADMEMIDX-LABEL: srb: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a3 ; RV32XTHEADMEMIDX-NEXT: th.srb a3, a0, a1, 0 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: srb: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.srb a2, a0, a1, 0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i8 %c, %c %2 = getelementptr i8, i8* %a, i64 %b store i8 %1, i8* %2, align 8 ret void } define void @surb(i8* %a, i32 %b, i8 %c) { ; RV32XTHEADMEMIDX-LABEL: surb: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: th.srb a2, a0, a1, 0 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: surb: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.surb a2, a0, a1, 0 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = add i8 %c, %c %3 = getelementptr i8, i8* %a, i64 %1 store i8 %2, i8* %3, align 8 ret void } define void @srh(i16* %a, i64 %b, i16 %c) { ; RV32XTHEADMEMIDX-LABEL: srh: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a3 ; RV32XTHEADMEMIDX-NEXT: th.srh a3, a0, a1, 1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: srh: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.srh a2, a0, a1, 1 ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i16 %c, %c %2 = getelementptr i16, i16* %a, i64 %b store i16 %1, i16* %2, align 8 ret void } define void @surh(i16* %a, i32 %b, i16 %c) { ; RV32XTHEADMEMIDX-LABEL: surh: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: th.srh a2, a0, a1, 1 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: surh: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.surh a2, a0, a1, 1 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = add i16 %c, %c %3 = getelementptr i16, i16* %a, i64 %1 store i16 %2, i16* %3, align 8 ret void } define void @srw(i32* %a, i64 %b, i32 %c) { ; RV32XTHEADMEMIDX-LABEL: srw: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a3 ; RV32XTHEADMEMIDX-NEXT: th.srw a3, a0, a1, 2 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: srw: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.srw a2, a0, a1, 2 ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i32 %c, %c %2 = getelementptr i32, i32* %a, i64 %b store i32 %1, i32* %2, align 8 ret void } define void @surw(i32* %a, i32 %b, i32 %c) { ; RV32XTHEADMEMIDX-LABEL: surw: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV32XTHEADMEMIDX-NEXT: th.srw a2, a0, a1, 2 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: surw: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.surw a2, a0, a1, 2 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = add i32 %c, %c %3 = getelementptr i32, i32* %a, i64 %1 store i32 %2, i32* %3, align 8 ret void } define void @srd(i64* %a, i64 %b, i64 %c) { ; RV32XTHEADMEMIDX-LABEL: srd: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a2, a3, a3 ; RV32XTHEADMEMIDX-NEXT: sltu a3, a2, a3 ; RV32XTHEADMEMIDX-NEXT: add a4, a4, a4 ; RV32XTHEADMEMIDX-NEXT: add a3, a4, a3 ; RV32XTHEADMEMIDX-NEXT: slli a4, a1, 3 ; RV32XTHEADMEMIDX-NEXT: add a4, a0, a4 ; RV32XTHEADMEMIDX-NEXT: th.srw a2, a0, a1, 3 ; RV32XTHEADMEMIDX-NEXT: sw a3, 4(a4) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: srd: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.srd a2, a0, a1, 3 ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i64 %c, %c %2 = getelementptr i64, i64* %a, i64 %b store i64 %1, i64* %2, align 8 ret void } define void @surd(i64* %a, i32 %b, i64 %c) { ; RV32XTHEADMEMIDX-LABEL: surd: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a4, a2, a2 ; RV32XTHEADMEMIDX-NEXT: sltu a2, a4, a2 ; RV32XTHEADMEMIDX-NEXT: add a3, a3, a3 ; RV32XTHEADMEMIDX-NEXT: add a2, a3, a2 ; RV32XTHEADMEMIDX-NEXT: slli a3, a1, 3 ; RV32XTHEADMEMIDX-NEXT: add a3, a0, a3 ; RV32XTHEADMEMIDX-NEXT: th.srw a4, a0, a1, 3 ; RV32XTHEADMEMIDX-NEXT: sw a2, 4(a3) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: surd: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a2, a2, a2 ; RV64XTHEADMEMIDX-NEXT: th.surd a2, a0, a1, 3 ; RV64XTHEADMEMIDX-NEXT: ret %1 = zext i32 %b to i64 %2 = add i64 %c, %c %3 = getelementptr i64, i64* %a, i64 %1 store i64 %2, i64* %3, align 8 ret void } define i32* @test_simm5(i32* %base, i32 %a, i32 %b) { ; RV32XTHEADMEMIDX-LABEL: test_simm5: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV32XTHEADMEMIDX-NEXT: th.swia a1, (a0), -12, 2 ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: test_simm5: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: add a1, a1, a2 ; RV64XTHEADMEMIDX-NEXT: th.swia a1, (a0), -12, 2 ; RV64XTHEADMEMIDX-NEXT: ret %addr.1 = getelementptr i32, i32* %base, i32 -12 %res = add i32 %a, %b store i32 %res, i32* %base ret i32* %addr.1 } define i64 @lrd_large_shift(i64* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrd_large_shift: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: slli a1, a1, 5 ; RV32XTHEADMEMIDX-NEXT: add a1, a1, a0 ; RV32XTHEADMEMIDX-NEXT: lw a0, 384(a1) ; RV32XTHEADMEMIDX-NEXT: lw a1, 388(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrd_large_shift: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: slli a1, a1, 5 ; RV64XTHEADMEMIDX-NEXT: add a0, a1, a0 ; RV64XTHEADMEMIDX-NEXT: ld a0, 384(a0) ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i64 %b, 12 %2 = shl i64 %1, 2 %3 = getelementptr i64, i64* %a, i64 %2 %4 = load i64, i64* %3, align 8 ret i64 %4 } define i64 @lrd_large_offset(i64* %a, i64 %b) { ; RV32XTHEADMEMIDX-LABEL: lrd_large_offset: ; RV32XTHEADMEMIDX: # %bb.0: ; RV32XTHEADMEMIDX-NEXT: slli a1, a1, 3 ; RV32XTHEADMEMIDX-NEXT: add a0, a1, a0 ; RV32XTHEADMEMIDX-NEXT: lui a1, 23 ; RV32XTHEADMEMIDX-NEXT: addi a1, a1, 1792 ; RV32XTHEADMEMIDX-NEXT: add a1, a0, a1 ; RV32XTHEADMEMIDX-NEXT: lw a0, 0(a1) ; RV32XTHEADMEMIDX-NEXT: lw a1, 4(a1) ; RV32XTHEADMEMIDX-NEXT: ret ; ; RV64XTHEADMEMIDX-LABEL: lrd_large_offset: ; RV64XTHEADMEMIDX: # %bb.0: ; RV64XTHEADMEMIDX-NEXT: slli a1, a1, 3 ; RV64XTHEADMEMIDX-NEXT: add a0, a1, a0 ; RV64XTHEADMEMIDX-NEXT: lui a1, 23 ; RV64XTHEADMEMIDX-NEXT: add a0, a0, a1 ; RV64XTHEADMEMIDX-NEXT: ld a0, 1792(a0) ; RV64XTHEADMEMIDX-NEXT: ret %1 = add i64 %b, 12000 %2 = getelementptr i64, i64* %a, i64 %1 %3 = load i64, i64* %2, align 8 ret i64 %3 }