285 lines
10 KiB
YAML
285 lines
10 KiB
YAML
# NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
# RUN: llc -mtriple riscv32 -mattr=+zve64x -start-before=prologepilog -o - \
|
|
# RUN: -verify-machineinstrs %s | FileCheck %s --check-prefix=RV32
|
|
# RUN: llc -mtriple riscv32 -mattr=+v -start-before=prologepilog -o - \
|
|
# RUN: -verify-machineinstrs %s | FileCheck %s --check-prefix=RV32
|
|
# RUN: llc -mtriple riscv64 -mattr=+zve64x -start-before=prologepilog -o - \
|
|
# RUN: -verify-machineinstrs %s | FileCheck %s --check-prefix=RV64
|
|
# RUN: llc -mtriple riscv64 -mattr=+v -start-before=prologepilog -o - \
|
|
# RUN: -verify-machineinstrs %s | FileCheck %s --check-prefix=RV64
|
|
--- |
|
|
target datalayout = "e-m:e-p:64:64-i64:64-i128:128-n64-S128"
|
|
target triple = "riscv64"
|
|
|
|
declare void @extern(<vscale x 4 x i32>*)
|
|
|
|
define void @rvv_stack_align8() #0 {
|
|
; RV32-LABEL: rvv_stack_align8:
|
|
; RV32: # %bb.0:
|
|
; RV32-NEXT: addi sp, sp, -48
|
|
; RV32-NEXT: sw ra, 44(sp) # 4-byte Folded Spill
|
|
; RV32-NEXT: csrr a0, vlenb
|
|
; RV32-NEXT: slli a0, a0, 1
|
|
; RV32-NEXT: sub sp, sp, a0
|
|
; RV32-NEXT: addi a0, sp, 32
|
|
; RV32-NEXT: addi a1, sp, 16
|
|
; RV32-NEXT: addi a2, sp, 8
|
|
; RV32-NEXT: call extern
|
|
; RV32-NEXT: csrr a0, vlenb
|
|
; RV32-NEXT: slli a0, a0, 1
|
|
; RV32-NEXT: add sp, sp, a0
|
|
; RV32-NEXT: lw ra, 44(sp) # 4-byte Folded Reload
|
|
; RV32-NEXT: addi sp, sp, 48
|
|
; RV32-NEXT: ret
|
|
;
|
|
; RV64-LABEL: rvv_stack_align8:
|
|
; RV64: # %bb.0:
|
|
; RV64-NEXT: addi sp, sp, -48
|
|
; RV64-NEXT: sd ra, 40(sp) # 8-byte Folded Spill
|
|
; RV64-NEXT: csrr a0, vlenb
|
|
; RV64-NEXT: slli a0, a0, 1
|
|
; RV64-NEXT: sub sp, sp, a0
|
|
; RV64-NEXT: addi a0, sp, 32
|
|
; RV64-NEXT: addi a1, sp, 16
|
|
; RV64-NEXT: addi a2, sp, 8
|
|
; RV64-NEXT: call extern
|
|
; RV64-NEXT: csrr a0, vlenb
|
|
; RV64-NEXT: slli a0, a0, 1
|
|
; RV64-NEXT: add sp, sp, a0
|
|
; RV64-NEXT: ld ra, 40(sp) # 8-byte Folded Reload
|
|
; RV64-NEXT: addi sp, sp, 48
|
|
; RV64-NEXT: ret
|
|
%a = alloca <vscale x 4 x i32>, align 8
|
|
%b = alloca i64
|
|
%c = alloca i64
|
|
call void @extern(<vscale x 4 x i32>* %a)
|
|
ret void
|
|
}
|
|
|
|
define void @rvv_stack_align16() #0 {
|
|
; RV32-LABEL: rvv_stack_align16:
|
|
; RV32: # %bb.0:
|
|
; RV32-NEXT: addi sp, sp, -48
|
|
; RV32-NEXT: sw ra, 44(sp) # 4-byte Folded Spill
|
|
; RV32-NEXT: csrr a0, vlenb
|
|
; RV32-NEXT: slli a0, a0, 1
|
|
; RV32-NEXT: sub sp, sp, a0
|
|
; RV32-NEXT: addi a0, sp, 32
|
|
; RV32-NEXT: addi a1, sp, 16
|
|
; RV32-NEXT: addi a2, sp, 8
|
|
; RV32-NEXT: call extern
|
|
; RV32-NEXT: csrr a0, vlenb
|
|
; RV32-NEXT: slli a0, a0, 1
|
|
; RV32-NEXT: add sp, sp, a0
|
|
; RV32-NEXT: lw ra, 44(sp) # 4-byte Folded Reload
|
|
; RV32-NEXT: addi sp, sp, 48
|
|
; RV32-NEXT: ret
|
|
;
|
|
; RV64-LABEL: rvv_stack_align16:
|
|
; RV64: # %bb.0:
|
|
; RV64-NEXT: addi sp, sp, -48
|
|
; RV64-NEXT: sd ra, 40(sp) # 8-byte Folded Spill
|
|
; RV64-NEXT: csrr a0, vlenb
|
|
; RV64-NEXT: slli a0, a0, 1
|
|
; RV64-NEXT: sub sp, sp, a0
|
|
; RV64-NEXT: addi a0, sp, 32
|
|
; RV64-NEXT: addi a1, sp, 16
|
|
; RV64-NEXT: addi a2, sp, 8
|
|
; RV64-NEXT: call extern
|
|
; RV64-NEXT: csrr a0, vlenb
|
|
; RV64-NEXT: slli a0, a0, 1
|
|
; RV64-NEXT: add sp, sp, a0
|
|
; RV64-NEXT: ld ra, 40(sp) # 8-byte Folded Reload
|
|
; RV64-NEXT: addi sp, sp, 48
|
|
; RV64-NEXT: ret
|
|
%a = alloca <vscale x 4 x i32>, align 16
|
|
%b = alloca i64
|
|
%c = alloca i64
|
|
call void @extern(<vscale x 4 x i32>* %a)
|
|
ret void
|
|
}
|
|
|
|
define void @rvv_stack_align32() #0 {
|
|
; RV32-LABEL: rvv_stack_align32:
|
|
; RV32: # %bb.0:
|
|
; RV32-NEXT: addi sp, sp, -48
|
|
; RV32-NEXT: sw ra, 44(sp) # 4-byte Folded Spill
|
|
; RV32-NEXT: sw s0, 40(sp) # 4-byte Folded Spill
|
|
; RV32-NEXT: addi s0, sp, 48
|
|
; RV32-NEXT: csrr a0, vlenb
|
|
; RV32-NEXT: slli a0, a0, 2
|
|
; RV32-NEXT: sub sp, sp, a0
|
|
; RV32-NEXT: andi sp, sp, -32
|
|
; RV32-NEXT: addi a0, sp, 32
|
|
; RV32-NEXT: addi a1, sp, 16
|
|
; RV32-NEXT: addi a2, sp, 8
|
|
; RV32-NEXT: call extern
|
|
; RV32-NEXT: addi sp, s0, -48
|
|
; RV32-NEXT: lw ra, 44(sp) # 4-byte Folded Reload
|
|
; RV32-NEXT: lw s0, 40(sp) # 4-byte Folded Reload
|
|
; RV32-NEXT: addi sp, sp, 48
|
|
; RV32-NEXT: ret
|
|
;
|
|
; RV64-LABEL: rvv_stack_align32:
|
|
; RV64: # %bb.0:
|
|
; RV64-NEXT: addi sp, sp, -80
|
|
; RV64-NEXT: sd ra, 72(sp) # 8-byte Folded Spill
|
|
; RV64-NEXT: sd s0, 64(sp) # 8-byte Folded Spill
|
|
; RV64-NEXT: addi s0, sp, 80
|
|
; RV64-NEXT: csrr a0, vlenb
|
|
; RV64-NEXT: slli a0, a0, 2
|
|
; RV64-NEXT: sub sp, sp, a0
|
|
; RV64-NEXT: andi sp, sp, -32
|
|
; RV64-NEXT: addi a0, sp, 64
|
|
; RV64-NEXT: addi a1, sp, 40
|
|
; RV64-NEXT: addi a2, sp, 32
|
|
; RV64-NEXT: call extern
|
|
; RV64-NEXT: addi sp, s0, -80
|
|
; RV64-NEXT: ld ra, 72(sp) # 8-byte Folded Reload
|
|
; RV64-NEXT: ld s0, 64(sp) # 8-byte Folded Reload
|
|
; RV64-NEXT: addi sp, sp, 80
|
|
; RV64-NEXT: ret
|
|
%a = alloca <vscale x 4 x i32>, align 32
|
|
%b = alloca i64
|
|
%c = alloca i64
|
|
call void @extern(<vscale x 4 x i32>* %a)
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind nofree nosync }
|
|
...
|
|
---
|
|
name: rvv_stack_align8
|
|
alignment: 4
|
|
frameInfo:
|
|
isFrameAddressTaken: false
|
|
isReturnAddressTaken: false
|
|
hasStackMap: false
|
|
hasPatchPoint: false
|
|
stackSize: 0
|
|
offsetAdjustment: 0
|
|
maxAlignment: 8
|
|
adjustsStack: false
|
|
hasCalls: true
|
|
stackProtector: ''
|
|
maxCallFrameSize: 4294967295
|
|
cvBytesOfCalleeSavedRegisters: 0
|
|
hasOpaqueSPAdjustment: false
|
|
hasVAStart: false
|
|
hasMustTailInVarArgFunc: false
|
|
hasTailCall: false
|
|
localFrameSize: 0
|
|
savePoint: ''
|
|
restorePoint: ''
|
|
fixedStack: []
|
|
stack:
|
|
- { id: 0, name: a, type: default, offset: 0, size: 16, alignment: 8,
|
|
stack-id: scalable-vector, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
- { id: 1, name: b, type: default, offset: 0, size: 8, alignment: 8,
|
|
stack-id: default, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
- { id: 2, name: c, type: default, offset: 0, size: 8, alignment: 8,
|
|
stack-id: default, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
body: |
|
|
bb.0 (%ir-block.0):
|
|
ADJCALLSTACKDOWN 0, 0, implicit-def dead $x2, implicit $x2
|
|
$x10 = ADDI %stack.0.a, 0
|
|
$x11 = ADDI %stack.1.b, 0
|
|
$x12 = ADDI %stack.2.c, 0
|
|
PseudoCALL target-flags(riscv-call) @extern, csr_ilp32d_lp64d, implicit-def dead $x1, implicit killed $x10, implicit-def $x2
|
|
ADJCALLSTACKUP 0, 0, implicit-def dead $x2, implicit $x2
|
|
PseudoRET
|
|
|
|
...
|
|
---
|
|
name: rvv_stack_align16
|
|
alignment: 4
|
|
frameInfo:
|
|
isFrameAddressTaken: false
|
|
isReturnAddressTaken: false
|
|
hasStackMap: false
|
|
hasPatchPoint: false
|
|
stackSize: 0
|
|
offsetAdjustment: 0
|
|
maxAlignment: 16
|
|
adjustsStack: false
|
|
hasCalls: true
|
|
stackProtector: ''
|
|
maxCallFrameSize: 4294967295
|
|
cvBytesOfCalleeSavedRegisters: 0
|
|
hasOpaqueSPAdjustment: false
|
|
hasVAStart: false
|
|
hasMustTailInVarArgFunc: false
|
|
hasTailCall: false
|
|
localFrameSize: 0
|
|
savePoint: ''
|
|
restorePoint: ''
|
|
fixedStack: []
|
|
stack:
|
|
- { id: 0, name: a, type: default, offset: 0, size: 16, alignment: 16,
|
|
stack-id: scalable-vector, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
- { id: 1, name: b, type: default, offset: 0, size: 8, alignment: 8,
|
|
stack-id: default, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
- { id: 2, name: c, type: default, offset: 0, size: 8, alignment: 8,
|
|
stack-id: default, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
body: |
|
|
bb.0 (%ir-block.0):
|
|
ADJCALLSTACKDOWN 0, 0, implicit-def dead $x2, implicit $x2
|
|
$x10 = ADDI %stack.0.a, 0
|
|
$x11 = ADDI %stack.1.b, 0
|
|
$x12 = ADDI %stack.2.c, 0
|
|
PseudoCALL target-flags(riscv-call) @extern, csr_ilp32d_lp64d, implicit-def dead $x1, implicit killed $x10, implicit-def $x2
|
|
ADJCALLSTACKUP 0, 0, implicit-def dead $x2, implicit $x2
|
|
PseudoRET
|
|
|
|
...
|
|
---
|
|
name: rvv_stack_align32
|
|
alignment: 4
|
|
frameInfo:
|
|
isFrameAddressTaken: false
|
|
isReturnAddressTaken: false
|
|
hasStackMap: false
|
|
hasPatchPoint: false
|
|
stackSize: 0
|
|
offsetAdjustment: 0
|
|
maxAlignment: 32
|
|
adjustsStack: false
|
|
hasCalls: true
|
|
stackProtector: ''
|
|
maxCallFrameSize: 4294967295
|
|
cvBytesOfCalleeSavedRegisters: 0
|
|
hasOpaqueSPAdjustment: false
|
|
hasVAStart: false
|
|
hasMustTailInVarArgFunc: false
|
|
hasTailCall: false
|
|
localFrameSize: 0
|
|
savePoint: ''
|
|
restorePoint: ''
|
|
fixedStack: []
|
|
stack:
|
|
- { id: 0, name: a, type: default, offset: 0, size: 16, alignment: 32,
|
|
stack-id: scalable-vector, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
- { id: 1, name: b, type: default, offset: 0, size: 8, alignment: 8,
|
|
stack-id: default, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
- { id: 2, name: c, type: default, offset: 0, size: 8, alignment: 8,
|
|
stack-id: default, callee-saved-register: '', callee-saved-restored: true,
|
|
debug-info-variable: '', debug-info-expression: '', debug-info-location: '' }
|
|
body: |
|
|
bb.0 (%ir-block.0):
|
|
ADJCALLSTACKDOWN 0, 0, implicit-def dead $x2, implicit $x2
|
|
$x10 = ADDI %stack.0.a, 0
|
|
$x11 = ADDI %stack.1.b, 0
|
|
$x12 = ADDI %stack.2.c, 0
|
|
PseudoCALL target-flags(riscv-call) @extern, csr_ilp32d_lp64d, implicit-def dead $x1, implicit killed $x10, implicit-def $x2
|
|
ADJCALLSTACKUP 0, 0, implicit-def dead $x2, implicit $x2
|
|
PseudoRET
|
|
|
|
...
|