199 lines
8.3 KiB
YAML
199 lines
8.3 KiB
YAML
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
|
|
# RUN: llc %s -verify-machineinstrs -mtriple=aarch64-unknown-unknown -run-pass=legalizer -simplify-mir -aarch64-neon-syntax=apple -mattr=-fullfp16 -o - | FileCheck %s --check-prefix=NO-FP16
|
|
# RUN: llc %s -verify-machineinstrs -mtriple=aarch64-unknown-unknown -run-pass=legalizer -simplify-mir -aarch64-neon-syntax=apple -mattr=+fullfp16 -o - | FileCheck %s --check-prefix=FP16
|
|
...
|
|
---
|
|
name: test_v4f16.fma
|
|
alignment: 4
|
|
tracksRegLiveness: true
|
|
machineFunctionInfo: {}
|
|
body: |
|
|
bb.0:
|
|
liveins: $d0, $d1, $d2
|
|
|
|
; NO-FP16-LABEL: name: test_v4f16.fma
|
|
; NO-FP16: liveins: $d0, $d1, $d2
|
|
; NO-FP16-NEXT: {{ $}}
|
|
; NO-FP16-NEXT: [[COPY:%[0-9]+]]:_(<4 x s16>) = COPY $d0
|
|
; NO-FP16-NEXT: [[COPY1:%[0-9]+]]:_(<4 x s16>) = COPY $d1
|
|
; NO-FP16-NEXT: [[COPY2:%[0-9]+]]:_(<4 x s16>) = COPY $d2
|
|
; NO-FP16-NEXT: [[FPEXT:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[COPY]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT1:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[COPY1]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT2:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[COPY2]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FMA:%[0-9]+]]:_(<4 x s32>) = G_FMA [[FPEXT]], [[FPEXT1]], [[FPEXT2]]
|
|
; NO-FP16-NEXT: [[FPTRUNC:%[0-9]+]]:_(<4 x s16>) = G_FPTRUNC [[FMA]](<4 x s32>)
|
|
; NO-FP16-NEXT: $d0 = COPY [[FPTRUNC]](<4 x s16>)
|
|
; NO-FP16-NEXT: RET_ReallyLR implicit $d0
|
|
;
|
|
; FP16-LABEL: name: test_v4f16.fma
|
|
; FP16: liveins: $d0, $d1, $d2
|
|
; FP16-NEXT: {{ $}}
|
|
; FP16-NEXT: [[COPY:%[0-9]+]]:_(<4 x s16>) = COPY $d0
|
|
; FP16-NEXT: [[COPY1:%[0-9]+]]:_(<4 x s16>) = COPY $d1
|
|
; FP16-NEXT: [[COPY2:%[0-9]+]]:_(<4 x s16>) = COPY $d2
|
|
; FP16-NEXT: [[FMA:%[0-9]+]]:_(<4 x s16>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; FP16-NEXT: $d0 = COPY [[FMA]](<4 x s16>)
|
|
; FP16-NEXT: RET_ReallyLR implicit $d0
|
|
%0:_(<4 x s16>) = COPY $d0
|
|
%1:_(<4 x s16>) = COPY $d1
|
|
%2:_(<4 x s16>) = COPY $d2
|
|
%3:_(<4 x s16>) = G_FMA %0, %1, %2
|
|
$d0 = COPY %3(<4 x s16>)
|
|
RET_ReallyLR implicit $d0
|
|
|
|
...
|
|
---
|
|
name: test_v8f16.fma
|
|
alignment: 4
|
|
tracksRegLiveness: true
|
|
machineFunctionInfo: {}
|
|
body: |
|
|
bb.0:
|
|
liveins: $q0, $q1, $q2
|
|
|
|
; NO-FP16-LABEL: name: test_v8f16.fma
|
|
; NO-FP16: liveins: $q0, $q1, $q2
|
|
; NO-FP16-NEXT: {{ $}}
|
|
; NO-FP16-NEXT: [[COPY:%[0-9]+]]:_(<8 x s16>) = COPY $q0
|
|
; NO-FP16-NEXT: [[COPY1:%[0-9]+]]:_(<8 x s16>) = COPY $q1
|
|
; NO-FP16-NEXT: [[COPY2:%[0-9]+]]:_(<8 x s16>) = COPY $q2
|
|
; NO-FP16-NEXT: [[UV:%[0-9]+]]:_(<4 x s16>), [[UV1:%[0-9]+]]:_(<4 x s16>) = G_UNMERGE_VALUES [[COPY]](<8 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[UV]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT1:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[UV1]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[UV2:%[0-9]+]]:_(<4 x s16>), [[UV3:%[0-9]+]]:_(<4 x s16>) = G_UNMERGE_VALUES [[COPY1]](<8 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT2:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[UV2]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT3:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[UV3]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[UV4:%[0-9]+]]:_(<4 x s16>), [[UV5:%[0-9]+]]:_(<4 x s16>) = G_UNMERGE_VALUES [[COPY2]](<8 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT4:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[UV4]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FPEXT5:%[0-9]+]]:_(<4 x s32>) = G_FPEXT [[UV5]](<4 x s16>)
|
|
; NO-FP16-NEXT: [[FMA:%[0-9]+]]:_(<4 x s32>) = G_FMA [[FPEXT]], [[FPEXT2]], [[FPEXT4]]
|
|
; NO-FP16-NEXT: [[FMA1:%[0-9]+]]:_(<4 x s32>) = G_FMA [[FPEXT1]], [[FPEXT3]], [[FPEXT5]]
|
|
; NO-FP16-NEXT: [[FPTRUNC:%[0-9]+]]:_(<4 x s16>) = G_FPTRUNC [[FMA]](<4 x s32>)
|
|
; NO-FP16-NEXT: [[FPTRUNC1:%[0-9]+]]:_(<4 x s16>) = G_FPTRUNC [[FMA1]](<4 x s32>)
|
|
; NO-FP16-NEXT: [[CONCAT_VECTORS:%[0-9]+]]:_(<8 x s16>) = G_CONCAT_VECTORS [[FPTRUNC]](<4 x s16>), [[FPTRUNC1]](<4 x s16>)
|
|
; NO-FP16-NEXT: $q0 = COPY [[CONCAT_VECTORS]](<8 x s16>)
|
|
; NO-FP16-NEXT: RET_ReallyLR implicit $q0
|
|
;
|
|
; FP16-LABEL: name: test_v8f16.fma
|
|
; FP16: liveins: $q0, $q1, $q2
|
|
; FP16-NEXT: {{ $}}
|
|
; FP16-NEXT: [[COPY:%[0-9]+]]:_(<8 x s16>) = COPY $q0
|
|
; FP16-NEXT: [[COPY1:%[0-9]+]]:_(<8 x s16>) = COPY $q1
|
|
; FP16-NEXT: [[COPY2:%[0-9]+]]:_(<8 x s16>) = COPY $q2
|
|
; FP16-NEXT: [[FMA:%[0-9]+]]:_(<8 x s16>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; FP16-NEXT: $q0 = COPY [[FMA]](<8 x s16>)
|
|
; FP16-NEXT: RET_ReallyLR implicit $q0
|
|
%0:_(<8 x s16>) = COPY $q0
|
|
%1:_(<8 x s16>) = COPY $q1
|
|
%2:_(<8 x s16>) = COPY $q2
|
|
%3:_(<8 x s16>) = G_FMA %0, %1, %2
|
|
$q0 = COPY %3(<8 x s16>)
|
|
RET_ReallyLR implicit $q0
|
|
|
|
...
|
|
---
|
|
name: test_v2f32.fma
|
|
alignment: 4
|
|
tracksRegLiveness: true
|
|
machineFunctionInfo: {}
|
|
body: |
|
|
bb.0:
|
|
liveins: $d0, $d1, $d2
|
|
|
|
; NO-FP16-LABEL: name: test_v2f32.fma
|
|
; NO-FP16: liveins: $d0, $d1, $d2
|
|
; NO-FP16-NEXT: {{ $}}
|
|
; NO-FP16-NEXT: [[COPY:%[0-9]+]]:_(<2 x s32>) = COPY $d0
|
|
; NO-FP16-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s32>) = COPY $d1
|
|
; NO-FP16-NEXT: [[COPY2:%[0-9]+]]:_(<2 x s32>) = COPY $d2
|
|
; NO-FP16-NEXT: [[FMA:%[0-9]+]]:_(<2 x s32>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; NO-FP16-NEXT: $d0 = COPY [[FMA]](<2 x s32>)
|
|
; NO-FP16-NEXT: RET_ReallyLR implicit $d0
|
|
;
|
|
; FP16-LABEL: name: test_v2f32.fma
|
|
; FP16: liveins: $d0, $d1, $d2
|
|
; FP16-NEXT: {{ $}}
|
|
; FP16-NEXT: [[COPY:%[0-9]+]]:_(<2 x s32>) = COPY $d0
|
|
; FP16-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s32>) = COPY $d1
|
|
; FP16-NEXT: [[COPY2:%[0-9]+]]:_(<2 x s32>) = COPY $d2
|
|
; FP16-NEXT: [[FMA:%[0-9]+]]:_(<2 x s32>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; FP16-NEXT: $d0 = COPY [[FMA]](<2 x s32>)
|
|
; FP16-NEXT: RET_ReallyLR implicit $d0
|
|
%0:_(<2 x s32>) = COPY $d0
|
|
%1:_(<2 x s32>) = COPY $d1
|
|
%2:_(<2 x s32>) = COPY $d2
|
|
%3:_(<2 x s32>) = G_FMA %0, %1, %2
|
|
$d0 = COPY %3(<2 x s32>)
|
|
RET_ReallyLR implicit $d0
|
|
|
|
...
|
|
---
|
|
name: test_v4f32.fma
|
|
alignment: 4
|
|
tracksRegLiveness: true
|
|
machineFunctionInfo: {}
|
|
body: |
|
|
bb.0:
|
|
liveins: $q0, $q1, $q2
|
|
|
|
; NO-FP16-LABEL: name: test_v4f32.fma
|
|
; NO-FP16: liveins: $q0, $q1, $q2
|
|
; NO-FP16-NEXT: {{ $}}
|
|
; NO-FP16-NEXT: [[COPY:%[0-9]+]]:_(<4 x s32>) = COPY $q0
|
|
; NO-FP16-NEXT: [[COPY1:%[0-9]+]]:_(<4 x s32>) = COPY $q1
|
|
; NO-FP16-NEXT: [[COPY2:%[0-9]+]]:_(<4 x s32>) = COPY $q2
|
|
; NO-FP16-NEXT: [[FMA:%[0-9]+]]:_(<4 x s32>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; NO-FP16-NEXT: $q0 = COPY [[FMA]](<4 x s32>)
|
|
; NO-FP16-NEXT: RET_ReallyLR implicit $q0
|
|
;
|
|
; FP16-LABEL: name: test_v4f32.fma
|
|
; FP16: liveins: $q0, $q1, $q2
|
|
; FP16-NEXT: {{ $}}
|
|
; FP16-NEXT: [[COPY:%[0-9]+]]:_(<4 x s32>) = COPY $q0
|
|
; FP16-NEXT: [[COPY1:%[0-9]+]]:_(<4 x s32>) = COPY $q1
|
|
; FP16-NEXT: [[COPY2:%[0-9]+]]:_(<4 x s32>) = COPY $q2
|
|
; FP16-NEXT: [[FMA:%[0-9]+]]:_(<4 x s32>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; FP16-NEXT: $q0 = COPY [[FMA]](<4 x s32>)
|
|
; FP16-NEXT: RET_ReallyLR implicit $q0
|
|
%0:_(<4 x s32>) = COPY $q0
|
|
%1:_(<4 x s32>) = COPY $q1
|
|
%2:_(<4 x s32>) = COPY $q2
|
|
%3:_(<4 x s32>) = G_FMA %0, %1, %2
|
|
$q0 = COPY %3(<4 x s32>)
|
|
RET_ReallyLR implicit $q0
|
|
|
|
...
|
|
---
|
|
name: test_v2f64.fma
|
|
alignment: 4
|
|
tracksRegLiveness: true
|
|
machineFunctionInfo: {}
|
|
body: |
|
|
bb.0:
|
|
liveins: $q0, $q1, $q2
|
|
|
|
; NO-FP16-LABEL: name: test_v2f64.fma
|
|
; NO-FP16: liveins: $q0, $q1, $q2
|
|
; NO-FP16-NEXT: {{ $}}
|
|
; NO-FP16-NEXT: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $q0
|
|
; NO-FP16-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s64>) = COPY $q1
|
|
; NO-FP16-NEXT: [[COPY2:%[0-9]+]]:_(<2 x s64>) = COPY $q2
|
|
; NO-FP16-NEXT: [[FMA:%[0-9]+]]:_(<2 x s64>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; NO-FP16-NEXT: $q0 = COPY [[FMA]](<2 x s64>)
|
|
; NO-FP16-NEXT: RET_ReallyLR implicit $q0
|
|
;
|
|
; FP16-LABEL: name: test_v2f64.fma
|
|
; FP16: liveins: $q0, $q1, $q2
|
|
; FP16-NEXT: {{ $}}
|
|
; FP16-NEXT: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $q0
|
|
; FP16-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s64>) = COPY $q1
|
|
; FP16-NEXT: [[COPY2:%[0-9]+]]:_(<2 x s64>) = COPY $q2
|
|
; FP16-NEXT: [[FMA:%[0-9]+]]:_(<2 x s64>) = G_FMA [[COPY]], [[COPY1]], [[COPY2]]
|
|
; FP16-NEXT: $q0 = COPY [[FMA]](<2 x s64>)
|
|
; FP16-NEXT: RET_ReallyLR implicit $q0
|
|
%0:_(<2 x s64>) = COPY $q0
|
|
%1:_(<2 x s64>) = COPY $q1
|
|
%2:_(<2 x s64>) = COPY $q2
|
|
%3:_(<2 x s64>) = G_FMA %0, %1, %2
|
|
$q0 = COPY %3(<2 x s64>)
|
|
RET_ReallyLR implicit $q0
|