; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py ; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv64 -mattr=+v,+f,+d,+zfh,+zvfh < %s | FileCheck %s --check-prefixes=CHECK,GENERIC ; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv64 -mattr=+v,+f,+d,+zfh,+zvfh -riscv-v-vector-bits-max=256 < %s | FileCheck %s --check-prefixes=CHECK,MAX256 ; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv64 < %s | FileCheck %s --check-prefixes=CHECK,UNSUPPORTED define void @masked_gather_aligned() { ; GENERIC-LABEL: 'masked_gather_aligned' ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8F64 = call @llvm.masked.gather.nxv8f64.nxv8p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4F64 = call @llvm.masked.gather.nxv4f64.nxv4p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2F64 = call @llvm.masked.gather.nxv2f64.nxv2p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1F64 = call @llvm.masked.gather.nxv1f64.nxv1p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16F32 = call @llvm.masked.gather.nxv16f32.nxv16p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8F32 = call @llvm.masked.gather.nxv8f32.nxv8p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4F32 = call @llvm.masked.gather.nxv4f32.nxv4p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2F32 = call @llvm.masked.gather.nxv2f32.nxv2p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1F32 = call @llvm.masked.gather.nxv1f32.nxv1p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %V32F16 = call @llvm.masked.gather.nxv32f16.nxv32p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16F16 = call @llvm.masked.gather.nxv16f16.nxv16p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8F16 = call @llvm.masked.gather.nxv8f16.nxv8p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4F16 = call @llvm.masked.gather.nxv4f16.nxv4p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2F16 = call @llvm.masked.gather.nxv2f16.nxv2p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1F16 = call @llvm.masked.gather.nxv1f16.nxv1p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I64 = call @llvm.masked.gather.nxv8i64.nxv8p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I64 = call @llvm.masked.gather.nxv4i64.nxv4p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I64 = call @llvm.masked.gather.nxv2i64.nxv2p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I64 = call @llvm.masked.gather.nxv1i64.nxv1p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16I32 = call @llvm.masked.gather.nxv16i32.nxv16p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I32 = call @llvm.masked.gather.nxv8i32.nxv8p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I32 = call @llvm.masked.gather.nxv4i32.nxv4p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I32 = call @llvm.masked.gather.nxv2i32.nxv2p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I32 = call @llvm.masked.gather.nxv1i32.nxv1p0( undef, i32 4, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %V32I16 = call @llvm.masked.gather.nxv32i16.nxv32p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16I16 = call @llvm.masked.gather.nxv16i16.nxv16p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I16 = call @llvm.masked.gather.nxv8i16.nxv8p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I16 = call @llvm.masked.gather.nxv4i16.nxv4p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I16 = call @llvm.masked.gather.nxv2i16.nxv2p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I16 = call @llvm.masked.gather.nxv1i16.nxv1p0( undef, i32 2, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 128 for instruction: %V64I8 = call @llvm.masked.gather.nxv64i8.nxv64p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %V32I8 = call @llvm.masked.gather.nxv32i8.nxv32p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16I8 = call @llvm.masked.gather.nxv16i8.nxv16p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I8 = call @llvm.masked.gather.nxv8i8.nxv8p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I8 = call @llvm.masked.gather.nxv4i8.nxv4p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I8 = call @llvm.masked.gather.nxv2i8.nxv2p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I8 = call @llvm.masked.gather.nxv1i8.nxv1p0( undef, i32 1, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8PTR = call @llvm.masked.gather.nxv8p0.nxv8p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4PTR = call @llvm.masked.gather.nxv4p0.nxv4p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2PTR = call @llvm.masked.gather.nxv2p0.nxv2p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1PTR = call @llvm.masked.gather.nxv1p0.nxv1p0( undef, i32 8, undef, undef) ; GENERIC-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void ; ; MAX256-LABEL: 'masked_gather_aligned' ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8F64 = call @llvm.masked.gather.nxv8f64.nxv8p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4F64 = call @llvm.masked.gather.nxv4f64.nxv4p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2F64 = call @llvm.masked.gather.nxv2f64.nxv2p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1F64 = call @llvm.masked.gather.nxv1f64.nxv1p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16F32 = call @llvm.masked.gather.nxv16f32.nxv16p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8F32 = call @llvm.masked.gather.nxv8f32.nxv8p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4F32 = call @llvm.masked.gather.nxv4f32.nxv4p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2F32 = call @llvm.masked.gather.nxv2f32.nxv2p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1F32 = call @llvm.masked.gather.nxv1f32.nxv1p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %V32F16 = call @llvm.masked.gather.nxv32f16.nxv32p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16F16 = call @llvm.masked.gather.nxv16f16.nxv16p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8F16 = call @llvm.masked.gather.nxv8f16.nxv8p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4F16 = call @llvm.masked.gather.nxv4f16.nxv4p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2F16 = call @llvm.masked.gather.nxv2f16.nxv2p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1F16 = call @llvm.masked.gather.nxv1f16.nxv1p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I64 = call @llvm.masked.gather.nxv8i64.nxv8p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I64 = call @llvm.masked.gather.nxv4i64.nxv4p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I64 = call @llvm.masked.gather.nxv2i64.nxv2p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I64 = call @llvm.masked.gather.nxv1i64.nxv1p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16I32 = call @llvm.masked.gather.nxv16i32.nxv16p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I32 = call @llvm.masked.gather.nxv8i32.nxv8p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I32 = call @llvm.masked.gather.nxv4i32.nxv4p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I32 = call @llvm.masked.gather.nxv2i32.nxv2p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I32 = call @llvm.masked.gather.nxv1i32.nxv1p0( undef, i32 4, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %V32I16 = call @llvm.masked.gather.nxv32i16.nxv32p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16I16 = call @llvm.masked.gather.nxv16i16.nxv16p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I16 = call @llvm.masked.gather.nxv8i16.nxv8p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I16 = call @llvm.masked.gather.nxv4i16.nxv4p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I16 = call @llvm.masked.gather.nxv2i16.nxv2p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I16 = call @llvm.masked.gather.nxv1i16.nxv1p0( undef, i32 2, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 128 for instruction: %V64I8 = call @llvm.masked.gather.nxv64i8.nxv64p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %V32I8 = call @llvm.masked.gather.nxv32i8.nxv32p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %V16I8 = call @llvm.masked.gather.nxv16i8.nxv16p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8I8 = call @llvm.masked.gather.nxv8i8.nxv8p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4I8 = call @llvm.masked.gather.nxv4i8.nxv4p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2I8 = call @llvm.masked.gather.nxv2i8.nxv2p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1I8 = call @llvm.masked.gather.nxv1i8.nxv1p0( undef, i32 1, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %V8PTR = call @llvm.masked.gather.nxv8p0.nxv8p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V4PTR = call @llvm.masked.gather.nxv4p0.nxv4p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V2PTR = call @llvm.masked.gather.nxv2p0.nxv2p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1PTR = call @llvm.masked.gather.nxv1p0.nxv1p0( undef, i32 8, undef, undef) ; MAX256-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void ; ; UNSUPPORTED-LABEL: 'masked_gather_aligned' ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8F64 = call @llvm.masked.gather.nxv8f64.nxv8p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4F64 = call @llvm.masked.gather.nxv4f64.nxv4p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2F64 = call @llvm.masked.gather.nxv2f64.nxv2p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1F64 = call @llvm.masked.gather.nxv1f64.nxv1p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V16F32 = call @llvm.masked.gather.nxv16f32.nxv16p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8F32 = call @llvm.masked.gather.nxv8f32.nxv8p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4F32 = call @llvm.masked.gather.nxv4f32.nxv4p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2F32 = call @llvm.masked.gather.nxv2f32.nxv2p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1F32 = call @llvm.masked.gather.nxv1f32.nxv1p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V32F16 = call @llvm.masked.gather.nxv32f16.nxv32p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V16F16 = call @llvm.masked.gather.nxv16f16.nxv16p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8F16 = call @llvm.masked.gather.nxv8f16.nxv8p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4F16 = call @llvm.masked.gather.nxv4f16.nxv4p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2F16 = call @llvm.masked.gather.nxv2f16.nxv2p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1F16 = call @llvm.masked.gather.nxv1f16.nxv1p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8I64 = call @llvm.masked.gather.nxv8i64.nxv8p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4I64 = call @llvm.masked.gather.nxv4i64.nxv4p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2I64 = call @llvm.masked.gather.nxv2i64.nxv2p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1I64 = call @llvm.masked.gather.nxv1i64.nxv1p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V16I32 = call @llvm.masked.gather.nxv16i32.nxv16p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8I32 = call @llvm.masked.gather.nxv8i32.nxv8p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4I32 = call @llvm.masked.gather.nxv4i32.nxv4p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2I32 = call @llvm.masked.gather.nxv2i32.nxv2p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1I32 = call @llvm.masked.gather.nxv1i32.nxv1p0( undef, i32 4, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V32I16 = call @llvm.masked.gather.nxv32i16.nxv32p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V16I16 = call @llvm.masked.gather.nxv16i16.nxv16p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8I16 = call @llvm.masked.gather.nxv8i16.nxv8p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4I16 = call @llvm.masked.gather.nxv4i16.nxv4p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2I16 = call @llvm.masked.gather.nxv2i16.nxv2p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1I16 = call @llvm.masked.gather.nxv1i16.nxv1p0( undef, i32 2, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V64I8 = call @llvm.masked.gather.nxv64i8.nxv64p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V32I8 = call @llvm.masked.gather.nxv32i8.nxv32p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V16I8 = call @llvm.masked.gather.nxv16i8.nxv16p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8I8 = call @llvm.masked.gather.nxv8i8.nxv8p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4I8 = call @llvm.masked.gather.nxv4i8.nxv4p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2I8 = call @llvm.masked.gather.nxv2i8.nxv2p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1I8 = call @llvm.masked.gather.nxv1i8.nxv1p0( undef, i32 1, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V8PTR = call @llvm.masked.gather.nxv8p0.nxv8p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V4PTR = call @llvm.masked.gather.nxv4p0.nxv4p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V2PTR = call @llvm.masked.gather.nxv2p0.nxv2p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Invalid cost for instruction: %V1PTR = call @llvm.masked.gather.nxv1p0.nxv1p0( undef, i32 8, undef, undef) ; UNSUPPORTED-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void ; %V8F64 = call @llvm.masked.gather.nxv8f64.nxv8p0( undef, i32 8, undef, undef) %V4F64 = call @llvm.masked.gather.nxv4f64.nxv4p0( undef, i32 8, undef, undef) %V2F64 = call @llvm.masked.gather.nxv2f64.nxv2p0( undef, i32 8, undef, undef) %V1F64 = call @llvm.masked.gather.nxv1f64.nxv1p0( undef, i32 8, undef, undef) %V16F32 = call @llvm.masked.gather.nxv16f32.nxv16p0( undef, i32 4, undef, undef) %V8F32 = call @llvm.masked.gather.nxv8f32.nxv8p0( undef, i32 4, undef, undef) %V4F32 = call @llvm.masked.gather.nxv4f32.nxv4p0( undef, i32 4, undef, undef) %V2F32 = call @llvm.masked.gather.nxv2f32.nxv2p0( undef, i32 4, undef, undef) %V1F32 = call @llvm.masked.gather.nxv1f32.nxv1p0( undef, i32 4, undef, undef) %V32F16 = call @llvm.masked.gather.nxv32f16.nxv32p0( undef, i32 2, undef, undef) %V16F16 = call @llvm.masked.gather.nxv16f16.nxv16p0( undef, i32 2, undef, undef) %V8F16 = call @llvm.masked.gather.nxv8f16.nxv8p0( undef, i32 2, undef, undef) %V4F16 = call @llvm.masked.gather.nxv4f16.nxv4p0( undef, i32 2, undef, undef) %V2F16 = call @llvm.masked.gather.nxv2f16.nxv2p0( undef, i32 2, undef, undef) %V1F16 = call @llvm.masked.gather.nxv1f16.nxv1p0( undef, i32 2, undef, undef) %V8I64 = call @llvm.masked.gather.nxv8i64.nxv8p0( undef, i32 8, undef, undef) %V4I64 = call @llvm.masked.gather.nxv4i64.nxv4p0( undef, i32 8, undef, undef) %V2I64 = call @llvm.masked.gather.nxv2i64.nxv2p0( undef, i32 8, undef, undef) %V1I64 = call @llvm.masked.gather.nxv1i64.nxv1p0( undef, i32 8, undef, undef) %V16I32 = call @llvm.masked.gather.nxv16i32.nxv16p0( undef, i32 4, undef, undef) %V8I32 = call @llvm.masked.gather.nxv8i32.nxv8p0( undef, i32 4, undef, undef) %V4I32 = call @llvm.masked.gather.nxv4i32.nxv4p0( undef, i32 4, undef, undef) %V2I32 = call @llvm.masked.gather.nxv2i32.nxv2p0( undef, i32 4, undef, undef) %V1I32 = call @llvm.masked.gather.nxv1i32.nxv1p0( undef, i32 4, undef, undef) %V32I16 = call @llvm.masked.gather.nxv32i16.nxv32p0( undef, i32 2, undef, undef) %V16I16 = call @llvm.masked.gather.nxv16i16.nxv16p0( undef, i32 2, undef, undef) %V8I16 = call @llvm.masked.gather.nxv8i16.nxv8p0( undef, i32 2, undef, undef) %V4I16 = call @llvm.masked.gather.nxv4i16.nxv4p0( undef, i32 2, undef, undef) %V2I16 = call @llvm.masked.gather.nxv2i16.nxv2p0( undef, i32 2, undef, undef) %V1I16 = call @llvm.masked.gather.nxv1i16.nxv1p0( undef, i32 2, undef, undef) %V64I8 = call @llvm.masked.gather.nxv64i8.nxv64p0( undef, i32 1, undef, undef) %V32I8 = call @llvm.masked.gather.nxv32i8.nxv32p0( undef, i32 1, undef, undef) %V16I8 = call @llvm.masked.gather.nxv16i8.nxv16p0( undef, i32 1, undef, undef) %V8I8 = call @llvm.masked.gather.nxv8i8.nxv8p0( undef, i32 1, undef, undef) %V4I8 = call @llvm.masked.gather.nxv4i8.nxv4p0( undef, i32 1, undef, undef) %V2I8 = call @llvm.masked.gather.nxv2i8.nxv2p0( undef, i32 1, undef, undef) %V1I8 = call @llvm.masked.gather.nxv1i8.nxv1p0( undef, i32 1, undef, undef) %V8PTR = call @llvm.masked.gather.nxv8p0.nxv8p0( undef, i32 8, undef, undef) %V4PTR = call @llvm.masked.gather.nxv4p0.nxv4p0( undef, i32 8, undef, undef) %V2PTR = call @llvm.masked.gather.nxv2p0.nxv2p0( undef, i32 8, undef, undef) %V1PTR= call @llvm.masked.gather.nxv1p0.nxv1p0( undef, i32 8, undef, undef) ret void } define void @masked_gather_unaligned() { ; CHECK-LABEL: 'masked_gather_unaligned' ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8F64.u = call @llvm.masked.gather.nxv8f64.nxv8p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4F64.u = call @llvm.masked.gather.nxv4f64.nxv4p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2F64.u = call @llvm.masked.gather.nxv2f64.nxv2p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1F64.u = call @llvm.masked.gather.nxv1f64.nxv1p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V16F32.u = call @llvm.masked.gather.nxv16f32.nxv16p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8F32.u = call @llvm.masked.gather.nxv8f32.nxv8p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4F32.u = call @llvm.masked.gather.nxv4f32.nxv4p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2F32.u = call @llvm.masked.gather.nxv2f32.nxv2p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1F32.u = call @llvm.masked.gather.nxv1f32.nxv1p0( undef, i32 2, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V32F16.u = call @llvm.masked.gather.nxv32f16.nxv32p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V16F16.u = call @llvm.masked.gather.nxv16f16.nxv16p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8F16.u = call @llvm.masked.gather.nxv8f16.nxv8p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4F16.u = call @llvm.masked.gather.nxv4f16.nxv4p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2F16.u = call @llvm.masked.gather.nxv2f16.nxv2p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1F16.u = call @llvm.masked.gather.nxv1f16.nxv1p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8I64.u = call @llvm.masked.gather.nxv8i64.nxv8p0( undef, i32 4, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4I64.u = call @llvm.masked.gather.nxv4i64.nxv4p0( undef, i32 4, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2I64.u = call @llvm.masked.gather.nxv2i64.nxv2p0( undef, i32 4, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1I64.u = call @llvm.masked.gather.nxv1i64.nxv1p0( undef, i32 4, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V16I32.u = call @llvm.masked.gather.nxv16i32.nxv16p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8I32.u = call @llvm.masked.gather.nxv8i32.nxv8p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4I32.u = call @llvm.masked.gather.nxv4i32.nxv4p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2I32.u = call @llvm.masked.gather.nxv2i32.nxv2p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1I32.u = call @llvm.masked.gather.nxv1i32.nxv1p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V32I16.u = call @llvm.masked.gather.nxv32i16.nxv32p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V16I16.u = call @llvm.masked.gather.nxv16i16.nxv16p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8I16.u = call @llvm.masked.gather.nxv8i16.nxv8p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4I16.u = call @llvm.masked.gather.nxv4i16.nxv4p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2I16.u = call @llvm.masked.gather.nxv2i16.nxv2p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1I16.u = call @llvm.masked.gather.nxv1i16.nxv1p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V8PTR = call @llvm.masked.gather.nxv8p0.nxv8p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V4PTR = call @llvm.masked.gather.nxv4p0.nxv4p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V2PTR = call @llvm.masked.gather.nxv2p0.nxv2p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Invalid cost for instruction: %V1PTR = call @llvm.masked.gather.nxv1p0.nxv1p0( undef, i32 1, undef, undef) ; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void ; %V8F64.u = call @llvm.masked.gather.nxv8f64.nxv8p0( undef, i32 2, undef, undef) %V4F64.u = call @llvm.masked.gather.nxv4f64.nxv4p0( undef, i32 2, undef, undef) %V2F64.u = call @llvm.masked.gather.nxv2f64.nxv2p0( undef, i32 2, undef, undef) %V1F64.u = call @llvm.masked.gather.nxv1f64.nxv1p0( undef, i32 2, undef, undef) %V16F32.u = call @llvm.masked.gather.nxv16f32.nxv16p0( undef, i32 2, undef, undef) %V8F32.u = call @llvm.masked.gather.nxv8f32.nxv8p0( undef, i32 2, undef, undef) %V4F32.u = call @llvm.masked.gather.nxv4f32.nxv4p0( undef, i32 2, undef, undef) %V2F32.u = call @llvm.masked.gather.nxv2f32.nxv2p0( undef, i32 2, undef, undef) %V1F32.u = call @llvm.masked.gather.nxv1f32.nxv1p0( undef, i32 2, undef, undef) %V32F16.u = call @llvm.masked.gather.nxv32f16.nxv32p0( undef, i32 1, undef, undef) %V16F16.u = call @llvm.masked.gather.nxv16f16.nxv16p0( undef, i32 1, undef, undef) %V8F16.u = call @llvm.masked.gather.nxv8f16.nxv8p0( undef, i32 1, undef, undef) %V4F16.u = call @llvm.masked.gather.nxv4f16.nxv4p0( undef, i32 1, undef, undef) %V2F16.u = call @llvm.masked.gather.nxv2f16.nxv2p0( undef, i32 1, undef, undef) %V1F16.u = call @llvm.masked.gather.nxv1f16.nxv1p0( undef, i32 1, undef, undef) %V8I64.u = call @llvm.masked.gather.nxv8i64.nxv8p0( undef, i32 4, undef, undef) %V4I64.u = call @llvm.masked.gather.nxv4i64.nxv4p0( undef, i32 4, undef, undef) %V2I64.u = call @llvm.masked.gather.nxv2i64.nxv2p0( undef, i32 4, undef, undef) %V1I64.u = call @llvm.masked.gather.nxv1i64.nxv1p0( undef, i32 4, undef, undef) %V16I32.u = call @llvm.masked.gather.nxv16i32.nxv16p0( undef, i32 1, undef, undef) %V8I32.u = call @llvm.masked.gather.nxv8i32.nxv8p0( undef, i32 1, undef, undef) %V4I32.u = call @llvm.masked.gather.nxv4i32.nxv4p0( undef, i32 1, undef, undef) %V2I32.u = call @llvm.masked.gather.nxv2i32.nxv2p0( undef, i32 1, undef, undef) %V1I32.u = call @llvm.masked.gather.nxv1i32.nxv1p0( undef, i32 1, undef, undef) %V32I16.u = call @llvm.masked.gather.nxv32i16.nxv32p0( undef, i32 1, undef, undef) %V16I16.u = call @llvm.masked.gather.nxv16i16.nxv16p0( undef, i32 1, undef, undef) %V8I16.u = call @llvm.masked.gather.nxv8i16.nxv8p0( undef, i32 1, undef, undef) %V4I16.u = call @llvm.masked.gather.nxv4i16.nxv4p0( undef, i32 1, undef, undef) %V2I16.u = call @llvm.masked.gather.nxv2i16.nxv2p0( undef, i32 1, undef, undef) %V1I16.u = call @llvm.masked.gather.nxv1i16.nxv1p0( undef, i32 1, undef, undef) %V8PTR = call @llvm.masked.gather.nxv8p0.nxv8p0( undef, i32 1, undef, undef) %V4PTR = call @llvm.masked.gather.nxv4p0.nxv4p0( undef, i32 1, undef, undef) %V2PTR = call @llvm.masked.gather.nxv2p0.nxv2p0( undef, i32 1, undef, undef) %V1PTR= call @llvm.masked.gather.nxv1p0.nxv1p0( undef, i32 1, undef, undef) ret void } declare @llvm.masked.gather.nxv8f64.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4f64.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2f64.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1f64.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv16f32.nxv16p0(, i32, , ) declare @llvm.masked.gather.nxv8f32.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4f32.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2f32.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1f32.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv32f16.nxv32p0(, i32, , ) declare @llvm.masked.gather.nxv16f16.nxv16p0(, i32, , ) declare @llvm.masked.gather.nxv8f16.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4f16.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2f16.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1f16.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv8i64.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4i64.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2i64.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1i64.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv16i32.nxv16p0(, i32, , ) declare @llvm.masked.gather.nxv8i32.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4i32.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2i32.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1i32.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv32i16.nxv32p0(, i32, , ) declare @llvm.masked.gather.nxv16i16.nxv16p0(, i32, , ) declare @llvm.masked.gather.nxv8i16.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4i16.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2i16.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1i16.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv64i8.nxv64p0(, i32, , ) declare @llvm.masked.gather.nxv32i8.nxv32p0(, i32, , ) declare @llvm.masked.gather.nxv16i8.nxv16p0(, i32, , ) declare @llvm.masked.gather.nxv8i8.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4i8.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2i8.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1i8.nxv1p0(, i32, , ) declare @llvm.masked.gather.nxv8p0.nxv8p0(, i32, , ) declare @llvm.masked.gather.nxv4p0.nxv4p0(, i32, , ) declare @llvm.masked.gather.nxv2p0.nxv2p0(, i32, , ) declare @llvm.masked.gather.nxv1p0.nxv1p0(, i32, , )