; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt -passes=instcombine -S < %s | FileCheck --check-prefix OPT %s target triple = "aarch64" ; Most of the testing is covered by the lastb cases, but here we ensure that ; lasta with a predicate having no active lanes is treated as an alias to ; extracting the first vector element. define i8 @lasta_extractelement_0( %v) #0 { ; OPT-LABEL: @lasta_extractelement_0( ; OPT-NEXT: [[E0:%.*]] = extractelement [[V:%.*]], i64 0 ; OPT-NEXT: ret i8 [[E0]] ; %e0 = tail call i8 @llvm.aarch64.sve.lasta.nxv16i8( zeroinitializer, %v) ret i8 %e0 } ; Most of the testing is covered by the lastb cases, but here we check the ; resulting extraction index is one more than the lastb case because lasta ; extracts the element after the last active. define i8 @lasta_extractelement_8( %v) #0 { ; OPT-LABEL: @lasta_extractelement_8( ; OPT-NEXT: [[E1:%.*]] = extractelement [[V:%.*]], i64 8 ; OPT-NEXT: ret i8 [[E1]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 8) %e1 = tail call i8 @llvm.aarch64.sve.lasta.nxv16i8( %pg, %v) ret i8 %e1 } define i8 @lastb_extractelement_0( %v) #0 { ; OPT-LABEL: @lastb_extractelement_0( ; OPT-NEXT: [[E0:%.*]] = extractelement [[V:%.*]], i64 0 ; OPT-NEXT: ret i8 [[E0]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 1) %e0 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e0 } define i8 @lastb_extractelement_1( %v) #0 { ; OPT-LABEL: @lastb_extractelement_1( ; OPT-NEXT: [[E1:%.*]] = extractelement [[V:%.*]], i64 1 ; OPT-NEXT: ret i8 [[E1]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 2) %e1 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e1 } define i8 @lastb_extractelement_2( %v) #0 { ; OPT-LABEL: @lastb_extractelement_2( ; OPT-NEXT: [[E2:%.*]] = extractelement [[V:%.*]], i64 2 ; OPT-NEXT: ret i8 [[E2]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 3) %e2 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e2 } define i8 @lastb_extractelement_3( %v) #0 { ; OPT-LABEL: @lastb_extractelement_3( ; OPT-NEXT: [[E3:%.*]] = extractelement [[V:%.*]], i64 3 ; OPT-NEXT: ret i8 [[E3]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 4) %e3 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e3 } define i8 @lastb_extractelement_4( %v) #0 { ; OPT-LABEL: @lastb_extractelement_4( ; OPT-NEXT: [[E4:%.*]] = extractelement [[V:%.*]], i64 4 ; OPT-NEXT: ret i8 [[E4]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 5) %e4 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e4 } define i8 @lastb_extractelement_5( %v) #0 { ; OPT-LABEL: @lastb_extractelement_5( ; OPT-NEXT: [[E5:%.*]] = extractelement [[V:%.*]], i64 5 ; OPT-NEXT: ret i8 [[E5]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 6) %e5 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e5 } define i8 @lastb_extractelement_6( %v) #0 { ; OPT-LABEL: @lastb_extractelement_6( ; OPT-NEXT: [[E6:%.*]] = extractelement [[V:%.*]], i64 6 ; OPT-NEXT: ret i8 [[E6]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 7) %e6 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e6 } define i8 @lastb_extractelement_7( %v) #0 { ; OPT-LABEL: @lastb_extractelement_7( ; OPT-NEXT: [[E7:%.*]] = extractelement [[V:%.*]], i64 7 ; OPT-NEXT: ret i8 [[E7]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 8) %e7 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e7 } define i8 @lastb_extractelement_15( %v) #0 { ; OPT-LABEL: @lastb_extractelement_15( ; OPT-NEXT: [[E15:%.*]] = extractelement [[V:%.*]], i64 15 ; OPT-NEXT: ret i8 [[E15]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 9) %e15 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e15 } ; No transformation because the requested element is beyond the range of the ; known minimum element count so we maintain the user's intentions. define i8 @lastb_extractelement_31( %v) #0 { ; OPT-LABEL: @lastb_extractelement_31( ; OPT-NEXT: [[PG:%.*]] = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 10) ; OPT-NEXT: [[E31:%.*]] = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG]], [[V:%.*]]) ; OPT-NEXT: ret i8 [[E31]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 10) %e31 = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e31 } ; No transformation because the ptrue's predicate pattern is bogus and thus ; nothing can be inferred about the result. define i8 @lastb_extractelement_invalid_predicate_pattern( %v) #0 { ; OPT-LABEL: @lastb_extractelement_invalid_predicate_pattern( ; OPT-NEXT: [[PG:%.*]] = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 15) ; OPT-NEXT: [[E:%.*]] = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG]], [[V:%.*]]) ; OPT-NEXT: ret i8 [[E]] ; %pg = tail call @llvm.aarch64.sve.ptrue.nxv16i1(i32 15) %e = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %v) ret i8 %e } ; Return the splatted value irrespective of the predicate. define i8 @lasta_splat( %pg, i8 %a) #0 { ; OPT-LABEL: @lasta_splat( ; OPT-NEXT: ret i8 [[A:%.*]] ; %splat_insert = insertelement poison, i8 %a, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %last = tail call i8 @llvm.aarch64.sve.lasta.nxv16i8( %pg, %splat) ret i8 %last } define i8 @lastb_splat( %pg, i8 %a) #0 { ; OPT-LABEL: @lastb_splat( ; OPT-NEXT: ret i8 [[A:%.*]] ; %splat_insert = insertelement poison, i8 %a, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %splat) ret i8 %last } ; Check that we move the lastb before the binary operation so that the new binary op is scalar. define i8 @lastb_binop_RHS_splat_sdiv( %pg, i8 %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_RHS_splat_sdiv( ; OPT-NEXT: [[TMP1:%.*]] = call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = sdiv i8 [[TMP1]], [[SCALAR:%.*]] ; OPT-NEXT: ret i8 [[BINOP1]] ; %splat_insert = insertelement poison, i8 %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = sdiv %vector, %splat %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %binop) ret i8 %last } define i8 @lastb_binop_RHS_splat_sdiv_exact( %pg, i8 %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_RHS_splat_sdiv_exact( ; OPT-NEXT: [[TMP1:%.*]] = call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = sdiv exact i8 [[TMP1]], [[SCALAR:%.*]] ; OPT-NEXT: ret i8 [[BINOP1]] ; %splat_insert = insertelement poison, i8 %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = sdiv exact %vector, %splat %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %binop) ret i8 %last } define float @lastb_binop_RHS_splat_fdiv_float_fast( %pg, float %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_RHS_splat_fdiv_float_fast( ; OPT-NEXT: [[TMP1:%.*]] = call float @llvm.aarch64.sve.lastb.nxv4f32( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = fdiv fast float [[TMP1]], [[SCALAR:%.*]] ; OPT-NEXT: ret float [[BINOP1]] ; %splat_insert = insertelement poison, float %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = fdiv fast %vector, %splat %last = tail call float @llvm.aarch64.sve.lastb.nxv4f32( %pg, %binop) ret float %last } define float @lastb_binop_RHS_splat_fdiv_float( %pg, float %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_RHS_splat_fdiv_float( ; OPT-NEXT: [[TMP1:%.*]] = call float @llvm.aarch64.sve.lastb.nxv4f32( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = fdiv float [[TMP1]], [[SCALAR:%.*]] ; OPT-NEXT: ret float [[BINOP1]] ; %splat_insert = insertelement poison, float %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = fdiv %vector, %splat %last = tail call float @llvm.aarch64.sve.lastb.nxv4f32( %pg, %binop) ret float %last } define i8 @lastb_binop_LHS_splat_sdiv( %pg, i8 %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_LHS_splat_sdiv( ; OPT-NEXT: [[TMP1:%.*]] = call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = sdiv i8 [[SCALAR:%.*]], [[TMP1]] ; OPT-NEXT: ret i8 [[BINOP1]] ; %splat_insert = insertelement poison, i8 %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = sdiv %splat, %vector %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %binop) ret i8 %last } define i8 @lastb_binop_LHS_splat_sdiv_exact( %pg, i8 %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_LHS_splat_sdiv_exact( ; OPT-NEXT: [[TMP1:%.*]] = call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = sdiv exact i8 [[SCALAR:%.*]], [[TMP1]] ; OPT-NEXT: ret i8 [[BINOP1]] ; %splat_insert = insertelement poison, i8 %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = sdiv exact %splat, %vector %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %binop) ret i8 %last } define float @lastb_binop_LHS_splat_fdiv_float_fast( %pg, float %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_LHS_splat_fdiv_float_fast( ; OPT-NEXT: [[TMP1:%.*]] = call float @llvm.aarch64.sve.lastb.nxv4f32( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = fdiv fast float [[SCALAR:%.*]], [[TMP1]] ; OPT-NEXT: ret float [[BINOP1]] ; %splat_insert = insertelement poison, float %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = fdiv fast %splat, %vector %last = tail call float @llvm.aarch64.sve.lastb.nxv4f32( %pg, %binop) ret float %last } define float @lastb_binop_LHS_splat_fdiv_float( %pg, float %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_LHS_splat_fdiv_float( ; OPT-NEXT: [[TMP1:%.*]] = call float @llvm.aarch64.sve.lastb.nxv4f32( [[PG:%.*]], [[VECTOR:%.*]]) ; OPT-NEXT: [[BINOP1:%.*]] = fdiv float [[SCALAR:%.*]], [[TMP1]] ; OPT-NEXT: ret float [[BINOP1]] ; %splat_insert = insertelement poison, float %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = fdiv %splat, %vector %last = tail call float @llvm.aarch64.sve.lastb.nxv4f32( %pg, %binop) ret float %last } define i8 @lastb_binop_LHS_RHS_splat_sdiv( %pg, i8 %scalar1, i8 %scalar2) #0 { ; OPT-LABEL: @lastb_binop_LHS_RHS_splat_sdiv( ; OPT-NEXT: [[BINOP1:%.*]] = sdiv i8 [[SCALAR1:%.*]], [[SCALAR2:%.*]] ; OPT-NEXT: ret i8 [[BINOP1]] ; %splat_insert = insertelement poison, i8 %scalar1, i8 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %splat_insert2 = insertelement poison, i8 %scalar2, i8 0 %splat2 = shufflevector %splat_insert2, poison, zeroinitializer %binop = sdiv %splat, %splat2 %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %binop) ret i8 %last } ; Check that we don't do anything as the binary op has multiple uses. define i8 @lastb_binop_nochange( %pg, i8 %scalar, %vector) #0 { ; OPT-LABEL: @lastb_binop_nochange( ; OPT-NEXT: [[SPLAT_INSERT:%.*]] = insertelement poison, i8 [[SCALAR:%.*]], i64 0 ; OPT-NEXT: [[SPLAT:%.*]] = shufflevector [[SPLAT_INSERT]], poison, zeroinitializer ; OPT-NEXT: [[BINOP:%.*]] = sdiv [[VECTOR:%.*]], [[SPLAT]] ; OPT-NEXT: [[LAST:%.*]] = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( [[PG:%.*]], [[BINOP]]) ; OPT-NEXT: call void @use( [[BINOP]]) ; OPT-NEXT: ret i8 [[LAST]] ; %splat_insert = insertelement poison, i8 %scalar, i32 0 %splat = shufflevector %splat_insert, poison, zeroinitializer %binop = sdiv %vector, %splat %last = tail call i8 @llvm.aarch64.sve.lastb.nxv16i8( %pg, %binop) call void @use( %binop) ret i8 %last } declare void @use() declare @llvm.aarch64.sve.ptrue.nxv16i1(i32) declare i8 @llvm.aarch64.sve.lasta.nxv16i8(, ) declare i8 @llvm.aarch64.sve.lastb.nxv16i8(, ) declare float @llvm.aarch64.sve.lastb.nxv4f32(, ) attributes #0 = { "target-features"="+sve" }