diff --git a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp index fb8bd81c033af..0d388fc3c787d 100644 --- a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp +++ b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp @@ -25523,6 +25523,9 @@ static SDValue performVSelectCombine(SDNode *N, SelectionDAG &DAG) { return SwapResult; SDValue N0 = N->getOperand(0); + SDValue IfTrue = N->getOperand(1); + SDValue IfFalse = N->getOperand(2); + EVT ResVT = N->getValueType(0); EVT CCVT = N0.getValueType(); if (isAllActivePredicate(DAG, N0)) @@ -25531,6 +25534,22 @@ static SDValue performVSelectCombine(SDNode *N, SelectionDAG &DAG) { if (isAllInactivePredicate(N0)) return N->getOperand(2); + if (isMergePassthruOpcode(IfTrue.getOpcode()) && IfTrue.hasOneUse()) { + // vselect A, (merge_pasthru_op all_active, B,{Bn,} -), C + // vselect A, (merge_pasthru_op -, B,{Bn,} undef), C + // vselect A, (merge_pasthru_op A, B,{Bn,} -), C + // -> merge_pasthru_op A, B,{Bn,} C + if (isAllActivePredicate(DAG, IfTrue->getOperand(0)) || + IfTrue->getOperand(IfTrue.getNumOperands() - 1).isUndef() || + IfTrue->getOperand(0) == N0) { + SmallVector Ops(IfTrue->op_values()); + Ops[0] = N0; + Ops[IfTrue.getNumOperands() - 1] = IfFalse; + + return DAG.getNode(IfTrue.getOpcode(), SDLoc(N), ResVT, Ops); + } + } + // Check for sign pattern (VSELECT setgt, iN lhs, -1, 1, -1) and transform // into (OR (ASR lhs, N-1), 1), which requires less instructions for the // supported types. @@ -25570,14 +25589,11 @@ static SDValue performVSelectCombine(SDNode *N, SelectionDAG &DAG) { CmpVT.getVectorElementType().isFloatingPoint()) return SDValue(); - EVT ResVT = N->getValueType(0); // Only combine when the result type is of the same size as the compared // operands. if (ResVT.getSizeInBits() != CmpVT.getSizeInBits()) return SDValue(); - SDValue IfTrue = N->getOperand(1); - SDValue IfFalse = N->getOperand(2); SetCC = DAG.getSetCC(SDLoc(N), CmpVT.changeVectorElementTypeToInteger(), N0.getOperand(0), N0.getOperand(1), cast(N0.getOperand(2))->get()); diff --git a/llvm/lib/Target/AArch64/AArch64SVEInstrInfo.td b/llvm/lib/Target/AArch64/AArch64SVEInstrInfo.td index 91a9d21fa7b2c..261df563bb2a9 100644 --- a/llvm/lib/Target/AArch64/AArch64SVEInstrInfo.td +++ b/llvm/lib/Target/AArch64/AArch64SVEInstrInfo.td @@ -2445,14 +2445,23 @@ let Predicates = [HasSVE_or_SME] in { defm FCVTZU_ZPmZ_DtoD : sve_fp_2op_p_zd< 0b1111111, "fcvtzu", ZPR64, ZPR64, null_frag, AArch64fcvtzu_mt, nxv2i64, nxv2i1, nxv2f64, ElementSizeD>; //These patterns exist to improve the code quality of conversions on unpacked types. + def : Pat<(nxv2f32 (AArch64fcvte_mt nxv2i1:$Pg, nxv2f16:$Zs, nxv2f32:$Zd)), + (FCVT_ZPmZ_HtoS ZPR:$Zd, PPR:$Pg, ZPR:$Zs)>; def : Pat<(nxv2f32 (AArch64fcvte_mt (nxv2i1 (SVEAllActive:$Pg)), nxv2f16:$Zs, nxv2f32:$Zd)), (FCVT_ZPmZ_HtoS_UNDEF ZPR:$Zd, PPR:$Pg, ZPR:$Zs)>; // FP_ROUND has an additional 'precise' flag which indicates the type of rounding. // This is ignored by the pattern below where it is matched by (i64 timm0_1) + def : Pat<(nxv2f16 (AArch64fcvtr_mt nxv2i1:$Pg, nxv2f32:$Zs, (i64 timm0_1), nxv2f16:$Zd)), + (FCVT_ZPmZ_StoH ZPR:$Zd, PPR:$Pg, ZPR:$Zs)>; def : Pat<(nxv2f16 (AArch64fcvtr_mt (nxv2i1 (SVEAllActive:$Pg)), nxv2f32:$Zs, (i64 timm0_1), nxv2f16:$Zd)), (FCVT_ZPmZ_StoH_UNDEF ZPR:$Zd, PPR:$Pg, ZPR:$Zs)>; + def : Pat<(nxv4f32 (AArch64fcvte_mt nxv4i1:$Pg, nxv4bf16:$Zs, nxv4f32:$Zd)), + (SEL_ZPZZ_S $Pg, (LSL_ZZI_S $Zs, (i32 16)), $Zd)>; + def : Pat<(nxv2f32 (AArch64fcvte_mt nxv2i1:$Pg, nxv2bf16:$Zs, nxv2f32:$Zd)), + (SEL_ZPZZ_D $Pg, (LSL_ZZI_S $Zs, (i32 16)), $Zd)>; + def : Pat<(nxv4f32 (AArch64fcvte_mt (SVEAnyPredicate), nxv4bf16:$op, undef)), (LSL_ZZI_S $op, (i32 16))>; def : Pat<(nxv2f32 (AArch64fcvte_mt (SVEAnyPredicate), nxv2bf16:$op, undef)), diff --git a/llvm/test/CodeGen/AArch64/sve-merging-unary.ll b/llvm/test/CodeGen/AArch64/sve-merging-unary.ll index 9e331a69bcf7c..07f75c866d3d0 100644 --- a/llvm/test/CodeGen/AArch64/sve-merging-unary.ll +++ b/llvm/test/CodeGen/AArch64/sve-merging-unary.ll @@ -7,9 +7,7 @@ target triple = "aarch64-unknown-linux-gnu" define @abs_nxv16i8( %pg, %a, %b) { ; CHECK-LABEL: abs_nxv16i8: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.b -; CHECK-NEXT: abs z1.b, p1/m, z1.b -; CHECK-NEXT: mov z0.b, p0/m, z1.b +; CHECK-NEXT: abs z0.b, p0/m, z1.b ; CHECK-NEXT: ret %b.op = call @llvm.abs.nxv16i8( %b, i1 0) %res = select %pg, %b.op, %a @@ -19,9 +17,7 @@ define @abs_nxv16i8( %pg, @abs_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: abs_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: abs z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: abs z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.abs.nxv8i16( %b, i1 0) %res = select %pg, %b.op, %a @@ -31,9 +27,7 @@ define @abs_nxv8i16( %pg, define @abs_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: abs_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: abs z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: abs z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.abs.nxv4i32( %b, i1 0) %res = select %pg, %b.op, %a @@ -43,9 +37,7 @@ define @abs_nxv4i32( %pg, define @abs_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: abs_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: abs z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: abs z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.abs.nxv2i64( %b, i1 0) %res = select %pg, %b.op, %a @@ -55,9 +47,7 @@ define @abs_nxv2i64( %pg, define @clz_nxv16i8( %pg, %a, %b) { ; CHECK-LABEL: clz_nxv16i8: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.b -; CHECK-NEXT: clz z1.b, p1/m, z1.b -; CHECK-NEXT: mov z0.b, p0/m, z1.b +; CHECK-NEXT: clz z0.b, p0/m, z1.b ; CHECK-NEXT: ret %b.op = call @llvm.ctlz.nxv16i8( %b) %res = select %pg, %b.op, %a @@ -67,9 +57,7 @@ define @clz_nxv16i8( %pg, @clz_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: clz_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: clz z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: clz z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.ctlz.nxv8i16( %b) %res = select %pg, %b.op, %a @@ -79,9 +67,7 @@ define @clz_nxv8i16( %pg, define @clz_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: clz_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: clz z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: clz z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.ctlz.nxv4i32( %b) %res = select %pg, %b.op, %a @@ -91,9 +77,7 @@ define @clz_nxv4i32( %pg, define @clz_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: clz_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: clz z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: clz z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.ctlz.nxv2i64( %b) %res = select %pg, %b.op, %a @@ -103,9 +87,7 @@ define @clz_nxv2i64( %pg, define @cnt_nxv16i8( %pg, %a, %b) { ; CHECK-LABEL: cnt_nxv16i8: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.b -; CHECK-NEXT: cnt z1.b, p1/m, z1.b -; CHECK-NEXT: mov z0.b, p0/m, z1.b +; CHECK-NEXT: cnt z0.b, p0/m, z1.b ; CHECK-NEXT: ret %b.op = call @llvm.ctpop.nxv16i8( %b) %res = select %pg, %b.op, %a @@ -115,9 +97,7 @@ define @cnt_nxv16i8( %pg, @cnt_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: cnt_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: cnt z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: cnt z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.ctpop.nxv8i16( %b) %res = select %pg, %b.op, %a @@ -127,9 +107,7 @@ define @cnt_nxv8i16( %pg, define @cnt_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: cnt_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: cnt z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: cnt z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.ctpop.nxv4i32( %b) %res = select %pg, %b.op, %a @@ -139,9 +117,7 @@ define @cnt_nxv4i32( %pg, define @cnt_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: cnt_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: cnt z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: cnt z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.ctpop.nxv2i64( %b) %res = select %pg, %b.op, %a @@ -151,9 +127,7 @@ define @cnt_nxv2i64( %pg, define @fabs_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: fabs_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fabs z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fabs z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.fabs.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -163,9 +137,7 @@ define @fabs_nxv2f16( %pg, @fabs_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: fabs_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fabs z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fabs z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.fabs.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -175,9 +147,7 @@ define @fabs_nxv4f16( %pg, @fabs_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: fabs_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: fabs z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: fabs z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.fabs.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -187,9 +157,7 @@ define @fabs_nxv8f16( %pg, @fabs_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: fabs_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fabs z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fabs z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.fabs.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -199,9 +167,7 @@ define @fabs_nxv2f32( %pg, @fabs_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: fabs_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fabs z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fabs z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.fabs.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -211,9 +177,7 @@ define @fabs_nxv4f32( %pg, @fabs_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: fabs_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fabs z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fabs z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.fabs.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -256,9 +220,7 @@ define @fabs_nxv8bf16( %pg, @fcvt_nxv2f16_to_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f16_to_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvt z1.s, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvt z0.s, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fpext %b to %res = select %pg, %b.op, %a @@ -268,9 +230,7 @@ define @fcvt_nxv2f16_to_nxv2f32( %pg, @fcvt_nxv2f16_to_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f16_to_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvt z1.d, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvt z0.d, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fpext %b to %res = select %pg, %b.op, %a @@ -280,9 +240,7 @@ define @fcvt_nxv2f16_to_nxv2f64( %pg, @fcvt_nxv4f16_to_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv4f16_to_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fcvt z1.s, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fcvt z0.s, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fpext %b to %res = select %pg, %b.op, %a @@ -292,9 +250,7 @@ define @fcvt_nxv4f16_to_nxv4f32( %pg, @fcvt_nxv2f32_to_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f32_to_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvt z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvt z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptrunc %b to %res = select %pg, %b.op, %a @@ -304,9 +260,7 @@ define @fcvt_nxv2f32_to_nxv2f16( %pg, @fcvt_nxv2f32_to_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f32_to_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvt z1.d, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvt z0.d, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fpext %b to %res = select %pg, %b.op, %a @@ -316,9 +270,7 @@ define @fcvt_nxv2f32_to_nxv2f64( %pg, @fcvt_nxv2f32_to_nxv2bf16( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f32_to_nxv2bf16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: bfcvt z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: bfcvt z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptrunc %b to %res = select %pg, %b.op, %a @@ -328,9 +280,7 @@ define @fcvt_nxv2f32_to_nxv2bf16( %pg, @fcvt_nxv4f32_to_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv4f32_to_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fcvt z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fcvt z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptrunc %b to %res = select %pg, %b.op, %a @@ -340,9 +290,7 @@ define @fcvt_nxv4f32_to_nxv4f16( %pg, @fcvt_nxv4f32_to_nxv4bf16( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv4f32_to_nxv4bf16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: bfcvt z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: bfcvt z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptrunc %b to %res = select %pg, %b.op, %a @@ -352,9 +300,7 @@ define @fcvt_nxv4f32_to_nxv4bf16( %pg, @fcvt_nxv2f64_to_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f64_to_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvt z1.h, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvt z0.h, p0/m, z1.d ; CHECK-NEXT: ret %b.op = fptrunc %b to %res = select %pg, %b.op, %a @@ -364,9 +310,7 @@ define @fcvt_nxv2f64_to_nxv2f16( %pg, @fcvt_nxv2f64_to_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: fcvt_nxv2f64_to_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvt z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvt z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptrunc %b to %res = select %pg, %b.op, %a @@ -378,8 +322,7 @@ define @fcvt_nxv2f64_to_nxv2bf16( %pg, %b to %res = select %pg, %b.op, %a @@ -401,9 +344,7 @@ define @fcvt_nxv2bf16_to_nxv2f64( %pg, %b to %res = select %pg, %b.op, %a @@ -424,9 +365,7 @@ define @fcvt_nxv4bf16_to_nxv4f32( %pg, @fcvtsu_nxv2f16_to_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: fcvtsu_nxv2f16_to_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvtzs z1.d, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvtzs z0.d, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fptosi %b to %res = select %pg, %b.op, %a @@ -436,9 +375,7 @@ define @fcvtsu_nxv2f16_to_nxv2i64( %pg, @fcvtsu_nxv4f16_to_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: fcvtsu_nxv4f16_to_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fcvtzs z1.s, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fcvtzs z0.s, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fptosi %b to %res = select %pg, %b.op, %a @@ -448,9 +385,7 @@ define @fcvtsu_nxv4f16_to_nxv4i32( %pg, @fcvtsu_nxv8f16_to_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: fcvtsu_nxv8f16_to_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: fcvtzs z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: fcvtzs z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fptosi %b to %res = select %pg, %b.op, %a @@ -460,9 +395,7 @@ define @fcvtsu_nxv8f16_to_nxv8i16( %pg, @fcvtsu_nxv2f32_to_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: fcvtsu_nxv2f32_to_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvtzs z1.d, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvtzs z0.d, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptosi %b to %res = select %pg, %b.op, %a @@ -472,9 +405,7 @@ define @fcvtsu_nxv2f32_to_nxv2i64( %pg, @fcvtsu_nxv4f32_to_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: fcvtsu_nxv4f32_to_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fcvtzs z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fcvtzs z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptosi %b to %res = select %pg, %b.op, %a @@ -484,9 +415,7 @@ define @fcvtsu_nxv4f32_to_nxv4i32( %pg, @fcvtsu_nxv2f64_to_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: fcvtsu_nxv2f64_to_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvtzs z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvtzs z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = fptosi %b to %res = select %pg, %b.op, %a @@ -496,9 +425,7 @@ define @fcvtsu_nxv2f64_to_nxv2i64( %pg, @fcvtzu_nxv2f16_to_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: fcvtzu_nxv2f16_to_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvtzu z1.d, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvtzu z0.d, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fptoui %b to %res = select %pg, %b.op, %a @@ -508,9 +435,7 @@ define @fcvtzu_nxv2f16_to_nxv2i64( %pg, @fcvtzu_nxv4f16_to_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: fcvtzu_nxv4f16_to_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fcvtzu z1.s, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fcvtzu z0.s, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fptoui %b to %res = select %pg, %b.op, %a @@ -520,9 +445,7 @@ define @fcvtzu_nxv4f16_to_nxv4i32( %pg, @fcvtzu_nxv8f16_to_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: fcvtzu_nxv8f16_to_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: fcvtzu z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: fcvtzu z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fptoui %b to %res = select %pg, %b.op, %a @@ -532,9 +455,7 @@ define @fcvtzu_nxv8f16_to_nxv8i16( %pg, @fcvtzu_nxv2f32_to_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: fcvtzu_nxv2f32_to_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvtzu z1.d, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvtzu z0.d, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptoui %b to %res = select %pg, %b.op, %a @@ -544,9 +465,7 @@ define @fcvtzu_nxv2f32_to_nxv2i64( %pg, @fcvtzu_nxv4f32_to_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: fcvtzu_nxv4f32_to_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fcvtzu z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fcvtzu z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fptoui %b to %res = select %pg, %b.op, %a @@ -556,9 +475,7 @@ define @fcvtzu_nxv4f32_to_nxv4i32( %pg, @fcvtzu_nxv2f64_to_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: fcvtzu_nxv2f64_to_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fcvtzu z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fcvtzu z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = fptoui %b to %res = select %pg, %b.op, %a @@ -568,9 +485,7 @@ define @fcvtzu_nxv2f64_to_nxv2i64( %pg, @fneg_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: fneg_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fneg z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fneg z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fneg %b %res = select %pg, %b.op, %a @@ -580,9 +495,7 @@ define @fneg_nxv2f16( %pg, @fneg_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: fneg_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fneg z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fneg z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fneg %b %res = select %pg, %b.op, %a @@ -592,9 +505,7 @@ define @fneg_nxv4f16( %pg, @fneg_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: fneg_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: fneg z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: fneg z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = fneg %b %res = select %pg, %b.op, %a @@ -604,9 +515,7 @@ define @fneg_nxv8f16( %pg, @fneg_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: fneg_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fneg z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fneg z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fneg %b %res = select %pg, %b.op, %a @@ -616,9 +525,7 @@ define @fneg_nxv2f32( %pg, @fneg_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: fneg_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fneg z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fneg z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = fneg %b %res = select %pg, %b.op, %a @@ -628,9 +535,7 @@ define @fneg_nxv4f32( %pg, @fneg_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: fneg_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fneg z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fneg z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = fneg %b %res = select %pg, %b.op, %a @@ -673,9 +578,7 @@ define @fneg_nxv8bf16( %pg, @frinta_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frinta_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frinta z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frinta z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.round.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -685,9 +588,7 @@ define @frinta_nxv2f16( %pg, @frinta_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frinta_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frinta z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frinta z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.round.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -697,9 +598,7 @@ define @frinta_nxv4f16( %pg, @frinta_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frinta_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frinta z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frinta z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.round.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -709,9 +608,7 @@ define @frinta_nxv8f16( %pg, @frinta_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frinta_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frinta z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frinta z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.round.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -721,9 +618,7 @@ define @frinta_nxv2f32( %pg, @frinta_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frinta_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frinta z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frinta z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.round.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -733,9 +628,7 @@ define @frinta_nxv4f32( %pg, @frinta_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frinta_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frinta z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frinta z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.round.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -745,9 +638,7 @@ define @frinta_nxv2f64( %pg, @frinti_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frinti_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frinti z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frinti z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.nearbyint.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -757,9 +648,7 @@ define @frinti_nxv2f16( %pg, @frinti_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frinti_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frinti z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frinti z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.nearbyint.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -769,9 +658,7 @@ define @frinti_nxv4f16( %pg, @frinti_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frinti_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frinti z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frinti z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.nearbyint.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -781,9 +668,7 @@ define @frinti_nxv8f16( %pg, @frinti_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frinti_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frinti z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frinti z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.nearbyint.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -793,9 +678,7 @@ define @frinti_nxv2f32( %pg, @frinti_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frinti_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frinti z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frinti z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.nearbyint.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -805,9 +688,7 @@ define @frinti_nxv4f32( %pg, @frinti_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frinti_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frinti z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frinti z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.nearbyint.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -817,9 +698,7 @@ define @frinti_nxv2f64( %pg, @frintm_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frintm_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintm z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintm z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.floor.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -829,9 +708,7 @@ define @frintm_nxv2f16( %pg, @frintm_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frintm_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintm z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintm z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.floor.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -841,9 +718,7 @@ define @frintm_nxv4f16( %pg, @frintm_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frintm_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frintm z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frintm z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.floor.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -853,9 +728,7 @@ define @frintm_nxv8f16( %pg, @frintm_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frintm_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintm z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintm z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.floor.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -865,9 +738,7 @@ define @frintm_nxv2f32( %pg, @frintm_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frintm_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintm z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintm z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.floor.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -877,9 +748,7 @@ define @frintm_nxv4f32( %pg, @frintm_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frintm_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintm z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintm z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.floor.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -889,9 +758,7 @@ define @frintm_nxv2f64( %pg, @frintn_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frintn_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintn z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintn z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.roundeven.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -901,9 +768,7 @@ define @frintn_nxv2f16( %pg, @frintn_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frintn_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintn z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintn z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.roundeven.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -913,9 +778,7 @@ define @frintn_nxv4f16( %pg, @frintn_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frintn_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frintn z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frintn z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.roundeven.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -925,9 +788,7 @@ define @frintn_nxv8f16( %pg, @frintn_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frintn_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintn z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintn z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.roundeven.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -937,9 +798,7 @@ define @frintn_nxv2f32( %pg, @frintn_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frintn_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintn z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintn z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.roundeven.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -949,9 +808,7 @@ define @frintn_nxv4f32( %pg, @frintn_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frintn_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintn z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintn z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.roundeven.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -961,9 +818,7 @@ define @frintn_nxv2f64( %pg, @frintp_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frintp_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintp z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintp z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.ceil.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -973,9 +828,7 @@ define @frintp_nxv2f16( %pg, @frintp_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frintp_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintp z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintp z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.ceil.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -985,9 +838,7 @@ define @frintp_nxv4f16( %pg, @frintp_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frintp_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frintp z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frintp z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.ceil.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -997,9 +848,7 @@ define @frintp_nxv8f16( %pg, @frintp_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frintp_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintp z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintp z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.ceil.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -1009,9 +858,7 @@ define @frintp_nxv2f32( %pg, @frintp_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frintp_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintp z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintp z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.ceil.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -1021,9 +868,7 @@ define @frintp_nxv4f32( %pg, @frintp_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frintp_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintp z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintp z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.ceil.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -1033,9 +878,7 @@ define @frintp_nxv2f64( %pg, @frintx_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frintx_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintx z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintx z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.rint.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -1045,9 +888,7 @@ define @frintx_nxv2f16( %pg, @frintx_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frintx_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintx z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintx z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.rint.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -1057,9 +898,7 @@ define @frintx_nxv4f16( %pg, @frintx_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frintx_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frintx z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frintx z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.rint.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -1069,9 +908,7 @@ define @frintx_nxv8f16( %pg, @frintx_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frintx_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintx z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintx z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.rint.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -1081,9 +918,7 @@ define @frintx_nxv2f32( %pg, @frintx_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frintx_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintx z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintx z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.rint.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -1093,9 +928,7 @@ define @frintx_nxv4f32( %pg, @frintx_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frintx_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintx z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintx z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.rint.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -1105,9 +938,7 @@ define @frintx_nxv2f64( %pg, @frintz_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: frintz_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintz z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintz z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.trunc.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -1117,9 +948,7 @@ define @frintz_nxv2f16( %pg, @frintz_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: frintz_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintz z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintz z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.trunc.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -1129,9 +958,7 @@ define @frintz_nxv4f16( %pg, @frintz_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: frintz_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: frintz z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: frintz z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.trunc.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -1141,9 +968,7 @@ define @frintz_nxv8f16( %pg, @frintz_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: frintz_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintz z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintz z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.trunc.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -1153,9 +978,7 @@ define @frintz_nxv2f32( %pg, @frintz_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: frintz_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: frintz z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: frintz z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.trunc.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -1165,9 +988,7 @@ define @frintz_nxv4f32( %pg, @frintz_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: frintz_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: frintz z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: frintz z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.trunc.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -1177,9 +998,7 @@ define @frintz_nxv2f64( %pg, @fsqrt_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: fsqrt_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fsqrt z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fsqrt z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.sqrt.nxv2f16( %b) %res = select %pg, %b.op, %a @@ -1189,9 +1008,7 @@ define @fsqrt_nxv2f16( %pg, @fsqrt_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: fsqrt_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fsqrt z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fsqrt z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.sqrt.nxv4f16( %b) %res = select %pg, %b.op, %a @@ -1201,9 +1018,7 @@ define @fsqrt_nxv4f16( %pg, @fsqrt_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: fsqrt_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: fsqrt z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: fsqrt z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.sqrt.nxv8f16( %b) %res = select %pg, %b.op, %a @@ -1213,9 +1028,7 @@ define @fsqrt_nxv8f16( %pg, @fsqrt_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: fsqrt_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fsqrt z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fsqrt z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.sqrt.nxv2f32( %b) %res = select %pg, %b.op, %a @@ -1225,9 +1038,7 @@ define @fsqrt_nxv2f32( %pg, @fsqrt_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: fsqrt_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: fsqrt z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: fsqrt z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.sqrt.nxv4f32( %b) %res = select %pg, %b.op, %a @@ -1237,9 +1048,7 @@ define @fsqrt_nxv4f32( %pg, @fsqrt_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: fsqrt_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: fsqrt z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: fsqrt z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.sqrt.nxv2f64( %b) %res = select %pg, %b.op, %a @@ -1293,9 +1102,7 @@ define @neg_nxv2i64( %pg, define @rbit_nxv16i8( %pg, %a, %b) { ; CHECK-LABEL: rbit_nxv16i8: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.b -; CHECK-NEXT: rbit z1.b, p1/m, z1.b -; CHECK-NEXT: mov z0.b, p0/m, z1.b +; CHECK-NEXT: rbit z0.b, p0/m, z1.b ; CHECK-NEXT: ret %b.op = call @llvm.bitreverse.nxv16i8( %b) %res = select %pg, %b.op, %a @@ -1305,9 +1112,7 @@ define @rbit_nxv16i8( %pg, @rbit_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: rbit_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: rbit z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: rbit z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.bitreverse.nxv8i16( %b) %res = select %pg, %b.op, %a @@ -1317,9 +1122,7 @@ define @rbit_nxv8i16( %pg, @rbit_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: rbit_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: rbit z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: rbit z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.bitreverse.nxv4i32( %b) %res = select %pg, %b.op, %a @@ -1329,9 +1132,7 @@ define @rbit_nxv4i32( %pg, @rbit_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: rbit_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: rbit z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: rbit z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.bitreverse.nxv2i64( %b) %res = select %pg, %b.op, %a @@ -1341,9 +1142,7 @@ define @rbit_nxv2i64( %pg, @revb_nxv8i16( %pg, %a, %b) { ; CHECK-LABEL: revb_nxv8i16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: revb z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: revb z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = call @llvm.bswap.nxv8i16( %b) %res = select %pg, %b.op, %a @@ -1353,9 +1152,7 @@ define @revb_nxv8i16( %pg, @revb_nxv4i32( %pg, %a, %b) { ; CHECK-LABEL: revb_nxv4i32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: revb z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: revb z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = call @llvm.bswap.nxv4i32( %b) %res = select %pg, %b.op, %a @@ -1365,9 +1162,7 @@ define @revb_nxv4i32( %pg, @revb_nxv2i64( %pg, %a, %b) { ; CHECK-LABEL: revb_nxv2i64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: revb z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: revb z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = call @llvm.bswap.nxv2i64( %b) %res = select %pg, %b.op, %a @@ -1377,9 +1172,7 @@ define @revb_nxv2i64( %pg, @scvtf_nxv8i16_to_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: scvtf_nxv8i16_to_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: scvtf z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: scvtf z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = sitofp %b to %res = select %pg, %b.op, %a @@ -1389,9 +1182,7 @@ define @scvtf_nxv8i16_to_nxv8f16( %pg, @scvtf_nxv4i32_to_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: scvtf_nxv4i32_to_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: scvtf z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: scvtf z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = sitofp %b to %res = select %pg, %b.op, %a @@ -1401,9 +1192,7 @@ define @scvtf_nxv4i32_to_nxv4f16( %pg, @scvtf_nxv4i32_to_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: scvtf_nxv4i32_to_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: scvtf z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: scvtf z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = sitofp %b to %res = select %pg, %b.op, %a @@ -1413,9 +1202,7 @@ define @scvtf_nxv4i32_to_nxv4f32( %pg, @scvtf_nxv2i64_to_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: scvtf_nxv2i64_to_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: scvtf z1.h, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: scvtf z0.h, p0/m, z1.d ; CHECK-NEXT: ret %b.op = sitofp %b to %res = select %pg, %b.op, %a @@ -1425,9 +1212,7 @@ define @scvtf_nxv2i64_to_nxv2f16( %pg, @scvtf_nxv2i64_to_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: scvtf_nxv2i64_to_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: scvtf z1.s, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: scvtf z0.s, p0/m, z1.d ; CHECK-NEXT: ret %b.op = sitofp %b to %res = select %pg, %b.op, %a @@ -1437,9 +1222,7 @@ define @scvtf_nxv2i64_to_nxv2f32( %pg, @scvtf_nxv2i64_to_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: scvtf_nxv2i64_to_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: scvtf z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: scvtf z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = sitofp %b to %res = select %pg, %b.op, %a @@ -1521,9 +1304,7 @@ define @sxtw_nxv2i64( %pg, @ucvtf_nxv8i16_to_nxv8f16( %pg, %a, %b) { ; CHECK-LABEL: ucvtf_nxv8i16_to_nxv8f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.h -; CHECK-NEXT: ucvtf z1.h, p1/m, z1.h -; CHECK-NEXT: mov z0.h, p0/m, z1.h +; CHECK-NEXT: ucvtf z0.h, p0/m, z1.h ; CHECK-NEXT: ret %b.op = uitofp %b to %res = select %pg, %b.op, %a @@ -1533,9 +1314,7 @@ define @ucvtf_nxv8i16_to_nxv8f16( %pg, @ucvtf_nxv4i32_to_nxv4f16( %pg, %a, %b) { ; CHECK-LABEL: ucvtf_nxv4i32_to_nxv4f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: ucvtf z1.h, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: ucvtf z0.h, p0/m, z1.s ; CHECK-NEXT: ret %b.op = uitofp %b to %res = select %pg, %b.op, %a @@ -1545,9 +1324,7 @@ define @ucvtf_nxv4i32_to_nxv4f16( %pg, @ucvtf_nxv4i32_to_nxv4f32( %pg, %a, %b) { ; CHECK-LABEL: ucvtf_nxv4i32_to_nxv4f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.s -; CHECK-NEXT: ucvtf z1.s, p1/m, z1.s -; CHECK-NEXT: mov z0.s, p0/m, z1.s +; CHECK-NEXT: ucvtf z0.s, p0/m, z1.s ; CHECK-NEXT: ret %b.op = uitofp %b to %res = select %pg, %b.op, %a @@ -1557,9 +1334,7 @@ define @ucvtf_nxv4i32_to_nxv4f32( %pg, @ucvtf_nxv2i64_to_nxv2f16( %pg, %a, %b) { ; CHECK-LABEL: ucvtf_nxv2i64_to_nxv2f16: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: ucvtf z1.h, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: ucvtf z0.h, p0/m, z1.d ; CHECK-NEXT: ret %b.op = uitofp %b to %res = select %pg, %b.op, %a @@ -1569,9 +1344,7 @@ define @ucvtf_nxv2i64_to_nxv2f16( %pg, @ucvtf_nxv2i64_to_nxv2f32( %pg, %a, %b) { ; CHECK-LABEL: ucvtf_nxv2i64_to_nxv2f32: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: ucvtf z1.s, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: ucvtf z0.s, p0/m, z1.d ; CHECK-NEXT: ret %b.op = uitofp %b to %res = select %pg, %b.op, %a @@ -1581,9 +1354,7 @@ define @ucvtf_nxv2i64_to_nxv2f32( %pg, @ucvtf_nxv2i64_to_nxv2f64( %pg, %a, %b) { ; CHECK-LABEL: ucvtf_nxv2i64_to_nxv2f64: ; CHECK: // %bb.0: -; CHECK-NEXT: ptrue p1.d -; CHECK-NEXT: ucvtf z1.d, p1/m, z1.d -; CHECK-NEXT: mov z0.d, p0/m, z1.d +; CHECK-NEXT: ucvtf z0.d, p0/m, z1.d ; CHECK-NEXT: ret %b.op = uitofp %b to %res = select %pg, %b.op, %a @@ -1656,6 +1427,62 @@ define @uxtw_nxv2i64( %pg, %res } +define @abs_nxv16i8_all_active_predicate( %pg, %a, %b, %c) { +; CHECK-LABEL: abs_nxv16i8_all_active_predicate: +; CHECK: // %bb.0: +; CHECK-NEXT: abs z0.b, p0/m, z1.b +; CHECK-NEXT: ret + %b.op = call @llvm.aarch64.sve.abs.nxv16i8( %c, splat(i1 true), %b) + %res = select %pg, %b.op, %a + ret %res +} + +define @abs_nxv16i8_same_predicate( %pg, %a, %b, %c) { +; CHECK-LABEL: abs_nxv16i8_same_predicate: +; CHECK: // %bb.0: +; CHECK-NEXT: abs z0.b, p0/m, z1.b +; CHECK-NEXT: ret + %b.op = call @llvm.aarch64.sve.abs.nxv16i8( %c, %pg, %b) + %res = select %pg, %b.op, %a + ret %res +} + +define @abs_nxv16i8_inactive_lanes_are_not_defined( %sel_pg, %op_pg, %a, %b) { +; CHECK-LABEL: abs_nxv16i8_inactive_lanes_are_not_defined: +; CHECK: // %bb.0: +; CHECK-NEXT: abs z0.b, p0/m, z1.b +; CHECK-NEXT: ret + %b.op = call @llvm.aarch64.sve.abs.nxv16i8( poison, %op_pg, %b) + %res = select %sel_pg, %b.op, %a + ret %res +} + +; Merging op has multiple users. +declare void @use(,) +define void @abs_nxv16i8_multi_use( %pg, %a, %b) { +; CHECK-LABEL: abs_nxv16i8_multi_use: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p1.b +; CHECK-NEXT: abs z1.b, p1/m, z1.b +; CHECK-NEXT: mov z0.b, p0/m, z1.b +; CHECK-NEXT: b use + %b.op = tail call @llvm.abs.nxv16i8( %b, i1 0) + %res = select %pg, %b.op, %a + tail call void @use( %res, %b.op) + ret void +} + +; Inactive lanes of the merging op remain live after the select. +define @abs_nxv16i8_predicate_mismatch( %sel_pg, %op_pg, %a, %b, %c) { +; CHECK-LABEL: abs_nxv16i8_predicate_mismatch: +; CHECK: // %bb.0: +; CHECK-NEXT: abs z2.b, p1/m, z1.b +; CHECK-NEXT: mov z0.b, p0/m, z2.b +; CHECK-NEXT: ret + %b.op = call @llvm.aarch64.sve.abs.nxv16i8( %c, %op_pg, %b) + %res = select %sel_pg, %b.op, %a + ret %res +} declare @llvm.abs.nxv16i8(, i1) declare @llvm.abs.nxv8i16(, i1)