target/arm: Rearrange Floating-point data-processing (2 regs)

There are lots of special cases within these insns. Split the major argument decode/loading/saving into no_output (compares), rd_is_dp, and rm_is_dp. We still need to special case argument load for compare (rd as input, rm as zero) and vcvt fixed (rd as input+output), but lots of special cases do disappear. Now that we have a full switch at the beginning, hoist the ISA checks from the code generation. Backports commit e80941bd64cc388554770fd72334e9e7d459a1ef from qemu
2025-09-19 05:57:21 +00:00 · 2019-02-22 18:57:20 -05:00 · 2019-02-22 18:57:20 -05:00 · f16dcbe226
parent dbe623dacc
commit f16dcbe226
1 changed files with 111 additions and 116 deletions
--- a/qemu/target/arm/translate.c
+++ b/qemu/target/arm/translate.c
@ -3761,52 +3761,108 @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
            }
        } else {
            /* data processing */
+            bool rd_is_dp = dp;
+            bool rm_is_dp = dp;
+            bool no_output = false;
+
            /* The opcode is in bits 23, 21, 20 and 6.  */
            op = ((insn >> 20) & 8) | ((insn >> 19) & 6) | ((insn >> 6) & 1);
-            if (dp) {
+            rn = VFP_SREG_N(insn);
+
            if (op == 15) {
-                    /* rn is opcode */
-                    rn = ((insn >> 15) & 0x1e) | ((insn >> 7) & 1);
-                } else {
+                /* rn is opcode, encoded as per VFP_SREG_N. */
+                switch (rn) {
+                case 0x00: /* vmov */
+                case 0x01: /* vabs */
+                case 0x02: /* vneg */
+                case 0x03: /* vsqrt */
+                    break;
+
+                case 0x04: /* vcvtb.f64.f16, vcvtb.f32.f16 */
+                case 0x05: /* vcvtt.f64.f16, vcvtt.f32.f16 */
+                    /*
+                     * VCVTB, VCVTT: only present with the halfprec extension
+                     * UNPREDICTABLE if bit 8 is set prior to ARMv8
+                     * (we choose to UNDEF)
+                     */
+                    if ((dp && !arm_dc_feature(s, ARM_FEATURE_V8)) ||
+                        !arm_dc_feature(s, ARM_FEATURE_VFP_FP16)) {
+                        return 1;
+                    }
+                    rm_is_dp = false;
+                    break;
+                case 0x06: /* vcvtb.f16.f32, vcvtb.f16.f64 */
+                case 0x07: /* vcvtt.f16.f32, vcvtt.f16.f64 */
+                    if ((dp && !arm_dc_feature(s, ARM_FEATURE_V8)) ||
+                        !arm_dc_feature(s, ARM_FEATURE_VFP_FP16)) {
+                        return 1;
+                    }
+                    rd_is_dp = false;
+                    break;
+
+                case 0x08: case 0x0a: /* vcmp, vcmpz */
+                case 0x09: case 0x0b: /* vcmpe, vcmpez */
+                    no_output = true;
+                    break;
+
+                case 0x0c: /* vrintr */
+                case 0x0d: /* vrintz */
+                case 0x0e: /* vrintx */
+                    break;
+
+                case 0x0f: /* vcvt double<->single */
+                    rd_is_dp = !dp;
+                    break;
+
+                case 0x10: /* vcvt.fxx.u32 */
+                case 0x11: /* vcvt.fxx.s32 */
+                    rm_is_dp = false;
+                    break;
+                case 0x18: /* vcvtr.u32.fxx */
+                case 0x19: /* vcvtz.u32.fxx */
+                case 0x1a: /* vcvtr.s32.fxx */
+                case 0x1b: /* vcvtz.s32.fxx */
+                    rd_is_dp = false;
+                    break;
+
+                case 0x14: /* vcvt fp <-> fixed */
+                case 0x15:
+                case 0x16:
+                case 0x17:
+                case 0x1c:
+                case 0x1d:
+                case 0x1e:
+                case 0x1f:
+                    if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
+                        return 1;
+                    }
+                    /* Immediate frac_bits has same format as SREG_M.  */
+                    rm_is_dp = false;
+                    break;
+
+                default:
+                    return 1;
+                }
+            } else if (dp) {
                /* rn is register number */
                VFP_DREG_N(rn, insn);
            }

-                if (op == 15 && (rn == 15 || ((rn & 0x1c) == 0x18) ||
-                                 ((rn & 0x1e) == 0x6))) {
-                    /* Integer or single/half precision destination.  */
-                    rd = VFP_SREG_D(insn);
-                } else {
+            if (rd_is_dp) {
                VFP_DREG_D(rd, insn);
-                }
-                if (op == 15 &&
-                    (((rn & 0x1c) == 0x10) || ((rn & 0x14) == 0x14) ||
-                     ((rn & 0x1e) == 0x4))) {
-                    /* VCVT from int or half precision is always from S reg
-                     * regardless of dp bit. VCVT with immediate frac_bits
-                     * has same format as SREG_M.
-                     */
-                    rm = VFP_SREG_M(insn);
            } else {
+                rd = VFP_SREG_D(insn);
+            }
+            if (rm_is_dp) {
                VFP_DREG_M(rm, insn);
-                }
            } else {
-                rn = VFP_SREG_N(insn);
-                if (op == 15 && rn == 15) {
-                    /* Double precision destination.  */
-                    VFP_DREG_D(rd, insn);
-                } else {
-                    rd = VFP_SREG_D(insn);
-                }
-                /* NB that we implicitly rely on the encoding for the frac_bits
-                 * in VCVT of fixed to float being the same as that of an SREG_M
-                 */
                rm = VFP_SREG_M(insn);
            }

            veclen = s->vec_len;
-            if (op == 15 && rn > 3)
+            if (op == 15 && rn > 3) {
                veclen = 0;
+            }

            /* Shut up compiler warnings.  */
            delta_m = 0;
@ -3842,55 +3898,28 @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
            /* Load the initial operands.  */
            if (op == 15) {
                switch (rn) {
-                case 16:
-                case 17:
-                    /* Integer source */
-                    gen_mov_F0_vreg(s, 0, rm);
-                    break;
-                case 8:
-                case 9:
-                    /* Compare */
+                case 0x08: case 0x09: /* Compare */
                    gen_mov_F0_vreg(s, dp, rd);
                    gen_mov_F1_vreg(s, dp, rm);
                    break;
-                case 10:
-                case 11:
-                    /* Compare with zero */
+                case 0x0a: case 0x0b: /* Compare with zero */
                    gen_mov_F0_vreg(s, dp, rd);
                    gen_vfp_F1_ld0(s, dp);
                    break;
-                case 20:
-                case 21:
-                case 22:
-                case 23:
-                case 28:
-                case 29:
-                case 30:
-                case 31:
+                case 0x14: /* vcvt fp <-> fixed */
+                case 0x15:
+                case 0x16:
+                case 0x17:
+                case 0x1c:
+                case 0x1d:
+                case 0x1e:
+                case 0x1f:
                    /* Source and destination the same.  */
                    gen_mov_F0_vreg(s, dp, rd);
                    break;
-                case 4:
-                case 5:
-                case 6:
-                case 7:
-                    /* VCVTB, VCVTT: only present with the halfprec extension
-                     * UNPREDICTABLE if bit 8 is set prior to ARMv8
-                     * (we choose to UNDEF)
-                     */
-                    if ((dp && !arm_dc_feature(s, ARM_FEATURE_V8)) ||
-                        !arm_dc_feature(s, ARM_FEATURE_VFP_FP16)) {
-                        return 1;
-                    }
-                    if (!extract32(rn, 1, 1)) {
-                        /* Half precision source.  */
-                        gen_mov_F0_vreg(s, 0, rm);
-                        break;
-                    }
-                    /* Otherwise fall through */
                default:
                    /* One source operand.  */
-                    gen_mov_F0_vreg(s, dp, rm);
+                    gen_mov_F0_vreg(s, rm_is_dp, rm);
                    break;
                }
            } else {
@ -4169,10 +4198,11 @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
                        break;
                    }
                    case 15: /* single<->double conversion */
-                        if (dp)
+                        if (dp) {
                            gen_helper_vfp_fcvtsd(tcg_ctx, s->F0s, s->F0d, tcg_ctx->cpu_env);
-                        else
+                        } else {
                            gen_helper_vfp_fcvtds(tcg_ctx, s->F0d, s->F0s, tcg_ctx->cpu_env);
+                        }
                        break;
                    case 16: /* fuito */
                        gen_vfp_uito(s, dp, 0);
@ -4181,27 +4211,15 @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
                        gen_vfp_sito(s, dp, 0);
                        break;
                    case 20: /* fshto */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_shto(s, dp, 16 - rm, 0);
                        break;
                    case 21: /* fslto */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_slto(s, dp, 32 - rm, 0);
                        break;
                    case 22: /* fuhto */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_uhto(s, dp, 16 - rm, 0);
                        break;
                    case 23: /* fulto */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_ulto(s, dp, 32 - rm, 0);
                        break;
                    case 24: /* ftoui */
@ -4217,57 +4235,34 @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
                        gen_vfp_tosiz(s, dp, 0);
                        break;
                    case 28: /* ftosh */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_tosh(s, dp, 16 - rm, 0);
                        break;
                    case 29: /* ftosl */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_tosl(s, dp, 32 - rm, 0);
                        break;
                    case 30: /* ftouh */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_touh(s, dp, 16 - rm, 0);
                        break;
                    case 31: /* ftoul */
-                        if (!arm_dc_feature(s, ARM_FEATURE_VFP3)) {
-                            return 1;
-                        }
                        gen_vfp_toul(s, dp, 32 - rm, 0);
                        break;
                    default: /* undefined */
-                        return 1;
+                        g_assert_not_reached();
                    }
                    break;
                default: /* undefined */
                    return 1;
                }

-                /* Write back the result.  */
-                if (op == 15 && (rn >= 8 && rn <= 11)) {
-                    /* Comparison, do nothing.  */
-                } else if (op == 15 && dp && ((rn & 0x1c) == 0x18 ||
-                                              (rn & 0x1e) == 0x6)) {
-                    /* VCVT double to int: always integer result.
-                     * VCVT double to half precision is always a single
-                     * precision result.
-                     */
-                    gen_mov_vreg_F0(s, 0, rd);
-                } else if (op == 15 && rn == 15) {
-                    /* conversion */
-                    gen_mov_vreg_F0(s, !dp, rd);
-                } else {
-                    gen_mov_vreg_F0(s, dp, rd);
+                /* Write back the result, if any.  */
+                if (!no_output) {
+                    gen_mov_vreg_F0(s, rd_is_dp, rd);
                }

                /* break out of the loop if we have finished  */
-                if (veclen == 0)
+                if (veclen == 0) {
                    break;
+                }

                if (op == 15 && delta_m == 0) {
                    /* single source one-many */