target/arm: Convert "double-precision" register moves to decodetree (9851ed92) · Commits · SUMMER2020 / students / proj-2021291

target/arm/translate-vfp.inc.c

+147 −0

Original line number	Diff line number	Diff line
		@@ -475,3 +475,150 @@ static bool trans_VCVT(DisasContext s, arg_VCVT a)

		return true;
		}

		static bool trans_VMOV_to_gp(DisasContext s, arg_VMOV_to_gp a)
		{
		/* VMOV scalar to general purpose register */
		TCGv_i32 tmp;
		int pass;
		uint32_t offset;

		/* UNDEF accesses to D16-D31 if they don't exist */
		if (!dc_isar_feature(aa32_fp_d32, s) && (a->vn & 0x10)) {
		return false;
		}

		offset = a->index << a->size;
		pass = extract32(offset, 2, 1);
		offset = extract32(offset, 0, 2) * 8;

		if (a->size != 2 && !arm_dc_feature(s, ARM_FEATURE_NEON)) {
		return false;
		}

		if (!vfp_access_check(s)) {
		return true;
		}

		tmp = neon_load_reg(a->vn, pass);
		switch (a->size) {
		case 0:
		if (offset) {
		tcg_gen_shri_i32(tmp, tmp, offset);
		}
		if (a->u) {
		gen_uxtb(tmp);
		} else {
		gen_sxtb(tmp);
		}
		break;
		case 1:
		if (a->u) {
		if (offset) {
		tcg_gen_shri_i32(tmp, tmp, 16);
		} else {
		gen_uxth(tmp);
		}
		} else {
		if (offset) {
		tcg_gen_sari_i32(tmp, tmp, 16);
		} else {
		gen_sxth(tmp);
		}
		}
		break;
		case 2:
		break;
		}
		store_reg(s, a->rt, tmp);

		return true;
		}

		static bool trans_VMOV_from_gp(DisasContext s, arg_VMOV_from_gp a)
		{
		/* VMOV general purpose register to scalar */
		TCGv_i32 tmp, tmp2;
		int pass;
		uint32_t offset;

		/* UNDEF accesses to D16-D31 if they don't exist */
		if (!dc_isar_feature(aa32_fp_d32, s) && (a->vn & 0x10)) {
		return false;
		}

		offset = a->index << a->size;
		pass = extract32(offset, 2, 1);
		offset = extract32(offset, 0, 2) * 8;

		if (a->size != 2 && !arm_dc_feature(s, ARM_FEATURE_NEON)) {
		return false;
		}

		if (!vfp_access_check(s)) {
		return true;
		}

		tmp = load_reg(s, a->rt);
		switch (a->size) {
		case 0:
		tmp2 = neon_load_reg(a->vn, pass);
		tcg_gen_deposit_i32(tmp, tmp2, tmp, offset, 8);
		tcg_temp_free_i32(tmp2);
		break;
		case 1:
		tmp2 = neon_load_reg(a->vn, pass);
		tcg_gen_deposit_i32(tmp, tmp2, tmp, offset, 16);
		tcg_temp_free_i32(tmp2);
		break;
		case 2:
		break;
		}
		neon_store_reg(a->vn, pass, tmp);

		return true;
		}

		static bool trans_VDUP(DisasContext s, arg_VDUP a)
		{
		/* VDUP (general purpose register) */
		TCGv_i32 tmp;
		int size, vec_size;

		if (!arm_dc_feature(s, ARM_FEATURE_NEON)) {
		return false;
		}

		/* UNDEF accesses to D16-D31 if they don't exist */
		if (!dc_isar_feature(aa32_fp_d32, s) && (a->vn & 0x10)) {
		return false;
		}

		if (a->b && a->e) {
		return false;
		}

		if (a->q && (a->vn & 1)) {
		return false;
		}

		vec_size = a->q ? 16 : 8;
		if (a->b) {
		size = 0;
		} else if (a->e) {
		size = 1;
		} else {
		size = 2;
		}

		if (!vfp_access_check(s)) {
		return true;
		}

		tmp = load_reg(s, a->rt);
		tcg_gen_gvec_dup_i32(size, neon_reg_offset(a->vn, 0),
		vec_size, vec_size, tmp);
		tcg_temp_free_i32(tmp);

		return true;
		}

target/arm/translate.c

+2 −81

Original line number	Diff line number	Diff line
		@@ -3151,87 +3151,8 @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
		/* single register transfer */
		rd = (insn >> 12) & 0xf;
		if (dp) {
		int size;
		int pass;

		VFP_DREG_N(rn, insn);
		if (insn & 0xf)
		return 1;
		if (insn & 0x00c00060
		&& !arm_dc_feature(s, ARM_FEATURE_NEON)) {
		/* already handled by decodetree */
		return 1;
		}

		pass = (insn >> 21) & 1;
		if (insn & (1 << 22)) {
		size = 0;
		offset = ((insn >> 5) & 3) * 8;
		} else if (insn & (1 << 5)) {
		size = 1;
		offset = (insn & (1 << 6)) ? 16 : 0;
		} else {
		size = 2;
		offset = 0;
		}
		if (insn & ARM_CP_RW_BIT) {
		/* vfp->arm */
		tmp = neon_load_reg(rn, pass);
		switch (size) {
		case 0:
		if (offset)
		tcg_gen_shri_i32(tmp, tmp, offset);
		if (insn & (1 << 23))
		gen_uxtb(tmp);
		else
		gen_sxtb(tmp);
		break;
		case 1:
		if (insn & (1 << 23)) {
		if (offset) {
		tcg_gen_shri_i32(tmp, tmp, 16);
		} else {
		gen_uxth(tmp);
		}
		} else {
		if (offset) {
		tcg_gen_sari_i32(tmp, tmp, 16);
		} else {
		gen_sxth(tmp);
		}
		}
		break;
		case 2:
		break;
		}
		store_reg(s, rd, tmp);
		} else {
		/* arm->vfp */
		tmp = load_reg(s, rd);
		if (insn & (1 << 23)) {
		/* VDUP */
		int vec_size = pass ? 16 : 8;
		tcg_gen_gvec_dup_i32(size, neon_reg_offset(rn, 0),
		vec_size, vec_size, tmp);
		tcg_temp_free_i32(tmp);
		} else {
		/* VMOV */
		switch (size) {
		case 0:
		tmp2 = neon_load_reg(rn, pass);
		tcg_gen_deposit_i32(tmp, tmp2, tmp, offset, 8);
		tcg_temp_free_i32(tmp2);
		break;
		case 1:
		tmp2 = neon_load_reg(rn, pass);
		tcg_gen_deposit_i32(tmp, tmp2, tmp, offset, 16);
		tcg_temp_free_i32(tmp2);
		break;
		case 2:
		break;
		}
		neon_store_reg(rn, pass, tmp);
		}
		}
		} else { /* !dp */
		bool is_sysreg;

target/arm/vfp.decode

+36 −0

Original line number	Diff line number	Diff line
		@@ -26,3 +26,39 @@
		# 1110 1110 .... .... .... 101. .... ....
		# (but those patterns might also cover some Neon instructions,
		# which do not live in this file.)

		# VFP registers have an odd encoding with a four-bit field
		# and a one-bit field which are assembled in different orders
		# depending on whether the register is double or single precision.
		# Each individual instruction function must do the checks for
		# "double register selected but CPU does not have double support"
		# and "double register number has bit 4 set but CPU does not
		# support D16-D31" (which should UNDEF).
		%vm_dp 5:1 0:4
		%vm_sp 0:4 5:1
		%vn_dp 7:1 16:4
		%vn_sp 16:4 7:1
		%vd_dp 22:1 12:4
		%vd_sp 12:4 22:1

		%vmov_idx_b 21:1 5:2
		%vmov_idx_h 21:1 6:1

		# VMOV scalar to general-purpose register; note that this does
		# include some Neon cases.
		VMOV_to_gp ---- 1110 u:1 1. 1 .... rt:4 1011 ... 1 0000 \
		vn=%vn_dp size=0 index=%vmov_idx_b
		VMOV_to_gp ---- 1110 u:1 0. 1 .... rt:4 1011 ..1 1 0000 \
		vn=%vn_dp size=1 index=%vmov_idx_h
		VMOV_to_gp ---- 1110 0 0 index:1 1 .... rt:4 1011 .00 1 0000 \
		vn=%vn_dp size=2 u=0

		VMOV_from_gp ---- 1110 0 1. 0 .... rt:4 1011 ... 1 0000 \
		vn=%vn_dp size=0 index=%vmov_idx_b
		VMOV_from_gp ---- 1110 0 0. 0 .... rt:4 1011 ..1 1 0000 \
		vn=%vn_dp size=1 index=%vmov_idx_h
		VMOV_from_gp ---- 1110 0 0 index:1 0 .... rt:4 1011 .00 1 0000 \
		vn=%vn_dp size=2

		VDUP ---- 1110 1 b:1 q:1 0 .... rt:4 1011 . 0 e:1 1 0000 \
		vn=%vn_dp