提交 92cdfaeb 编写于 作者: P Peter Maydell 提交者: Aurelien Jarno

target-arm: Fix shift by immediate and narrow where src, dest overlap

For Neon shifts by immediate and narrow, correctly handle the case
where the source registers and the destination registers overlap
(the second pass should use the original register contents, not the
results of the first pass).

This includes a refactoring to pull the size check outside the
loop rather than inside, since there is now very little common
code between the size == 3 and size != 3 case.
Signed-off-by: NPeter Maydell <peter.maydell@linaro.org>
Signed-off-by: NAurelien Jarno <aurelien@aurel32.net>
上级 c33171c7
...@@ -4804,64 +4804,68 @@ static int disas_neon_data_insn(CPUState * env, DisasContext *s, uint32_t insn) ...@@ -4804,64 +4804,68 @@ static int disas_neon_data_insn(CPUState * env, DisasContext *s, uint32_t insn)
shift = shift - (1 << (size + 3)); shift = shift - (1 << (size + 3));
size++; size++;
switch (size) { if (size == 3) {
case 1:
imm = (uint16_t)shift;
imm |= imm << 16;
tmp2 = tcg_const_i32(imm);
TCGV_UNUSED_I64(tmp64);
break;
case 2:
imm = (uint32_t)shift;
tmp2 = tcg_const_i32(imm);
TCGV_UNUSED_I64(tmp64);
break;
case 3:
tmp64 = tcg_const_i64(shift); tmp64 = tcg_const_i64(shift);
TCGV_UNUSED(tmp2); neon_load_reg64(cpu_V0, rm);
break; neon_load_reg64(cpu_V1, rm + 1);
default: for (pass = 0; pass < 2; pass++) {
abort(); TCGv_i64 in;
} if (pass == 0) {
in = cpu_V0;
for (pass = 0; pass < 2; pass++) { } else {
if (size == 3) { in = cpu_V1;
neon_load_reg64(cpu_V0, rm + pass); }
if (q) { if (q) {
if (input_unsigned) { if (input_unsigned) {
gen_helper_neon_rshl_u64(cpu_V0, cpu_V0, gen_helper_neon_rshl_u64(cpu_V0, in, tmp64);
tmp64);
} else { } else {
gen_helper_neon_rshl_s64(cpu_V0, cpu_V0, gen_helper_neon_rshl_s64(cpu_V0, in, tmp64);
tmp64);
} }
} else { } else {
if (input_unsigned) { if (input_unsigned) {
gen_helper_neon_shl_u64(cpu_V0, cpu_V0, gen_helper_neon_shl_u64(cpu_V0, in, tmp64);
tmp64);
} else { } else {
gen_helper_neon_shl_s64(cpu_V0, cpu_V0, gen_helper_neon_shl_s64(cpu_V0, in, tmp64);
tmp64);
} }
} }
tmp = new_tmp();
gen_neon_narrow_op(op == 8, u, size - 1, tmp, cpu_V0);
neon_store_reg(rd, pass, tmp);
} /* for pass */
tcg_temp_free_i64(tmp64);
} else {
if (size == 1) {
imm = (uint16_t)shift;
imm |= imm << 16;
} else { } else {
tmp = neon_load_reg(rm + pass, 0); /* size == 2 */
imm = (uint32_t)shift;
}
tmp2 = tcg_const_i32(imm);
tmp4 = neon_load_reg(rm + 1, 0);
tmp5 = neon_load_reg(rm + 1, 1);
for (pass = 0; pass < 2; pass++) {
if (pass == 0) {
tmp = neon_load_reg(rm, 0);
} else {
tmp = tmp4;
}
gen_neon_shift_narrow(size, tmp, tmp2, q, gen_neon_shift_narrow(size, tmp, tmp2, q,
input_unsigned); input_unsigned);
tmp3 = neon_load_reg(rm + pass, 1); if (pass == 0) {
tmp3 = neon_load_reg(rm, 1);
} else {
tmp3 = tmp5;
}
gen_neon_shift_narrow(size, tmp3, tmp2, q, gen_neon_shift_narrow(size, tmp3, tmp2, q,
input_unsigned); input_unsigned);
tcg_gen_concat_i32_i64(cpu_V0, tmp, tmp3); tcg_gen_concat_i32_i64(cpu_V0, tmp, tmp3);
dead_tmp(tmp); dead_tmp(tmp);
dead_tmp(tmp3); dead_tmp(tmp3);
} tmp = new_tmp();
tmp = new_tmp(); gen_neon_narrow_op(op == 8, u, size - 1, tmp, cpu_V0);
gen_neon_narrow_op(op == 8, u, size - 1, tmp, cpu_V0); neon_store_reg(rd, pass, tmp);
neon_store_reg(rd, pass, tmp); } /* for pass */
} /* for pass */
if (size == 3) {
tcg_temp_free_i64(tmp64);
} else {
tcg_temp_free_i32(tmp2); tcg_temp_free_i32(tmp2);
} }
} else if (op == 10) { } else if (op == 10) {
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册