提交 f34001ec 编写于 作者: N Nikunj A Dadhania 提交者: David Gibson

target-ppc: improve lxvw4x implementation

Load 8byte at a time and manipulate.

Big-Endian Storage
+-------------+-------------+-------------+-------------+
| 00 11 22 33 | 44 55 66 77 | 88 99 AA BB | CC DD EE FF |
+-------------+-------------+-------------+-------------+

Little-Endian Storage
+-------------+-------------+-------------+-------------+
| 33 22 11 00 | 77 66 55 44 | BB AA 99 88 | FF EE DD CC |
+-------------+-------------+-------------+-------------+

Vector load results in (32-bit elements):
+----------+----------+----------+----------+
| 00112233 | 44556677 | 8899AABB | CCDDEEFF |
+----------+----------+----------+----------+
Signed-off-by: NNikunj A Dadhania <nikunj@linux.vnet.ibm.com>
Reviewed-by: NRichard Henderson <rth@twiddle.net>
[dwg: Slight tweak to commit description]
Signed-off-by: NDavid Gibson <david@gibson.dropbear.id.au>
上级 b9731075
...@@ -75,7 +75,6 @@ static void gen_lxvdsx(DisasContext *ctx) ...@@ -75,7 +75,6 @@ static void gen_lxvdsx(DisasContext *ctx)
static void gen_lxvw4x(DisasContext *ctx) static void gen_lxvw4x(DisasContext *ctx)
{ {
TCGv EA; TCGv EA;
TCGv_i64 tmp;
TCGv_i64 xth = cpu_vsrh(xT(ctx->opcode)); TCGv_i64 xth = cpu_vsrh(xT(ctx->opcode));
TCGv_i64 xtl = cpu_vsrl(xT(ctx->opcode)); TCGv_i64 xtl = cpu_vsrl(xT(ctx->opcode));
if (unlikely(!ctx->vsx_enabled)) { if (unlikely(!ctx->vsx_enabled)) {
...@@ -84,22 +83,27 @@ static void gen_lxvw4x(DisasContext *ctx) ...@@ -84,22 +83,27 @@ static void gen_lxvw4x(DisasContext *ctx)
} }
gen_set_access_type(ctx, ACCESS_INT); gen_set_access_type(ctx, ACCESS_INT);
EA = tcg_temp_new(); EA = tcg_temp_new();
tmp = tcg_temp_new_i64();
gen_addr_reg_index(ctx, EA); gen_addr_reg_index(ctx, EA);
gen_qemu_ld32u_i64(ctx, tmp, EA); if (ctx->le_mode) {
tcg_gen_addi_tl(EA, EA, 4); TCGv_i64 t0 = tcg_temp_new_i64();
gen_qemu_ld32u_i64(ctx, xth, EA); TCGv_i64 t1 = tcg_temp_new_i64();
tcg_gen_deposit_i64(xth, xth, tmp, 32, 32);
tcg_gen_qemu_ld_i64(t0, EA, ctx->mem_idx, MO_LEQ);
tcg_gen_addi_tl(EA, EA, 4); tcg_gen_shri_i64(t1, t0, 32);
gen_qemu_ld32u_i64(ctx, tmp, EA); tcg_gen_deposit_i64(xth, t1, t0, 32, 32);
tcg_gen_addi_tl(EA, EA, 4); tcg_gen_addi_tl(EA, EA, 8);
gen_qemu_ld32u_i64(ctx, xtl, EA); tcg_gen_qemu_ld_i64(t0, EA, ctx->mem_idx, MO_LEQ);
tcg_gen_deposit_i64(xtl, xtl, tmp, 32, 32); tcg_gen_shri_i64(t1, t0, 32);
tcg_gen_deposit_i64(xtl, t1, t0, 32, 32);
tcg_temp_free_i64(t0);
tcg_temp_free_i64(t1);
} else {
tcg_gen_qemu_ld_i64(xth, EA, ctx->mem_idx, MO_BEQ);
tcg_gen_addi_tl(EA, EA, 8);
tcg_gen_qemu_ld_i64(xtl, EA, ctx->mem_idx, MO_BEQ);
}
tcg_temp_free(EA); tcg_temp_free(EA);
tcg_temp_free_i64(tmp);
} }
#define VSX_STORE_SCALAR(name, operation) \ #define VSX_STORE_SCALAR(name, operation) \
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册