tcg: Use per-temp state data in optimize

While we're touching many of the lines anyway, adjust the naming
of the functions to better distinguish when "TCGArg" vs "TCGTemp"
should be used.

Backports commit 6349039d0b06eda59820629b934944246b14a1c1 from qemu
This commit is contained in:
Richard Henderson 2018-03-05 08:19:33 -05:00 committed by Lioncash
parent 387060ccf5
commit 9f8c6a456b
No known key found for this signature in database
GPG key ID: 4E3C3CC1031BA9C7
2 changed files with 242 additions and 194 deletions

View file

@ -32,31 +32,49 @@
glue(glue(case INDEX_op_, x), _i32): \ glue(glue(case INDEX_op_, x), _i32): \
glue(glue(case INDEX_op_, x), _i64) glue(glue(case INDEX_op_, x), _i64)
static inline bool temp_is_const(TCGContext *s, TCGArg arg) static inline struct tcg_temp_info *ts_info(TCGTemp *ts)
{ {
struct tcg_temp_info *temps = s->temps2; return ts->state_ptr;
return temps[arg].is_const;
} }
static inline bool temp_is_copy(TCGContext *s, TCGArg arg) static inline struct tcg_temp_info *arg_info(TCGContext *s, TCGArg arg)
{ {
struct tcg_temp_info *temps = s->temps2; return ts_info(arg_temp(s, arg));
}
return temps[arg].next_copy != arg; static inline bool ts_is_const(TCGTemp *ts)
{
return ts_info(ts)->is_const;
}
static inline bool arg_is_const(TCGContext *s, TCGArg arg)
{
return ts_is_const(arg_temp(s, arg));
}
static inline bool ts_is_copy(TCGTemp *ts)
{
return ts_info(ts)->next_copy != ts;
} }
/* Reset TEMP's state, possibly removing the temp for the list of copies. */ /* Reset TEMP's state, possibly removing the temp for the list of copies. */
static void reset_temp(TCGContext *s, TCGArg temp) static void reset_ts(TCGTemp *ts)
{ {
struct tcg_temp_info *temps = s->temps2; struct tcg_temp_info *ti = ts_info(ts);
struct tcg_temp_info *pi = ts_info(ti->prev_copy);
struct tcg_temp_info *ni = ts_info(ti->next_copy);
temps[temps[temp].next_copy].prev_copy = temps[temp].prev_copy; ni->prev_copy = ti->prev_copy;
temps[temps[temp].prev_copy].next_copy = temps[temp].next_copy; pi->next_copy = ti->next_copy;
temps[temp].next_copy = temp; ti->next_copy = ts;
temps[temp].prev_copy = temp; ti->prev_copy = ts;
temps[temp].is_const = false; ti->is_const = false;
temps[temp].mask = -1; ti->mask = -1;
}
static void reset_temp(TCGContext *s, TCGArg arg)
{
reset_ts(arg_temp(s, arg));
} }
/* Reset all temporaries, given that there are NB_TEMPS of them. */ /* Reset all temporaries, given that there are NB_TEMPS of them. */
@ -67,20 +85,29 @@ static void reset_all_temps(TCGContext *s, int nb_temps)
} }
/* Initialize and activate a temporary. */ /* Initialize and activate a temporary. */
static void init_temp_info(TCGContext *s, TCGArg temp) static void init_ts_info(TCGContext *s, TCGTemp *ts)
{ {
struct tcg_temp_info *temps = s->temps2; struct tcg_temp_info *temps = s->temps2;
TCGTempSet *temps_used = &s->temps2_used; TCGTempSet *temps_used = &s->temps2_used;
if (!test_bit(temp, temps_used->l)) { size_t idx = temp_idx(s, ts);
temps[temp].next_copy = temp; if (!test_bit(idx, temps_used->l)) {
temps[temp].prev_copy = temp; struct tcg_temp_info *ti = &temps[idx];
temps[temp].is_const = false;
temps[temp].mask = -1; ts->state_ptr = ti;
set_bit(temp, temps_used->l); ti->next_copy = ts;
ti->prev_copy = ts;
ti->is_const = false;
ti->mask = -1;
set_bit(idx, temps_used->l);
} }
} }
static void init_arg_info(TCGContext *s, TCGArg arg)
{
init_ts_info(s, arg_temp(s, arg));
}
static int op_bits(TCGContext *s, TCGOpcode op) static int op_bits(TCGContext *s, TCGOpcode op)
{ {
const TCGOpDef *def = &s->tcg_op_defs[op]; const TCGOpDef *def = &s->tcg_op_defs[op];
@ -115,52 +142,49 @@ static TCGOpcode op_to_movi(TCGContext *s, TCGOpcode op)
} }
} }
static TCGArg find_better_copy(TCGContext *s, TCGArg arg) static TCGTemp *find_better_copy(TCGTemp *ts)
{ {
struct tcg_temp_info *temps = s->temps2; TCGTemp *i;
TCGTemp *ts = arg_temp(s, arg);
TCGArg i;
/* If this is already a global, we can't do better. */ /* If this is already a global, we can't do better. */
if (ts->temp_global) { if (ts->temp_global) {
return arg; return ts;
} }
/* Search for a global first. */ /* Search for a global first. */
for (i = temps[arg].next_copy ; i != arg; i = temps[i].next_copy) { for (i = ts_info(ts)->next_copy; i != ts; i = ts_info(i)->next_copy) {
if (i < (unsigned int)s->nb_globals) { if (i->temp_global) {
return i; return i;
} }
} }
/* If it is a temp, search for a temp local. */ /* If it is a temp, search for a temp local. */
if (!ts->temp_local) { if (!ts->temp_local) {
for (i = temps[arg].next_copy ; i != arg; i = temps[i].next_copy) { for (i = ts_info(ts)->next_copy; i != ts; i = ts_info(i)->next_copy) {
if (s->temps[i].temp_local) { if (ts->temp_local) {
return i; return i;
} }
} }
} }
/* Failure to find a better representation, return the same temp. */ /* Failure to find a better representation, return the same temp. */
return arg; return ts;
} }
static bool temps_are_copies(TCGContext *s, TCGArg arg1, TCGArg arg2) static bool ts_are_copies(TCGTemp *ts1, TCGTemp *ts2)
{ {
struct tcg_temp_info *temps = s->temps2; TCGTemp *i;
TCGArg i;
if (arg1 == arg2) { if (ts1 == ts2) {
return true; return true;
} }
if (!temp_is_copy(s, arg1) || !temp_is_copy(s, arg2)) { if (!ts_is_copy(ts1) || !ts_is_copy(ts2)) {
return false; return false;
} }
for (i = temps[arg1].next_copy ; i != arg1 ; i = temps[i].next_copy) { for (i = ts_info(ts1)->next_copy; i != ts1; i = ts_info(i)->next_copy) {
if (i == arg2) { if (i == ts2) {
return true; return true;
} }
} }
@ -168,24 +192,29 @@ static bool temps_are_copies(TCGContext *s, TCGArg arg1, TCGArg arg2)
return false; return false;
} }
static bool args_are_copies(TCGContext *s, TCGArg arg1, TCGArg arg2)
{
return ts_are_copies(arg_temp(s, arg1), arg_temp(s, arg2));
}
static void tcg_opt_gen_movi(TCGContext *s, TCGOp *op, TCGArg dst, TCGArg val) static void tcg_opt_gen_movi(TCGContext *s, TCGOp *op, TCGArg dst, TCGArg val)
{ {
struct tcg_temp_info *temps = s->temps2;
TCGOpcode new_op = op_to_movi(s, op->opc); TCGOpcode new_op = op_to_movi(s, op->opc);
tcg_target_ulong mask; tcg_target_ulong mask;
struct tcg_temp_info *di = arg_info(s, dst);
op->opc = new_op; op->opc = new_op;
reset_temp(s, dst); reset_temp(s, dst);
temps[dst].is_const = true; di->is_const = true;
temps[dst].val = val; di->val = val;
mask = val; mask = val;
if (TCG_TARGET_REG_BITS > 32 && new_op == INDEX_op_movi_i32) { if (TCG_TARGET_REG_BITS > 32 && new_op == INDEX_op_movi_i32) {
/* High bits of the destination are now garbage. */ /* High bits of the destination are now garbage. */
mask |= ~0xffffffffull; mask |= ~0xffffffffull;
} }
temps[dst].mask = mask; di->mask = mask;
op->args[0] = dst; op->args[0] = dst;
op->args[1] = val; op->args[1] = val;
@ -193,36 +222,44 @@ static void tcg_opt_gen_movi(TCGContext *s, TCGOp *op, TCGArg dst, TCGArg val)
static void tcg_opt_gen_mov(TCGContext *s, TCGOp *op, TCGArg dst, TCGArg src) static void tcg_opt_gen_mov(TCGContext *s, TCGOp *op, TCGArg dst, TCGArg src)
{ {
if (temps_are_copies(s, dst, src)) { TCGTemp *dst_ts = arg_temp(s, dst);
TCGTemp *src_ts = arg_temp(s, src);
struct tcg_temp_info *di;
struct tcg_temp_info *si;
tcg_target_ulong mask;
TCGOpcode new_op;
if (ts_are_copies(dst_ts, src_ts)) {
tcg_op_remove(s, op); tcg_op_remove(s, op);
return; return;
} }
struct tcg_temp_info *temps = s->temps2; reset_ts(dst_ts);
TCGOpcode new_op = op_to_mov(s, op->opc); di = ts_info(dst_ts);
tcg_target_ulong mask; si = ts_info(src_ts);
new_op = op_to_mov(s, op->opc);
op->opc = new_op; op->opc = new_op;
op->args[0] = dst;
op->args[1] = src;
reset_temp(s, dst); mask = si->mask;
mask = temps[src].mask;
if (TCG_TARGET_REG_BITS > 32 && new_op == INDEX_op_mov_i32) { if (TCG_TARGET_REG_BITS > 32 && new_op == INDEX_op_mov_i32) {
/* High bits of the destination are now garbage. */ /* High bits of the destination are now garbage. */
mask |= ~0xffffffffull; mask |= ~0xffffffffull;
} }
temps[dst].mask = mask; di->mask = mask;
if (arg_temp(s, src)->type == arg_temp(s, dst)->type) { if (src_ts->type == dst_ts->type) {
temps[dst].next_copy = temps[src].next_copy; struct tcg_temp_info *ni = ts_info(si->next_copy);
temps[dst].prev_copy = src;
temps[temps[dst].next_copy].prev_copy = dst; di->next_copy = si->next_copy;
temps[src].next_copy = dst; di->prev_copy = src_ts;
temps[dst].is_const = temps[src].is_const; ni->prev_copy = dst_ts;
temps[dst].val = temps[src].val; si->next_copy = dst_ts;
di->is_const = si->is_const;
di->val = si->val;
} }
op->args[0] = dst;
op->args[1] = src;
} }
static TCGArg do_constant_folding_2(TCGOpcode op, TCGArg x, TCGArg y) static TCGArg do_constant_folding_2(TCGOpcode op, TCGArg x, TCGArg y)
@ -469,20 +506,21 @@ static bool do_constant_folding_cond_eq(TCGCond c)
static TCGArg do_constant_folding_cond(TCGContext *s, TCGOpcode op, TCGArg x, static TCGArg do_constant_folding_cond(TCGContext *s, TCGOpcode op, TCGArg x,
TCGArg y, TCGCond c) TCGArg y, TCGCond c)
{ {
struct tcg_temp_info *temps = s->temps2; tcg_target_ulong xv = arg_info(s, x)->val;
tcg_target_ulong yv = arg_info(s, y)->val;
if (temp_is_const(s, x) && temp_is_const(s, y)) { if (arg_is_const(s, x) && arg_is_const(s, y)) {
switch (op_bits(s, op)) { switch (op_bits(s, op)) {
case 32: case 32:
return do_constant_folding_cond_32(temps[x].val, temps[y].val, c); return do_constant_folding_cond_32(xv, yv, c);
case 64: case 64:
return do_constant_folding_cond_64(temps[x].val, temps[y].val, c); return do_constant_folding_cond_64(xv, yv, c);
default: default:
tcg_abort(); tcg_abort();
} }
} else if (temps_are_copies(s, x, y)) { } else if (args_are_copies(s, x, y)) {
return do_constant_folding_cond_eq(c); return do_constant_folding_cond_eq(c);
} else if (temp_is_const(s, y) && temps[y].val == 0) { } else if (arg_is_const(s, y) && yv == 0) {
switch (c) { switch (c) {
case TCG_COND_LTU: case TCG_COND_LTU:
return 0; return 0;
@ -499,17 +537,18 @@ static TCGArg do_constant_folding_cond(TCGContext *s, TCGOpcode op, TCGArg x,
of the condition (0 or 1) if it can */ of the condition (0 or 1) if it can */
static TCGArg do_constant_folding_cond2(TCGContext *s, TCGArg *p1, TCGArg *p2, TCGCond c) static TCGArg do_constant_folding_cond2(TCGContext *s, TCGArg *p1, TCGArg *p2, TCGCond c)
{ {
struct tcg_temp_info *temps = s->temps2;
TCGArg al = p1[0], ah = p1[1]; TCGArg al = p1[0], ah = p1[1];
TCGArg bl = p2[0], bh = p2[1]; TCGArg bl = p2[0], bh = p2[1];
if (temp_is_const(s, bl) && temp_is_const(s, bh)) { if (arg_is_const(s, bl) && arg_is_const(s, bh)) {
uint64_t b = ((uint64_t)temps[bh].val << 32) | (uint32_t)temps[bl].val; tcg_target_ulong blv = arg_info(s, bl)->val;
tcg_target_ulong bhv = arg_info(s, bh)->val;
uint64_t b = deposit64(blv, 32, 32, bhv);
if (temp_is_const(s, al) && temp_is_const(s, ah)) { if (arg_is_const(s, al) && arg_is_const(s, ah)) {
uint64_t a; tcg_target_ulong alv = arg_info(s, al)->val;
a = ((uint64_t)temps[ah].val << 32) | (uint32_t)temps[al].val; tcg_target_ulong ahv = arg_info(s, ah)->val;
uint64_t a = deposit64(alv, 32, 32, ahv);
return do_constant_folding_cond_64(a, b, c); return do_constant_folding_cond_64(a, b, c);
} }
if (b == 0) { if (b == 0) {
@ -523,7 +562,7 @@ static TCGArg do_constant_folding_cond2(TCGContext *s, TCGArg *p1, TCGArg *p2, T
} }
} }
} }
if (temps_are_copies(s, al, bl) && temps_are_copies(s, ah, bh)) { if (args_are_copies(s, al, bl) && args_are_copies(s, ah, bh)) {
return do_constant_folding_cond_eq(c); return do_constant_folding_cond_eq(c);
} }
return 2; return 2;
@ -533,9 +572,8 @@ static bool swap_commutative(TCGContext *s, TCGArg dest, TCGArg *p1, TCGArg *p2)
{ {
TCGArg a1 = *p1, a2 = *p2; TCGArg a1 = *p1, a2 = *p2;
int sum = 0; int sum = 0;
sum += arg_is_const(s, a1);
sum += temp_is_const(s, a1); sum -= arg_is_const(s, a2);
sum -= temp_is_const(s, a2);
/* Prefer the constant in second argument, and then the form /* Prefer the constant in second argument, and then the form
op a, a, b, which is better handled on non-RISC hosts. */ op a, a, b, which is better handled on non-RISC hosts. */
@ -550,11 +588,10 @@ static bool swap_commutative(TCGContext *s, TCGArg dest, TCGArg *p1, TCGArg *p2)
static bool swap_commutative2(TCGContext *s, TCGArg *p1, TCGArg *p2) static bool swap_commutative2(TCGContext *s, TCGArg *p1, TCGArg *p2)
{ {
int sum = 0; int sum = 0;
sum += arg_is_const(s, p1[0]);
sum += temp_is_const(s, p1[0]); sum += arg_is_const(s, p1[1]);
sum += temp_is_const(s, p1[1]); sum -= arg_is_const(s, p2[0]);
sum -= temp_is_const(s, p2[0]); sum -= arg_is_const(s, p2[1]);
sum -= temp_is_const(s, p2[1]);
if (sum > 0) { if (sum > 0) {
TCGArg t; TCGArg t;
t = p1[0], p1[0] = p2[0], p2[0] = t; t = p1[0], p1[0] = p2[0], p2[0] = t;
@ -567,7 +604,6 @@ static bool swap_commutative2(TCGContext *s, TCGArg *p1, TCGArg *p2)
/* Propagate constants and copies, fold constant expressions. */ /* Propagate constants and copies, fold constant expressions. */
void tcg_optimize(TCGContext *s) void tcg_optimize(TCGContext *s)
{ {
struct tcg_temp_info *temps = s->temps2;
int oi, oi_next, nb_temps, nb_globals; int oi, oi_next, nb_temps, nb_globals;
TCGOp *prev_mb = NULL; TCGOp *prev_mb = NULL;
@ -597,23 +633,24 @@ void tcg_optimize(TCGContext *s)
nb_oargs = op->callo; nb_oargs = op->callo;
nb_iargs = op->calli; nb_iargs = op->calli;
for (i = 0; i < nb_oargs + nb_iargs; i++) { for (i = 0; i < nb_oargs + nb_iargs; i++) {
tmp = op->args[i]; TCGTemp *ts = arg_temp(s, op->args[i]);
if (tmp != TCG_CALL_DUMMY_ARG) { if (ts) {
init_temp_info(s, tmp); init_ts_info(s, ts);
} }
} }
} else { } else {
nb_oargs = def->nb_oargs; nb_oargs = def->nb_oargs;
nb_iargs = def->nb_iargs; nb_iargs = def->nb_iargs;
for (i = 0; i < nb_oargs + nb_iargs; i++) { for (i = 0; i < nb_oargs + nb_iargs; i++) {
init_temp_info(s, op->args[i]); init_arg_info(s, op->args[i]);
} }
} }
/* Do copy propagation */ /* Do copy propagation */
for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
if (temp_is_copy(s, op->args[i])) { TCGTemp *ts = arg_temp(s, op->args[i]);
op->args[i] = find_better_copy(s, op->args[i]); if (ts && ts_is_copy(ts)) {
op->args[i] = temp_arg(s, find_better_copy(ts));
} }
} }
@ -682,7 +719,8 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(sar): CASE_OP_32_64(sar):
CASE_OP_32_64(rotl): CASE_OP_32_64(rotl):
CASE_OP_32_64(rotr): CASE_OP_32_64(rotr):
if (temp_is_const(s, op->args[1]) && temps[op->args[1]].val == 0) { if (arg_is_const(s, op->args[1])
&& arg_info(s, op->args[1])->val == 0) {
tcg_opt_gen_movi(s, op, op->args[0], 0); tcg_opt_gen_movi(s, op, op->args[0], 0);
continue; continue;
} }
@ -692,7 +730,7 @@ void tcg_optimize(TCGContext *s)
TCGOpcode neg_op; TCGOpcode neg_op;
bool have_neg; bool have_neg;
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
/* Proceed with possible constant folding. */ /* Proceed with possible constant folding. */
break; break;
} }
@ -706,8 +744,8 @@ void tcg_optimize(TCGContext *s)
if (!have_neg) { if (!have_neg) {
break; break;
} }
if (temp_is_const(s, op->args[1]) if (arg_is_const(s, op->args[1])
&& temps[op->args[1]].val == 0) { && arg_info(s, op->args[1])->val == 0) {
op->opc = neg_op; op->opc = neg_op;
reset_temp(s, op->args[0]); reset_temp(s, op->args[0]);
op->args[1] = op->args[2]; op->args[1] = op->args[2];
@ -717,34 +755,34 @@ void tcg_optimize(TCGContext *s)
break; break;
CASE_OP_32_64(xor): CASE_OP_32_64(xor):
CASE_OP_32_64(nand): CASE_OP_32_64(nand):
if (!temp_is_const(s, op->args[1]) if (!arg_is_const(s, op->args[1])
&& temp_is_const(s, op->args[2]) && arg_is_const(s, op->args[2])
&& temps[op->args[2]].val == -1) { && arg_info(s, op->args[2])->val == -1) {
i = 1; i = 1;
goto try_not; goto try_not;
} }
break; break;
CASE_OP_32_64(nor): CASE_OP_32_64(nor):
if (!temp_is_const(s, op->args[1]) if (!arg_is_const(s, op->args[1])
&& temp_is_const(s, op->args[2]) && arg_is_const(s, op->args[2])
&& temps[op->args[2]].val == 0) { && arg_info(s, op->args[2])->val == 0) {
i = 1; i = 1;
goto try_not; goto try_not;
} }
break; break;
CASE_OP_32_64(andc): CASE_OP_32_64(andc):
if (!temp_is_const(s, op->args[2]) if (!arg_is_const(s, op->args[2])
&& temp_is_const(s, op->args[1]) && arg_is_const(s, op->args[1])
&& temps[op->args[1]].val == -1) { && arg_info(s, op->args[1])->val == -1) {
i = 2; i = 2;
goto try_not; goto try_not;
} }
break; break;
CASE_OP_32_64(orc): CASE_OP_32_64(orc):
CASE_OP_32_64(eqv): CASE_OP_32_64(eqv):
if (!temp_is_const(s, op->args[2]) if (!arg_is_const(s, op->args[2])
&& temp_is_const(s, op->args[1]) && arg_is_const(s, op->args[1])
&& temps[op->args[1]].val == 0) { && arg_info(s, op->args[1])->val == 0) {
i = 2; i = 2;
goto try_not; goto try_not;
} }
@ -785,9 +823,9 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(or): CASE_OP_32_64(or):
CASE_OP_32_64(xor): CASE_OP_32_64(xor):
CASE_OP_32_64(andc): CASE_OP_32_64(andc):
if (!temp_is_const(s, op->args[1]) if (!arg_is_const(s, op->args[1])
&& temp_is_const(s, op->args[2]) && arg_is_const(s, op->args[2])
&& temps[op->args[2]].val == 0) { && arg_info(s, op->args[2])->val == 0) {
tcg_opt_gen_mov(s, op, op->args[0], op->args[1]); tcg_opt_gen_mov(s, op, op->args[0], op->args[1]);
continue; continue;
} }
@ -795,9 +833,9 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(and): CASE_OP_32_64(and):
CASE_OP_32_64(orc): CASE_OP_32_64(orc):
CASE_OP_32_64(eqv): CASE_OP_32_64(eqv):
if (!temp_is_const(s, op->args[1]) if (!arg_is_const(s, op->args[1])
&& temp_is_const(s, op->args[2]) && arg_is_const(s, op->args[2])
&& temps[op->args[2]].val == -1) { && arg_info(s, op->args[2])->val == -1) {
tcg_opt_gen_mov(s, op, op->args[0], op->args[1]); tcg_opt_gen_mov(s, op, op->args[0], op->args[1]);
continue; continue;
} }
@ -812,21 +850,21 @@ void tcg_optimize(TCGContext *s)
affected = -1; affected = -1;
switch (opc) { switch (opc) {
CASE_OP_32_64(ext8s): CASE_OP_32_64(ext8s):
if ((temps[op->args[1]].mask & 0x80) != 0) { if ((arg_info(s, op->args[1])->mask & 0x80) != 0) {
break; break;
} }
CASE_OP_32_64(ext8u): CASE_OP_32_64(ext8u):
mask = 0xff; mask = 0xff;
goto and_const; goto and_const;
CASE_OP_32_64(ext16s): CASE_OP_32_64(ext16s):
if ((temps[op->args[1]].mask & 0x8000) != 0) { if ((arg_info(s, op->args[1])->mask & 0x8000) != 0) {
break; break;
} }
CASE_OP_32_64(ext16u): CASE_OP_32_64(ext16u):
mask = 0xffff; mask = 0xffff;
goto and_const; goto and_const;
case INDEX_op_ext32s_i64: case INDEX_op_ext32s_i64:
if ((temps[op->args[1]].mask & 0x80000000) != 0) { if ((arg_info(s, op->args[1])->mask & 0x80000000) != 0) {
break; break;
} }
case INDEX_op_ext32u_i64: case INDEX_op_ext32u_i64:
@ -834,111 +872,114 @@ void tcg_optimize(TCGContext *s)
goto and_const; goto and_const;
CASE_OP_32_64(and): CASE_OP_32_64(and):
mask = temps[op->args[2]].mask; mask = arg_info(s, op->args[2])->mask;
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
and_const: and_const:
affected = temps[op->args[1]].mask & ~mask; affected = arg_info(s, op->args[1])->mask & ~mask;
} }
mask = temps[op->args[1]].mask & mask; mask = arg_info(s, op->args[1])->mask & mask;
break; break;
case INDEX_op_ext_i32_i64: case INDEX_op_ext_i32_i64:
if ((temps[op->args[1]].mask & 0x80000000) != 0) { if ((arg_info(s, op->args[1])->mask & 0x80000000) != 0) {
break; break;
} }
case INDEX_op_extu_i32_i64: case INDEX_op_extu_i32_i64:
/* We do not compute affected as it is a size changing op. */ /* We do not compute affected as it is a size changing op. */
mask = (uint32_t)temps[op->args[1]].mask; mask = (uint32_t)arg_info(s, op->args[1])->mask;
break; break;
CASE_OP_32_64(andc): CASE_OP_32_64(andc):
/* Known-zeros does not imply known-ones. Therefore unless /* Known-zeros does not imply known-ones. Therefore unless
args[2] is constant, we can't infer anything from it. */ args[2] is constant, we can't infer anything from it. */
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
mask = ~temps[op->args[2]].mask; mask = ~arg_info(s, op->args[2])->mask;
goto and_const; goto and_const;
} }
/* But we certainly know nothing outside args[1] may be set. */ /* But we certainly know nothing outside args[1] may be set. */
mask = temps[op->args[1]].mask; mask = arg_info(s, op->args[1])->mask;
break; break;
case INDEX_op_sar_i32: case INDEX_op_sar_i32:
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
tmp = temps[op->args[2]].val & 31; tmp = arg_info(s, op->args[2])->val & 31;
mask = (int32_t)temps[op->args[1]].mask >> tmp; mask = (int32_t)arg_info(s, op->args[1])->mask >> tmp;
} }
break; break;
case INDEX_op_sar_i64: case INDEX_op_sar_i64:
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
tmp = temps[op->args[2]].val & 63; tmp = arg_info(s, op->args[2])->val & 63;
mask = (int64_t)temps[op->args[1]].mask >> tmp; mask = (int64_t)arg_info(s, op->args[1])->mask >> tmp;
} }
break; break;
case INDEX_op_shr_i32: case INDEX_op_shr_i32:
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
tmp = temps[op->args[2]].val & 31; tmp = arg_info(s, op->args[2])->val & 31;
mask = (uint32_t)temps[op->args[1]].mask >> tmp; mask = (uint32_t)arg_info(s, op->args[1])->mask >> tmp;
} }
break; break;
case INDEX_op_shr_i64: case INDEX_op_shr_i64:
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
tmp = temps[op->args[2]].val & 63; tmp = arg_info(s, op->args[2])->val & 63;
mask = (uint64_t)temps[op->args[1]].mask >> tmp; mask = (uint64_t)arg_info(s, op->args[1])->mask >> tmp;
} }
break; break;
case INDEX_op_extrl_i64_i32: case INDEX_op_extrl_i64_i32:
mask = (uint32_t)temps[op->args[1]].mask; mask = (uint32_t)arg_info(s, op->args[1])->mask;
break; break;
case INDEX_op_extrh_i64_i32: case INDEX_op_extrh_i64_i32:
mask = (uint64_t)temps[op->args[1]].mask >> 32; mask = (uint64_t)arg_info(s, op->args[1])->mask >> 32;
break; break;
CASE_OP_32_64(shl): CASE_OP_32_64(shl):
if (temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[2])) {
tmp = temps[op->args[2]].val & (TCG_TARGET_REG_BITS - 1); tmp = arg_info(s, op->args[2])->val & (TCG_TARGET_REG_BITS - 1);
mask = temps[op->args[1]].mask << tmp; mask = arg_info(s, op->args[1])->mask << tmp;
} }
break; break;
CASE_OP_32_64(neg): CASE_OP_32_64(neg):
/* Set to 1 all bits to the left of the rightmost. */ /* Set to 1 all bits to the left of the rightmost. */
mask = 0-(temps[op->args[1]].mask & (0-temps[op->args[1]].mask)); mask = -(arg_info(s, op->args[1])->mask
& -arg_info(s, op->args[1])->mask);
break; break;
CASE_OP_32_64(deposit): CASE_OP_32_64(deposit):
mask = deposit64(temps[op->args[1]].mask, op->args[3], mask = deposit64(arg_info(s, op->args[1])->mask,
op->args[4], temps[op->args[2]].mask); op->args[3], op->args[4],
arg_info(s, op->args[2])->mask);
break; break;
CASE_OP_32_64(extract): CASE_OP_32_64(extract):
mask = extract64(temps[op->args[1]].mask, op->args[2], op->args[3]); mask = extract64(arg_info(s, op->args[1])->mask,
op->args[2], op->args[3]);
if (op->args[2] == 0) { if (op->args[2] == 0) {
affected = temps[op->args[1]].mask & ~mask; affected = arg_info(s, op->args[1])->mask & ~mask;
} }
break; break;
CASE_OP_32_64(sextract): CASE_OP_32_64(sextract):
mask = sextract64(temps[op->args[1]].mask, mask = sextract64(arg_info(s, op->args[1])->mask,
op->args[2], op->args[3]); op->args[2], op->args[3]);
if (op->args[2] == 0 && (tcg_target_long)mask >= 0) { if (op->args[2] == 0 && (tcg_target_long)mask >= 0) {
affected = temps[op->args[1]].mask & ~mask; affected = arg_info(s, op->args[1])->mask & ~mask;
} }
break; break;
CASE_OP_32_64(or): CASE_OP_32_64(or):
CASE_OP_32_64(xor): CASE_OP_32_64(xor):
mask = temps[op->args[1]].mask | temps[op->args[2]].mask; mask = arg_info(s, op->args[1])->mask | arg_info(s, op->args[2])->mask;
break; break;
case INDEX_op_clz_i32: case INDEX_op_clz_i32:
case INDEX_op_ctz_i32: case INDEX_op_ctz_i32:
mask = temps[op->args[2]].mask | 31; mask = arg_info(s, op->args[2])->mask | 31;
break; break;
case INDEX_op_clz_i64: case INDEX_op_clz_i64:
case INDEX_op_ctz_i64: case INDEX_op_ctz_i64:
mask = temps[op->args[2]].mask | 63; mask = arg_info(s, op->args[2])->mask | 63;
break; break;
case INDEX_op_ctpop_i32: case INDEX_op_ctpop_i32:
@ -954,7 +995,7 @@ void tcg_optimize(TCGContext *s)
break; break;
CASE_OP_32_64(movcond): CASE_OP_32_64(movcond):
mask = temps[op->args[3]].mask | temps[op->args[4]].mask; mask = arg_info(s, op->args[3])->mask | arg_info(s, op->args[4])->mask;
break; break;
CASE_OP_32_64(ld8u): CASE_OP_32_64(ld8u):
@ -1008,7 +1049,8 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(mul): CASE_OP_32_64(mul):
CASE_OP_32_64(muluh): CASE_OP_32_64(muluh):
CASE_OP_32_64(mulsh): CASE_OP_32_64(mulsh):
if ((temp_is_const(s, op->args[2]) && temps[op->args[2]].val == 0)) { if (arg_is_const(s, op->args[2])
&& arg_info(s, op->args[2])->val == 0) {
tcg_opt_gen_movi(s, op, op->args[0], 0); tcg_opt_gen_movi(s, op, op->args[0], 0);
continue; continue;
} }
@ -1021,7 +1063,7 @@ void tcg_optimize(TCGContext *s)
switch (opc) { switch (opc) {
CASE_OP_32_64(or): CASE_OP_32_64(or):
CASE_OP_32_64(and): CASE_OP_32_64(and):
if (temps_are_copies(s, op->args[1], op->args[2])) { if (args_are_copies(s, op->args[1], op->args[2])) {
tcg_opt_gen_mov(s, op, op->args[0], op->args[1]); tcg_opt_gen_mov(s, op, op->args[0], op->args[1]);
continue; continue;
} }
@ -1035,7 +1077,7 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(andc): CASE_OP_32_64(andc):
CASE_OP_32_64(sub): CASE_OP_32_64(sub):
CASE_OP_32_64(xor): CASE_OP_32_64(xor):
if (temps_are_copies(s, op->args[1], op->args[2])) { if (args_are_copies(s, op->args[1], op->args[2])) {
tcg_opt_gen_movi(s, op, op->args[0], 0); tcg_opt_gen_movi(s, op, op->args[0], 0);
continue; continue;
} }
@ -1068,8 +1110,8 @@ void tcg_optimize(TCGContext *s)
case INDEX_op_extu_i32_i64: case INDEX_op_extu_i32_i64:
case INDEX_op_extrl_i64_i32: case INDEX_op_extrl_i64_i32:
case INDEX_op_extrh_i64_i32: case INDEX_op_extrh_i64_i32:
if (temp_is_const(s, op->args[1])) { if (arg_is_const(s, op->args[1])) {
tmp = do_constant_folding(s, opc, temps[op->args[1]].val, 0); tmp = do_constant_folding(s, opc, arg_info(s, op->args[1])->val, 0);
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
break; break;
} }
@ -1097,9 +1139,9 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(divu): CASE_OP_32_64(divu):
CASE_OP_32_64(rem): CASE_OP_32_64(rem):
CASE_OP_32_64(remu): CASE_OP_32_64(remu):
if (temp_is_const(s, op->args[1]) && temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[1]) && arg_is_const(s, op->args[2])) {
tmp = do_constant_folding(s, opc, temps[op->args[1]].val, tmp = do_constant_folding(s, opc, arg_info(s, op->args[1])->val,
temps[op->args[2]].val); arg_info(s, op->args[2])->val);
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
break; break;
} }
@ -1107,8 +1149,8 @@ void tcg_optimize(TCGContext *s)
CASE_OP_32_64(clz): CASE_OP_32_64(clz):
CASE_OP_32_64(ctz): CASE_OP_32_64(ctz):
if (temp_is_const(s, op->args[1])) { if (arg_is_const(s, op->args[1])) {
TCGArg v = temps[op->args[1]].val; TCGArg v = arg_info(s, op->args[1])->val;
if (v != 0) { if (v != 0) {
tmp = do_constant_folding(s, opc, v, 0); tmp = do_constant_folding(s, opc, v, 0);
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
@ -1120,17 +1162,18 @@ void tcg_optimize(TCGContext *s)
goto do_default; goto do_default;
CASE_OP_32_64(deposit): CASE_OP_32_64(deposit):
if (temp_is_const(s, op->args[1]) && temp_is_const(s, op->args[2])) { if (arg_is_const(s, op->args[1]) && arg_is_const(s, op->args[2])) {
tmp = deposit64(temps[op->args[1]].val, op->args[3], tmp = deposit64(arg_info(s, op->args[1])->val,
op->args[4], temps[op->args[2]].val); op->args[3], op->args[4],
arg_info(s, op->args[2])->val);
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
break; break;
} }
goto do_default; goto do_default;
CASE_OP_32_64(extract): CASE_OP_32_64(extract):
if (temp_is_const(s, op->args[1])) { if (arg_is_const(s, op->args[1])) {
tmp = extract64(temps[op->args[1]].val, tmp = extract64(arg_info(s, op->args[1])->val,
op->args[2], op->args[3]); op->args[2], op->args[3]);
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
break; break;
@ -1138,8 +1181,8 @@ void tcg_optimize(TCGContext *s)
goto do_default; goto do_default;
CASE_OP_32_64(sextract): CASE_OP_32_64(sextract):
if (temp_is_const(s, op->args[1])) { if (arg_is_const(s, op->args[1])) {
tmp = sextract64(temps[op->args[1]].val, tmp = sextract64(arg_info(s, op->args[1])->val,
op->args[2], op->args[3]); op->args[2], op->args[3]);
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
break; break;
@ -1177,9 +1220,9 @@ void tcg_optimize(TCGContext *s)
tcg_opt_gen_mov(s, op, op->args[0], op->args[4-tmp]); tcg_opt_gen_mov(s, op, op->args[0], op->args[4-tmp]);
break; break;
} }
if (temp_is_const(s, op->args[3]) && temp_is_const(s, op->args[4])) { if (arg_is_const(s, op->args[3]) && arg_is_const(s, op->args[4])) {
tcg_target_ulong tv = temps[op->args[3]].val; tcg_target_ulong tv = arg_info(s, op->args[3])->val;
tcg_target_ulong fv = temps[op->args[4]].val; tcg_target_ulong fv = arg_info(s, op->args[4])->val;
TCGCond cond = op->args[5]; TCGCond cond = op->args[5];
if (fv == 1 && tv == 0) { if (fv == 1 && tv == 0) {
cond = tcg_invert_cond(cond); cond = tcg_invert_cond(cond);
@ -1196,12 +1239,12 @@ void tcg_optimize(TCGContext *s)
case INDEX_op_add2_i32: case INDEX_op_add2_i32:
case INDEX_op_sub2_i32: case INDEX_op_sub2_i32:
if (temp_is_const(s, op->args[2]) && temp_is_const(s, op->args[3]) if (arg_is_const(s, op->args[2]) && arg_is_const(s, op->args[3])
&& temp_is_const(s, op->args[4]) && temp_is_const(s, op->args[5])) { && arg_is_const(s, op->args[4]) && arg_is_const(s, op->args[5])) {
uint32_t al = temps[op->args[2]].val; uint32_t al = arg_info(s, op->args[2])->val;
uint32_t ah = temps[op->args[3]].val; uint32_t ah = arg_info(s, op->args[3])->val;
uint32_t bl = temps[op->args[4]].val; uint32_t bl = arg_info(s, op->args[4])->val;
uint32_t bh = temps[op->args[5]].val; uint32_t bh = arg_info(s, op->args[5])->val;
uint64_t a = ((uint64_t)ah << 32) | al; uint64_t a = ((uint64_t)ah << 32) | al;
uint64_t b = ((uint64_t)bh << 32) | bl; uint64_t b = ((uint64_t)bh << 32) | bl;
TCGArg rl, rh; TCGArg rl, rh;
@ -1225,9 +1268,9 @@ void tcg_optimize(TCGContext *s)
goto do_default; goto do_default;
case INDEX_op_mulu2_i32: case INDEX_op_mulu2_i32:
if (temp_is_const(s, op->args[2]) && temp_is_const(s, op->args[3])) { if (arg_is_const(s, op->args[2]) && arg_is_const(s, op->args[3])) {
uint32_t a = temps[op->args[2]].val; uint32_t a = arg_info(s, op->args[2])->val;
uint32_t b = temps[op->args[3]].val; uint32_t b = arg_info(s, op->args[3])->val;
uint64_t r = (uint64_t)a * b; uint64_t r = (uint64_t)a * b;
TCGArg rl, rh; TCGArg rl, rh;
TCGOp *op2 = tcg_op_insert_before(s, op, INDEX_op_movi_i32, 2); TCGOp *op2 = tcg_op_insert_before(s, op, INDEX_op_movi_i32, 2);
@ -1258,10 +1301,10 @@ void tcg_optimize(TCGContext *s)
} }
} else if ((op->args[4] == TCG_COND_LT } else if ((op->args[4] == TCG_COND_LT
|| op->args[4] == TCG_COND_GE) || op->args[4] == TCG_COND_GE)
&& temp_is_const(s, op->args[2]) && arg_is_const(s, op->args[2])
&& temps[op->args[2]].val == 0 && arg_info(s, op->args[2])->val == 0
&& temp_is_const(s, op->args[3]) && arg_is_const(s, op->args[3])
&& temps[op->args[3]].val == 0) { && arg_info(s, op->args[3])->val == 0) {
/* Simplify LT/GE comparisons vs zero to a single compare /* Simplify LT/GE comparisons vs zero to a single compare
vs the high word of the input. */ vs the high word of the input. */
do_brcond_high: do_brcond_high:
@ -1329,15 +1372,15 @@ void tcg_optimize(TCGContext *s)
tcg_opt_gen_movi(s, op, op->args[0], tmp); tcg_opt_gen_movi(s, op, op->args[0], tmp);
} else if ((op->args[5] == TCG_COND_LT } else if ((op->args[5] == TCG_COND_LT
|| op->args[5] == TCG_COND_GE) || op->args[5] == TCG_COND_GE)
&& temp_is_const(s, op->args[3]) && arg_is_const(s, op->args[3])
&& temps[op->args[3]].val == 0 && arg_info(s, op->args[3])->val == 0
&& temp_is_const(s, op->args[4]) && arg_is_const(s, op->args[4])
&& temps[op->args[4]].val == 0) { && arg_info(s, op->args[4])->val == 0) {
/* Simplify LT/GE comparisons vs zero to a single compare /* Simplify LT/GE comparisons vs zero to a single compare
vs the high word of the input. */ vs the high word of the input. */
do_setcond_high: do_setcond_high:
reset_temp(s, op->args[0]); reset_temp(s, op->args[0]);
temps[op->args[0]].mask = 1; arg_info(s, op->args[0])->mask = 1;
op->opc = INDEX_op_setcond_i32; op->opc = INDEX_op_setcond_i32;
op->args[1] = op->args[2]; op->args[1] = op->args[2];
op->args[2] = op->args[4]; op->args[2] = op->args[4];
@ -1363,7 +1406,7 @@ void tcg_optimize(TCGContext *s)
} }
do_setcond_low: do_setcond_low:
reset_temp(s, op->args[0]); reset_temp(s, op->args[0]);
temps[op->args[0]].mask = 1; arg_info(s, op->args[0])->mask = 1;
op->opc = INDEX_op_setcond_i32; op->opc = INDEX_op_setcond_i32;
op->args[2] = op->args[3]; op->args[2] = op->args[3];
op->args[3] = op->args[5]; op->args[3] = op->args[5];
@ -1397,7 +1440,7 @@ void tcg_optimize(TCGContext *s)
& (TCG_CALL_NO_READ_GLOBALS | TCG_CALL_NO_WRITE_GLOBALS))) { & (TCG_CALL_NO_READ_GLOBALS | TCG_CALL_NO_WRITE_GLOBALS))) {
for (i = 0; i < nb_globals; i++) { for (i = 0; i < nb_globals; i++) {
if (test_bit(i, s->temps2_used.l)) { if (test_bit(i, s->temps2_used.l)) {
reset_temp(s, i); reset_ts(&s->temps[i]);
} }
} }
} }
@ -1419,7 +1462,7 @@ void tcg_optimize(TCGContext *s)
/* Save the corresponding known-zero bits mask for the /* Save the corresponding known-zero bits mask for the
first output argument (only one supported so far). */ first output argument (only one supported so far). */
if (i == 0) { if (i == 0) {
temps[op->args[i]].mask = mask; arg_info(s, op->args[i])->mask = mask;
} }
} }
} }

View file

@ -765,8 +765,8 @@ typedef struct TCGOpDef {
struct tcg_temp_info { struct tcg_temp_info {
bool is_const; bool is_const;
uint16_t prev_copy; TCGTemp *prev_copy;
uint16_t next_copy; TCGTemp *next_copy;
tcg_target_ulong val; tcg_target_ulong val;
tcg_target_ulong mask; tcg_target_ulong mask;
}; };
@ -1009,6 +1009,11 @@ static inline TCGTemp *arg_temp(TCGContext *tcg_ctx, TCGArg a)
return a == TCG_CALL_DUMMY_ARG ? NULL : &tcg_ctx->temps[a]; return a == TCG_CALL_DUMMY_ARG ? NULL : &tcg_ctx->temps[a];
} }
static inline size_t arg_index(TCGArg a)
{
return a;
}
static inline void tcg_set_insn_param(TCGContext *tcg_ctx, int op_idx, int arg, TCGArg v) static inline void tcg_set_insn_param(TCGContext *tcg_ctx, int op_idx, int arg, TCGArg v)
{ {
tcg_ctx->gen_op_buf[op_idx].args[arg] = v; tcg_ctx->gen_op_buf[op_idx].args[arg] = v;