tcg: Optimize spills of constants

While we can store constants via constrants on INDEX_op_st_i32 et al,
we weren't able to spill constants to backing store.

Add a new backend interface, tcg_out_sti, which may store the constant
(and is allowed to fail). Rearrange the temp_* helpers so that we only
attempt to directly store a constant when the temp is becoming dead/free.

Backports commit 59d7c14eeff8d2ad7f61aed86ce5a176113bc153 from qemu
This commit is contained in:
Richard Henderson 2018-02-25 01:41:28 -05:00 committed by Lioncash
parent 64fda683b1
commit 23586e2674
No known key found for this signature in database
GPG key ID: 4E3C3CC1031BA9C7
8 changed files with 152 additions and 82 deletions

View file

@ -720,6 +720,16 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
arg, arg1, arg2); arg, arg1, arg2);
} }
static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs)
{
if (val == 0) {
tcg_out_st(s, type, TCG_REG_XZR, base, ofs);
return true;
}
return false;
}
static inline void tcg_out_bfm(TCGContext *s, TCGType ext, TCGReg rd, static inline void tcg_out_bfm(TCGContext *s, TCGType ext, TCGReg rd,
TCGReg rn, unsigned int a, unsigned int b) TCGReg rn, unsigned int a, unsigned int b)
{ {

View file

@ -2046,6 +2046,12 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
tcg_out_st32(s, COND_AL, arg, arg1, arg2); tcg_out_st32(s, COND_AL, arg, arg1, arg2);
} }
static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs)
{
return false;
}
static inline void tcg_out_mov(TCGContext *s, TCGType type, static inline void tcg_out_mov(TCGContext *s, TCGType type,
TCGReg ret, TCGReg arg) TCGReg ret, TCGReg arg)
{ {

View file

@ -736,12 +736,19 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
tcg_out_modrm_offset(s, opc, arg, arg1, arg2); tcg_out_modrm_offset(s, opc, arg, arg1, arg2);
} }
static inline void tcg_out_sti(TCGContext *s, TCGType type, TCGReg base, static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
tcg_target_long ofs, tcg_target_long val) TCGReg base, intptr_t ofs)
{ {
int opc = OPC_MOVL_EvIz + (type == TCG_TYPE_I64 ? P_REXW : 0); int rexw = 0;
tcg_out_modrm_offset(s, opc, 0, base, ofs); if (TCG_TARGET_REG_BITS == 64 && type == TCG_TYPE_I64) {
if (val != (int32_t)val) {
return false;
}
rexw = P_REXW;
}
tcg_out_modrm_offset(s, OPC_MOVL_EvIz | rexw, 0, base, ofs);
tcg_out32(s, val); tcg_out32(s, val);
return true;
} }
static void tcg_out_shifti(TCGContext *s, int subopc, int reg, int count) static void tcg_out_shifti(TCGContext *s, int subopc, int reg, int count)
@ -1423,10 +1430,10 @@ static void tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
ofs += 4; ofs += 4;
} }
tcg_out_sti(s, TCG_TYPE_I32, TCG_REG_ESP, ofs, oi); tcg_out_sti(s, TCG_TYPE_I32, oi, TCG_REG_ESP, ofs);
ofs += 4; ofs += 4;
tcg_out_sti(s, TCG_TYPE_I32, TCG_REG_ESP, ofs, (uintptr_t)l->raddr); tcg_out_sti(s, TCG_TYPE_PTR, (uintptr_t)l->raddr, TCG_REG_ESP, ofs);
} else { } else {
tcg_out_mov(s, TCG_TYPE_PTR, tcg_target_call_iarg_regs[0], TCG_AREG0); tcg_out_mov(s, TCG_TYPE_PTR, tcg_target_call_iarg_regs[0], TCG_AREG0);
/* The second argument is already loaded with addrlo. */ /* The second argument is already loaded with addrlo. */
@ -1515,7 +1522,7 @@ static void tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
ofs += 4; ofs += 4;
} }
tcg_out_sti(s, TCG_TYPE_I32, TCG_REG_ESP, ofs, oi); tcg_out_sti(s, TCG_TYPE_I32, oi, TCG_REG_ESP, ofs);
ofs += 4; ofs += 4;
retaddr = TCG_REG_EAX; retaddr = TCG_REG_EAX;

View file

@ -576,6 +576,16 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
tcg_out_ldst(s, OPC_SW, arg, arg1, arg2); tcg_out_ldst(s, OPC_SW, arg, arg1, arg2);
} }
static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs)
{
if (val == 0) {
tcg_out_st(s, type, TCG_REG_ZERO, base, ofs);
return true;
}
return false;
}
static inline void tcg_out_addi(TCGContext *s, TCGReg reg, TCGArg val) static inline void tcg_out_addi(TCGContext *s, TCGReg reg, TCGArg val)
{ {
if (val == (int16_t)val) { if (val == (int16_t)val) {

View file

@ -863,6 +863,12 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
tcg_out_mem_long(s, opi, opx, arg, arg1, arg2); tcg_out_mem_long(s, opi, opx, arg, arg1, arg2);
} }
static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs)
{
return false;
}
static void tcg_out_cmp(TCGContext *s, int cond, TCGArg arg1, TCGArg arg2, static void tcg_out_cmp(TCGContext *s, int cond, TCGArg arg1, TCGArg arg2,
int const_arg2, int cr, TCGType type) int const_arg2, int cr, TCGType type)
{ {

View file

@ -803,6 +803,12 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg data,
} }
} }
static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs)
{
return false;
}
/* load data from an absolute host address */ /* load data from an absolute host address */
static void tcg_out_ld_abs(TCGContext *s, TCGType type, TCGReg dest, void *abs) static void tcg_out_ld_abs(TCGContext *s, TCGType type, TCGReg dest, void *abs)
{ {

View file

@ -506,6 +506,16 @@ static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
tcg_out_ldst(s, arg, arg1, arg2, (type == TCG_TYPE_I32 ? STW : STX)); tcg_out_ldst(s, arg, arg1, arg2, (type == TCG_TYPE_I32 ? STW : STX));
} }
static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs)
{
if (val == 0) {
tcg_out_st(s, type, TCG_REG_G0, base, ofs);
return true;
}
return false;
}
static void tcg_out_ld_ptr(TCGContext *s, TCGReg ret, uintptr_t arg) static void tcg_out_ld_ptr(TCGContext *s, TCGReg ret, uintptr_t arg)
{ {
tcg_out_movi(s, TCG_TYPE_PTR, ret, arg & ~0x3ff); tcg_out_movi(s, TCG_TYPE_PTR, ret, arg & ~0x3ff);

View file

@ -104,6 +104,8 @@ static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args,
const int *const_args); const int *const_args);
static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1,
intptr_t arg2); intptr_t arg2);
static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
TCGReg base, intptr_t ofs);
static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); static void tcg_out_call(TCGContext *s, tcg_insn_unit *target);
static int tcg_target_const_match(tcg_target_long val, TCGType type, static int tcg_target_const_match(tcg_target_long val, TCGType type,
const TCGArgConstraint *arg_ct); const TCGArgConstraint *arg_ct);
@ -1746,35 +1748,89 @@ static void temp_allocate_frame(TCGContext *s, int temp)
static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet); static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet);
/* sync register 'reg' by saving it to the corresponding temporary */ /* Mark a temporary as free or dead. If 'free_or_dead' is negative,
static void tcg_reg_sync(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) mark it free; otherwise mark it dead. */
static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead)
{ {
TCGTemp *ts = s->reg_to_temp[reg]; if (ts->fixed_reg) {
return;
}
if (ts->val_type == TEMP_VAL_REG) {
s->reg_to_temp[ts->reg] = NULL;
}
ts->val_type = (free_or_dead < 0
|| ts->temp_local
|| temp_idx(s, ts) < s->nb_globals
? TEMP_VAL_MEM : TEMP_VAL_DEAD);
}
tcg_debug_assert(ts->val_type == TEMP_VAL_REG); /* Mark a temporary as dead. */
if (!ts->mem_coherent && !ts->fixed_reg) { static inline void temp_dead(TCGContext *s, TCGTemp *ts)
{
temp_free_or_dead(s, ts, 1);
}
/* Sync a temporary to memory. 'allocated_regs' is used in case a temporary
registers needs to be allocated to store a constant. If 'free_or_dead'
is non-zero, subsequently release the temporary; if it is positive, the
temp is dead; if it is negative, the temp is free. */
static void temp_sync(TCGContext *s, TCGTemp *ts,
TCGRegSet allocated_regs, int free_or_dead)
{
if (ts->fixed_reg) {
return;
}
if (!ts->mem_coherent) {
if (!ts->mem_allocated) { if (!ts->mem_allocated) {
temp_allocate_frame(s, temp_idx(s, ts)); temp_allocate_frame(s, temp_idx(s, ts));
} else if (ts->indirect_reg) { }
tcg_regset_set_reg(allocated_regs, ts->reg); if (ts->indirect_reg) {
if (ts->val_type == TEMP_VAL_REG) {
tcg_regset_set_reg(allocated_regs, ts->reg);
}
temp_load(s, ts->mem_base, temp_load(s, ts->mem_base,
s->tcg_target_available_regs[TCG_TYPE_PTR], s->tcg_target_available_regs[TCG_TYPE_PTR],
allocated_regs); allocated_regs);
} }
tcg_out_st(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); switch (ts->val_type) {
case TEMP_VAL_CONST:
/* If we're going to free the temp immediately, then we won't
require it later in a register, so attempt to store the
constant to memory directly. */
if (free_or_dead
&& tcg_out_sti(s, ts->type, ts->val,
ts->mem_base->reg, ts->mem_offset)) {
break;
}
temp_load(s, ts, s->tcg_target_available_regs[ts->type],
allocated_regs);
/* fallthrough */
case TEMP_VAL_REG:
tcg_out_st(s, ts->type, ts->reg,
ts->mem_base->reg, ts->mem_offset);
break;
case TEMP_VAL_MEM:
break;
case TEMP_VAL_DEAD:
default:
tcg_abort();
}
ts->mem_coherent = 1;
}
if (free_or_dead) {
temp_free_or_dead(s, ts, free_or_dead);
} }
ts->mem_coherent = 1;
} }
/* free register 'reg' by spilling the corresponding temporary if necessary */ /* free register 'reg' by spilling the corresponding temporary if necessary */
static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs)
{ {
TCGTemp *ts = s->reg_to_temp[reg]; TCGTemp *ts = s->reg_to_temp[reg];
if (ts != NULL) { if (ts != NULL) {
tcg_reg_sync(s, reg, allocated_regs); temp_sync(s, ts, allocated_regs, -1);
ts->val_type = TEMP_VAL_MEM;
s->reg_to_temp[reg] = NULL;
} }
} }
@ -1844,46 +1900,9 @@ static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs,
s->reg_to_temp[reg] = ts; s->reg_to_temp[reg] = ts;
} }
/* mark a temporary as dead. */ /* Save a temporary to memory. 'allocated_regs' is used in case a
static inline void temp_dead(TCGContext *s, TCGTemp *ts) temporary registers needs to be allocated to store a constant. */
{ static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs)
if (ts->fixed_reg) {
return;
}
if (ts->val_type == TEMP_VAL_REG) {
s->reg_to_temp[ts->reg] = NULL;
}
ts->val_type = (temp_idx(s, ts) < s->nb_globals || ts->temp_local
? TEMP_VAL_MEM : TEMP_VAL_DEAD);
}
/* sync a temporary to memory. 'allocated_regs' is used in case a
temporary registers needs to be allocated to store a constant. */
static void temp_sync(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs)
{
if (ts->fixed_reg) {
return;
}
switch (ts->val_type) {
case TEMP_VAL_CONST:
temp_load(s, ts, s->tcg_target_available_regs[ts->type], allocated_regs);
/* fallthrough */
case TEMP_VAL_REG:
tcg_reg_sync(s, ts->reg, allocated_regs);
break;
case TEMP_VAL_DEAD:
case TEMP_VAL_MEM:
break;
default:
tcg_abort();
}
}
/* save a temporary to memory. 'allocated_regs' is used in case a
temporary registers needs to be allocated to store a constant. */
static inline void temp_save(TCGContext *s, TCGTemp *ts,
TCGRegSet allocated_regs)
{ {
#ifdef USE_LIVENESS_ANALYSIS #ifdef USE_LIVENESS_ANALYSIS
/* ??? Liveness does not yet incorporate indirect bases. */ /* ??? Liveness does not yet incorporate indirect bases. */
@ -1894,8 +1913,7 @@ static inline void temp_save(TCGContext *s, TCGTemp *ts,
return; return;
} }
#endif #endif
temp_sync(s, ts, allocated_regs); temp_sync(s, ts, allocated_regs, 1);
temp_dead(s, ts);
} }
/* save globals to their canonical location and assume they can be /* save globals to their canonical location and assume they can be
@ -1928,7 +1946,7 @@ static void sync_globals(TCGContext *s, TCGRegSet allocated_regs)
continue; continue;
} }
#endif #endif
temp_sync(s, ts, allocated_regs); temp_sync(s, ts, allocated_regs, 0);
} }
} }
@ -1972,21 +1990,20 @@ static void tcg_reg_alloc_movi(TCGContext *s, const TCGArg *args,
val = args[1]; val = args[1];
if (ots->fixed_reg) { if (ots->fixed_reg) {
/* for fixed registers, we do not do any constant /* For fixed registers, we do not do any constant propagation. */
propagation */
tcg_out_movi(s, ots->type, ots->reg, val); tcg_out_movi(s, ots->type, ots->reg, val);
} else { return;
/* The movi is not explicitly generated here */
if (ots->val_type == TEMP_VAL_REG) {
s->reg_to_temp[ots->reg] = NULL;
}
ots->val_type = TEMP_VAL_CONST;
ots->val = val;
} }
/* The movi is not explicitly generated here. */
if (ots->val_type == TEMP_VAL_REG) {
s->reg_to_temp[ots->reg] = NULL;
}
ots->val_type = TEMP_VAL_CONST;
ots->val = val;
ots->mem_coherent = 0;
if (NEED_SYNC_ARG(0)) { if (NEED_SYNC_ARG(0)) {
temp_sync(s, ots, s->reserved_regs); temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0));
} } else if (IS_DEAD_ARG(0)) {
if (IS_DEAD_ARG(0)) {
temp_dead(s, ots); temp_dead(s, ots);
} }
} }
@ -2068,7 +2085,7 @@ static void tcg_reg_alloc_mov(TCGContext *s, const TCGOpDef *def,
ots->mem_coherent = 0; ots->mem_coherent = 0;
s->reg_to_temp[ots->reg] = ots; s->reg_to_temp[ots->reg] = ots;
if (NEED_SYNC_ARG(0)) { if (NEED_SYNC_ARG(0)) {
tcg_reg_sync(s, ots->reg, allocated_regs); temp_sync(s, ots, allocated_regs, 0);
} }
} }
} }
@ -2218,9 +2235,8 @@ static void tcg_reg_alloc_op(TCGContext *s,
tcg_out_mov(s, ts->type, ts->reg, reg); tcg_out_mov(s, ts->type, ts->reg, reg);
} }
if (NEED_SYNC_ARG(i)) { if (NEED_SYNC_ARG(i)) {
tcg_reg_sync(s, reg, allocated_regs); temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i));
} } else if (IS_DEAD_ARG(i)) {
if (IS_DEAD_ARG(i)) {
temp_dead(s, ts); temp_dead(s, ts);
} }
} }
@ -2357,9 +2373,8 @@ static void tcg_reg_alloc_call(TCGContext *s, int nb_oargs, int nb_iargs,
ts->mem_coherent = 0; ts->mem_coherent = 0;
s->reg_to_temp[reg] = ts; s->reg_to_temp[reg] = ts;
if (NEED_SYNC_ARG(i)) { if (NEED_SYNC_ARG(i)) {
tcg_reg_sync(s, reg, allocated_regs); temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i));
} } else if (IS_DEAD_ARG(i)) {
if (IS_DEAD_ARG(i)) {
temp_dead(s, ts); temp_dead(s, ts);
} }
} }