summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorFrancisco Jerez <currojerez@riseup.net>2015-03-23 14:08:49 +0200
committerFrancisco Jerez <currojerez@riseup.net>2015-03-23 14:52:57 +0200
commit2babde35b9a38a0561a87dc2d7cb431e9aabbd5a (patch)
treeac152c416e6d40df4943cf0ee4f292e86acd26bd
parente6e655ef76bb22193b31af2841cb50fda0c39461 (diff)
downloadexternal_mesa3d-2babde35b9a38a0561a87dc2d7cb431e9aabbd5a.zip
external_mesa3d-2babde35b9a38a0561a87dc2d7cb431e9aabbd5a.tar.gz
external_mesa3d-2babde35b9a38a0561a87dc2d7cb431e9aabbd5a.tar.bz2
i965/vec4: Calculate live intervals with subregister granularity.
Reviewed-by: Matt Turner <mattst88@gmail.com>
-rw-r--r--src/mesa/drivers/dri/i965/brw_vec4_live_variables.cpp68
-rw-r--r--src/mesa/drivers/dri/i965/brw_vec4_live_variables.h11
2 files changed, 46 insertions, 33 deletions
diff --git a/src/mesa/drivers/dri/i965/brw_vec4_live_variables.cpp b/src/mesa/drivers/dri/i965/brw_vec4_live_variables.cpp
index 66beb21..95b9d90 100644
--- a/src/mesa/drivers/dri/i965/brw_vec4_live_variables.cpp
+++ b/src/mesa/drivers/dri/i965/brw_vec4_live_variables.cpp
@@ -76,10 +76,13 @@ vec4_live_variables::setup_def_use()
/* Set use[] for this instruction */
for (unsigned int i = 0; i < 3; i++) {
if (inst->src[i].file == GRF) {
- for (int c = 0; c < 4; c++) {
- const unsigned v = var_from_reg(alloc, inst->src[i], c);
- if (!BITSET_TEST(bd->def, v))
- BITSET_SET(bd->use, v);
+ for (unsigned j = 0; j < inst->regs_read(i); j++) {
+ for (int c = 0; c < 4; c++) {
+ const unsigned v =
+ var_from_reg(alloc, offset(inst->src[i], j), c);
+ if (!BITSET_TEST(bd->def, v))
+ BITSET_SET(bd->use, v);
+ }
}
}
}
@@ -93,14 +96,15 @@ vec4_live_variables::setup_def_use()
* are the things that screen off preceding definitions of a
* variable, and thus qualify for being in def[].
*/
- if (inst->dst.file == GRF &&
- alloc.sizes[inst->dst.reg] == 1 &&
- !inst->predicate) {
- for (int c = 0; c < 4; c++) {
- if (inst->dst.writemask & (1 << c)) {
- const unsigned v = var_from_reg(alloc, inst->dst, c);
- if (!BITSET_TEST(bd->use, v))
- BITSET_SET(bd->def, v);
+ if (inst->dst.file == GRF && !inst->predicate) {
+ for (unsigned i = 0; i < inst->regs_written; i++) {
+ for (int c = 0; c < 4; c++) {
+ if (inst->dst.writemask & (1 << c)) {
+ const unsigned v =
+ var_from_reg(alloc, offset(inst->dst, i), c);
+ if (!BITSET_TEST(bd->use, v))
+ BITSET_SET(bd->def, v);
+ }
}
}
}
@@ -179,7 +183,7 @@ vec4_live_variables::vec4_live_variables(const simple_allocator &alloc,
{
mem_ctx = ralloc_context(NULL);
- num_vars = alloc.count * 4;
+ num_vars = alloc.total_size * 4;
block_data = rzalloc_array(mem_ctx, struct block_data, cfg->num_blocks);
bitset_words = BITSET_WORDS(num_vars);
@@ -229,14 +233,14 @@ vec4_visitor::calculate_live_intervals()
if (this->live_intervals)
return;
- int *start = ralloc_array(mem_ctx, int, this->alloc.count * 4);
- int *end = ralloc_array(mem_ctx, int, this->alloc.count * 4);
+ int *start = ralloc_array(mem_ctx, int, this->alloc.total_size * 4);
+ int *end = ralloc_array(mem_ctx, int, this->alloc.total_size * 4);
ralloc_free(this->virtual_grf_start);
ralloc_free(this->virtual_grf_end);
this->virtual_grf_start = start;
this->virtual_grf_end = end;
- for (unsigned i = 0; i < this->alloc.count * 4; i++) {
+ for (unsigned i = 0; i < this->alloc.total_size * 4; i++) {
start[i] = MAX_INSTRUCTION;
end[i] = -1;
}
@@ -248,20 +252,26 @@ vec4_visitor::calculate_live_intervals()
foreach_block_and_inst(block, vec4_instruction, inst, cfg) {
for (unsigned int i = 0; i < 3; i++) {
if (inst->src[i].file == GRF) {
- for (int c = 0; c < 4; c++) {
- const unsigned v = var_from_reg(alloc, inst->src[i], c);
- start[v] = MIN2(start[v], ip);
- end[v] = ip;
+ for (unsigned j = 0; j < inst->regs_read(i); j++) {
+ for (int c = 0; c < 4; c++) {
+ const unsigned v =
+ var_from_reg(alloc, offset(inst->src[i], j), c);
+ start[v] = MIN2(start[v], ip);
+ end[v] = ip;
+ }
}
}
}
if (inst->dst.file == GRF) {
- for (int c = 0; c < 4; c++) {
- if (inst->dst.writemask & (1 << c)) {
- const unsigned v = var_from_reg(alloc, inst->dst, c);
- start[v] = MIN2(start[v], ip);
- end[v] = ip;
+ for (unsigned i = 0; i < inst->regs_written; i++) {
+ for (int c = 0; c < 4; c++) {
+ if (inst->dst.writemask & (1 << c)) {
+ const unsigned v =
+ var_from_reg(alloc, offset(inst->dst, i), c);
+ start[v] = MIN2(start[v], ip);
+ end[v] = ip;
+ }
}
}
}
@@ -325,8 +335,8 @@ vec4_visitor::var_range_end(unsigned v, unsigned n) const
bool
vec4_visitor::virtual_grf_interferes(int a, int b)
{
- return !((var_range_end(4 * a, 4) <=
- var_range_start(4 * b, 4)) ||
- (var_range_end(4 * b, 4) <=
- var_range_start(4 * a, 4)));
+ return !((var_range_end(4 * alloc.offsets[a], 4 * alloc.sizes[a]) <=
+ var_range_start(4 * alloc.offsets[b], 4 * alloc.sizes[b])) ||
+ (var_range_end(4 * alloc.offsets[b], 4 * alloc.sizes[b]) <=
+ var_range_start(4 * alloc.offsets[a], 4 * alloc.sizes[a])));
}
diff --git a/src/mesa/drivers/dri/i965/brw_vec4_live_variables.h b/src/mesa/drivers/dri/i965/brw_vec4_live_variables.h
index cef55f7..e7929ec 100644
--- a/src/mesa/drivers/dri/i965/brw_vec4_live_variables.h
+++ b/src/mesa/drivers/dri/i965/brw_vec4_live_variables.h
@@ -82,16 +82,19 @@ inline unsigned
var_from_reg(const simple_allocator &alloc, const src_reg &reg,
unsigned c = 0)
{
- assert(reg.file == GRF && reg.reg < alloc.count && c < 4);
- return 4 * reg.reg + BRW_GET_SWZ(reg.swizzle, c);
+ assert(reg.file == GRF && reg.reg < alloc.count &&
+ reg.reg_offset < alloc.sizes[reg.reg] && c < 4);
+ return (4 * (alloc.offsets[reg.reg] + reg.reg_offset) +
+ BRW_GET_SWZ(reg.swizzle, c));
}
inline unsigned
var_from_reg(const simple_allocator &alloc, const dst_reg &reg,
unsigned c = 0)
{
- assert(reg.file == GRF && reg.reg < alloc.count && c < 4);
- return 4 * reg.reg + c;
+ assert(reg.file == GRF && reg.reg < alloc.count &&
+ reg.reg_offset < alloc.sizes[reg.reg] && c < 4);
+ return 4 * (alloc.offsets[reg.reg] + reg.reg_offset) + c;
}
} /* namespace brw */