diff options
author | Connor Abbott <connor.w.abbott@intel.com> | 2015-07-28 18:21:56 -0700 |
---|---|---|
committer | Samuel Iglesias Gonsálvez <siglesias@igalia.com> | 2016-04-29 09:47:01 +0200 |
commit | cc1839abdb3544231732f3d052ab393f624184c7 (patch) | |
tree | e6bbc1cd2bee44575d670a0a0eae679ae1173f77 | |
parent | 16454fb26b5a444d38f0d01d272595044afb7e02 (diff) |
i965/fs: generalize SIMD16 interference workaround
Work based on registers read/written instead of dispatch_width, so that
the interferences are added for 64-bit sources/destinations as well.
-rw-r--r-- | src/mesa/drivers/dri/i965/brw_fs_reg_allocate.cpp | 67 |
1 files changed, 48 insertions, 19 deletions
diff --git a/src/mesa/drivers/dri/i965/brw_fs_reg_allocate.cpp b/src/mesa/drivers/dri/i965/brw_fs_reg_allocate.cpp index 2347cd5d33..f0e96f9309 100644 --- a/src/mesa/drivers/dri/i965/brw_fs_reg_allocate.cpp +++ b/src/mesa/drivers/dri/i965/brw_fs_reg_allocate.cpp @@ -541,6 +541,34 @@ setup_mrf_hack_interference(fs_visitor *v, struct ra_graph *g, } } +static unsigned +get_reg_node(const fs_reg& reg, unsigned first_payload_node) +{ + switch (reg.file) { + case VGRF: + return reg.nr; + case ARF: + case FIXED_GRF: + return first_payload_node + reg.nr; + case MRF: + default: + unreachable("unhandled register file"); + } + + return 0; +} + +static void +add_reg_interference(struct ra_graph *g, const fs_reg& reg1, + const fs_reg& reg2, unsigned first_payload_node) +{ + if ((reg1.file == VGRF || reg1.file == ARF || reg1.file == FIXED_GRF) && + (reg2.file == VGRF || reg2.file == ARF || reg2.file == FIXED_GRF)) { + ra_add_node_interference(g, get_reg_node(reg1, first_payload_node), + get_reg_node(reg2, first_payload_node)); + } +} + bool fs_visitor::assign_regs(bool allow_spilling) { @@ -643,26 +671,27 @@ fs_visitor::assign_regs(bool allow_spilling) } } - if (dispatch_width > 8) { - /* In 16-wide dispatch we have an issue where a compressed - * instruction is actually two instructions executed simultaneiously. - * It's actually ok to have the source and destination registers be - * the same. In this case, each instruction over-writes its own - * source and there's no problem. The real problem here is if the - * source and destination registers are off by one. Then you can end - * up in a scenario where the first instruction over-writes the - * source of the second instruction. Since the compiler doesn't know - * about this level of granularity, we simply make the source and - * destination interfere. - */ - foreach_block_and_inst(block, fs_inst, inst, cfg) { - if (inst->dst.file != VGRF) - continue; + /* When instructions both read/write more than a single SIMD8 register, we + * have an issue where an instruction is actually two instructions executed + * simultaneiously. It's actually ok to have the source and destination + * registers be the same. In this case, each instruction over-writes its + * own source and there's no problem. The real problem here is if the + * source and destination registers are off by one. Then you can end up in + * a scenario where the first instruction over-writes the source of the + * second instruction. Since the compiler doesn't know about this level of + * granularity, we simply make the source and destination interfere. + */ + foreach_block_and_inst(block, fs_inst, inst, cfg) { + if (inst->dst.file != VGRF && + inst->dst.file != ARF && inst->dst.file != FIXED_GRF) + continue; - for (int i = 0; i < inst->sources; ++i) { - if (inst->src[i].file == VGRF) { - ra_add_node_interference(g, inst->dst.nr, inst->src[i].nr); - } + if (inst->regs_written <= 1) + continue; + + for (int i = 0; i < inst->sources; ++i) { + if (inst->regs_read(i) > 1) { + add_reg_interference(g, inst->dst, inst->src[i], first_payload_node); } } } |