intel/eu: Don't double-loop as often in brw_set_uip_jip
brw_find_next_block_end() scans through the instructions to find the end of the block. We were calling it for every instruction in the program which is, if you have a single basic block, makes the whole mess a nice clean O(n^2) when it really doesn't need to be. Instead, only call brw_find_next_block_end() as-needed. This brings it back to O(n) like it should have been. This cuts the runtime of the following Vulkan CTS on my SKL box by 5% from 1:51 to 1:45: dEQP-VK.ssbo.phys.layout.random.16bit.scalar.13 Reviewed-by: Ian Romanick <ian.d.romanick@intel.com> Reviewed-by: Emma Anholt <emma@anholt.net> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/13734>
This commit is contained in:
parent
cf98a3cc19
commit
e6f0def97d
|
@ -2992,9 +2992,9 @@ brw_set_uip_jip(struct brw_codegen *p, int start_offset)
|
|||
brw_inst *insn = store + offset;
|
||||
assert(brw_inst_cmpt_control(devinfo, insn) == 0);
|
||||
|
||||
int block_end_offset = brw_find_next_block_end(p, offset);
|
||||
switch (brw_inst_opcode(devinfo, insn)) {
|
||||
case BRW_OPCODE_BREAK:
|
||||
case BRW_OPCODE_BREAK: {
|
||||
int block_end_offset = brw_find_next_block_end(p, offset);
|
||||
assert(block_end_offset != 0);
|
||||
brw_inst_set_jip(devinfo, insn, (block_end_offset - offset) / scale);
|
||||
/* Gfx7 UIP points to WHILE; Gfx6 points just after it */
|
||||
|
@ -3002,7 +3002,10 @@ brw_set_uip_jip(struct brw_codegen *p, int start_offset)
|
|||
(brw_find_loop_end(p, offset) - offset +
|
||||
(devinfo->ver == 6 ? 16 : 0)) / scale);
|
||||
break;
|
||||
case BRW_OPCODE_CONTINUE:
|
||||
}
|
||||
|
||||
case BRW_OPCODE_CONTINUE: {
|
||||
int block_end_offset = brw_find_next_block_end(p, offset);
|
||||
assert(block_end_offset != 0);
|
||||
brw_inst_set_jip(devinfo, insn, (block_end_offset - offset) / scale);
|
||||
brw_inst_set_uip(devinfo, insn,
|
||||
|
@ -3011,8 +3014,10 @@ brw_set_uip_jip(struct brw_codegen *p, int start_offset)
|
|||
assert(brw_inst_uip(devinfo, insn) != 0);
|
||||
assert(brw_inst_jip(devinfo, insn) != 0);
|
||||
break;
|
||||
}
|
||||
|
||||
case BRW_OPCODE_ENDIF: {
|
||||
int block_end_offset = brw_find_next_block_end(p, offset);
|
||||
int32_t jump = (block_end_offset == 0) ?
|
||||
1 * br : (block_end_offset - offset) / scale;
|
||||
if (devinfo->ver >= 7)
|
||||
|
@ -3022,7 +3027,7 @@ brw_set_uip_jip(struct brw_codegen *p, int start_offset)
|
|||
break;
|
||||
}
|
||||
|
||||
case BRW_OPCODE_HALT:
|
||||
case BRW_OPCODE_HALT: {
|
||||
/* From the Sandy Bridge PRM (volume 4, part 2, section 8.3.19):
|
||||
*
|
||||
* "In case of the halt instruction not inside any conditional
|
||||
|
@ -3034,6 +3039,7 @@ brw_set_uip_jip(struct brw_codegen *p, int start_offset)
|
|||
* The uip will have already been set by whoever set up the
|
||||
* instruction.
|
||||
*/
|
||||
int block_end_offset = brw_find_next_block_end(p, offset);
|
||||
if (block_end_offset == 0) {
|
||||
brw_inst_set_jip(devinfo, insn, brw_inst_uip(devinfo, insn));
|
||||
} else {
|
||||
|
@ -3042,6 +3048,7 @@ brw_set_uip_jip(struct brw_codegen *p, int start_offset)
|
|||
assert(brw_inst_uip(devinfo, insn) != 0);
|
||||
assert(brw_inst_jip(devinfo, insn) != 0);
|
||||
break;
|
||||
}
|
||||
|
||||
default:
|
||||
break;
|
||||
|
|
Loading…
Reference in New Issue