289 lines
11 KiB
C
289 lines
11 KiB
C
/*
|
|
* Copyright © 2014 Broadcom
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
* IN THE SOFTWARE.
|
|
*/
|
|
|
|
/**
|
|
* @file v3d_opt_dead_code.c
|
|
*
|
|
* This is a simple dead code eliminator for SSA values in VIR.
|
|
*
|
|
* It walks all the instructions finding what temps are used, then walks again
|
|
* to remove instructions writing unused temps.
|
|
*
|
|
* This is an inefficient implementation if you have long chains of
|
|
* instructions where the entire chain is dead, but we expect those to have
|
|
* been eliminated at the NIR level, and here we're just cleaning up small
|
|
* problems produced by NIR->VIR.
|
|
*/
|
|
|
|
#include "v3d_compiler.h"
|
|
|
|
static bool debug;
|
|
|
|
static void
|
|
dce(struct v3d_compile *c, struct qinst *inst)
|
|
{
|
|
if (debug) {
|
|
fprintf(stderr, "Removing: ");
|
|
vir_dump_inst(c, inst);
|
|
fprintf(stderr, "\n");
|
|
}
|
|
assert(!v3d_qpu_writes_flags(&inst->qpu));
|
|
vir_remove_instruction(c, inst);
|
|
}
|
|
|
|
static bool
|
|
has_nonremovable_reads(struct v3d_compile *c, struct qinst *inst)
|
|
{
|
|
for (int i = 0; i < vir_get_nsrc(inst); i++) {
|
|
if (inst->src[i].file == QFILE_VPM)
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
static bool
|
|
can_write_to_null(struct v3d_compile *c, struct qinst *inst)
|
|
{
|
|
/* The SFU instructions must write to a physical register. */
|
|
if (c->devinfo->ver >= 41 && v3d_qpu_uses_sfu(&inst->qpu))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
static void
|
|
vir_dce_flags(struct v3d_compile *c, struct qinst *inst)
|
|
{
|
|
if (debug) {
|
|
fprintf(stderr,
|
|
"Removing flags write from: ");
|
|
vir_dump_inst(c, inst);
|
|
fprintf(stderr, "\n");
|
|
}
|
|
|
|
assert(inst->qpu.type == V3D_QPU_INSTR_TYPE_ALU);
|
|
|
|
inst->qpu.flags.apf = V3D_QPU_PF_NONE;
|
|
inst->qpu.flags.mpf = V3D_QPU_PF_NONE;
|
|
inst->qpu.flags.auf = V3D_QPU_UF_NONE;
|
|
inst->qpu.flags.muf = V3D_QPU_UF_NONE;
|
|
}
|
|
|
|
static bool
|
|
check_last_ldunifa(struct v3d_compile *c,
|
|
struct qinst *inst,
|
|
struct qblock *block)
|
|
{
|
|
if (!inst->qpu.sig.ldunifa && !inst->qpu.sig.ldunifarf)
|
|
return false;
|
|
|
|
list_for_each_entry_from(struct qinst, scan_inst, inst->link.next,
|
|
&block->instructions, link) {
|
|
/* If we find a new write to unifa, then this was the last
|
|
* ldunifa in its sequence and is safe to remove.
|
|
*/
|
|
if (scan_inst->dst.file == QFILE_MAGIC &&
|
|
scan_inst->dst.index == V3D_QPU_WADDR_UNIFA) {
|
|
return true;
|
|
}
|
|
|
|
/* If we find another ldunifa in the same sequence then we
|
|
* can't remove it.
|
|
*/
|
|
if (scan_inst->qpu.sig.ldunifa || scan_inst->qpu.sig.ldunifarf)
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
check_first_ldunifa(struct v3d_compile *c,
|
|
struct qinst *inst,
|
|
struct qblock *block,
|
|
struct qinst **unifa)
|
|
{
|
|
if (!inst->qpu.sig.ldunifa && !inst->qpu.sig.ldunifarf)
|
|
return false;
|
|
|
|
list_for_each_entry_from_rev(struct qinst, scan_inst, inst->link.prev,
|
|
&block->instructions, link) {
|
|
/* If we find a write to unifa, then this was the first
|
|
* ldunifa in its sequence and is safe to remove.
|
|
*/
|
|
if (scan_inst->dst.file == QFILE_MAGIC &&
|
|
scan_inst->dst.index == V3D_QPU_WADDR_UNIFA) {
|
|
*unifa = scan_inst;
|
|
return true;
|
|
}
|
|
|
|
/* If we find another ldunifa in the same sequence then we
|
|
* can't remove it.
|
|
*/
|
|
if (scan_inst->qpu.sig.ldunifa || scan_inst->qpu.sig.ldunifarf)
|
|
return false;
|
|
}
|
|
|
|
unreachable("could not find starting unifa for ldunifa sequence");
|
|
}
|
|
|
|
static bool
|
|
increment_unifa_address(struct v3d_compile *c, struct qinst *unifa)
|
|
{
|
|
if (unifa->qpu.type == V3D_QPU_INSTR_TYPE_ALU &&
|
|
unifa->qpu.alu.mul.op == V3D_QPU_M_MOV) {
|
|
c->cursor = vir_after_inst(unifa);
|
|
struct qreg unifa_reg = vir_reg(QFILE_MAGIC, V3D_QPU_WADDR_UNIFA);
|
|
vir_ADD_dest(c, unifa_reg, unifa->src[0], vir_uniform_ui(c, 4u));
|
|
vir_remove_instruction(c, unifa);
|
|
return true;
|
|
}
|
|
|
|
if (unifa->qpu.type == V3D_QPU_INSTR_TYPE_ALU &&
|
|
unifa->qpu.alu.add.op == V3D_QPU_A_ADD) {
|
|
c->cursor = vir_after_inst(unifa);
|
|
struct qreg unifa_reg = vir_reg(QFILE_MAGIC, V3D_QPU_WADDR_UNIFA);
|
|
struct qreg tmp =
|
|
vir_ADD(c, unifa->src[1], vir_uniform_ui(c, 4u));
|
|
vir_ADD_dest(c, unifa_reg, unifa->src[0], tmp);
|
|
vir_remove_instruction(c, unifa);
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool
|
|
vir_opt_dead_code(struct v3d_compile *c)
|
|
{
|
|
bool progress = false;
|
|
bool *used = calloc(c->num_temps, sizeof(bool));
|
|
|
|
/* Defuse the "are you removing the cursor?" assertion in the core.
|
|
* You'll need to set up a new cursor for any new instructions after
|
|
* doing DCE (which we would expect, anyway).
|
|
*/
|
|
c->cursor.link = NULL;
|
|
|
|
vir_for_each_inst_inorder(inst, c) {
|
|
for (int i = 0; i < vir_get_nsrc(inst); i++) {
|
|
if (inst->src[i].file == QFILE_TEMP)
|
|
used[inst->src[i].index] = true;
|
|
}
|
|
}
|
|
|
|
vir_for_each_block(block, c) {
|
|
struct qinst *last_flags_write = NULL;
|
|
c->cur_block = block;
|
|
vir_for_each_inst_safe(inst, block) {
|
|
/* If this instruction reads the flags, we can't
|
|
* remove the flags generation for it.
|
|
*/
|
|
if (v3d_qpu_reads_flags(&inst->qpu))
|
|
last_flags_write = NULL;
|
|
|
|
if (inst->dst.file != QFILE_NULL &&
|
|
!(inst->dst.file == QFILE_TEMP &&
|
|
!used[inst->dst.index])) {
|
|
continue;
|
|
}
|
|
|
|
const bool is_ldunifa = inst->qpu.sig.ldunifa ||
|
|
inst->qpu.sig.ldunifarf;
|
|
|
|
if (vir_has_side_effects(c, inst) && !is_ldunifa)
|
|
continue;
|
|
|
|
bool is_first_ldunifa = false;
|
|
bool is_last_ldunifa = false;
|
|
struct qinst *unifa = NULL;
|
|
if (is_ldunifa) {
|
|
is_last_ldunifa =
|
|
check_last_ldunifa(c, inst, block);
|
|
|
|
is_first_ldunifa =
|
|
check_first_ldunifa(c, inst, block, &unifa);
|
|
}
|
|
|
|
if (v3d_qpu_writes_flags(&inst->qpu)) {
|
|
/* If we obscure a previous flags write,
|
|
* drop it.
|
|
*/
|
|
if (last_flags_write &&
|
|
(inst->qpu.flags.apf != V3D_QPU_PF_NONE ||
|
|
inst->qpu.flags.mpf != V3D_QPU_PF_NONE)) {
|
|
vir_dce_flags(c, last_flags_write);
|
|
progress = true;
|
|
}
|
|
|
|
last_flags_write = inst;
|
|
}
|
|
|
|
if (v3d_qpu_writes_flags(&inst->qpu) ||
|
|
has_nonremovable_reads(c, inst) ||
|
|
(is_ldunifa && !is_first_ldunifa && !is_last_ldunifa)) {
|
|
/* If we can't remove the instruction, but we
|
|
* don't need its destination value, just
|
|
* remove the destination. The register
|
|
* allocator would trivially color it and it
|
|
* wouldn't cause any register pressure, but
|
|
* it's nicer to read the VIR code without
|
|
* unused destination regs.
|
|
*/
|
|
if (inst->dst.file == QFILE_TEMP &&
|
|
can_write_to_null(c, inst)) {
|
|
if (debug) {
|
|
fprintf(stderr,
|
|
"Removing dst from: ");
|
|
vir_dump_inst(c, inst);
|
|
fprintf(stderr, "\n");
|
|
}
|
|
c->defs[inst->dst.index] = NULL;
|
|
inst->dst.file = QFILE_NULL;
|
|
progress = true;
|
|
}
|
|
continue;
|
|
}
|
|
|
|
/* If we are removing the first ldunifa in a sequence
|
|
* we need to update the unifa address.
|
|
*/
|
|
if (is_first_ldunifa) {
|
|
assert(unifa);
|
|
if (!increment_unifa_address(c, unifa))
|
|
continue;
|
|
}
|
|
|
|
assert(inst != last_flags_write);
|
|
dce(c, inst);
|
|
progress = true;
|
|
continue;
|
|
}
|
|
}
|
|
|
|
free(used);
|
|
|
|
return progress;
|
|
}
|