From 29953d60481bcab370228a352f82eceb10903261 Mon Sep 17 00:00:00 2001 From: Rhys Perry Date: Wed, 25 May 2022 17:21:50 +0100 Subject: [PATCH] aco: include scratch/global in VMEM WAW optimization MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit fossil-db (navi21): Totals from 2 (0.00% of 162293) affected shaders: Instrs: 4788 -> 4785 (-0.06%) CodeSize: 25884 -> 25872 (-0.05%) Latency: 255008 -> 252950 (-0.81%) InvThroughput: 170005 -> 168633 (-0.81%) VClause: 206 -> 205 (-0.49%) Signed-off-by: Rhys Perry Reviewed-by: Daniel Schürmann Part-of: --- src/amd/compiler/aco_insert_waitcnt.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/amd/compiler/aco_insert_waitcnt.cpp b/src/amd/compiler/aco_insert_waitcnt.cpp index 9d6f0991316..b8be00c1fcf 100644 --- a/src/amd/compiler/aco_insert_waitcnt.cpp +++ b/src/amd/compiler/aco_insert_waitcnt.cpp @@ -250,7 +250,7 @@ get_vmem_type(Instruction* instr) else if (instr->isMIMG() && !instr->operands[1].isUndefined() && instr->operands[1].regClass() == s4) return vmem_sampler; - else if (instr->isVMEM()) + else if (instr->isVMEM() || instr->isScratch() || instr->isGlobal()) return vmem_nosampler; return 0; }