aco: don't create v_mad_f32 on GFX10.3
Signed-off-by: Rhys Perry <pendingchaos02@gmail.com> Reviewed-by: Daniel Schürmann <daniel@schuermann.dev> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/5546>
This commit is contained in:
parent
5718f7c8a7
commit
4f1242a4d8
|
@ -2614,7 +2614,7 @@ void combine_instruction(opt_ctx &ctx, Block& block, aco_ptr<Instruction>& instr
|
|||
instr->opcode == aco_opcode::v_sub_f16 ||
|
||||
instr->opcode == aco_opcode::v_subrev_f16;
|
||||
if (mad16 || mad32) {
|
||||
bool need_fma = mad32 ? block.fp_mode.denorm32 != 0 :
|
||||
bool need_fma = mad32 ? (block.fp_mode.denorm32 != 0 || ctx.program->chip_class >= GFX10_3) :
|
||||
(block.fp_mode.denorm16_64 != 0 || ctx.program->chip_class >= GFX10);
|
||||
if (need_fma && instr->definitions[0].isPrecise())
|
||||
return;
|
||||
|
|
Loading…
Reference in New Issue