radeonsi: tweak triangle list culling performance for GS fast launch

Acked-by: Pierre-Eric Pelloux-Prayer <pierre-eric.pelloux-prayer@amd.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/7542>
This commit is contained in:
Marek Olšák 2020-10-21 12:34:51 -04:00 committed by Marge Bot
parent 2b2b22f496
commit 0ab7ab40c8
1 changed files with 4 additions and 1 deletions

View File

@ -1941,7 +1941,10 @@ bool gfx10_ngg_calculate_subgroup_info(struct si_shader *shader)
unsigned max_esverts_base = 128;
if (shader->key.opt.ngg_culling & SI_NGG_CULL_GS_FAST_LAUNCH_TRI_LIST) {
max_gsprims_base = 128 / 3;
/* Exactly 1 wave32 executes culling in primitive threads (there is no
* divergence), other waves are idle.
*/
max_gsprims_base = 32;
max_esverts_base = max_gsprims_base * 3;
} else if (shader->key.opt.ngg_culling & SI_NGG_CULL_GS_FAST_LAUNCH_TRI_STRIP) {
max_gsprims_base = 126;