radeonsi: tweak triangle list culling performance for GS fast launch
Acked-by: Pierre-Eric Pelloux-Prayer <pierre-eric.pelloux-prayer@amd.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/7542>
This commit is contained in:
parent
2b2b22f496
commit
0ab7ab40c8
|
@ -1941,7 +1941,10 @@ bool gfx10_ngg_calculate_subgroup_info(struct si_shader *shader)
|
||||||
unsigned max_esverts_base = 128;
|
unsigned max_esverts_base = 128;
|
||||||
|
|
||||||
if (shader->key.opt.ngg_culling & SI_NGG_CULL_GS_FAST_LAUNCH_TRI_LIST) {
|
if (shader->key.opt.ngg_culling & SI_NGG_CULL_GS_FAST_LAUNCH_TRI_LIST) {
|
||||||
max_gsprims_base = 128 / 3;
|
/* Exactly 1 wave32 executes culling in primitive threads (there is no
|
||||||
|
* divergence), other waves are idle.
|
||||||
|
*/
|
||||||
|
max_gsprims_base = 32;
|
||||||
max_esverts_base = max_gsprims_base * 3;
|
max_esverts_base = max_gsprims_base * 3;
|
||||||
} else if (shader->key.opt.ngg_culling & SI_NGG_CULL_GS_FAST_LAUNCH_TRI_STRIP) {
|
} else if (shader->key.opt.ngg_culling & SI_NGG_CULL_GS_FAST_LAUNCH_TRI_STRIP) {
|
||||||
max_gsprims_base = 126;
|
max_gsprims_base = 126;
|
||||||
|
|
Loading…
Reference in New Issue