aco: adjust num_waves for LDS before scheduling
Totals from 67 (0.05% of 134913) affected shaders: (GFX10.3) VGPRs: 2024 -> 2136 (+5.53%); split: -0.40%, +5.93% CodeSize: 162364 -> 162348 (-0.01%); split: -0.08%, +0.07% MaxWaves: 1882 -> 1816 (-3.51%); split: +0.11%, -3.61% Instrs: 29176 -> 29162 (-0.05%); split: -0.09%, +0.04% Latency: 329984 -> 327272 (-0.82%); split: -0.88%, +0.06% InvThroughput: 54653 -> 54672 (+0.03%); split: -0.01%, +0.04% VClause: 782 -> 761 (-2.69%); split: -2.81%, +0.13% SClause: 833 -> 824 (-1.08%); split: -2.28%, +1.20% Copies: 1872 -> 1873 (+0.05%); split: -0.37%, +0.43% Reviewed-by: Rhys Perry <pendingchaos02@gmail.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/16039>
This commit is contained in:
committed by
Marge Bot
parent
8d8c59b4cd
commit
d5dc0c0392
@@ -1070,6 +1070,7 @@ schedule_program(Program* program, live& live_vars)
|
||||
ctx.num_waves = 7 * wave_fac;
|
||||
ctx.num_waves = std::max<uint16_t>(ctx.num_waves, program->min_waves);
|
||||
ctx.num_waves = std::min<uint16_t>(ctx.num_waves, program->num_waves);
|
||||
ctx.num_waves = max_suitable_waves(program, ctx.num_waves);
|
||||
|
||||
/* VMEM_MAX_MOVES and such assume pre-GFX10 wave count */
|
||||
ctx.num_waves = std::max<uint16_t>(ctx.num_waves / wave_fac, 1);
|
||||
|
||||
Reference in New Issue
Block a user