From d666d83be2fa03210f38b06e72410e8d8221b184 Mon Sep 17 00:00:00 2001 From: =?utf8?q?Daniel=20Sch=C3=BCrmann?= Date: Wed, 15 Apr 2020 11:00:45 +0100 Subject: [PATCH] aco: try to always find a register with stride for even sizes Totals from affected shaders: SGPRS: 1162400 -> 1162400 (0.00 %) VGPRS: 947364 -> 946960 (-0.04 %) Code Size: 98399300 -> 98399004 (-0.00 %) bytes Max Waves: 74665 -> 74682 (0.02 %) Reviewed-by: Rhys Perry Part-of: --- src/amd/compiler/aco_register_allocation.cpp | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/src/amd/compiler/aco_register_allocation.cpp b/src/amd/compiler/aco_register_allocation.cpp index 9a36019..eae3822 100644 --- a/src/amd/compiler/aco_register_allocation.cpp +++ b/src/amd/compiler/aco_register_allocation.cpp @@ -395,8 +395,10 @@ std::pair get_reg_simple(ra_ctx& ctx, if (stride == 1) { - if (rc.type() == RegType::vgpr && (size == 4 || size == 8)) { - info.stride = 4; + for (unsigned stride = 8; stride > 1; stride /= 2) { + if (size % stride) + continue; + info.stride = stride; std::pair res = get_reg_simple(ctx, reg_file, info); if (res.second) return res; -- 2.7.4