From 3215645b8d81bbef7db1d16b88de7ed0288f2274 Mon Sep 17 00:00:00 2001 From: Tony Linthicum Date: Mon, 23 Feb 2026 09:34:17 -0600 Subject: [PATCH] [AMDGPU] Enable scheduler mfma rewrite stage by default (#180751) After performance testing, it was determined that the large number of copies that are inserted outside the loop are more than offset by better allocation within the loop as a result of the rewrite. Additionally, there is a minor cleanup of the cost logic. --------- Co-authored-by: Tony Linthicum --- llvm/lib/Target/AMDGPU/GCNSchedStrategy.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/llvm/lib/Target/AMDGPU/GCNSchedStrategy.cpp b/llvm/lib/Target/AMDGPU/GCNSchedStrategy.cpp index f3c471bb697d..9309d5402ae5 100644 --- a/llvm/lib/Target/AMDGPU/GCNSchedStrategy.cpp +++ b/llvm/lib/Target/AMDGPU/GCNSchedStrategy.cpp @@ -101,7 +101,7 @@ static cl::opt PrintMaxRPRegUsageAfterScheduler( static cl::opt DisableRewriteMFMAFormSchedStage( "amdgpu-disable-rewrite-mfma-form-sched-stage", cl::Hidden, - cl::desc("Disable rewrie mfma rewrite scheduling stage"), cl::init(true)); + cl::desc("Disable rewrite mfma rewrite scheduling stage"), cl::init(false)); const unsigned ScheduleMetrics::ScaleFactor = 100;