[RISCV] Add a unaligned-scalar-mem feature like we had in clang 17.

author Craig Topper <craig.topper@sifive.com>

Thu, 16 May 2024 19:27:05 +0000 (12:27 -0700)

committer Tom Stellard <tstellar@redhat.com>

Fri, 17 May 2024 20:22:27 +0000 (13:22 -0700)
author Craig Topper <craig.topper@sifive.com>
Thu, 16 May 2024 19:27:05 +0000 (12:27 -0700)
committer Tom Stellard <tstellar@redhat.com>
Fri, 17 May 2024 20:22:27 +0000 (13:22 -0700)
diff --git a/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp b/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp

index 0a314fdd41cbe2bb9b5ec95a9d11e138a82f9453..89207640ee54ad5ad9caa6d268b9ac51e46ba618 100644 (file)
--- a/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
+++ b/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
@@ -317,8 +317,9 @@ bool RISCVExpandPseudo::expandRV32ZdinxStore(MachineBasicBlock &MBB,
        .addReg(MBBI->getOperand(1).getReg())
        .add(MBBI->getOperand(2));
    if (MBBI->getOperand(2).isGlobal() || MBBI->getOperand(2).isCPI()) {
-    // FIXME: Zdinx RV32 can not work on unaligned memory.
-    assert(!STI->hasFastUnalignedAccess());
+    // FIXME: Zdinx RV32 can not work on unaligned scalar memory.
+    assert(!STI->hasFastUnalignedAccess() &&
+           !STI->enableUnalignedScalarMem());
  
      assert(MBBI->getOperand(2).getOffset() % 8 == 0);
      MBBI->getOperand(2).setOffset(MBBI->getOperand(2).getOffset() + 4);
diff --git a/llvm/lib/Target/RISCV/RISCVFeatures.td b/llvm/lib/Target/RISCV/RISCVFeatures.td

index 26451c80f57b4230b8ec9f6c9347275999b75174..1bb6b6a561f4a5c55d753b6def54a785b6ad15ad 100644 (file)
--- a/llvm/lib/Target/RISCV/RISCVFeatures.td
+++ b/llvm/lib/Target/RISCV/RISCVFeatures.td
@@ -1025,6 +1025,11 @@ def FeatureFastUnalignedAccess
                        "true", "Has reasonably performant unaligned "
                        "loads and stores (both scalar and vector)">;
  
+def FeatureUnalignedScalarMem
+   : SubtargetFeature<"unaligned-scalar-mem", "EnableUnalignedScalarMem",
+                      "true", "Has reasonably performant unaligned scalar "
+                      "loads and stores">;
+
  def FeaturePostRAScheduler : SubtargetFeature<"use-postra-scheduler",
      "UsePostRAScheduler", "true", "Schedule again after register allocation">;
  
diff --git a/llvm/lib/Target/RISCV/RISCVISelLowering.cpp b/llvm/lib/Target/RISCV/RISCVISelLowering.cpp

index d46093b9e260a202d69980a09eebe18fe55d2e55..3fe7ddfdd4279163b0730b6cf59d41dab8171599 100644 (file)
--- a/llvm/lib/Target/RISCV/RISCVISelLowering.cpp
+++ b/llvm/lib/Target/RISCV/RISCVISelLowering.cpp
@@ -1883,7 +1883,8 @@ bool RISCVTargetLowering::shouldConvertConstantLoadToIntImm(const APInt &Imm,
    // replace. If we don't support unaligned scalar mem, prefer the constant
    // pool.
    // TODO: Can the caller pass down the alignment?
-  if (!Subtarget.hasFastUnalignedAccess())
+  if (!Subtarget.hasFastUnalignedAccess() &&
+      !Subtarget.enableUnalignedScalarMem())
      return true;
  
    // Prefer to keep the load if it would require many instructions.
@@ -19772,8 +19773,10 @@ bool RISCVTargetLowering::allowsMisalignedMemoryAccesses(
      unsigned *Fast) const {
    if (!VT.isVector()) {
      if (Fast)
-      *Fast = Subtarget.hasFastUnalignedAccess();
-    return Subtarget.hasFastUnalignedAccess();
+      *Fast = Subtarget.hasFastUnalignedAccess() ||
+              Subtarget.enableUnalignedScalarMem();
+    return Subtarget.hasFastUnalignedAccess() ||
+           Subtarget.enableUnalignedScalarMem();
    }
  
    // All vector implementations must support element alignment
diff --git a/llvm/test/CodeGen/RISCV/memcpy-inline.ll b/llvm/test/CodeGen/RISCV/memcpy-inline.ll

index 343695ee37da84d47e18135bf745b01c43102f30..709b8264b5833decad28e346270829db93317d1a 100644 (file)
--- a/llvm/test/CodeGen/RISCV/memcpy-inline.ll
+++ b/llvm/test/CodeGen/RISCV/memcpy-inline.ll
@@ -7,6 +7,10 @@
  ; RUN:   | FileCheck %s --check-prefixes=RV32-BOTH,RV32-FAST
  ; RUN: llc < %s -mtriple=riscv64 -mattr=+fast-unaligned-access \
  ; RUN:   | FileCheck %s --check-prefixes=RV64-BOTH,RV64-FAST
+; RUN: llc < %s -mtriple=riscv32 -mattr=+unaligned-scalar-mem \
+; RUN:   | FileCheck %s --check-prefixes=RV32-BOTH,RV32-FAST
+; RUN: llc < %s -mtriple=riscv64 -mattr=+unaligned-scalar-mem \
+; RUN:   | FileCheck %s --check-prefixes=RV64-BOTH,RV64-FAST
  
  ; ----------------------------------------------------------------------
  ; Fully unaligned cases
diff --git a/llvm/test/CodeGen/RISCV/memcpy.ll b/llvm/test/CodeGen/RISCV/memcpy.ll

index 12ec0881b20d9feec44c68968258a85098c640bb..f8f5d25947d7f8dc27704d1bedeb5d8ac55ef7a3 100644 (file)
--- a/llvm/test/CodeGen/RISCV/memcpy.ll
+++ b/llvm/test/CodeGen/RISCV/memcpy.ll
@@ -7,6 +7,10 @@
  ; RUN:   | FileCheck %s --check-prefixes=RV32-BOTH,RV32-FAST
  ; RUN: llc < %s -mtriple=riscv64 -mattr=+fast-unaligned-access \
  ; RUN:   | FileCheck %s --check-prefixes=RV64-BOTH,RV64-FAST
+; RUN: llc < %s -mtriple=riscv32 -mattr=+unaligned-scalar-mem \
+; RUN:   | FileCheck %s --check-prefixes=RV32-BOTH,RV32-FAST
+; RUN: llc < %s -mtriple=riscv64 -mattr=+unaligned-scalar-mem \
+; RUN:   | FileCheck %s --check-prefixes=RV64-BOTH,RV64-FAST
  %struct.x = type { i8, i8, i8, i8, i8, i8, i8, i8, i8, i8, i8 }
  
  @src = external dso_local global %struct.x
diff --git a/llvm/test/CodeGen/RISCV/memset-inline.ll b/llvm/test/CodeGen/RISCV/memset-inline.ll

index cc22b77c641e272a353379dd204f718014458a8c..e131a3480c89e63f6ee36c3a77b22b1134c799e0 100644 (file)
--- a/llvm/test/CodeGen/RISCV/memset-inline.ll
+++ b/llvm/test/CodeGen/RISCV/memset-inline.ll
@@ -7,6 +7,10 @@
  ; RUN:   | FileCheck %s --check-prefixes=RV32-BOTH,RV32-FAST
  ; RUN: llc < %s -mtriple=riscv64 -mattr=+m,+fast-unaligned-access \
  ; RUN:   | FileCheck %s --check-prefixes=RV64-BOTH,RV64-FAST
+; RUN: llc < %s -mtriple=riscv32 -mattr=+m,+unaligned-scalar-mem \
+; RUN:   | FileCheck %s --check-prefixes=RV32-BOTH,RV32-FAST
+; RUN: llc < %s -mtriple=riscv64 -mattr=+m,+unaligned-scalar-mem \
+; RUN:   | FileCheck %s --check-prefixes=RV64-BOTH,RV64-FAST
  %struct.x = type { i8, i8, i8, i8, i8, i8, i8, i8, i8, i8, i8 }
  
  declare void @llvm.memset.p0.i64(ptr nocapture, i8, i64, i1) nounwind
diff --git a/llvm/test/CodeGen/RISCV/pr56110.ll b/llvm/test/CodeGen/RISCV/pr56110.ll

index c795b17419f564edb83f584946f5e90a1a52e5a4..fcf3f691d56e07ba3846b40de64ac27b2a045efc 100644 (file)
--- a/llvm/test/CodeGen/RISCV/pr56110.ll
+++ b/llvm/test/CodeGen/RISCV/pr56110.ll
@@ -1,6 +1,7 @@
  ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
  ; RUN: llc < %s -mtriple=riscv32 | FileCheck %s
  ; RUN: llc < %s -mtriple=riscv32 -mattr=+fast-unaligned-access | FileCheck %s
+; RUN: llc < %s -mtriple=riscv32 -mattr=+unaligned-scalar-mem | FileCheck %s
  
  define void @foo_set(ptr nocapture noundef %a, i32 noundef %v) {
  ; CHECK-LABEL: foo_set:
diff --git a/llvm/test/CodeGen/RISCV/unaligned-load-store.ll b/llvm/test/CodeGen/RISCV/unaligned-load-store.ll

index 599b0d08629eaff2eaac2a2d65e1a94b01400724..641686dce97f697d5c4910e3ae6d37d344ae1b26 100644 (file)
--- a/llvm/test/CodeGen/RISCV/unaligned-load-store.ll
+++ b/llvm/test/CodeGen/RISCV/unaligned-load-store.ll
@@ -7,6 +7,10 @@
  ; RUN:   | FileCheck -check-prefixes=ALL,FAST,RV32I-FAST %s
  ; RUN: llc -mtriple=riscv64 -mattr=+fast-unaligned-access -verify-machineinstrs < %s \
  ; RUN:   | FileCheck -check-prefixes=ALL,FAST,RV64I-FAST %s
+; RUN: llc -mtriple=riscv32 -mattr=+unaligned-scalar-mem -verify-machineinstrs < %s \
+; RUN:   | FileCheck -check-prefixes=ALL,FAST,RV32I-FAST %s
+; RUN: llc -mtriple=riscv64 -mattr=+unaligned-scalar-mem -verify-machineinstrs < %s \
+; RUN:   | FileCheck -check-prefixes=ALL,FAST,RV64I-FAST %s
  
  ; A collection of cases showing codegen for unaligned loads and stores
author	Craig Topper <craig.topper@sifive.com>
	Thu, 16 May 2024 19:27:05 +0000 (12:27 -0700)
committer	Tom Stellard <tstellar@redhat.com>
	Fri, 17 May 2024 20:22:27 +0000 (13:22 -0700)
llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp		patch \| blob \| history
llvm/lib/Target/RISCV/RISCVFeatures.td		patch \| blob \| history
llvm/lib/Target/RISCV/RISCVISelLowering.cpp		patch \| blob \| history
llvm/test/CodeGen/RISCV/memcpy-inline.ll		patch \| blob \| history
llvm/test/CodeGen/RISCV/memcpy.ll		patch \| blob \| history
llvm/test/CodeGen/RISCV/memset-inline.ll		patch \| blob \| history
llvm/test/CodeGen/RISCV/pr56110.ll		patch \| blob \| history
llvm/test/CodeGen/RISCV/unaligned-load-store.ll		patch \| blob \| history