riscv: mm: execute local TLB flush after populating vmemmap
[platform/kernel/linux-starfive.git] / arch / riscv / mm / tlbflush.c
index 77be59a..bdee5de 100644 (file)
@@ -8,28 +8,50 @@
 
 static inline void local_flush_tlb_all_asid(unsigned long asid)
 {
-       __asm__ __volatile__ ("sfence.vma x0, %0"
-                       :
-                       : "r" (asid)
-                       : "memory");
+       if (asid != FLUSH_TLB_NO_ASID)
+               __asm__ __volatile__ ("sfence.vma x0, %0"
+                               :
+                               : "r" (asid)
+                               : "memory");
+       else
+               local_flush_tlb_all();
 }
 
 static inline void local_flush_tlb_page_asid(unsigned long addr,
                unsigned long asid)
 {
-       __asm__ __volatile__ ("sfence.vma %0, %1"
-                       :
-                       : "r" (addr), "r" (asid)
-                       : "memory");
+       if (asid != FLUSH_TLB_NO_ASID)
+               __asm__ __volatile__ ("sfence.vma %0, %1"
+                               :
+                               : "r" (addr), "r" (asid)
+                               : "memory");
+       else
+               local_flush_tlb_page(addr);
 }
 
-static inline void local_flush_tlb_range(unsigned long start,
-               unsigned long size, unsigned long stride)
+/*
+ * Flush entire TLB if number of entries to be flushed is greater
+ * than the threshold below.
+ */
+static unsigned long tlb_flush_all_threshold __read_mostly = 64;
+
+static void local_flush_tlb_range_threshold_asid(unsigned long start,
+                                                unsigned long size,
+                                                unsigned long stride,
+                                                unsigned long asid)
 {
-       if (size <= stride)
-               local_flush_tlb_page(start);
-       else
-               local_flush_tlb_all();
+       unsigned long nr_ptes_in_range = DIV_ROUND_UP(size, stride);
+       int i;
+
+       if (nr_ptes_in_range > tlb_flush_all_threshold) {
+               local_flush_tlb_all_asid(asid);
+               return;
+       }
+
+       for (i = 0; i < nr_ptes_in_range; ++i) {
+               local_flush_tlb_page_asid(start, asid);
+               start += stride;
+       }
 }
 
 static inline void local_flush_tlb_range_asid(unsigned long start,
@@ -37,8 +59,16 @@ static inline void local_flush_tlb_range_asid(unsigned long start,
 {
        if (size <= stride)
                local_flush_tlb_page_asid(start, asid);
-       else
+       else if (size == FLUSH_TLB_MAX_SIZE)
                local_flush_tlb_all_asid(asid);
+       else
+               local_flush_tlb_range_threshold_asid(start, size, stride, asid);
+}
+
+/* Flush a range of kernel pages without broadcasting */
+void local_flush_tlb_kernel_range(unsigned long start, unsigned long end)
+{
+       local_flush_tlb_range_asid(start, end - start, PAGE_SIZE, FLUSH_TLB_NO_ASID);
 }
 
 static void __ipi_flush_tlb_all(void *info)
@@ -51,7 +81,7 @@ void flush_tlb_all(void)
        if (riscv_use_ipi_for_rfence())
                on_each_cpu(__ipi_flush_tlb_all, NULL, 1);
        else
-               sbi_remote_sfence_vma(NULL, 0, -1);
+               sbi_remote_sfence_vma_asid(NULL, 0, FLUSH_TLB_MAX_SIZE, FLUSH_TLB_NO_ASID);
 }
 
 struct flush_tlb_range_data {
@@ -68,68 +98,62 @@ static void __ipi_flush_tlb_range_asid(void *info)
        local_flush_tlb_range_asid(d->start, d->size, d->stride, d->asid);
 }
 
-static void __ipi_flush_tlb_range(void *info)
-{
-       struct flush_tlb_range_data *d = info;
-
-       local_flush_tlb_range(d->start, d->size, d->stride);
-}
-
 static void __flush_tlb_range(struct mm_struct *mm, unsigned long start,
                              unsigned long size, unsigned long stride)
 {
        struct flush_tlb_range_data ftd;
-       struct cpumask *cmask = mm_cpumask(mm);
-       unsigned int cpuid;
+       const struct cpumask *cmask;
+       unsigned long asid = FLUSH_TLB_NO_ASID;
        bool broadcast;
 
-       if (cpumask_empty(cmask))
-               return;
+       if (mm) {
+               unsigned int cpuid;
+
+               cmask = mm_cpumask(mm);
+               if (cpumask_empty(cmask))
+                       return;
+
+               cpuid = get_cpu();
+               /* check if the tlbflush needs to be sent to other CPUs */
+               broadcast = cpumask_any_but(cmask, cpuid) < nr_cpu_ids;
+
+               if (static_branch_unlikely(&use_asid_allocator))
+                       asid = atomic_long_read(&mm->context.id) & asid_mask;
+       } else {
+               cmask = cpu_online_mask;
+               broadcast = true;
+       }
 
-       cpuid = get_cpu();
-       /* check if the tlbflush needs to be sent to other CPUs */
-       broadcast = cpumask_any_but(cmask, cpuid) < nr_cpu_ids;
-       if (static_branch_unlikely(&use_asid_allocator)) {
-               unsigned long asid = atomic_long_read(&mm->context.id) & asid_mask;
-
-               if (broadcast) {
-                       if (riscv_use_ipi_for_rfence()) {
-                               ftd.asid = asid;
-                               ftd.start = start;
-                               ftd.size = size;
-                               ftd.stride = stride;
-                               on_each_cpu_mask(cmask,
-                                                __ipi_flush_tlb_range_asid,
-                                                &ftd, 1);
-                       } else
-                               sbi_remote_sfence_vma_asid(cmask,
-                                                          start, size, asid);
-               } else {
-                       local_flush_tlb_range_asid(start, size, stride, asid);
-               }
+       if (broadcast) {
+               if (riscv_use_ipi_for_rfence()) {
+                       ftd.asid = asid;
+                       ftd.start = start;
+                       ftd.size = size;
+                       ftd.stride = stride;
+                       on_each_cpu_mask(cmask,
+                                        __ipi_flush_tlb_range_asid,
+                                        &ftd, 1);
+               } else
+                       sbi_remote_sfence_vma_asid(cmask,
+                                                  start, size, asid);
        } else {
-               if (broadcast) {
-                       if (riscv_use_ipi_for_rfence()) {
-                               ftd.asid = 0;
-                               ftd.start = start;
-                               ftd.size = size;
-                               ftd.stride = stride;
-                               on_each_cpu_mask(cmask,
-                                                __ipi_flush_tlb_range,
-                                                &ftd, 1);
-                       } else
-                               sbi_remote_sfence_vma(cmask, start, size);
-               } else {
-                       local_flush_tlb_range(start, size, stride);
-               }
+               local_flush_tlb_range_asid(start, size, stride, asid);
        }
 
-       put_cpu();
+       if (mm)
+               put_cpu();
 }
 
 void flush_tlb_mm(struct mm_struct *mm)
 {
-       __flush_tlb_range(mm, 0, -1, PAGE_SIZE);
+       __flush_tlb_range(mm, 0, FLUSH_TLB_MAX_SIZE, PAGE_SIZE);
+}
+
+void flush_tlb_mm_range(struct mm_struct *mm,
+                       unsigned long start, unsigned long end,
+                       unsigned int page_size)
+{
+       __flush_tlb_range(mm, start, end - start, page_size);
 }
 
 void flush_tlb_page(struct vm_area_struct *vma, unsigned long addr)
@@ -142,6 +166,12 @@ void flush_tlb_range(struct vm_area_struct *vma, unsigned long start,
 {
        __flush_tlb_range(vma->vm_mm, start, end - start, PAGE_SIZE);
 }
+
+void flush_tlb_kernel_range(unsigned long start, unsigned long end)
+{
+       __flush_tlb_range(NULL, start, end - start, PAGE_SIZE);
+}
+
 #ifdef CONFIG_TRANSPARENT_HUGEPAGE
 void flush_pmd_tlb_range(struct vm_area_struct *vma, unsigned long start,
                        unsigned long end)