Merge branch 'akpm' (patches from Andrew)

author Linus Torvalds <torvalds@linux-foundation.org>

Fri, 7 Aug 2020 18:39:33 +0000 (11:39 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Fri, 7 Aug 2020 18:39:33 +0000 (11:39 -0700)
author Linus Torvalds <torvalds@linux-foundation.org>
Fri, 7 Aug 2020 18:39:33 +0000 (11:39 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Fri, 7 Aug 2020 18:39:33 +0000 (11:39 -0700)
diff --combined Documentation/admin-guide/kernel-parameters.txt

index 00b993a,c955522..98ea67f
--- 1/Documentation/admin-guide/kernel-parameters.txt
--- 2/Documentation/admin-guide/kernel-parameters.txt
+++ b/Documentation/admin-guide/kernel-parameters.txt
@@@ -916,10 -916,6 +916,10 @@@
         disable_radix   [PPC]
                         Disable RADIX MMU mode on POWER9
   
+ +      radix_hcall_invalidate=on  [PPC/PSERIES]
+ +                      Disable RADIX GTSE feature and use hcall for TLB
+ +                      invalidate.
+ +
         disable_tlbie   [PPC]
                         Disable TLBIE instruction. Currently does not work
                         with KVM, with HASH MMU, or with coherent accelerators.
@@@ -4693,7 -4689,7 +4693,7 @@@
                         fragmentation.  Defaults to 1 for systems with
                         more than 32MB of RAM, 0 otherwise.
   
-       slub_debug[=options[,slabs]]    [MM, SLUB]
+       slub_debug[=options[,slabs][;[options[,slabs]]...]      [MM, SLUB]
                         Enabling slub_debug allows one to determine the
                         culprit if slab objects become corrupted. Enabling
                         slub_debug can create guard zones around objects and
diff --combined arch/m68k/mm/mcfmmu.c

index a3e7e4e,7068126..2b9cb4a
--- 1/arch/m68k/mm/mcfmmu.c
--- 2/arch/m68k/mm/mcfmmu.c
+++ b/arch/m68k/mm/mcfmmu.c
@@@ -20,6 -20,7 +20,7 @@@
   #include <asm/mmu_context.h>
   #include <asm/mcf_pgalloc.h>
   #include <asm/tlbflush.h>
+ #include <asm/pgalloc.h>
   
   #define KMAPAREA(x)   ((x >= VMALLOC_START) && (x < KMAP_END))
   
@@@ -39,6 -40,7 +40,6 @@@ void __init paging_init(void
         unsigned long address, size;
         unsigned long next_pgtable, bootmem_end;
         unsigned long max_zone_pfn[MAX_NR_ZONES] = { 0 };
- -      enum zone_type zone;
         int i;
   
         empty_zero_page = (void *) memblock_alloc(PAGE_SIZE, PAGE_SIZE);
@@@ -213,6 -215,11 +214,6 @@@ void __init cf_mmu_context_init(void
   
   /*
    * Steal a context from a task that has one at the moment.
- - * This is only used on 8xx and 4xx and we presently assume that
- - * they don't do SMP.  If they do then thicfpgalloc.hs will have to check
- - * whether the MM we steal is in use.
- - * We also assume that this is only used on systems that don't
- - * use an MMU hash table - this is true for 8xx and 4xx.
    * This isn't an LRU system, it just frees up each context in
    * turn (sort-of pseudo-random replacement :).  This would be the
    * place to implement an LRU scheme if anyone was motivated to do it.
diff --combined arch/powerpc/mm/init_32.c

index bf1717f,7ea19dc..02c7db4
--- 1/arch/powerpc/mm/init_32.c
--- 2/arch/powerpc/mm/init_32.c
+++ b/arch/powerpc/mm/init_32.c
@@@ -29,7 -29,6 +29,6 @@@
   #include <linux/slab.h>
   #include <linux/hugetlb.h>
   
- #include <asm/pgalloc.h>
   #include <asm/prom.h>
   #include <asm/io.h>
   #include <asm/mmu.h>
@@@ -171,8 -170,6 +170,8 @@@ void __init MMU_init(void
         btext_unmap();
   #endif
   
+ +      kasan_mmu_init();
+ +
         setup_kup();
   
         /* Shortly after that, the entire linear mapping will be available */
diff --combined arch/powerpc/mm/init_64.c

index 4ae5fc0,3fd504d..02e127f
--- 1/arch/powerpc/mm/init_64.c
--- 2/arch/powerpc/mm/init_64.c
+++ b/arch/powerpc/mm/init_64.c
@@@ -225,12 -225,12 +225,12 @@@ int __meminit vmemmap_populate(unsigne
                  * fall back to system memory if the altmap allocation fail.
                  */
                 if (altmap && !altmap_cross_boundary(altmap, start, page_size)) {
-                       p = altmap_alloc_block_buf(page_size, altmap);
+                       p = vmemmap_alloc_block_buf(page_size, node, altmap);
                         if (!p)
                                 pr_debug("altmap block allocation failed, falling back to system memory");
                 }
                 if (!p)
-                       p = vmemmap_alloc_block_buf(page_size, node);
+                       p = vmemmap_alloc_block_buf(page_size, node, NULL);
                 if (!p)
                         return -ENOMEM;
   
@@@ -406,15 -406,13 +406,15 @@@ static void __init early_check_vec5(voi
                 }
                 if (!(vec5[OV5_INDX(OV5_RADIX_GTSE)] &
                                                 OV5_FEAT(OV5_RADIX_GTSE))) {
- -                      pr_warn("WARNING: Hypervisor doesn't support RADIX with GTSE\n");
- -              }
+ +                      cur_cpu_spec->mmu_features &= ~MMU_FTR_GTSE;
+ +              } else
+ +                      cur_cpu_spec->mmu_features |= MMU_FTR_GTSE;
                 /* Do radix anyway - the hypervisor said we had to */
                 cur_cpu_spec->mmu_features |= MMU_FTR_TYPE_RADIX;
         } else if (mmu_supported == OV5_FEAT(OV5_MMU_HASH)) {
                 /* Hypervisor only supports hash - disable radix */
                 cur_cpu_spec->mmu_features &= ~MMU_FTR_TYPE_RADIX;
+ +              cur_cpu_spec->mmu_features &= ~MMU_FTR_GTSE;
         }
   }
   
diff --combined arch/powerpc/mm/mem.c

index 9dafc63,ec68c9e..42e2587
--- 1/arch/powerpc/mm/mem.c
--- 2/arch/powerpc/mm/mem.c
+++ b/arch/powerpc/mm/mem.c
@@@ -34,7 -34,6 +34,6 @@@
   #include <linux/dma-direct.h>
   #include <linux/kprobes.h>
   
- #include <asm/pgalloc.h>
   #include <asm/prom.h>
   #include <asm/io.h>
   #include <asm/mmu_context.h>
@@@ -127,6 -126,8 +126,6 @@@ int __ref arch_add_memory(int nid, u64 
         unsigned long nr_pages = size >> PAGE_SHIFT;
         int rc;
   
- -      resize_hpt_for_hotplug(memblock_phys_mem_size());
- -
         start = (unsigned long)__va(start);
         rc = create_section_mapping(start, start + size, nid,
                                     params->pgprot);
@@@ -159,6 -160,9 +158,6 @@@ void __ref arch_remove_memory(int nid, 
          * hit that section of memory
          */
         vm_unmap_aliases();
- -
- -      if (resize_hpt_for_hotplug(memblock_phys_mem_size()) == -ENOSPC)
- -              pr_warn("Hash collision while resizing HPT\n");
   }
   #endif
   
@@@ -179,8 -183,6 +178,6 @@@ void __init mem_topology_setup(void
   
   void __init initmem_init(void)
   {
-       /* XXX need to clip this if using highmem? */
-       sparse_memory_present_with_active_regions(0);
         sparse_init();
   }
   
diff --combined arch/powerpc/mm/numa.c

index 058fee9,03a81d6..1f61fa2
--- 1/arch/powerpc/mm/numa.c
--- 2/arch/powerpc/mm/numa.c
+++ b/arch/powerpc/mm/numa.c
@@@ -221,8 -221,7 +221,8 @@@ static void initialize_distance_lookup_
         }
   }
   
- -/* Returns nid in the range [0..MAX_NUMNODES-1], or -1 if no useful numa
+ +/*
+ + * Returns nid in the range [0..nr_node_ids], or -1 if no useful NUMA
    * info is found.
    */
   static int associativity_to_nid(const __be32 *associativity)
@@@ -236,7 -235,7 +236,7 @@@
                 nid = of_read_number(&associativity[min_common_depth], 1);
   
         /* POWER4 LPAR uses 0xffff as invalid node */
- -      if (nid == 0xffff || nid >= MAX_NUMNODES)
+ +      if (nid == 0xffff || nid >= nr_node_ids)
                 nid = NUMA_NO_NODE;
   
         if (nid > 0 &&
@@@ -449,7 -448,7 +449,7 @@@ static int of_drconf_to_nid_single(stru
                 index = lmb->aa_index * aa.array_sz + min_common_depth - 1;
                 nid = of_read_number(&aa.arrays[index], 1);
   
- -              if (nid == 0xffff || nid >= MAX_NUMNODES)
+ +              if (nid == 0xffff || nid >= nr_node_ids)
                         nid = default_nid;
   
                 if (nid > 0) {
@@@ -645,9 -644,8 +645,9 @@@ static inline int __init read_usm_range
    * Extract NUMA information from the ibm,dynamic-reconfiguration-memory
    * node.  This assumes n_mem_{addr,size}_cells have been set.
    */
- -static void __init numa_setup_drmem_lmb(struct drmem_lmb *lmb,
- -                                      const __be32 **usm)
+ +static int __init numa_setup_drmem_lmb(struct drmem_lmb *lmb,
+ +                                      const __be32 **usm,
+ +                                      void *data)
   {
         unsigned int ranges, is_kexec_kdump = 0;
         unsigned long base, size, sz;
@@@ -659,7 -657,7 +659,7 @@@
          */
         if ((lmb->flags & DRCONF_MEM_RESERVED)
             || !(lmb->flags & DRCONF_MEM_ASSIGNED))
- -              return;
+ +              return 0;
   
         if (*usm)
                 is_kexec_kdump = 1;
@@@ -671,7 -669,7 +671,7 @@@
         if (is_kexec_kdump) {
                 ranges = read_usm_ranges(usm);
                 if (!ranges) /* there are no (base, size) duple */
- -                      return;
+ +                      return 0;
         }
   
         do {
@@@ -688,8 -686,6 +688,8 @@@
                 if (sz)
                         memblock_set_node(base, sz, &memblock.memory, nid);
         } while (--ranges);
+ +
+ +      return 0;
   }
   
   static int __init parse_numa_properties(void)
@@@ -791,7 -787,7 +791,7 @@@ new_range
          */
         memory = of_find_node_by_path("/ibm,dynamic-reconfiguration-memory");
         if (memory) {
- -              walk_drmem_lmbs(memory, numa_setup_drmem_lmb);
+ +              walk_drmem_lmbs(memory, NULL, numa_setup_drmem_lmb);
                 of_node_put(memory);
         }
   
@@@ -953,7 -949,6 +953,6 @@@ void __init initmem_init(void
   
                 get_pfn_range_for_nid(nid, &start_pfn, &end_pfn);
                 setup_node_data(nid, start_pfn, end_pfn);
-               sparse_memory_present_with_active_regions(nid);
         }
   
         sparse_init();
@@@ -988,6 -983,28 +987,6 @@@ static int __init early_numa(char *p
   }
   early_param("numa", early_numa);
   
- -/*
- - * The platform can inform us through one of several mechanisms
- - * (post-migration device tree updates, PRRN or VPHN) that the NUMA
- - * assignment of a resource has changed. This controls whether we act
- - * on that. Disabled by default.
- - */
- -static bool topology_updates_enabled;
- -
- -static int __init early_topology_updates(char *p)
- -{
- -      if (!p)
- -              return 0;
- -
- -      if (!strcmp(p, "on")) {
- -              pr_warn("Caution: enabling topology updates\n");
- -              topology_updates_enabled = true;
- -      }
- -
- -      return 0;
- -}
- -early_param("topology_updates", early_topology_updates);
- -
   #ifdef CONFIG_MEMORY_HOTPLUG
   /*
    * Find the node associated with a hot added memory section for
@@@ -1126,9 -1143,98 +1125,9 @@@ u64 memory_hotplug_max(void
   
   /* Virtual Processor Home Node (VPHN) support */
   #ifdef CONFIG_PPC_SPLPAR
- -struct topology_update_data {
- -      struct topology_update_data *next;
- -      unsigned int cpu;
- -      int old_nid;
- -      int new_nid;
- -};
- -
- -#define TOPOLOGY_DEF_TIMER_SECS       60
- -
- -static u8 vphn_cpu_change_counts[NR_CPUS][MAX_DISTANCE_REF_POINTS];
- -static cpumask_t cpu_associativity_changes_mask;
- -static int vphn_enabled;
- -static int prrn_enabled;
- -static void reset_topology_timer(void);
- -static int topology_timer_secs = 1;
   static int topology_inited;
   
   /*
- - * Change polling interval for associativity changes.
- - */
- -int timed_topology_update(int nsecs)
- -{
- -      if (vphn_enabled) {
- -              if (nsecs > 0)
- -                      topology_timer_secs = nsecs;
- -              else
- -                      topology_timer_secs = TOPOLOGY_DEF_TIMER_SECS;
- -
- -              reset_topology_timer();
- -      }
- -
- -      return 0;
- -}
- -
- -/*
- - * Store the current values of the associativity change counters in the
- - * hypervisor.
- - */
- -static void setup_cpu_associativity_change_counters(void)
- -{
- -      int cpu;
- -
- -      /* The VPHN feature supports a maximum of 8 reference points */
- -      BUILD_BUG_ON(MAX_DISTANCE_REF_POINTS > 8);
- -
- -      for_each_possible_cpu(cpu) {
- -              int i;
- -              u8 *counts = vphn_cpu_change_counts[cpu];
- -              volatile u8 *hypervisor_counts = lppaca_of(cpu).vphn_assoc_counts;
- -
- -              for (i = 0; i < distance_ref_points_depth; i++)
- -                      counts[i] = hypervisor_counts[i];
- -      }
- -}
- -
- -/*
- - * The hypervisor maintains a set of 8 associativity change counters in
- - * the VPA of each cpu that correspond to the associativity levels in the
- - * ibm,associativity-reference-points property. When an associativity
- - * level changes, the corresponding counter is incremented.
- - *
- - * Set a bit in cpu_associativity_changes_mask for each cpu whose home
- - * node associativity levels have changed.
- - *
- - * Returns the number of cpus with unhandled associativity changes.
- - */
- -static int update_cpu_associativity_changes_mask(void)
- -{
- -      int cpu;
- -      cpumask_t *changes = &cpu_associativity_changes_mask;
- -
- -      for_each_possible_cpu(cpu) {
- -              int i, changed = 0;
- -              u8 *counts = vphn_cpu_change_counts[cpu];
- -              volatile u8 *hypervisor_counts = lppaca_of(cpu).vphn_assoc_counts;
- -
- -              for (i = 0; i < distance_ref_points_depth; i++) {
- -                      if (hypervisor_counts[i] != counts[i]) {
- -                              counts[i] = hypervisor_counts[i];
- -                              changed = 1;
- -                      }
- -              }
- -              if (changed) {
- -                      cpumask_or(changes, changes, cpu_sibling_mask(cpu));
- -                      cpu = cpu_last_thread_sibling(cpu);
- -              }
- -      }
- -
- -      return cpumask_weight(changes);
- -}
- -
- -/*
    * Retrieve the new associativity information for a virtual processor's
    * home node.
    */
@@@ -1143,6 -1249,7 +1142,6 @@@ static long vphn_get_associativity(unsi
         switch (rc) {
         case H_SUCCESS:
                 dbg("VPHN hcall succeeded. Reset polling...\n");
- -              timed_topology_update(0);
                 goto out;
   
         case H_FUNCTION:
@@@ -1161,6 -1268,8 +1160,6 @@@
                         , rc);
                 break;
         }
- -
- -      stop_topology_update();
   out:
         return rc;
   }
@@@ -1204,8 -1313,380 +1203,8 @@@ int find_and_online_cpu_nid(int cpu
         return new_nid;
   }
   
- -/*
- - * Update the CPU maps and sysfs entries for a single CPU when its NUMA
- - * characteristics change. This function doesn't perform any locking and is
- - * only safe to call from stop_machine().
- - */
- -static int update_cpu_topology(void *data)
- -{
- -      struct topology_update_data *update;
- -      unsigned long cpu;
- -
- -      if (!data)
- -              return -EINVAL;
- -
- -      cpu = smp_processor_id();
- -
- -      for (update = data; update; update = update->next) {
- -              int new_nid = update->new_nid;
- -              if (cpu != update->cpu)
- -                      continue;
- -
- -              unmap_cpu_from_node(cpu);
- -              map_cpu_to_node(cpu, new_nid);
- -              set_cpu_numa_node(cpu, new_nid);
- -              set_cpu_numa_mem(cpu, local_memory_node(new_nid));
- -              vdso_getcpu_init();
- -      }
- -
- -      return 0;
- -}
- -
- -static int update_lookup_table(void *data)
- -{
- -      struct topology_update_data *update;
- -
- -      if (!data)
- -              return -EINVAL;
- -
- -      /*
- -       * Upon topology update, the numa-cpu lookup table needs to be updated
- -       * for all threads in the core, including offline CPUs, to ensure that
- -       * future hotplug operations respect the cpu-to-node associativity
- -       * properly.
- -       */
- -      for (update = data; update; update = update->next) {
- -              int nid, base, j;
- -
- -              nid = update->new_nid;
- -              base = cpu_first_thread_sibling(update->cpu);
- -
- -              for (j = 0; j < threads_per_core; j++) {
- -                      update_numa_cpu_lookup_table(base + j, nid);
- -              }
- -      }
- -
- -      return 0;
- -}
- -
- -/*
- - * Update the node maps and sysfs entries for each cpu whose home node
- - * has changed. Returns 1 when the topology has changed, and 0 otherwise.
- - *
- - * cpus_locked says whether we already hold cpu_hotplug_lock.
- - */
- -int numa_update_cpu_topology(bool cpus_locked)
- -{
- -      unsigned int cpu, sibling, changed = 0;
- -      struct topology_update_data *updates, *ud;
- -      cpumask_t updated_cpus;
- -      struct device *dev;
- -      int weight, new_nid, i = 0;
- -
- -      if (!prrn_enabled && !vphn_enabled && topology_inited)
- -              return 0;
- -
- -      weight = cpumask_weight(&cpu_associativity_changes_mask);
- -      if (!weight)
- -              return 0;
- -
- -      updates = kcalloc(weight, sizeof(*updates), GFP_KERNEL);
- -      if (!updates)
- -              return 0;
- -
- -      cpumask_clear(&updated_cpus);
- -
- -      for_each_cpu(cpu, &cpu_associativity_changes_mask) {
- -              /*
- -               * If siblings aren't flagged for changes, updates list
- -               * will be too short. Skip on this update and set for next
- -               * update.
- -               */
- -              if (!cpumask_subset(cpu_sibling_mask(cpu),
- -                                      &cpu_associativity_changes_mask)) {
- -                      pr_info("Sibling bits not set for associativity "
- -                                      "change, cpu%d\n", cpu);
- -                      cpumask_or(&cpu_associativity_changes_mask,
- -                                      &cpu_associativity_changes_mask,
- -                                      cpu_sibling_mask(cpu));
- -                      cpu = cpu_last_thread_sibling(cpu);
- -                      continue;
- -              }
- -
- -              new_nid = find_and_online_cpu_nid(cpu);
- -
- -              if (new_nid == numa_cpu_lookup_table[cpu]) {
- -                      cpumask_andnot(&cpu_associativity_changes_mask,
- -                                      &cpu_associativity_changes_mask,
- -                                      cpu_sibling_mask(cpu));
- -                      dbg("Assoc chg gives same node %d for cpu%d\n",
- -                                      new_nid, cpu);
- -                      cpu = cpu_last_thread_sibling(cpu);
- -                      continue;
- -              }
- -
- -              for_each_cpu(sibling, cpu_sibling_mask(cpu)) {
- -                      ud = &updates[i++];
- -                      ud->next = &updates[i];
- -                      ud->cpu = sibling;
- -                      ud->new_nid = new_nid;
- -                      ud->old_nid = numa_cpu_lookup_table[sibling];
- -                      cpumask_set_cpu(sibling, &updated_cpus);
- -              }
- -              cpu = cpu_last_thread_sibling(cpu);
- -      }
- -
- -      /*
- -       * Prevent processing of 'updates' from overflowing array
- -       * where last entry filled in a 'next' pointer.
- -       */
- -      if (i)
- -              updates[i-1].next = NULL;
- -
- -      pr_debug("Topology update for the following CPUs:\n");
- -      if (cpumask_weight(&updated_cpus)) {
- -              for (ud = &updates[0]; ud; ud = ud->next) {
- -                      pr_debug("cpu %d moving from node %d "
- -                                        "to %d\n", ud->cpu,
- -                                        ud->old_nid, ud->new_nid);
- -              }
- -      }
- -
- -      /*
- -       * In cases where we have nothing to update (because the updates list
- -       * is too short or because the new topology is same as the old one),
- -       * skip invoking update_cpu_topology() via stop-machine(). This is
- -       * necessary (and not just a fast-path optimization) since stop-machine
- -       * can end up electing a random CPU to run update_cpu_topology(), and
- -       * thus trick us into setting up incorrect cpu-node mappings (since
- -       * 'updates' is kzalloc()'ed).
- -       *
- -       * And for the similar reason, we will skip all the following updating.
- -       */
- -      if (!cpumask_weight(&updated_cpus))
- -              goto out;
- -
- -      if (cpus_locked)
- -              stop_machine_cpuslocked(update_cpu_topology, &updates[0],
- -                                      &updated_cpus);
- -      else
- -              stop_machine(update_cpu_topology, &updates[0], &updated_cpus);
- -
- -      /*
- -       * Update the numa-cpu lookup table with the new mappings, even for
- -       * offline CPUs. It is best to perform this update from the stop-
- -       * machine context.
- -       */
- -      if (cpus_locked)
- -              stop_machine_cpuslocked(update_lookup_table, &updates[0],
- -                                      cpumask_of(raw_smp_processor_id()));
- -      else
- -              stop_machine(update_lookup_table, &updates[0],
- -                           cpumask_of(raw_smp_processor_id()));
- -
- -      for (ud = &updates[0]; ud; ud = ud->next) {
- -              unregister_cpu_under_node(ud->cpu, ud->old_nid);
- -              register_cpu_under_node(ud->cpu, ud->new_nid);
- -
- -              dev = get_cpu_device(ud->cpu);
- -              if (dev)
- -                      kobject_uevent(&dev->kobj, KOBJ_CHANGE);
- -              cpumask_clear_cpu(ud->cpu, &cpu_associativity_changes_mask);
- -              changed = 1;
- -      }
- -
- -out:
- -      kfree(updates);
- -      return changed;
- -}
- -
- -int arch_update_cpu_topology(void)
- -{
- -      return numa_update_cpu_topology(true);
- -}
- -
- -static void topology_work_fn(struct work_struct *work)
- -{
- -      rebuild_sched_domains();
- -}
- -static DECLARE_WORK(topology_work, topology_work_fn);
- -
- -static void topology_schedule_update(void)
- -{
- -      schedule_work(&topology_work);
- -}
- -
- -static void topology_timer_fn(struct timer_list *unused)
- -{
- -      if (prrn_enabled && cpumask_weight(&cpu_associativity_changes_mask))
- -              topology_schedule_update();
- -      else if (vphn_enabled) {
- -              if (update_cpu_associativity_changes_mask() > 0)
- -                      topology_schedule_update();
- -              reset_topology_timer();
- -      }
- -}
- -static struct timer_list topology_timer;
- -
- -static void reset_topology_timer(void)
- -{
- -      if (vphn_enabled)
- -              mod_timer(&topology_timer, jiffies + topology_timer_secs * HZ);
- -}
- -
- -#ifdef CONFIG_SMP
- -
- -static int dt_update_callback(struct notifier_block *nb,
- -                              unsigned long action, void *data)
- -{
- -      struct of_reconfig_data *update = data;
- -      int rc = NOTIFY_DONE;
- -
- -      switch (action) {
- -      case OF_RECONFIG_UPDATE_PROPERTY:
- -              if (of_node_is_type(update->dn, "cpu") &&
- -                  !of_prop_cmp(update->prop->name, "ibm,associativity")) {
- -                      u32 core_id;
- -                      of_property_read_u32(update->dn, "reg", &core_id);
- -                      rc = dlpar_cpu_readd(core_id);
- -                      rc = NOTIFY_OK;
- -              }
- -              break;
- -      }
- -
- -      return rc;
- -}
- -
- -static struct notifier_block dt_update_nb = {
- -      .notifier_call = dt_update_callback,
- -};
- -
- -#endif
- -
- -/*
- - * Start polling for associativity changes.
- - */
- -int start_topology_update(void)
- -{
- -      int rc = 0;
- -
- -      if (!topology_updates_enabled)
- -              return 0;
- -
- -      if (firmware_has_feature(FW_FEATURE_PRRN)) {
- -              if (!prrn_enabled) {
- -                      prrn_enabled = 1;
- -#ifdef CONFIG_SMP
- -                      rc = of_reconfig_notifier_register(&dt_update_nb);
- -#endif
- -              }
- -      }
- -      if (firmware_has_feature(FW_FEATURE_VPHN) &&
- -                 lppaca_shared_proc(get_lppaca())) {
- -              if (!vphn_enabled) {
- -                      vphn_enabled = 1;
- -                      setup_cpu_associativity_change_counters();
- -                      timer_setup(&topology_timer, topology_timer_fn,
- -                                  TIMER_DEFERRABLE);
- -                      reset_topology_timer();
- -              }
- -      }
- -
- -      pr_info("Starting topology update%s%s\n",
- -              (prrn_enabled ? " prrn_enabled" : ""),
- -              (vphn_enabled ? " vphn_enabled" : ""));
- -
- -      return rc;
- -}
- -
- -/*
- - * Disable polling for VPHN associativity changes.
- - */
- -int stop_topology_update(void)
- -{
- -      int rc = 0;
- -
- -      if (!topology_updates_enabled)
- -              return 0;
- -
- -      if (prrn_enabled) {
- -              prrn_enabled = 0;
- -#ifdef CONFIG_SMP
- -              rc = of_reconfig_notifier_unregister(&dt_update_nb);
- -#endif
- -      }
- -      if (vphn_enabled) {
- -              vphn_enabled = 0;
- -              rc = del_timer_sync(&topology_timer);
- -      }
- -
- -      pr_info("Stopping topology update\n");
- -
- -      return rc;
- -}
- -
- -int prrn_is_enabled(void)
- -{
- -      return prrn_enabled;
- -}
- -
- -static int topology_read(struct seq_file *file, void *v)
- -{
- -      if (vphn_enabled || prrn_enabled)
- -              seq_puts(file, "on\n");
- -      else
- -              seq_puts(file, "off\n");
- -
- -      return 0;
- -}
- -
- -static int topology_open(struct inode *inode, struct file *file)
- -{
- -      return single_open(file, topology_read, NULL);
- -}
- -
- -static ssize_t topology_write(struct file *file, const char __user *buf,
- -                            size_t count, loff_t *off)
- -{
- -      char kbuf[4]; /* "on" or "off" plus null. */
- -      int read_len;
- -
- -      read_len = count < 3 ? count : 3;
- -      if (copy_from_user(kbuf, buf, read_len))
- -              return -EINVAL;
- -
- -      kbuf[read_len] = '\0';
- -
- -      if (!strncmp(kbuf, "on", 2)) {
- -              topology_updates_enabled = true;
- -              start_topology_update();
- -      } else if (!strncmp(kbuf, "off", 3)) {
- -              stop_topology_update();
- -              topology_updates_enabled = false;
- -      } else
- -              return -EINVAL;
- -
- -      return count;
- -}
- -
- -static const struct proc_ops topology_proc_ops = {
- -      .proc_read      = seq_read,
- -      .proc_write     = topology_write,
- -      .proc_open      = topology_open,
- -      .proc_release   = single_release,
- -};
- -
   static int topology_update_init(void)
   {
- -      start_topology_update();
- -
- -      if (vphn_enabled)
- -              topology_schedule_update();
- -
- -      if (!proc_create("powerpc/topology_updates", 0644, NULL, &topology_proc_ops))
- -              return -ENOMEM;
- -
         topology_inited = 1;
         return 0;
   }
diff --combined arch/powerpc/mm/ptdump/hashpagetable.c

index 5b8bd34,ff4b05a..ad6df9a
--- 1/arch/powerpc/mm/ptdump/hashpagetable.c
--- 2/arch/powerpc/mm/ptdump/hashpagetable.c
+++ b/arch/powerpc/mm/ptdump/hashpagetable.c
@@@ -17,10 -17,10 +17,10 @@@
   #include <linux/seq_file.h>
   #include <linux/const.h>
   #include <asm/page.h>
- #include <asm/pgalloc.h>
   #include <asm/plpar_wrappers.h>
   #include <linux/memblock.h>
   #include <asm/firmware.h>
+ #include <asm/pgalloc.h>
   
   struct pg_state {
         struct seq_file *seq;
@@@ -258,7 -258,7 +258,7 @@@ static int pseries_find(unsigned long e
         for (i = 0; i < HPTES_PER_GROUP; i += 4, hpte_group += 4) {
                 lpar_rc = plpar_pte_read_4(0, hpte_group, (void *)ptes);
   
- -              if (lpar_rc != H_SUCCESS)
+ +              if (lpar_rc)
                         continue;
                 for (j = 0; j < 4; j++) {
                         if (HPTE_V_COMPARE(ptes[j].v, want_v) &&
diff --combined arch/powerpc/mm/ptdump/ptdump.c

index c911cd7,f7ba13c..aca354f
--- 1/arch/powerpc/mm/ptdump/ptdump.c
--- 2/arch/powerpc/mm/ptdump/ptdump.c
+++ b/arch/powerpc/mm/ptdump/ptdump.c
@@@ -21,7 -21,6 +21,6 @@@
   #include <asm/fixmap.h>
   #include <linux/const.h>
   #include <asm/page.h>
- #include <asm/pgalloc.h>
   #include <asm/hugetlb.h>
   
   #include <mm/mmu_decl.h>
@@@ -74,10 -73,6 +73,10 @@@ struct addr_marker 
   
   static struct addr_marker address_markers[] = {
         { 0,    "Start of kernel VM" },
+ +#ifdef MODULES_VADDR
+ +      { 0,    "modules start" },
+ +      { 0,    "modules end" },
+ +#endif
         { 0,    "vmalloc() Area" },
         { 0,    "vmalloc() End" },
   #ifdef CONFIG_PPC64
@@@ -199,24 -194,6 +198,24 @@@ static void note_prot_wx(struct pg_stat
         st->wx_pages += (addr - st->start_address) / PAGE_SIZE;
   }
   
+ +static void note_page_update_state(struct pg_state *st, unsigned long addr,
+ +                                 unsigned int level, u64 val, unsigned long page_size)
+ +{
+ +      u64 flag = val & pg_level[level].mask;
+ +      u64 pa = val & PTE_RPN_MASK;
+ +
+ +      st->level = level;
+ +      st->current_flags = flag;
+ +      st->start_address = addr;
+ +      st->start_pa = pa;
+ +      st->page_size = page_size;
+ +
+ +      while (addr >= st->marker[1].start_address) {
+ +              st->marker++;
+ +              pt_dump_seq_printf(st->seq, "---[ %s ]---\n", st->marker->name);
+ +      }
+ +}
+ +
   static void note_page(struct pg_state *st, unsigned long addr,
                unsigned int level, u64 val, unsigned long page_size)
   {
@@@ -225,8 -202,13 +224,8 @@@
   
         /* At first no level is set */
         if (!st->level) {
- -              st->level = level;
- -              st->current_flags = flag;
- -              st->start_address = addr;
- -              st->start_pa = pa;
- -              st->last_pa = pa;
- -              st->page_size = page_size;
                 pt_dump_seq_printf(st->seq, "---[ %s ]---\n", st->marker->name);
+ +              note_page_update_state(st, addr, level, val, page_size);
         /*
          * Dump the section of virtual memory when:
          *   - the PTE flags from one entry to the next differs.
@@@ -258,9 -240,19 +257,9 @@@
                  * Address indicates we have passed the end of the
                  * current section of virtual memory
                  */
- -              while (addr >= st->marker[1].start_address) {
- -                      st->marker++;
- -                      pt_dump_seq_printf(st->seq, "---[ %s ]---\n", st->marker->name);
- -              }
- -              st->start_address = addr;
- -              st->start_pa = pa;
- -              st->last_pa = pa;
- -              st->page_size = page_size;
- -              st->current_flags = flag;
- -              st->level = level;
- -      } else {
- -              st->last_pa = pa;
+ +              note_page_update_state(st, addr, level, val, page_size);
         }
+ +      st->last_pa = pa;
   }
   
   static void walk_pte(struct pg_state *st, pmd_t *pmd, unsigned long start)
@@@ -355,15 -347,7 +354,15 @@@ static void populate_markers(void
   {
         int i = 0;
   
+ +#ifdef CONFIG_PPC64
         address_markers[i++].start_address = PAGE_OFFSET;
+ +#else
+ +      address_markers[i++].start_address = TASK_SIZE;
+ +#endif
+ +#ifdef MODULES_VADDR
+ +      address_markers[i++].start_address = MODULES_VADDR;
+ +      address_markers[i++].start_address = MODULES_END;
+ +#endif
         address_markers[i++].start_address = VMALLOC_START;
         address_markers[i++].start_address = VMALLOC_END;
   #ifdef CONFIG_PPC64
@@@ -400,7 -384,7 +399,7 @@@ static int ptdump_show(struct seq_file 
         struct pg_state st = {
                 .seq = m,
                 .marker = address_markers,
- -              .start_address = PAGE_OFFSET,
+ +              .start_address = IS_ENABLED(CONFIG_PPC64) ? PAGE_OFFSET : TASK_SIZE,
         };
   
   #ifdef CONFIG_PPC64
@@@ -444,7 -428,7 +443,7 @@@ void ptdump_check_wx(void
                 .seq = NULL,
                 .marker = address_markers,
                 .check_wx = true,
- -              .start_address = PAGE_OFFSET,
+ +              .start_address = IS_ENABLED(CONFIG_PPC64) ? PAGE_OFFSET : TASK_SIZE,
         };
   
   #ifdef CONFIG_PPC64
diff --combined arch/riscv/mm/init.c

index 50bcd9f,f6e6286..787c75f
--- 1/arch/riscv/mm/init.c
--- 2/arch/riscv/mm/init.c
+++ b/arch/riscv/mm/init.c
@@@ -541,46 -541,18 +541,45 @@@ void mark_rodata_ro(void
   }
   #endif
   
+ +static void __init resource_init(void)
+ +{
+ +      struct memblock_region *region;
+ +
+ +      for_each_memblock(memory, region) {
+ +              struct resource *res;
+ +
+ +              res = memblock_alloc(sizeof(struct resource), SMP_CACHE_BYTES);
+ +              if (!res)
+ +                      panic("%s: Failed to allocate %zu bytes\n", __func__,
+ +                            sizeof(struct resource));
+ +
+ +              if (memblock_is_nomap(region)) {
+ +                      res->name = "reserved";
+ +                      res->flags = IORESOURCE_MEM;
+ +              } else {
+ +                      res->name = "System RAM";
+ +                      res->flags = IORESOURCE_SYSTEM_RAM | IORESOURCE_BUSY;
+ +              }
+ +              res->start = __pfn_to_phys(memblock_region_memory_base_pfn(region));
+ +              res->end = __pfn_to_phys(memblock_region_memory_end_pfn(region)) - 1;
+ +
+ +              request_resource(&iomem_resource, res);
+ +      }
+ +}
+ +
   void __init paging_init(void)
   {
         setup_vm_final();
-       memblocks_present();
         sparse_init();
         setup_zero_page();
         zone_sizes_init();
+ +      resource_init();
   }
   
   #ifdef CONFIG_SPARSEMEM_VMEMMAP
   int __meminit vmemmap_populate(unsigned long start, unsigned long end, int node,
                                struct vmem_altmap *altmap)
   {
-       return vmemmap_populate_basepages(start, end, node);
+       return vmemmap_populate_basepages(start, end, node, NULL);
   }
   #endif
diff --combined arch/s390/kernel/ptrace.c

index a09b9e9,3c72a3b..11d2f7d
--- 1/arch/s390/kernel/ptrace.c
--- 2/arch/s390/kernel/ptrace.c
+++ b/arch/s390/kernel/ptrace.c
@@@ -25,7 -25,6 +25,6 @@@
   #include <linux/compat.h>
   #include <trace/syscall.h>
   #include <asm/page.h>
- #include <asm/pgalloc.h>
   #include <linux/uaccess.h>
   #include <asm/unistd.h>
   #include <asm/switch_to.h>
@@@ -945,14 -944,28 +944,14 @@@ asmlinkage void do_syscall_trace_exit(s
   
   static int s390_regs_get(struct task_struct *target,
                          const struct user_regset *regset,
- -                       unsigned int pos, unsigned int count,
- -                       void *kbuf, void __user *ubuf)
+ +                       struct membuf to)
   {
+ +      unsigned pos;
         if (target == current)
                 save_access_regs(target->thread.acrs);
   
- -      if (kbuf) {
- -              unsigned long *k = kbuf;
- -              while (count > 0) {
- -                      *k++ = __peek_user(target, pos);
- -                      count -= sizeof(*k);
- -                      pos += sizeof(*k);
- -              }
- -      } else {
- -              unsigned long __user *u = ubuf;
- -              while (count > 0) {
- -                      if (__put_user(__peek_user(target, pos), u++))
- -                              return -EFAULT;
- -                      count -= sizeof(*u);
- -                      pos += sizeof(*u);
- -              }
- -      }
+ +      for (pos = 0; pos < sizeof(s390_regs); pos += sizeof(long))
+ +              membuf_store(&to, __peek_user(target, pos));
         return 0;
   }
   
@@@ -993,8 -1006,8 +992,8 @@@ static int s390_regs_set(struct task_st
   }
   
   static int s390_fpregs_get(struct task_struct *target,
- -                         const struct user_regset *regset, unsigned int pos,
- -                         unsigned int count, void *kbuf, void __user *ubuf)
+ +                         const struct user_regset *regset,
+ +                         struct membuf to)
   {
         _s390_fp_regs fp_regs;
   
@@@ -1004,7 -1017,8 +1003,7 @@@
         fp_regs.fpc = target->thread.fpu.fpc;
         fpregs_store(&fp_regs, &target->thread.fpu);
   
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
- -                                 &fp_regs, 0, -1);
+ +      return membuf_write(&to, &fp_regs, sizeof(fp_regs));
   }
   
   static int s390_fpregs_set(struct task_struct *target,
@@@ -1051,9 -1065,20 +1050,9 @@@
   
   static int s390_last_break_get(struct task_struct *target,
                                const struct user_regset *regset,
- -                             unsigned int pos, unsigned int count,
- -                             void *kbuf, void __user *ubuf)
+ +                             struct membuf to)
   {
- -      if (count > 0) {
- -              if (kbuf) {
- -                      unsigned long *k = kbuf;
- -                      *k = target->thread.last_break;
- -              } else {
- -                      unsigned long  __user *u = ubuf;
- -                      if (__put_user(target->thread.last_break, u))
- -                              return -EFAULT;
- -              }
- -      }
- -      return 0;
+ +      return membuf_store(&to, target->thread.last_break);
   }
   
   static int s390_last_break_set(struct task_struct *target,
@@@ -1066,13 -1091,16 +1065,13 @@@
   
   static int s390_tdb_get(struct task_struct *target,
                         const struct user_regset *regset,
- -                      unsigned int pos, unsigned int count,
- -                      void *kbuf, void __user *ubuf)
+ +                      struct membuf to)
   {
         struct pt_regs *regs = task_pt_regs(target);
- -      unsigned char *data;
   
         if (!(regs->int_code & 0x200))
                 return -ENODATA;
- -      data = target->thread.trap_tdb;
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf, data, 0, 256);
+ +      return membuf_write(&to, target->thread.trap_tdb, 256);
   }
   
   static int s390_tdb_set(struct task_struct *target,
@@@ -1085,7 -1113,8 +1084,7 @@@
   
   static int s390_vxrs_low_get(struct task_struct *target,
                              const struct user_regset *regset,
- -                           unsigned int pos, unsigned int count,
- -                           void *kbuf, void __user *ubuf)
+ +                           struct membuf to)
   {
         __u64 vxrs[__NUM_VXRS_LOW];
         int i;
@@@ -1096,7 -1125,7 +1095,7 @@@
                 save_fpu_regs();
         for (i = 0; i < __NUM_VXRS_LOW; i++)
                 vxrs[i] = *((__u64 *)(target->thread.fpu.vxrs + i) + 1);
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf, vxrs, 0, -1);
+ +      return membuf_write(&to, vxrs, sizeof(vxrs));
   }
   
   static int s390_vxrs_low_set(struct task_struct *target,
@@@ -1125,14 -1154,18 +1124,14 @@@
   
   static int s390_vxrs_high_get(struct task_struct *target,
                               const struct user_regset *regset,
- -                            unsigned int pos, unsigned int count,
- -                            void *kbuf, void __user *ubuf)
+ +                            struct membuf to)
   {
- -      __vector128 vxrs[__NUM_VXRS_HIGH];
- -
         if (!MACHINE_HAS_VX)
                 return -ENODEV;
         if (target == current)
                 save_fpu_regs();
- -      memcpy(vxrs, target->thread.fpu.vxrs + __NUM_VXRS_LOW, sizeof(vxrs));
- -
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf, vxrs, 0, -1);
+ +      return membuf_write(&to, target->thread.fpu.vxrs + __NUM_VXRS_LOW,
+ +                          __NUM_VXRS_HIGH * sizeof(__vector128));
   }
   
   static int s390_vxrs_high_set(struct task_struct *target,
@@@ -1154,9 -1187,12 +1153,9 @@@
   
   static int s390_system_call_get(struct task_struct *target,
                                 const struct user_regset *regset,
- -                              unsigned int pos, unsigned int count,
- -                              void *kbuf, void __user *ubuf)
+ +                              struct membuf to)
   {
- -      unsigned int *data = &target->thread.system_call;
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
- -                                 data, 0, sizeof(unsigned int));
+ +      return membuf_store(&to, target->thread.system_call);
   }
   
   static int s390_system_call_set(struct task_struct *target,
@@@ -1171,7 -1207,8 +1170,7 @@@
   
   static int s390_gs_cb_get(struct task_struct *target,
                           const struct user_regset *regset,
- -                        unsigned int pos, unsigned int count,
- -                        void *kbuf, void __user *ubuf)
+ +                        struct membuf to)
   {
         struct gs_cb *data = target->thread.gs_cb;
   
@@@ -1181,7 -1218,8 +1180,7 @@@
                 return -ENODATA;
         if (target == current)
                 save_gs_cb(data);
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
- -                                 data, 0, sizeof(struct gs_cb));
+ +      return membuf_write(&to, data, sizeof(struct gs_cb));
   }
   
   static int s390_gs_cb_set(struct task_struct *target,
@@@ -1225,7 -1263,8 +1224,7 @@@
   
   static int s390_gs_bc_get(struct task_struct *target,
                           const struct user_regset *regset,
- -                        unsigned int pos, unsigned int count,
- -                        void *kbuf, void __user *ubuf)
+ +                        struct membuf to)
   {
         struct gs_cb *data = target->thread.gs_bc_cb;
   
@@@ -1233,7 -1272,8 +1232,7 @@@
                 return -ENODEV;
         if (!data)
                 return -ENODATA;
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
- -                                 data, 0, sizeof(struct gs_cb));
+ +      return membuf_write(&to, data, sizeof(struct gs_cb));
   }
   
   static int s390_gs_bc_set(struct task_struct *target,
@@@ -1284,7 -1324,8 +1283,7 @@@ static bool is_ri_cb_valid(struct runti
   
   static int s390_runtime_instr_get(struct task_struct *target,
                                 const struct user_regset *regset,
- -                              unsigned int pos, unsigned int count,
- -                              void *kbuf, void __user *ubuf)
+ +                              struct membuf to)
   {
         struct runtime_instr_cb *data = target->thread.ri_cb;
   
@@@ -1293,7 -1334,8 +1292,7 @@@
         if (!data)
                 return -ENODATA;
   
- -      return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
- -                                 data, 0, sizeof(struct runtime_instr_cb));
+ +      return membuf_write(&to, data, sizeof(struct runtime_instr_cb));
   }
   
   static int s390_runtime_instr_set(struct task_struct *target,
@@@ -1349,7 -1391,7 +1348,7 @@@ static const struct user_regset s390_re
                 .n = sizeof(s390_regs) / sizeof(long),
                 .size = sizeof(long),
                 .align = sizeof(long),
- -              .get = s390_regs_get,
+ +              .regset_get = s390_regs_get,
                 .set = s390_regs_set,
         },
         {
@@@ -1357,7 -1399,7 +1356,7 @@@
                 .n = sizeof(s390_fp_regs) / sizeof(long),
                 .size = sizeof(long),
                 .align = sizeof(long),
- -              .get = s390_fpregs_get,
+ +              .regset_get = s390_fpregs_get,
                 .set = s390_fpregs_set,
         },
         {
@@@ -1365,7 -1407,7 +1364,7 @@@
                 .n = 1,
                 .size = sizeof(unsigned int),
                 .align = sizeof(unsigned int),
- -              .get = s390_system_call_get,
+ +              .regset_get = s390_system_call_get,
                 .set = s390_system_call_set,
         },
         {
@@@ -1373,7 -1415,7 +1372,7 @@@
                 .n = 1,
                 .size = sizeof(long),
                 .align = sizeof(long),
- -              .get = s390_last_break_get,
+ +              .regset_get = s390_last_break_get,
                 .set = s390_last_break_set,
         },
         {
@@@ -1381,7 -1423,7 +1380,7 @@@
                 .n = 1,
                 .size = 256,
                 .align = 1,
- -              .get = s390_tdb_get,
+ +              .regset_get = s390_tdb_get,
                 .set = s390_tdb_set,
         },
         {
@@@ -1389,7 -1431,7 +1388,7 @@@
                 .n = __NUM_VXRS_LOW,
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_vxrs_low_get,
+ +              .regset_get = s390_vxrs_low_get,
                 .set = s390_vxrs_low_set,
         },
         {
@@@ -1397,7 -1439,7 +1396,7 @@@
                 .n = __NUM_VXRS_HIGH,
                 .size = sizeof(__vector128),
                 .align = sizeof(__vector128),
- -              .get = s390_vxrs_high_get,
+ +              .regset_get = s390_vxrs_high_get,
                 .set = s390_vxrs_high_set,
         },
         {
@@@ -1405,7 -1447,7 +1404,7 @@@
                 .n = sizeof(struct gs_cb) / sizeof(__u64),
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_gs_cb_get,
+ +              .regset_get = s390_gs_cb_get,
                 .set = s390_gs_cb_set,
         },
         {
@@@ -1413,7 -1455,7 +1412,7 @@@
                 .n = sizeof(struct gs_cb) / sizeof(__u64),
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_gs_bc_get,
+ +              .regset_get = s390_gs_bc_get,
                 .set = s390_gs_bc_set,
         },
         {
@@@ -1421,7 -1463,7 +1420,7 @@@
                 .n = sizeof(struct runtime_instr_cb) / sizeof(__u64),
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_runtime_instr_get,
+ +              .regset_get = s390_runtime_instr_get,
                 .set = s390_runtime_instr_set,
         },
   };
@@@ -1436,15 -1478,28 +1435,15 @@@ static const struct user_regset_view us
   #ifdef CONFIG_COMPAT
   static int s390_compat_regs_get(struct task_struct *target,
                                 const struct user_regset *regset,
- -                              unsigned int pos, unsigned int count,
- -                              void *kbuf, void __user *ubuf)
+ +                              struct membuf to)
   {
+ +      unsigned n;
+ +
         if (target == current)
                 save_access_regs(target->thread.acrs);
   
- -      if (kbuf) {
- -              compat_ulong_t *k = kbuf;
- -              while (count > 0) {
- -                      *k++ = __peek_user_compat(target, pos);
- -                      count -= sizeof(*k);
- -                      pos += sizeof(*k);
- -              }
- -      } else {
- -              compat_ulong_t __user *u = ubuf;
- -              while (count > 0) {
- -                      if (__put_user(__peek_user_compat(target, pos), u++))
- -                              return -EFAULT;
- -                      count -= sizeof(*u);
- -                      pos += sizeof(*u);
- -              }
- -      }
+ +      for (n = 0; n < sizeof(s390_compat_regs); n += sizeof(compat_ulong_t))
+ +              membuf_store(&to, __peek_user_compat(target, n));
         return 0;
   }
   
@@@ -1486,14 -1541,29 +1485,14 @@@ static int s390_compat_regs_set(struct 
   
   static int s390_compat_regs_high_get(struct task_struct *target,
                                      const struct user_regset *regset,
- -                                   unsigned int pos, unsigned int count,
- -                                   void *kbuf, void __user *ubuf)
+ +                                   struct membuf to)
   {
         compat_ulong_t *gprs_high;
+ +      int i;
   
- -      gprs_high = (compat_ulong_t *)
- -              &task_pt_regs(target)->gprs[pos / sizeof(compat_ulong_t)];
- -      if (kbuf) {
- -              compat_ulong_t *k = kbuf;
- -              while (count > 0) {
- -                      *k++ = *gprs_high;
- -                      gprs_high += 2;
- -                      count -= sizeof(*k);
- -              }
- -      } else {
- -              compat_ulong_t __user *u = ubuf;
- -              while (count > 0) {
- -                      if (__put_user(*gprs_high, u++))
- -                              return -EFAULT;
- -                      gprs_high += 2;
- -                      count -= sizeof(*u);
- -              }
- -      }
+ +      gprs_high = (compat_ulong_t *)task_pt_regs(target)->gprs;
+ +      for (i = 0; i < NUM_GPRS; i++, gprs_high += 2)
+ +              membuf_store(&to, *gprs_high);
         return 0;
   }
   
@@@ -1532,11 -1602,23 +1531,11 @@@ static int s390_compat_regs_high_set(st
   
   static int s390_compat_last_break_get(struct task_struct *target,
                                       const struct user_regset *regset,
- -                                    unsigned int pos, unsigned int count,
- -                                    void *kbuf, void __user *ubuf)
+ +                                    struct membuf to)
   {
- -      compat_ulong_t last_break;
+ +      compat_ulong_t last_break = target->thread.last_break;
   
- -      if (count > 0) {
- -              last_break = target->thread.last_break;
- -              if (kbuf) {
- -                      unsigned long *k = kbuf;
- -                      *k = last_break;
- -              } else {
- -                      unsigned long  __user *u = ubuf;
- -                      if (__put_user(last_break, u))
- -                              return -EFAULT;
- -              }
- -      }
- -      return 0;
+ +      return membuf_store(&to, (unsigned long)last_break);
   }
   
   static int s390_compat_last_break_set(struct task_struct *target,
@@@ -1553,7 -1635,7 +1552,7 @@@ static const struct user_regset s390_co
                 .n = sizeof(s390_compat_regs) / sizeof(compat_long_t),
                 .size = sizeof(compat_long_t),
                 .align = sizeof(compat_long_t),
- -              .get = s390_compat_regs_get,
+ +              .regset_get = s390_compat_regs_get,
                 .set = s390_compat_regs_set,
         },
         {
@@@ -1561,7 -1643,7 +1560,7 @@@
                 .n = sizeof(s390_fp_regs) / sizeof(compat_long_t),
                 .size = sizeof(compat_long_t),
                 .align = sizeof(compat_long_t),
- -              .get = s390_fpregs_get,
+ +              .regset_get = s390_fpregs_get,
                 .set = s390_fpregs_set,
         },
         {
@@@ -1569,7 -1651,7 +1568,7 @@@
                 .n = 1,
                 .size = sizeof(compat_uint_t),
                 .align = sizeof(compat_uint_t),
- -              .get = s390_system_call_get,
+ +              .regset_get = s390_system_call_get,
                 .set = s390_system_call_set,
         },
         {
@@@ -1577,7 -1659,7 +1576,7 @@@
                 .n = 1,
                 .size = sizeof(long),
                 .align = sizeof(long),
- -              .get = s390_compat_last_break_get,
+ +              .regset_get = s390_compat_last_break_get,
                 .set = s390_compat_last_break_set,
         },
         {
@@@ -1585,7 -1667,7 +1584,7 @@@
                 .n = 1,
                 .size = 256,
                 .align = 1,
- -              .get = s390_tdb_get,
+ +              .regset_get = s390_tdb_get,
                 .set = s390_tdb_set,
         },
         {
@@@ -1593,7 -1675,7 +1592,7 @@@
                 .n = __NUM_VXRS_LOW,
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_vxrs_low_get,
+ +              .regset_get = s390_vxrs_low_get,
                 .set = s390_vxrs_low_set,
         },
         {
@@@ -1601,7 -1683,7 +1600,7 @@@
                 .n = __NUM_VXRS_HIGH,
                 .size = sizeof(__vector128),
                 .align = sizeof(__vector128),
- -              .get = s390_vxrs_high_get,
+ +              .regset_get = s390_vxrs_high_get,
                 .set = s390_vxrs_high_set,
         },
         {
@@@ -1609,7 -1691,7 +1608,7 @@@
                 .n = sizeof(s390_compat_regs_high) / sizeof(compat_long_t),
                 .size = sizeof(compat_long_t),
                 .align = sizeof(compat_long_t),
- -              .get = s390_compat_regs_high_get,
+ +              .regset_get = s390_compat_regs_high_get,
                 .set = s390_compat_regs_high_set,
         },
         {
@@@ -1617,7 -1699,7 +1616,7 @@@
                 .n = sizeof(struct gs_cb) / sizeof(__u64),
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_gs_cb_get,
+ +              .regset_get = s390_gs_cb_get,
                 .set = s390_gs_cb_set,
         },
         {
@@@ -1625,7 -1707,7 +1624,7 @@@
                 .n = sizeof(struct gs_cb) / sizeof(__u64),
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_gs_bc_get,
+ +              .regset_get = s390_gs_bc_get,
                 .set = s390_gs_bc_set,
         },
         {
@@@ -1633,7 -1715,7 +1632,7 @@@
                 .n = sizeof(struct runtime_instr_cb) / sizeof(__u64),
                 .size = sizeof(__u64),
                 .align = sizeof(__u64),
- -              .get = s390_runtime_instr_get,
+ +              .regset_get = s390_runtime_instr_get,
                 .set = s390_runtime_instr_set,
         },
   };
diff --combined arch/x86/mm/init_64.c

index 449e071,1c1209d..3b246ae
--- 1/arch/x86/mm/init_64.c
--- 2/arch/x86/mm/init_64.c
+++ b/arch/x86/mm/init_64.c
@@@ -817,7 -817,6 +817,6 @@@ void __init initmem_init(void
   
   void __init paging_init(void)
   {
-       sparse_memory_present_with_active_regions(MAX_NUMNODES);
         sparse_init();
   
         /*
@@@ -1253,23 -1252,28 +1252,23 @@@ static void __init preallocate_vmalloc_
                 p4d_t *p4d;
                 pud_t *pud;
   
- -              p4d = p4d_offset(pgd, addr);
- -              if (p4d_none(*p4d)) {
- -                      /* Can only happen with 5-level paging */
- -                      p4d = p4d_alloc(&init_mm, pgd, addr);
- -                      if (!p4d) {
- -                              lvl = "p4d";
- -                              goto failed;
- -                      }
- -              }
+ +              lvl = "p4d";
+ +              p4d = p4d_alloc(&init_mm, pgd, addr);
+ +              if (!p4d)
+ +                      goto failed;
   
+ +              /*
+ +               * With 5-level paging the P4D level is not folded. So the PGDs
+ +               * are now populated and there is no need to walk down to the
+ +               * PUD level.
+ +               */
                 if (pgtable_l5_enabled())
                         continue;
   
- -              pud = pud_offset(p4d, addr);
- -              if (pud_none(*pud)) {
- -                      /* Ends up here only with 4-level paging */
- -                      pud = pud_alloc(&init_mm, p4d, addr);
- -                      if (!pud) {
- -                              lvl = "pud";
- -                              goto failed;
- -                      }
- -              }
+ +              lvl = "pud";
+ +              pud = pud_alloc(&init_mm, p4d, addr);
+ +              if (!pud)
+ +                      goto failed;
         }
   
         return;
@@@ -1510,10 -1514,7 +1509,7 @@@ static int __meminit vmemmap_populate_h
                 if (pmd_none(*pmd)) {
                         void *p;
   
-                       if (altmap)
-                               p = altmap_alloc_block_buf(PMD_SIZE, altmap);
-                       else
-                               p = vmemmap_alloc_block_buf(PMD_SIZE, node);
+                       p = vmemmap_alloc_block_buf(PMD_SIZE, node, altmap);
                         if (p) {
                                 pte_t entry;
   
@@@ -1540,7 -1541,7 +1536,7 @@@
                         vmemmap_verify((pte_t *)pmd, node, addr, next);
                         continue;
                 }
-               if (vmemmap_populate_basepages(addr, next, node))
+               if (vmemmap_populate_basepages(addr, next, node, NULL))
                         return -ENOMEM;
         }
         return 0;
@@@ -1552,7 -1553,7 +1548,7 @@@ int __meminit vmemmap_populate(unsigne
         int err;
   
         if (end - start < PAGES_PER_SECTION * sizeof(struct page))
-               err = vmemmap_populate_basepages(start, end, node);
+               err = vmemmap_populate_basepages(start, end, node, NULL);
         else if (boot_cpu_has(X86_FEATURE_PSE))
                 err = vmemmap_populate_hugepages(start, end, node, altmap);
         else if (altmap) {
@@@ -1560,7 -1561,7 +1556,7 @@@
                                 __func__);
                 err = -ENOMEM;
         } else
-               err = vmemmap_populate_basepages(start, end, node);
+               err = vmemmap_populate_basepages(start, end, node, NULL);
         if (!err)
                 sync_global_pgds(start, end - 1);
         return err;
diff --combined drivers/xen/balloon.c

index b1d8b02,f5c838a..37ffccd
--- 1/drivers/xen/balloon.c
--- 2/drivers/xen/balloon.c
+++ b/drivers/xen/balloon.c
@@@ -58,7 -58,6 +58,6 @@@
   #include <linux/sysctl.h>
   
   #include <asm/page.h>
- #include <asm/pgalloc.h>
   #include <asm/tlb.h>
   
   #include <asm/xen/hypervisor.h>
@@@ -266,6 -265,20 +265,6 @@@ static struct resource *additional_memo
                 return NULL;
         }
   
- -#ifdef CONFIG_SPARSEMEM
- -      {
- -              unsigned long limit = 1UL << (MAX_PHYSMEM_BITS - PAGE_SHIFT);
- -              unsigned long pfn = res->start >> PAGE_SHIFT;
- -
- -              if (pfn > limit) {
- -                      pr_err("New System RAM resource outside addressable RAM (%lu > %lu)\n",
- -                             pfn, limit);
- -                      release_memory_resource(res);
- -                      return NULL;
- -              }
- -      }
- -#endif
- -
         return res;
   }
   
@@@ -554,13 -567,11 +553,13 @@@ static int add_ballooned_pages(int nr_p
         if (xen_hotplug_unpopulated) {
                 st = reserve_additional_memory();
                 if (st != BP_ECANCELED) {
+ +                      int rc;
+ +
                         mutex_unlock(&balloon_mutex);
- -                      wait_event(balloon_wq,
+ +                      rc = wait_event_interruptible(balloon_wq,
                                    !list_empty(&ballooned_pages));
                         mutex_lock(&balloon_mutex);
- -                      return 0;
+ +                      return rc ? -ENOMEM : 0;
                 }
         }
   
@@@ -618,12 -629,6 +617,12 @@@ int alloc_xenballooned_pages(int nr_pag
    out_undo:
         mutex_unlock(&balloon_mutex);
         free_xenballooned_pages(pgno, pages);
+ +      /*
+ +       * NB: free_xenballooned_pages will only subtract pgno pages, but since
+ +       * target_unpopulated is incremented with nr_pages at the start we need
+ +       * to remove the remaining ones also, or accounting will be screwed.
+ +       */
+ +      balloon_stats.target_unpopulated -= nr_pages - pgno;
         return ret;
   }
   EXPORT_SYMBOL(alloc_xenballooned_pages);
diff --combined drivers/xen/privcmd.c

index 095d683,5dfc59f..63abe6c
--- 1/drivers/xen/privcmd.c
--- 2/drivers/xen/privcmd.c
+++ b/drivers/xen/privcmd.c
@@@ -25,7 -25,6 +25,6 @@@
   #include <linux/miscdevice.h>
   #include <linux/moduleparam.h>
   
- #include <asm/pgalloc.h>
   #include <asm/xen/hypervisor.h>
   #include <asm/xen/hypercall.h>
   
@@@ -580,13 -579,13 +579,13 @@@ out_unlock
   
   static int lock_pages(
         struct privcmd_dm_op_buf kbufs[], unsigned int num,
- -      struct page *pages[], unsigned int nr_pages)
+ +      struct page *pages[], unsigned int nr_pages, unsigned int *pinned)
   {
         unsigned int i;
   
         for (i = 0; i < num; i++) {
                 unsigned int requested;
- -              int pinned;
+ +              int page_count;
   
                 requested = DIV_ROUND_UP(
                         offset_in_page(kbufs[i].uptr) + kbufs[i].size,
@@@ -594,15 -593,14 +593,15 @@@
                 if (requested > nr_pages)
                         return -ENOSPC;
   
- -              pinned = get_user_pages_fast(
+ +              page_count = pin_user_pages_fast(
                         (unsigned long) kbufs[i].uptr,
                         requested, FOLL_WRITE, pages);
- -              if (pinned < 0)
- -                      return pinned;
+ +              if (page_count < 0)
+ +                      return page_count;
   
- -              nr_pages -= pinned;
- -              pages += pinned;
+ +              *pinned += page_count;
+ +              nr_pages -= page_count;
+ +              pages += page_count;
         }
   
         return 0;
@@@ -610,7 -608,15 +609,7 @@@
   
   static void unlock_pages(struct page *pages[], unsigned int nr_pages)
   {
- -      unsigned int i;
- -
- -      if (!pages)
- -              return;
- -
- -      for (i = 0; i < nr_pages; i++) {
- -              if (pages[i])
- -                      put_page(pages[i]);
- -      }
+ +      unpin_user_pages_dirty_lock(pages, nr_pages, true);
   }
   
   static long privcmd_ioctl_dm_op(struct file *file, void __user *udata)
@@@ -623,7 -629,6 +622,7 @@@
         struct xen_dm_op_buf *xbufs = NULL;
         unsigned int i;
         long rc;
+ +      unsigned int pinned = 0;
   
         if (copy_from_user(&kdata, udata, sizeof(kdata)))
                 return -EFAULT;
@@@ -677,11 -682,9 +676,11 @@@
                 goto out;
         }
   
- -      rc = lock_pages(kbufs, kdata.num, pages, nr_pages);
- -      if (rc)
+ +      rc = lock_pages(kbufs, kdata.num, pages, nr_pages, &pinned);
+ +      if (rc < 0) {
+ +              nr_pages = pinned;
                 goto out;
+ +      }
   
         for (i = 0; i < kdata.num; i++) {
                 set_xen_guest_handle(xbufs[i].h, kbufs[i].uptr);
diff --combined fs/cifs/connect.c

index 7e3e5e2,889fee5..0ad1309
--- 1/fs/cifs/connect.c
--- 2/fs/cifs/connect.c
+++ b/fs/cifs/connect.c
@@@ -393,14 -393,15 +393,14 @@@ static inline int reconn_set_ipaddr(str
   
   #ifdef CONFIG_CIFS_DFS_UPCALL
   /* These functions must be called with server->srv_mutex held */
- -static void reconn_inval_dfs_target(struct TCP_Server_Info *server,
- -                                  struct cifs_sb_info *cifs_sb,
- -                                  struct dfs_cache_tgt_list *tgt_list,
- -                                  struct dfs_cache_tgt_iterator **tgt_it)
+ +static void reconn_set_next_dfs_target(struct TCP_Server_Info *server,
+ +                                     struct cifs_sb_info *cifs_sb,
+ +                                     struct dfs_cache_tgt_list *tgt_list,
+ +                                     struct dfs_cache_tgt_iterator **tgt_it)
   {
         const char *name;
   
- -      if (!cifs_sb || !cifs_sb->origin_fullpath || !tgt_list ||
- -          !server->nr_targets)
+ +      if (!cifs_sb || !cifs_sb->origin_fullpath)
                 return;
   
         if (!*tgt_it) {
@@@ -470,13 -471,11 +470,13 @@@ cifs_reconnect(struct TCP_Server_Info *
                 sb = NULL;
         } else {
                 cifs_sb = CIFS_SB(sb);
- -
                 rc = reconn_setup_dfs_targets(cifs_sb, &tgt_list);
- -              if (rc && (rc != -EOPNOTSUPP)) {
- -                      cifs_server_dbg(VFS, "%s: no target servers for DFS failover\n",
- -                               __func__);
+ +              if (rc) {
+ +                      cifs_sb = NULL;
+ +                      if (rc != -EOPNOTSUPP) {
+ +                              cifs_server_dbg(VFS, "%s: no target servers for DFS failover\n",
+ +                                              __func__);
+ +                      }
                 } else {
                         server->nr_targets = dfs_cache_get_nr_tgts(&tgt_list);
                 }
@@@ -579,7 -578,7 +579,7 @@@
                  * feature is disabled, then we will retry last server we
                  * connected to before.
                  */
- -              reconn_inval_dfs_target(server, cifs_sb, &tgt_list, &tgt_it);
+ +              reconn_set_next_dfs_target(server, cifs_sb, &tgt_list, &tgt_it);
   #endif
                 rc = reconn_set_ipaddr(server);
                 if (rc) {
@@@ -2183,7 -2182,7 +2183,7 @@@ cifs_parse_mount_options(const char *mo
                         tmp_end++;
                         if (!(tmp_end < end && tmp_end[1] == delim)) {
                                 /* No it is not. Set the password to NULL */
-                               kzfree(vol->password);
+                               kfree_sensitive(vol->password);
                                 vol->password = NULL;
                                 break;
                         }
@@@ -2221,7 -2220,7 +2221,7 @@@
                                         options = end;
                         }
   
-                       kzfree(vol->password);
+                       kfree_sensitive(vol->password);
                         /* Now build new password string */
                         temp_len = strlen(value);
                         vol->password = kzalloc(temp_len+1, GFP_KERNEL);
@@@ -3199,7 -3198,7 +3199,7 @@@ cifs_set_cifscreds(struct smb_vol *vol
                         rc = -ENOMEM;
                         kfree(vol->username);
                         vol->username = NULL;
-                       kzfree(vol->password);
+                       kfree_sensitive(vol->password);
                         vol->password = NULL;
                         goto out_key_put;
                 }
@@@ -4220,7 -4219,7 +4220,7 @@@ voi
   cifs_cleanup_volume_info_contents(struct smb_vol *volume_info)
   {
         kfree(volume_info->username);
-       kzfree(volume_info->password);
+       kfree_sensitive(volume_info->password);
         kfree(volume_info->UNC);
         kfree(volume_info->domainname);
         kfree(volume_info->iocharset);
@@@ -4423,11 -4422,11 +4423,11 @@@ build_unc_path_to_root(const struct smb
   static int
   expand_dfs_referral(const unsigned int xid, struct cifs_ses *ses,
                     struct smb_vol *volume_info, struct cifs_sb_info *cifs_sb,
- -                  int check_prefix)
+ +                  char *ref_path)
   {
         int rc;
         struct dfs_info3_param referral = {0};
- -      char *full_path = NULL, *ref_path = NULL, *mdata = NULL;
+ +      char *full_path = NULL, *mdata = NULL;
   
         if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NO_DFS)
                 return -EREMOTE;
@@@ -4436,6 -4435,9 +4436,6 @@@
         if (IS_ERR(full_path))
                 return PTR_ERR(full_path);
   
- -      /* For DFS paths, skip the first '\' of the UNC */
- -      ref_path = check_prefix ? full_path + 1 : volume_info->UNC + 1;
- -
         rc = dfs_cache_find(xid, ses, cifs_sb->local_nls, cifs_remap(cifs_sb),
                             ref_path, &referral, NULL);
         if (!rc) {
@@@ -4498,10 -4500,13 +4498,10 @@@ static int update_vol_info(const struc
         return 0;
   }
   
- -static int setup_dfs_tgt_conn(const char *path,
+ +static int setup_dfs_tgt_conn(const char *path, const char *full_path,
                               const struct dfs_cache_tgt_iterator *tgt_it,
- -                            struct cifs_sb_info *cifs_sb,
- -                            struct smb_vol *vol,
- -                            unsigned int *xid,
- -                            struct TCP_Server_Info **server,
- -                            struct cifs_ses **ses,
+ +                            struct cifs_sb_info *cifs_sb, struct smb_vol *vol, unsigned int *xid,
+ +                            struct TCP_Server_Info **server, struct cifs_ses **ses,
                               struct cifs_tcon **tcon)
   {
         int rc;
@@@ -4515,7 -4520,8 +4515,7 @@@
         if (rc)
                 return rc;
   
- -      mdata = cifs_compose_mount_options(cifs_sb->mountdata, path, &ref,
- -                                         &fake_devname);
+ +      mdata = cifs_compose_mount_options(cifs_sb->mountdata, full_path + 1, &ref, &fake_devname);
         free_dfs_info_param(&ref);
   
         if (IS_ERR(mdata)) {
@@@ -4538,7 -4544,7 +4538,7 @@@
                 mount_put_conns(cifs_sb, *xid, *server, *ses, *tcon);
                 rc = mount_get_conns(&fake_vol, cifs_sb, xid, server, ses,
                                      tcon);
- -              if (!rc) {
+ +              if (!rc || (*server && *ses)) {
                         /*
                          * We were able to connect to new target server.
                          * Update current volume info with new target server.
@@@ -4550,10 -4556,14 +4550,10 @@@
         return rc;
   }
   
- -static int mount_do_dfs_failover(const char *path,
- -                               struct cifs_sb_info *cifs_sb,
- -                               struct smb_vol *vol,
- -                               struct cifs_ses *root_ses,
- -                               unsigned int *xid,
- -                               struct TCP_Server_Info **server,
- -                               struct cifs_ses **ses,
- -                               struct cifs_tcon **tcon)
+ +static int do_dfs_failover(const char *path, const char *full_path, struct cifs_sb_info *cifs_sb,
+ +                         struct smb_vol *vol, struct cifs_ses *root_ses, unsigned int *xid,
+ +                         struct TCP_Server_Info **server, struct cifs_ses **ses,
+ +                         struct cifs_tcon **tcon)
   {
         int rc;
         struct dfs_cache_tgt_list tgt_list;
@@@ -4572,9 -4582,9 +4572,9 @@@
                 if (rc)
                         break;
                 /* Connect to next DFS target */
- -              rc = setup_dfs_tgt_conn(path, tgt_it, cifs_sb, vol, xid, server,
- -                                      ses, tcon);
- -              if (!rc || rc == -EACCES || rc == -EOPNOTSUPP)
+ +              rc = setup_dfs_tgt_conn(path, full_path, tgt_it, cifs_sb, vol, xid, server, ses,
+ +                                      tcon);
+ +              if (!rc || (*server && *ses))
                         break;
         }
         if (!rc) {
@@@ -4744,210 -4754,207 +4744,210 @@@ static int is_path_remote(struct cifs_s
   }
   
   #ifdef CONFIG_CIFS_DFS_UPCALL
- -static inline void set_root_tcon(struct cifs_sb_info *cifs_sb,
- -                               struct cifs_tcon *tcon,
- -                               struct cifs_tcon **root)
+ +static void set_root_ses(struct cifs_sb_info *cifs_sb, struct cifs_ses *ses,
+ +                       struct cifs_ses **root_ses)
   {
- -      spin_lock(&cifs_tcp_ses_lock);
- -      tcon->tc_count++;
- -      tcon->remap = cifs_remap(cifs_sb);
- -      spin_unlock(&cifs_tcp_ses_lock);
- -      *root = tcon;
+ +      if (ses) {
+ +              spin_lock(&cifs_tcp_ses_lock);
+ +              ses->ses_count++;
+ +              ses->tcon_ipc->remap = cifs_remap(cifs_sb);
+ +              spin_unlock(&cifs_tcp_ses_lock);
+ +      }
+ +      *root_ses = ses;
+ +}
+ +
+ +static void put_root_ses(struct cifs_ses *ses)
+ +{
+ +      if (ses)
+ +              cifs_put_smb_ses(ses);
+ +}
+ +
+ +/* Check if a path component is remote and then update @dfs_path accordingly */
+ +static int check_dfs_prepath(struct cifs_sb_info *cifs_sb, struct smb_vol *vol,
+ +                           const unsigned int xid, struct TCP_Server_Info *server,
+ +                           struct cifs_tcon *tcon, char **dfs_path)
+ +{
+ +      char *path, *s;
+ +      char sep = CIFS_DIR_SEP(cifs_sb), tmp;
+ +      char *npath;
+ +      int rc = 0;
+ +      int added_treename = tcon->Flags & SMB_SHARE_IS_IN_DFS;
+ +      int skip = added_treename;
+ +
+ +      path = cifs_build_path_to_root(vol, cifs_sb, tcon, added_treename);
+ +      if (!path)
+ +              return -ENOMEM;
+ +
+ +      /*
+ +       * Walk through the path components in @path and check if they're accessible. In case any of
+ +       * the components is -EREMOTE, then update @dfs_path with the next DFS referral request path
+ +       * (NOT including the remaining components).
+ +       */
+ +      s = path;
+ +      do {
+ +              /* skip separators */
+ +              while (*s && *s == sep)
+ +                      s++;
+ +              if (!*s)
+ +                      break;
+ +              /* next separator */
+ +              while (*s && *s != sep)
+ +                      s++;
+ +              /*
+ +               * if the treename is added, we then have to skip the first
+ +               * part within the separators
+ +               */
+ +              if (skip) {
+ +                      skip = 0;
+ +                      continue;
+ +              }
+ +              tmp = *s;
+ +              *s = 0;
+ +              rc = server->ops->is_path_accessible(xid, tcon, cifs_sb, path);
+ +              if (rc && rc == -EREMOTE) {
+ +                      struct smb_vol v = {NULL};
+ +                      /* if @path contains a tree name, skip it in the prefix path */
+ +                      if (added_treename) {
+ +                              rc = cifs_parse_devname(path, &v);
+ +                              if (rc)
+ +                                      break;
+ +                              rc = -EREMOTE;
+ +                              npath = build_unc_path_to_root(&v, cifs_sb, true);
+ +                              cifs_cleanup_volume_info_contents(&v);
+ +                      } else {
+ +                              v.UNC = vol->UNC;
+ +                              v.prepath = path + 1;
+ +                              npath = build_unc_path_to_root(&v, cifs_sb, true);
+ +                      }
+ +                      if (IS_ERR(npath)) {
+ +                              rc = PTR_ERR(npath);
+ +                              break;
+ +                      }
+ +                      kfree(*dfs_path);
+ +                      *dfs_path = npath;
+ +              }
+ +              *s = tmp;
+ +      } while (rc == 0);
+ +
+ +      kfree(path);
+ +      return rc;
   }
   
   int cifs_mount(struct cifs_sb_info *cifs_sb, struct smb_vol *vol)
   {
         int rc = 0;
         unsigned int xid;
- -      struct cifs_ses *ses;
- -      struct cifs_tcon *root_tcon = NULL;
+ +      struct TCP_Server_Info *server = NULL;
+ +      struct cifs_ses *ses = NULL, *root_ses = NULL;
         struct cifs_tcon *tcon = NULL;
- -      struct TCP_Server_Info *server;
- -      char *root_path = NULL, *full_path = NULL;
- -      char *old_mountdata, *origin_mountdata = NULL;
- -      int count;
+ +      int count = 0;
+ +      char *ref_path = NULL, *full_path = NULL;
+ +      char *oldmnt = NULL;
+ +      char *mntdata = NULL;
   
         rc = mount_get_conns(vol, cifs_sb, &xid, &server, &ses, &tcon);
- -      if (!rc && tcon) {
- -              /* If not a standalone DFS root, then check if path is remote */
- -              rc = dfs_cache_find(xid, ses, cifs_sb->local_nls,
- -                                  cifs_remap(cifs_sb), vol->UNC + 1, NULL,
- -                                  NULL);
- -              if (rc) {
- -                      rc = is_path_remote(cifs_sb, vol, xid, server, tcon);
- -                      if (!rc)
- -                              goto out;
- -                      if (rc != -EREMOTE)
- -                              goto error;
- -              }
- -      }
         /*
- -       * If first DFS target server went offline and we failed to connect it,
- -       * server and ses pointers are NULL at this point, though we still have
- -       * chance to get a cached DFS referral in expand_dfs_referral() and
- -       * retry next target available in it.
+ +       * Unconditionally try to get an DFS referral (even cached) to determine whether it is an
+ +       * DFS mount.
          *
- -       * If a NULL ses ptr is passed to dfs_cache_find(), a lookup will be
- -       * performed against DFS path and *no* requests will be sent to server
- -       * for any new DFS referrals. Hence it's safe to skip checking whether
- -       * server or ses ptr is NULL.
+ +       * Skip prefix path to provide support for DFS referrals from w2k8 servers which don't seem
+ +       * to respond with PATH_NOT_COVERED to requests that include the prefix.
          */
- -      if (rc == -EACCES || rc == -EOPNOTSUPP)
- -              goto error;
- -
- -      root_path = build_unc_path_to_root(vol, cifs_sb, false);
- -      if (IS_ERR(root_path)) {
- -              rc = PTR_ERR(root_path);
- -              root_path = NULL;
- -              goto error;
- -      }
- -
- -      full_path = build_unc_path_to_root(vol, cifs_sb, true);
- -      if (IS_ERR(full_path)) {
- -              rc = PTR_ERR(full_path);
- -              full_path = NULL;
- -              goto error;
- -      }
- -      /*
- -       * Perform an unconditional check for whether there are DFS
- -       * referrals for this path without prefix, to provide support
- -       * for DFS referrals from w2k8 servers which don't seem to respond
- -       * with PATH_NOT_COVERED to requests that include the prefix.
- -       * Chase the referral if found, otherwise continue normally.
- -       */
- -      old_mountdata = cifs_sb->mountdata;
- -      (void)expand_dfs_referral(xid, ses, vol, cifs_sb, false);
- -
- -      if (cifs_sb->mountdata == NULL) {
- -              rc = -ENOENT;
- -              goto error;
+ +      if (dfs_cache_find(xid, ses, cifs_sb->local_nls, cifs_remap(cifs_sb), vol->UNC + 1, NULL,
+ +                         NULL)) {
+ +              /* No DFS referral was returned.  Looks like a regular share. */
+ +              if (rc)
+ +                      goto error;
+ +              /* Check if it is fully accessible and then mount it */
+ +              rc = is_path_remote(cifs_sb, vol, xid, server, tcon);
+ +              if (!rc)
+ +                      goto out;
+ +              if (rc != -EREMOTE)
+ +                      goto error;
         }
- -
- -      /* Save DFS root volume information for DFS refresh worker */
- -      origin_mountdata = kstrndup(cifs_sb->mountdata,
- -                                  strlen(cifs_sb->mountdata), GFP_KERNEL);
- -      if (!origin_mountdata) {
+ +      /* Save mount options */
+ +      mntdata = kstrndup(cifs_sb->mountdata, strlen(cifs_sb->mountdata), GFP_KERNEL);
+ +      if (!mntdata) {
                 rc = -ENOMEM;
                 goto error;
         }
- -
- -      if (cifs_sb->mountdata != old_mountdata) {
- -              /* If we were redirected, reconnect to new target server */
- -              mount_put_conns(cifs_sb, xid, server, ses, tcon);
- -              rc = mount_get_conns(vol, cifs_sb, &xid, &server, &ses, &tcon);
- -      }
- -      if (rc) {
- -              if (rc == -EACCES || rc == -EOPNOTSUPP)
- -                      goto error;
- -              /* Perform DFS failover to any other DFS targets */
- -              rc = mount_do_dfs_failover(root_path + 1, cifs_sb, vol, NULL,
- -                                         &xid, &server, &ses, &tcon);
- -              if (rc)
- -                      goto error;
- -      }
- -
- -      kfree(root_path);
- -      root_path = build_unc_path_to_root(vol, cifs_sb, false);
- -      if (IS_ERR(root_path)) {
- -              rc = PTR_ERR(root_path);
- -              root_path = NULL;
+ +      /* Get path of DFS root */
+ +      ref_path = build_unc_path_to_root(vol, cifs_sb, false);
+ +      if (IS_ERR(ref_path)) {
+ +              rc = PTR_ERR(ref_path);
+ +              ref_path = NULL;
                 goto error;
         }
- -      /* Cache out resolved root server */
- -      (void)dfs_cache_find(xid, ses, cifs_sb->local_nls, cifs_remap(cifs_sb),
- -                           root_path + 1, NULL, NULL);
- -      kfree(root_path);
- -      root_path = NULL;
- -
- -      set_root_tcon(cifs_sb, tcon, &root_tcon);
- -
- -      for (count = 1; ;) {
- -              if (!rc && tcon) {
- -                      rc = is_path_remote(cifs_sb, vol, xid, server, tcon);
- -                      if (!rc || rc != -EREMOTE)
- -                              break;
- -              }
- -              /*
- -               * BB: when we implement proper loop detection,
- -               *     we will remove this check. But now we need it
- -               *     to prevent an indefinite loop if 'DFS tree' is
- -               *     misconfigured (i.e. has loops).
- -               */
- -              if (count++ > MAX_NESTED_LINKS) {
- -                      rc = -ELOOP;
- -                      break;
- -              }
   
+ +      set_root_ses(cifs_sb, ses, &root_ses);
+ +      do {
+ +              /* Save full path of last DFS path we used to resolve final target server */
                 kfree(full_path);
- -              full_path = build_unc_path_to_root(vol, cifs_sb, true);
+ +              full_path = build_unc_path_to_root(vol, cifs_sb, !!count);
                 if (IS_ERR(full_path)) {
                         rc = PTR_ERR(full_path);
- -                      full_path = NULL;
                         break;
                 }
- -
- -              old_mountdata = cifs_sb->mountdata;
- -              rc = expand_dfs_referral(xid, root_tcon->ses, vol, cifs_sb,
- -                                       true);
+ +              /* Chase referral */
+ +              oldmnt = cifs_sb->mountdata;
+ +              rc = expand_dfs_referral(xid, root_ses, vol, cifs_sb, ref_path + 1);
                 if (rc)
                         break;
- -
- -              if (cifs_sb->mountdata != old_mountdata) {
+ +              /* Connect to new DFS target only if we were redirected */
+ +              if (oldmnt != cifs_sb->mountdata) {
                         mount_put_conns(cifs_sb, xid, server, ses, tcon);
- -                      rc = mount_get_conns(vol, cifs_sb, &xid, &server, &ses,
- -                                           &tcon);
- -                      /*
- -                       * Ensure that DFS referrals go through new root server.
- -                       */
- -                      if (!rc && tcon &&
- -                          (tcon->share_flags & (SHI1005_FLAGS_DFS |
- -                                                SHI1005_FLAGS_DFS_ROOT))) {
- -                              cifs_put_tcon(root_tcon);
- -                              set_root_tcon(cifs_sb, tcon, &root_tcon);
- -                      }
+ +                      rc = mount_get_conns(vol, cifs_sb, &xid, &server, &ses, &tcon);
                 }
- -              if (rc) {
- -                      if (rc == -EACCES || rc == -EOPNOTSUPP)
- -                              break;
- -                      /* Perform DFS failover to any other DFS targets */
- -                      rc = mount_do_dfs_failover(full_path + 1, cifs_sb, vol,
- -                                                 root_tcon->ses, &xid,
- -                                                 &server, &ses, &tcon);
- -                      if (rc == -EACCES || rc == -EOPNOTSUPP || !server ||
- -                          !ses)
- -                              goto error;
+ +              if (rc && !server && !ses) {
+ +                      /* Failed to connect. Try to connect to other targets in the referral. */
+ +                      rc = do_dfs_failover(ref_path + 1, full_path, cifs_sb, vol, root_ses, &xid,
+ +                                           &server, &ses, &tcon);
                 }
- -      }
- -      cifs_put_tcon(root_tcon);
+ +              if (rc == -EACCES || rc == -EOPNOTSUPP || !server || !ses)
+ +                      break;
+ +              if (!tcon)
+ +                      continue;
+ +              /* Make sure that requests go through new root servers */
+ +              if (tcon->share_flags & (SHI1005_FLAGS_DFS | SHI1005_FLAGS_DFS_ROOT)) {
+ +                      put_root_ses(root_ses);
+ +                      set_root_ses(cifs_sb, ses, &root_ses);
+ +              }
+ +              /* Check for remaining path components and then continue chasing them (-EREMOTE) */
+ +              rc = check_dfs_prepath(cifs_sb, vol, xid, server, tcon, &ref_path);
+ +              /* Prevent recursion on broken link referrals */
+ +              if (rc == -EREMOTE && ++count > MAX_NESTED_LINKS)
+ +                      rc = -ELOOP;
+ +      } while (rc == -EREMOTE);
   
         if (rc)
                 goto error;
- -
- -      spin_lock(&cifs_tcp_ses_lock);
- -      if (!tcon->dfs_path) {
- -              /* Save full path in new tcon to do failover when reconnecting tcons */
- -              tcon->dfs_path = full_path;
- -              full_path = NULL;
- -              tcon->remap = cifs_remap(cifs_sb);
- -      }
- -      cifs_sb->origin_fullpath = kstrndup(tcon->dfs_path,
- -                                          strlen(tcon->dfs_path),
- -                                          GFP_ATOMIC);
+ +      put_root_ses(root_ses);
+ +      root_ses = NULL;
+ +      kfree(ref_path);
+ +      ref_path = NULL;
+ +      /*
+ +       * Store DFS full path in both superblock and tree connect structures.
+ +       *
+ +       * For DFS root mounts, the prefix path (cifs_sb->prepath) is preserved during reconnect so
+ +       * only the root path is set in cifs_sb->origin_fullpath and tcon->dfs_path. And for DFS
+ +       * links, the prefix path is included in both and may be changed during reconnect.  See
+ +       * cifs_tree_connect().
+ +       */
+ +      cifs_sb->origin_fullpath = kstrndup(full_path, strlen(full_path), GFP_KERNEL);
         if (!cifs_sb->origin_fullpath) {
- -              spin_unlock(&cifs_tcp_ses_lock);
                 rc = -ENOMEM;
                 goto error;
         }
+ +      spin_lock(&cifs_tcp_ses_lock);
+ +      tcon->dfs_path = full_path;
+ +      full_path = NULL;
+ +      tcon->remap = cifs_remap(cifs_sb);
         spin_unlock(&cifs_tcp_ses_lock);
   
- -      rc = dfs_cache_add_vol(origin_mountdata, vol, cifs_sb->origin_fullpath);
- -      if (rc) {
- -              kfree(cifs_sb->origin_fullpath);
+ +      /* Add original volume information for DFS cache to be used when refreshing referrals */
+ +      rc = dfs_cache_add_vol(mntdata, vol, cifs_sb->origin_fullpath);
+ +      if (rc)
                 goto error;
- -      }
         /*
          * After reconnecting to a different server, unique ids won't
          * match anymore, so we disable serverino. This prevents
@@@ -4969,11 -4976,9 +4969,11 @@@ out
         return mount_setup_tlink(cifs_sb, ses, tcon);
   
   error:
+ +      kfree(ref_path);
         kfree(full_path);
- -      kfree(root_path);
- -      kfree(origin_mountdata);
+ +      kfree(mntdata);
+ +      kfree(cifs_sb->origin_fullpath);
+ +      put_root_ses(root_ses);
         mount_put_conns(cifs_sb, xid, server, ses, tcon);
         return rc;
   }
@@@ -5109,7 -5114,8 +5109,7 @@@ CIFSTCon(const unsigned int xid, struc
         bcc_ptr += strlen("?????");
         bcc_ptr += 1;
         count = bcc_ptr - &pSMB->Password[0];
- -      pSMB->hdr.smb_buf_length = cpu_to_be32(be32_to_cpu(
- -                                      pSMB->hdr.smb_buf_length) + count);
+ +      be32_add_cpu(&pSMB->hdr.smb_buf_length, count);
         pSMB->ByteCount = cpu_to_le16(count);
   
         rc = SendReceive(xid, ses, smb_buffer, smb_buffer_response, &length,
@@@ -5339,7 -5345,7 +5339,7 @@@ cifs_construct_tcon(struct cifs_sb_inf
   
   out:
         kfree(vol_info->username);
-       kzfree(vol_info->password);
+       kfree_sensitive(vol_info->password);
         kfree(vol_info);
   
         return tcon;
@@@ -5527,115 -5533,3 +5527,115 @@@ cifs_prune_tlinks(struct work_struct *w
         queue_delayed_work(cifsiod_wq, &cifs_sb->prune_tlinks,
                                 TLINK_IDLE_EXPIRE);
   }
+ +
+ +#ifdef CONFIG_CIFS_DFS_UPCALL
+ +int cifs_tree_connect(const unsigned int xid, struct cifs_tcon *tcon, const struct nls_table *nlsc)
+ +{
+ +      int rc;
+ +      struct TCP_Server_Info *server = tcon->ses->server;
+ +      const struct smb_version_operations *ops = server->ops;
+ +      struct dfs_cache_tgt_list tl;
+ +      struct dfs_cache_tgt_iterator *it = NULL;
+ +      char *tree;
+ +      const char *tcp_host;
+ +      size_t tcp_host_len;
+ +      const char *dfs_host;
+ +      size_t dfs_host_len;
+ +      char *share = NULL, *prefix = NULL;
+ +      struct dfs_info3_param ref = {0};
+ +      bool isroot;
+ +
+ +      tree = kzalloc(MAX_TREE_SIZE, GFP_KERNEL);
+ +      if (!tree)
+ +              return -ENOMEM;
+ +
+ +      if (!tcon->dfs_path) {
+ +              if (tcon->ipc) {
+ +                      scnprintf(tree, MAX_TREE_SIZE, "\\\\%s\\IPC$", server->hostname);
+ +                      rc = ops->tree_connect(xid, tcon->ses, tree, tcon, nlsc);
+ +              } else {
+ +                      rc = ops->tree_connect(xid, tcon->ses, tcon->treeName, tcon, nlsc);
+ +              }
+ +              goto out;
+ +      }
+ +
+ +      rc = dfs_cache_noreq_find(tcon->dfs_path + 1, &ref, &tl);
+ +      if (rc)
+ +              goto out;
+ +      isroot = ref.server_type == DFS_TYPE_ROOT;
+ +      free_dfs_info_param(&ref);
+ +
+ +      extract_unc_hostname(server->hostname, &tcp_host, &tcp_host_len);
+ +
+ +      for (it = dfs_cache_get_tgt_iterator(&tl); it; it = dfs_cache_get_next_tgt(&tl, it)) {
+ +              bool target_match;
+ +
+ +              kfree(share);
+ +              kfree(prefix);
+ +              share = NULL;
+ +              prefix = NULL;
+ +
+ +              rc = dfs_cache_get_tgt_share(tcon->dfs_path + 1, it, &share, &prefix);
+ +              if (rc) {
+ +                      cifs_dbg(VFS, "%s: failed to parse target share %d\n",
+ +                               __func__, rc);
+ +                      continue;
+ +              }
+ +
+ +              extract_unc_hostname(share, &dfs_host, &dfs_host_len);
+ +
+ +              if (dfs_host_len != tcp_host_len
+ +                  || strncasecmp(dfs_host, tcp_host, dfs_host_len) != 0) {
+ +                      cifs_dbg(FYI, "%s: %.*s doesn't match %.*s\n", __func__, (int)dfs_host_len,
+ +                               dfs_host, (int)tcp_host_len, tcp_host);
+ +
+ +                      rc = match_target_ip(server, dfs_host, dfs_host_len, &target_match);
+ +                      if (rc) {
+ +                              cifs_dbg(VFS, "%s: failed to match target ip: %d\n", __func__, rc);
+ +                              break;
+ +                      }
+ +
+ +                      if (!target_match) {
+ +                              cifs_dbg(FYI, "%s: skipping target\n", __func__);
+ +                              continue;
+ +                      }
+ +              }
+ +
+ +              if (tcon->ipc) {
+ +                      scnprintf(tree, MAX_TREE_SIZE, "\\\\%s\\IPC$", share);
+ +                      rc = ops->tree_connect(xid, tcon->ses, tree, tcon, nlsc);
+ +              } else {
+ +                      scnprintf(tree, MAX_TREE_SIZE, "\\%s", share);
+ +                      rc = ops->tree_connect(xid, tcon->ses, tree, tcon, nlsc);
+ +                      /* Only handle prefix paths of DFS link targets */
+ +                      if (!rc && !isroot) {
+ +                              rc = update_super_prepath(tcon, prefix);
+ +                              break;
+ +                      }
+ +              }
+ +              if (rc == -EREMOTE)
+ +                      break;
+ +      }
+ +
+ +      kfree(share);
+ +      kfree(prefix);
+ +
+ +      if (!rc) {
+ +              if (it)
+ +                      rc = dfs_cache_noreq_update_tgthint(tcon->dfs_path + 1, it);
+ +              else
+ +                      rc = -ENOENT;
+ +      }
+ +      dfs_cache_free_tgts(&tl);
+ +out:
+ +      kfree(tree);
+ +      return rc;
+ +}
+ +#else
+ +int cifs_tree_connect(const unsigned int xid, struct cifs_tcon *tcon, const struct nls_table *nlsc)
+ +{
+ +      const struct smb_version_operations *ops = tcon->ses->server->ops;
+ +
+ +      return ops->tree_connect(xid, tcon->ses, tcon->treeName, tcon, nlsc);
+ +}
+ +#endif
diff --combined fs/cifs/dfs_cache.c

index a44f58b,7a8d414..6ee8496
--- 1/fs/cifs/dfs_cache.c
--- 2/fs/cifs/dfs_cache.c
+++ b/fs/cifs/dfs_cache.c
@@@ -29,7 -29,6 +29,7 @@@
   
   struct cache_dfs_tgt {
         char *name;
+ +      int path_consumed;
         struct list_head list;
   };
   
@@@ -351,7 -350,7 +351,7 @@@ static inline struct timespec64 get_exp
   }
   
   /* Allocate a new DFS target */
- -static struct cache_dfs_tgt *alloc_target(const char *name)
+ +static struct cache_dfs_tgt *alloc_target(const char *name, int path_consumed)
   {
         struct cache_dfs_tgt *t;
   
@@@ -363,7 -362,6 +363,7 @@@
                 kfree(t);
                 return ERR_PTR(-ENOMEM);
         }
+ +      t->path_consumed = path_consumed;
         INIT_LIST_HEAD(&t->list);
         return t;
   }
@@@ -386,7 -384,7 +386,7 @@@ static int copy_ref_data(const struct d
         for (i = 0; i < numrefs; i++) {
                 struct cache_dfs_tgt *t;
   
- -              t = alloc_target(refs[i].node_name);
+ +              t = alloc_target(refs[i].node_name, refs[i].path_consumed);
                 if (IS_ERR(t)) {
                         free_tgts(ce);
                         return PTR_ERR(t);
@@@ -492,7 -490,16 +492,7 @@@ static int add_cache_entry(const char *
         return 0;
   }
   
- -/*
- - * Find a DFS cache entry in hash table and optionally check prefix path against
- - * @path.
- - * Use whole path components in the match.
- - * Must be called with htable_rw_lock held.
- - *
- - * Return ERR_PTR(-ENOENT) if the entry is not found.
- - */
- -static struct cache_entry *lookup_cache_entry(const char *path,
- -                                            unsigned int *hash)
+ +static struct cache_entry *__lookup_cache_entry(const char *path)
   {
         struct cache_entry *ce;
         unsigned int h;
@@@ -510,75 -517,9 +510,75 @@@
   
         if (!found)
                 ce = ERR_PTR(-ENOENT);
+ +      return ce;
+ +}
+ +
+ +/*
+ + * Find a DFS cache entry in hash table and optionally check prefix path against
+ + * @path.
+ + * Use whole path components in the match.
+ + * Must be called with htable_rw_lock held.
+ + *
+ + * Return ERR_PTR(-ENOENT) if the entry is not found.
+ + */
+ +static struct cache_entry *lookup_cache_entry(const char *path, unsigned int *hash)
+ +{
+ +      struct cache_entry *ce = ERR_PTR(-ENOENT);
+ +      unsigned int h;
+ +      int cnt = 0;
+ +      char *npath;
+ +      char *s, *e;
+ +      char sep;
+ +
+ +      npath = kstrndup(path, strlen(path), GFP_KERNEL);
+ +      if (!npath)
+ +              return ERR_PTR(-ENOMEM);
+ +
+ +      s = npath;
+ +      sep = *npath;
+ +      while ((s = strchr(s, sep)) && ++cnt < 3)
+ +              s++;
+ +
+ +      if (cnt < 3) {
+ +              h = cache_entry_hash(path, strlen(path));
+ +              ce = __lookup_cache_entry(path);
+ +              goto out;
+ +      }
+ +      /*
+ +       * Handle paths that have more than two path components and are a complete prefix of the DFS
+ +       * referral request path (@path).
+ +       *
+ +       * See MS-DFSC 3.2.5.5 "Receiving a Root Referral Request or Link Referral Request".
+ +       */
+ +      h = cache_entry_hash(npath, strlen(npath));
+ +      e = npath + strlen(npath) - 1;
+ +      while (e > s) {
+ +              char tmp;
+ +
+ +              /* skip separators */
+ +              while (e > s && *e == sep)
+ +                      e--;
+ +              if (e == s)
+ +                      goto out;
+ +
+ +              tmp = *(e+1);
+ +              *(e+1) = 0;
+ +
+ +              ce = __lookup_cache_entry(npath);
+ +              if (!IS_ERR(ce)) {
+ +                      h = cache_entry_hash(npath, strlen(npath));
+ +                      break;
+ +              }
+ +
+ +              *(e+1) = tmp;
+ +              /* backward until separator */
+ +              while (e > s && *e != sep)
+ +                      e--;
+ +      }
+ +out:
         if (hash)
                 *hash = h;
- -
+ +      kfree(npath);
         return ce;
   }
   
@@@ -832,7 -773,6 +832,7 @@@ static int get_targets(struct cache_ent
                         rc = -ENOMEM;
                         goto err_free_it;
                 }
+ +              it->it_path_consumed = t->path_consumed;
   
                 if (ce->tgthint == t)
                         list_add(&it->it_list, head);
@@@ -1191,7 -1131,7 +1191,7 @@@ err_free_domainname
   err_free_unc:
         kfree(new->UNC);
   err_free_password:
-       kzfree(new->password);
+       kfree_sensitive(new->password);
   err_free_username:
         kfree(new->username);
         kfree(new);
@@@ -1323,26 -1263,23 +1323,26 @@@ void dfs_cache_del_vol(const char *full
   /**
    * dfs_cache_get_tgt_share - parse a DFS target
    *
+ + * @path: DFS full path
    * @it: DFS target iterator.
    * @share: tree name.
- - * @share_len: length of tree name.
    * @prefix: prefix path.
- - * @prefix_len: length of prefix path.
    *
    * Return zero if target was parsed correctly, otherwise non-zero.
    */
- -int dfs_cache_get_tgt_share(const struct dfs_cache_tgt_iterator *it,
- -                          const char **share, size_t *share_len,
- -                          const char **prefix, size_t *prefix_len)
+ +int dfs_cache_get_tgt_share(char *path, const struct dfs_cache_tgt_iterator *it,
+ +                          char **share, char **prefix)
   {
- -      char *s, sep;
+ +      char *s, sep, *p;
+ +      size_t len;
+ +      size_t plen1, plen2;
   
- -      if (!it || !share || !share_len || !prefix || !prefix_len)
+ +      if (!it || !path || !share || !prefix || strlen(path) < it->it_path_consumed)
                 return -EINVAL;
   
+ +      *share = NULL;
+ +      *prefix = NULL;
+ +
         sep = it->it_name[0];
         if (sep != '\\' && sep != '/')
                 return -EINVAL;
@@@ -1351,38 -1288,13 +1351,38 @@@
         if (!s)
                 return -EINVAL;
   
+ +      /* point to prefix in target node */
         s = strchrnul(s + 1, sep);
   
- -      *share = it->it_name;
- -      *share_len = s - it->it_name;
- -      *prefix = *s ? s + 1 : s;
- -      *prefix_len = &it->it_name[strlen(it->it_name)] - *prefix;
+ +      /* extract target share */
+ +      *share = kstrndup(it->it_name, s - it->it_name, GFP_KERNEL);
+ +      if (!*share)
+ +              return -ENOMEM;
   
+ +      /* skip separator */
+ +      if (*s)
+ +              s++;
+ +      /* point to prefix in DFS path */
+ +      p = path + it->it_path_consumed;
+ +      if (*p == sep)
+ +              p++;
+ +
+ +      /* merge prefix paths from DFS path and target node */
+ +      plen1 = it->it_name + strlen(it->it_name) - s;
+ +      plen2 = path + strlen(path) - p;
+ +      if (plen1 || plen2) {
+ +              len = plen1 + plen2 + 2;
+ +              *prefix = kmalloc(len, GFP_KERNEL);
+ +              if (!*prefix) {
+ +                      kfree(*share);
+ +                      *share = NULL;
+ +                      return -ENOMEM;
+ +              }
+ +              if (plen1)
+ +                      scnprintf(*prefix, len, "%.*s%c%.*s", (int)plen1, s, sep, (int)plen2, p);
+ +              else
+ +                      strscpy(*prefix, p, len);
+ +      }
         return 0;
   }
   
diff --combined fs/cifs/misc.c

index 7642348,3e37724..1c14cf0
--- 1/fs/cifs/misc.c
--- 2/fs/cifs/misc.c
+++ b/fs/cifs/misc.c
@@@ -103,12 -103,12 +103,12 @@@ sesInfoFree(struct cifs_ses *buf_to_fre
         kfree(buf_to_free->serverOS);
         kfree(buf_to_free->serverDomain);
         kfree(buf_to_free->serverNOS);
-       kzfree(buf_to_free->password);
+       kfree_sensitive(buf_to_free->password);
         kfree(buf_to_free->user_name);
         kfree(buf_to_free->domainName);
-       kzfree(buf_to_free->auth_key.response);
+       kfree_sensitive(buf_to_free->auth_key.response);
         kfree(buf_to_free->iface_list);
-       kzfree(buf_to_free);
+       kfree_sensitive(buf_to_free);
   }
   
   struct cifs_tcon *
@@@ -148,7 -148,7 +148,7 @@@ tconInfoFree(struct cifs_tcon *buf_to_f
         }
         atomic_dec(&tconInfoAllocCount);
         kfree(buf_to_free->nativeFileSystem);
-       kzfree(buf_to_free->password);
+       kfree_sensitive(buf_to_free->password);
         kfree(buf_to_free->crfid.fid);
   #ifdef CONFIG_CIFS_DFS_UPCALL
         kfree(buf_to_free->dfs_path);
@@@ -1164,7 -1164,8 +1164,7 @@@ static inline void cifs_put_tcon_super(
   }
   #endif
   
- -int update_super_prepath(struct cifs_tcon *tcon, const char *prefix,
- -                       size_t prefix_len)
+ +int update_super_prepath(struct cifs_tcon *tcon, char *prefix)
   {
         struct super_block *sb;
         struct cifs_sb_info *cifs_sb;
@@@ -1178,8 -1179,8 +1178,8 @@@
   
         kfree(cifs_sb->prepath);
   
- -      if (*prefix && prefix_len) {
- -              cifs_sb->prepath = kstrndup(prefix, prefix_len, GFP_ATOMIC);
+ +      if (prefix && *prefix) {
+ +              cifs_sb->prepath = kstrndup(prefix, strlen(prefix), GFP_ATOMIC);
                 if (!cifs_sb->prepath) {
                         rc = -ENOMEM;
                         goto out;
diff --combined include/linux/fs.h

index 6d19769,f5da33b..2df72de
--- 1/include/linux/fs.h
--- 2/include/linux/fs.h
+++ b/include/linux/fs.h
@@@ -528,7 -528,7 +528,7 @@@ static inline int mapping_mapped(struc
   
   /*
    * Might pages of this file have been modified in userspace?
-  * Note that i_mmap_writable counts all VM_SHARED vmas: do_mmap_pgoff
+  * Note that i_mmap_writable counts all VM_SHARED vmas: do_mmap
    * marks vma as VM_SHARED if it is shared, and the file was opened for
    * writing i.e. vma may be mprotected writable even if now readonly.
    *
@@@ -1712,10 -1712,6 +1712,10 @@@ int vfs_mkobj(struct dentry *, umode_t
                 int (*f)(struct dentry *, umode_t, void *),
                 void *);
   
+ +int vfs_fchown(struct file *file, uid_t user, gid_t group);
+ +int vfs_fchmod(struct file *file, umode_t mode);
+ +int vfs_utimes(const struct path *path, struct timespec64 *times);
+ +
   extern long vfs_ioctl(struct file *file, unsigned int cmd, unsigned long arg);
   
   #ifdef CONFIG_COMPAT
@@@ -2950,6 -2946,21 +2950,21 @@@ extern void discard_new_inode(struct in
   extern unsigned int get_next_ino(void);
   extern void evict_inodes(struct super_block *sb);
   
+ /*
+  * Userspace may rely on the the inode number being non-zero. For example, glibc
+  * simply ignores files with zero i_ino in unlink() and other places.
+  *
+  * As an additional complication, if userspace was compiled with
+  * _FILE_OFFSET_BITS=32 on a 64-bit kernel we'll only end up reading out the
+  * lower 32 bits, so we need to check that those aren't zero explicitly. With
+  * _FILE_OFFSET_BITS=64, this may cause some harmless false-negatives, but
+  * better safe than sorry.
+  */
+ static inline bool is_zero_ino(ino_t ino)
+ {
+       return (u32)ino == 0;
+ }
+ 
   extern void __iget(struct inode * inode);
   extern void iget_failed(struct inode *);
   extern void clear_inode(struct inode *);
diff --combined include/linux/mm.h

index 6c8333d,392016c..f6a82f9
--- 1/include/linux/mm.h
--- 2/include/linux/mm.h
+++ b/include/linux/mm.h
@@@ -206,6 -206,8 +206,8 @@@ int overcommit_ratio_handler(struct ctl
                 loff_t *);
   int overcommit_kbytes_handler(struct ctl_table *, int, void *, size_t *,
                 loff_t *);
+ int overcommit_policy_handler(struct ctl_table *, int, void *, size_t *,
+               loff_t *);
   
   #define nth_page(page,n) pfn_to_page(page_to_pfn((page)) + (n))
   
@@@ -317,6 -319,8 +319,6 @@@ extern unsigned int kobjsize(const voi
   
   #if defined(CONFIG_X86)
   # define VM_PAT               VM_ARCH_1       /* PAT reserves whole VMA at once (x86) */
- -#elif defined(CONFIG_PPC)
- -# define VM_SAO               VM_ARCH_1       /* Strong Access Ordering (powerpc) */
   #elif defined(CONFIG_PARISC)
   # define VM_GROWSUP   VM_ARCH_1
   #elif defined(CONFIG_IA64)
@@@ -777,6 -781,11 +779,11 @@@ static inline void *kvcalloc(size_t n, 
   extern void kvfree(const void *addr);
   extern void kvfree_sensitive(const void *addr, size_t len);
   
+ static inline int head_mapcount(struct page *head)
+ {
+       return atomic_read(compound_mapcount_ptr(head)) + 1;
+ }
+ 
   /*
    * Mapcount of compound page as a whole, does not include mapped sub-pages.
    *
@@@ -786,7 -795,7 +793,7 @@@ static inline int compound_mapcount(str
   {
         VM_BUG_ON_PAGE(!PageCompound(page), page);
         page = compound_head(page);
-       return atomic_read(compound_mapcount_ptr(page)) + 1;
+       return head_mapcount(page);
   }
   
   /*
@@@ -899,11 -908,16 +906,16 @@@ static inline bool hpage_pincount_avail
         return PageCompound(page) && compound_order(page) > 1;
   }
   
+ static inline int head_pincount(struct page *head)
+ {
+       return atomic_read(compound_pincount_ptr(head));
+ }
+ 
   static inline int compound_pincount(struct page *page)
   {
         VM_BUG_ON_PAGE(!hpage_pincount_available(page), page);
         page = compound_head(page);
-       return atomic_read(compound_pincount_ptr(page));
+       return head_pincount(page);
   }
   
   static inline void set_compound_order(struct page *page, unsigned int order)
@@@ -2091,51 -2105,11 +2103,11 @@@ static inline pud_t *pud_alloc(struct m
                 NULL : pud_offset(p4d, address);
   }
   
- static inline p4d_t *p4d_alloc_track(struct mm_struct *mm, pgd_t *pgd,
-                                    unsigned long address,
-                                    pgtbl_mod_mask *mod_mask)
- 
- {
-       if (unlikely(pgd_none(*pgd))) {
-               if (__p4d_alloc(mm, pgd, address))
-                       return NULL;
-               *mod_mask |= PGTBL_PGD_MODIFIED;
-       }
- 
-       return p4d_offset(pgd, address);
- }
- 
- static inline pud_t *pud_alloc_track(struct mm_struct *mm, p4d_t *p4d,
-                                    unsigned long address,
-                                    pgtbl_mod_mask *mod_mask)
- {
-       if (unlikely(p4d_none(*p4d))) {
-               if (__pud_alloc(mm, p4d, address))
-                       return NULL;
-               *mod_mask |= PGTBL_P4D_MODIFIED;
-       }
- 
-       return pud_offset(p4d, address);
- }
- 
   static inline pmd_t *pmd_alloc(struct mm_struct *mm, pud_t *pud, unsigned long address)
   {
         return (unlikely(pud_none(*pud)) && __pmd_alloc(mm, pud, address))?
                 NULL: pmd_offset(pud, address);
   }
- 
- static inline pmd_t *pmd_alloc_track(struct mm_struct *mm, pud_t *pud,
-                                    unsigned long address,
-                                    pgtbl_mod_mask *mod_mask)
- {
-       if (unlikely(pud_none(*pud))) {
-               if (__pmd_alloc(mm, pud, address))
-                       return NULL;
-               *mod_mask |= PGTBL_PUD_MODIFIED;
-       }
- 
-       return pmd_offset(pud, address);
- }
   #endif /* CONFIG_MMU */
   
   #if USE_SPLIT_PTE_PTLOCKS
@@@ -2251,11 -2225,6 +2223,6 @@@ static inline void pgtable_pte_page_dto
         ((unlikely(pmd_none(*(pmd))) && __pte_alloc_kernel(pmd))? \
                 NULL: pte_offset_kernel(pmd, address))
   
- #define pte_alloc_kernel_track(pmd, address, mask)                    \
-       ((unlikely(pmd_none(*(pmd))) &&                                 \
-         (__pte_alloc_kernel(pmd) || ({*(mask)|=PGTBL_PMD_MODIFIED;0;})))?\
-               NULL: pte_offset_kernel(pmd, address))
- 
   #if USE_SPLIT_PMD_PTLOCKS
   
   static struct page *pmd_to_page(pmd_t *pmd)
@@@ -2413,9 -2382,6 +2380,6 @@@ static inline unsigned long get_num_phy
    * for_each_valid_physical_page_range()
    *    memblock_add_node(base, size, nid)
    * free_area_init(max_zone_pfns);
-  *
-  * sparse_memory_present_with_active_regions() calls memory_present() for
-  * each range when SPARSEMEM is enabled.
    */
   void free_area_init(unsigned long *max_zone_pfn);
   unsigned long node_map_pfn_alignment(void);
@@@ -2426,7 -2392,6 +2390,6 @@@ extern unsigned long absent_pages_in_ra
   extern void get_pfn_range_for_nid(unsigned int nid,
                         unsigned long *start_pfn, unsigned long *end_pfn);
   extern unsigned long find_min_pfn_with_active_regions(void);
- extern void sparse_memory_present_with_active_regions(int nid);
   
   #ifndef CONFIG_NEED_MULTIPLE_NODES
   static inline int early_pfn_to_nid(unsigned long pfn)
@@@ -2577,23 -2542,13 +2540,13 @@@ extern unsigned long mmap_region(struc
         struct list_head *uf);
   extern unsigned long do_mmap(struct file *file, unsigned long addr,
         unsigned long len, unsigned long prot, unsigned long flags,
-       vm_flags_t vm_flags, unsigned long pgoff, unsigned long *populate,
-       struct list_head *uf);
+       unsigned long pgoff, unsigned long *populate, struct list_head *uf);
   extern int __do_munmap(struct mm_struct *, unsigned long, size_t,
                        struct list_head *uf, bool downgrade);
   extern int do_munmap(struct mm_struct *, unsigned long, size_t,
                      struct list_head *uf);
   extern int do_madvise(unsigned long start, size_t len_in, int behavior);
   
- static inline unsigned long
- do_mmap_pgoff(struct file *file, unsigned long addr,
-       unsigned long len, unsigned long prot, unsigned long flags,
-       unsigned long pgoff, unsigned long *populate,
-       struct list_head *uf)
- {
-       return do_mmap(file, addr, len, prot, flags, 0, pgoff, populate, uf);
- }
- 
   #ifdef CONFIG_MMU
   extern int __mm_populate(unsigned long addr, unsigned long len,
                          int ignore_errors);
@@@ -3009,14 -2964,15 +2962,15 @@@ pgd_t *vmemmap_pgd_populate(unsigned lo
   p4d_t *vmemmap_p4d_populate(pgd_t *pgd, unsigned long addr, int node);
   pud_t *vmemmap_pud_populate(p4d_t *p4d, unsigned long addr, int node);
   pmd_t *vmemmap_pmd_populate(pud_t *pud, unsigned long addr, int node);
- pte_t *vmemmap_pte_populate(pmd_t *pmd, unsigned long addr, int node);
+ pte_t *vmemmap_pte_populate(pmd_t *pmd, unsigned long addr, int node,
+                           struct vmem_altmap *altmap);
   void *vmemmap_alloc_block(unsigned long size, int node);
   struct vmem_altmap;
- void *vmemmap_alloc_block_buf(unsigned long size, int node);
- void *altmap_alloc_block_buf(unsigned long size, struct vmem_altmap *altmap);
+ void *vmemmap_alloc_block_buf(unsigned long size, int node,
+                             struct vmem_altmap *altmap);
   void vmemmap_verify(pte_t *, int, unsigned long, unsigned long);
   int vmemmap_populate_basepages(unsigned long start, unsigned long end,
-                              int node);
+                              int node, struct vmem_altmap *altmap);
   int vmemmap_populate(unsigned long start, unsigned long end, int node,
                 struct vmem_altmap *altmap);
   void vmemmap_populate_print_last(void);
diff --combined init/main.c

index 276ca31,92d2579..de2f9fa
--- 1/init/main.c
--- 2/init/main.c
+++ b/init/main.c
@@@ -96,7 -96,6 +96,7 @@@
   #include <linux/jump_label.h>
   #include <linux/mem_encrypt.h>
   #include <linux/kcsan.h>
+ +#include <linux/init_syscalls.h>
   
   #include <asm/io.h>
   #include <asm/bugs.h>
@@@ -155,7 -154,7 +155,7 @@@ static bool initargs_found
   #endif
   
   static char *execute_command;
- -static char *ramdisk_execute_command;
+ +static char *ramdisk_execute_command = "/init";
   
   /*
    * Used to generate warnings if static_key manipulation functions are used
@@@ -830,7 -829,7 +830,7 @@@ void __init __weak arch_call_rest_init(
         rest_init();
   }
   
- asmlinkage __visible void __init start_kernel(void)
+ asmlinkage __visible void __init __no_sanitize_address start_kernel(void)
   {
         char *command_line;
         char *after_dashes;
@@@ -1458,19 -1457,15 +1458,19 @@@ static int __ref kernel_init(void *unus
               "See Linux Documentation/admin-guide/init.rst for guidance.");
   }
   
- -void console_on_rootfs(void)
+ +/* Open /dev/console, for stdin/stdout/stderr, this should never fail */
+ +void __init console_on_rootfs(void)
   {
- -      /* Open the /dev/console as stdin, this should never fail */
- -      if (ksys_open((const char __user *) "/dev/console", O_RDWR, 0) < 0)
- -              pr_err("Warning: unable to open an initial console.\n");
+ +      struct file *file = filp_open("/dev/console", O_RDWR, 0);
   
- -      /* create stdout/stderr */
- -      (void) ksys_dup(0);
- -      (void) ksys_dup(0);
+ +      if (IS_ERR(file)) {
+ +              pr_err("Warning: unable to open an initial console.\n");
+ +              return;
+ +      }
+ +      init_dup(file);
+ +      init_dup(file);
+ +      init_dup(file);
+ +      fput(file);
   }
   
   static noinline void __init kernel_init_freeable(void)
@@@ -1515,7 -1510,12 +1515,7 @@@
          * check if there is an early userspace init.  If yes, let it do all
          * the work
          */
- -
- -      if (!ramdisk_execute_command)
- -              ramdisk_execute_command = "/init";
- -
- -      if (ksys_access((const char __user *)
- -                      ramdisk_execute_command, 0) != 0) {
+ +      if (init_eaccess(ramdisk_execute_command) != 0) {
                 ramdisk_execute_command = NULL;
                 prepare_namespace();
         }
diff --combined net/core/sock.c

index d29709e,9d8b15b..a2044b4
--- 1/net/core/sock.c
--- 2/net/core/sock.c
+++ b/net/core/sock.c
@@@ -820,14 -820,6 +820,14 @@@ void sock_set_rcvbuf(struct sock *sk, i
   }
   EXPORT_SYMBOL(sock_set_rcvbuf);
   
+ +void sock_set_mark(struct sock *sk, u32 val)
+ +{
+ +      lock_sock(sk);
+ +      sk->sk_mark = val;
+ +      release_sock(sk);
+ +}
+ +EXPORT_SYMBOL(sock_set_mark);
+ +
   /*
    *    This is meant for all protocols to use and covers goings on
    *    at the socket level. Everything here is generic.
@@@ -2265,7 -2257,7 +2265,7 @@@ static inline void __sock_kfree_s(struc
         if (WARN_ON_ONCE(!mem))
                 return;
         if (nullify)
-               kzfree(mem);
+               kfree_sensitive(mem);
         else
                 kfree(mem);
         atomic_sub(size, &sk->sk_omem_alloc);
author	Linus Torvalds <torvalds@linux-foundation.org>
	Fri, 7 Aug 2020 18:39:33 +0000 (11:39 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Fri, 7 Aug 2020 18:39:33 +0000 (11:39 -0700)
		1	2
Documentation/admin-guide/kernel-parameters.txt	patch \|	diff1 \|	diff2 \|	blob \| history
arch/m68k/mm/mcfmmu.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/mm/init_32.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/mm/init_64.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/mm/mem.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/mm/numa.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/mm/ptdump/hashpagetable.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/mm/ptdump/ptdump.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/riscv/mm/init.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/s390/kernel/ptrace.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/mm/init_64.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/xen/balloon.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/xen/privcmd.c	patch \|	diff1 \|	diff2 \|	blob \| history
fs/cifs/connect.c	patch \|	diff1 \|	diff2 \|	blob \| history
fs/cifs/dfs_cache.c	patch \|	diff1 \|	diff2 \|	blob \| history
fs/cifs/misc.c	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/fs.h	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/mm.h	patch \|	diff1 \|	diff2 \|	blob \| history
init/main.c	patch \|	diff1 \|	diff2 \|	blob \| history
net/core/sock.c	patch \|	diff1 \|	diff2 \|	blob \| history