Merge tag 'ceph-for-5.8-rc1' of git://github.com/ceph/ceph-client

author Linus Torvalds <torvalds@linux-foundation.org>

Mon, 8 Jun 2020 19:49:18 +0000 (12:49 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Mon, 8 Jun 2020 19:49:18 +0000 (12:49 -0700)
author Linus Torvalds <torvalds@linux-foundation.org>
Mon, 8 Jun 2020 19:49:18 +0000 (12:49 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Mon, 8 Jun 2020 19:49:18 +0000 (12:49 -0700)
diff --combined net/ceph/ceph_common.c

index 66f22e8,9bab3e9..afe0e81
--- 1/net/ceph/ceph_common.c
--- 2/net/ceph/ceph_common.c
+++ b/net/ceph/ceph_common.c
@@@ -176,6 -176,10 +176,10 @@@ int ceph_compare_options(struct ceph_op
                 }
         }
   
+       ret = ceph_compare_crush_locs(&opt1->crush_locs, &opt2->crush_locs);
+       if (ret)
+               return ret;
+ 
         /* any matching mon ip implies a match */
         for (i = 0; i < opt1->num_mon; i++) {
                 if (ceph_monmap_contains(client->monc.monmap,
@@@ -190,7 -194,8 +194,7 @@@ EXPORT_SYMBOL(ceph_compare_options)
    * kvmalloc() doesn't fall back to the vmalloc allocator unless flags are
    * compatible with (a superset of) GFP_KERNEL.  This is because while the
    * actual pages are allocated with the specified flags, the page table pages
- - * are always allocated with GFP_KERNEL.  map_vm_area() doesn't even take
- - * flags because GFP_KERNEL is hard-coded in {p4d,pud,pmd,pte}_alloc().
+ + * are always allocated with GFP_KERNEL.
    *
    * ceph_kvmalloc() may be called with GFP_KERNEL, GFP_NOFS or GFP_NOIO.
    */
@@@ -259,6 -264,8 +263,8 @@@ enum 
         Opt_secret,
         Opt_key,
         Opt_ip,
+       Opt_crush_location,
+       Opt_read_from_replica,
         /* string args above */
         Opt_share,
         Opt_crc,
@@@ -268,11 -275,25 +274,25 @@@
         Opt_abort_on_full,
   };
   
+ enum {
+       Opt_read_from_replica_no,
+       Opt_read_from_replica_balance,
+       Opt_read_from_replica_localize,
+ };
+ 
+ static const struct constant_table ceph_param_read_from_replica[] = {
+       {"no",          Opt_read_from_replica_no},
+       {"balance",     Opt_read_from_replica_balance},
+       {"localize",    Opt_read_from_replica_localize},
+       {}
+ };
+ 
   static const struct fs_parameter_spec ceph_parameters[] = {
         fsparam_flag    ("abort_on_full",               Opt_abort_on_full),
         fsparam_flag_no ("cephx_require_signatures",    Opt_cephx_require_signatures),
         fsparam_flag_no ("cephx_sign_messages",         Opt_cephx_sign_messages),
         fsparam_flag_no ("crc",                         Opt_crc),
+       fsparam_string  ("crush_location",              Opt_crush_location),
         fsparam_string  ("fsid",                        Opt_fsid),
         fsparam_string  ("ip",                          Opt_ip),
         fsparam_string  ("key",                         Opt_key),
@@@ -283,6 -304,8 +303,8 @@@
         fsparam_u32     ("osdkeepalive",                Opt_osdkeepalivetimeout),
         __fsparam       (fs_param_is_s32, "osdtimeout", Opt_osdtimeout,
                          fs_param_deprecated, NULL),
+       fsparam_enum    ("read_from_replica",           Opt_read_from_replica,
+                        ceph_param_read_from_replica),
         fsparam_string  ("secret",                      Opt_secret),
         fsparam_flag_no ("share",                       Opt_share),
         fsparam_flag_no ("tcp_nodelay",                 Opt_tcp_nodelay),
@@@ -297,6 -320,7 +319,7 @@@ struct ceph_options *ceph_alloc_options
         if (!opt)
                 return NULL;
   
+       opt->crush_locs = RB_ROOT;
         opt->mon_addr = kcalloc(CEPH_MAX_MON, sizeof(*opt->mon_addr),
                                 GFP_KERNEL);
         if (!opt->mon_addr) {
@@@ -319,6 -343,7 +342,7 @@@ void ceph_destroy_options(struct ceph_o
         if (!opt)
                 return;
   
+       ceph_clear_crush_locs(&opt->crush_locs);
         kfree(opt->name);
         if (opt->key) {
                 ceph_crypto_key_destroy(opt->key);
@@@ -453,6 -478,34 +477,34 @@@ int ceph_parse_param(struct fs_paramete
                 if (!opt->key)
                         return -ENOMEM;
                 return get_secret(opt->key, param->string, &log);
+       case Opt_crush_location:
+               ceph_clear_crush_locs(&opt->crush_locs);
+               err = ceph_parse_crush_location(param->string,
+                                               &opt->crush_locs);
+               if (err) {
+                       error_plog(&log, "Failed to parse CRUSH location: %d",
+                                  err);
+                       return err;
+               }
+               break;
+       case Opt_read_from_replica:
+               switch (result.uint_32) {
+               case Opt_read_from_replica_no:
+                       opt->osd_req_flags &= ~(CEPH_OSD_FLAG_BALANCE_READS |
+                                               CEPH_OSD_FLAG_LOCALIZE_READS);
+                       break;
+               case Opt_read_from_replica_balance:
+                       opt->osd_req_flags |= CEPH_OSD_FLAG_BALANCE_READS;
+                       opt->osd_req_flags &= ~CEPH_OSD_FLAG_LOCALIZE_READS;
+                       break;
+               case Opt_read_from_replica_localize:
+                       opt->osd_req_flags |= CEPH_OSD_FLAG_LOCALIZE_READS;
+                       opt->osd_req_flags &= ~CEPH_OSD_FLAG_BALANCE_READS;
+                       break;
+               default:
+                       BUG();
+               }
+               break;
   
         case Opt_osdtimeout:
                 warn_plog(&log, "Ignoring osdtimeout");
@@@ -535,6 -588,7 +587,7 @@@ int ceph_print_client_options(struct se
   {
         struct ceph_options *opt = client->options;
         size_t pos = m->count;
+       struct rb_node *n;
   
         if (opt->name) {
                 seq_puts(m, "name=");
@@@ -544,6 -598,28 +597,28 @@@
         if (opt->key)
                 seq_puts(m, "secret=<hidden>,");
   
+       if (!RB_EMPTY_ROOT(&opt->crush_locs)) {
+               seq_puts(m, "crush_location=");
+               for (n = rb_first(&opt->crush_locs); ; ) {
+                       struct crush_loc_node *loc =
+                           rb_entry(n, struct crush_loc_node, cl_node);
+ 
+                       seq_printf(m, "%s:%s", loc->cl_loc.cl_type_name,
+                                  loc->cl_loc.cl_name);
+                       n = rb_next(n);
+                       if (!n)
+                               break;
+ 
+                       seq_putc(m, '|');
+               }
+               seq_putc(m, ',');
+       }
+       if (opt->osd_req_flags & CEPH_OSD_FLAG_BALANCE_READS) {
+               seq_puts(m, "read_from_replica=balance,");
+       } else if (opt->osd_req_flags & CEPH_OSD_FLAG_LOCALIZE_READS) {
+               seq_puts(m, "read_from_replica=localize,");
+       }
+ 
         if (opt->flags & CEPH_OPT_FSID)
                 seq_printf(m, "fsid=%pU,", &opt->fsid);
         if (opt->flags & CEPH_OPT_NOSHARE)
author	Linus Torvalds <torvalds@linux-foundation.org>
	Mon, 8 Jun 2020 19:49:18 +0000 (12:49 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Mon, 8 Jun 2020 19:49:18 +0000 (12:49 -0700)