2 * Copyright (c) 2003, 2004, 2005 Christophe Varoqui
3 * Copyright (c) 2005 Benjamin Marzinski, Redhat
4 * Copyright (c) 2005 Kiyoshi Ueda, NEC
5 * Copyright (c) 2005 Patrick Caulfield, Redhat
6 * Copyright (c) 2005 Edward Goggin, EMC
16 #include <libdevmapper.h>
18 #include "mpath_cmd.h"
22 #include "devmapper.h"
25 #include "structs_vec.h"
28 #include "blacklist.h"
30 #include "discovery.h"
32 #include "switchgroup.h"
33 #include "dm-generic.h"
35 #include "configure.h"
36 #include "pgpolicies.h"
44 #include "io_err_stat.h"
46 /* group paths in pg by host adapter
48 int group_by_host_adapter(struct pathgroup *pgp, vector adapters)
50 struct adapter_group *agp;
51 struct host_group *hgp;
52 struct path *pp, *pp1;
53 char adapter_name1[SLOT_NAME_SIZE];
54 char adapter_name2[SLOT_NAME_SIZE];
56 int found_hostgroup = 0;
58 while (VECTOR_SIZE(pgp->paths) > 0) {
60 pp = VECTOR_SLOT(pgp->paths, 0);
62 if (sysfs_get_host_adapter_name(pp, adapter_name1))
64 /* create a new host adapter group
66 agp = alloc_adaptergroup();
71 strlcpy(agp->adapter_name, adapter_name1, SLOT_NAME_SIZE);
72 store_adaptergroup(adapters, agp);
74 /* create a new host port group
76 hgp = alloc_hostgroup();
79 if (store_hostgroup(agp->host_groups, hgp))
82 hgp->host_no = pp->sg_id.host_no;
84 if (store_path(hgp->paths, pp))
88 /* delete path from path group
90 vector_del_slot(pgp->paths, 0);
92 /* add all paths belonging to same host adapter
94 vector_foreach_slot(pgp->paths, pp1, i) {
95 if (sysfs_get_host_adapter_name(pp1, adapter_name2))
97 if (strcmp(adapter_name1, adapter_name2) == 0) {
99 vector_foreach_slot(agp->host_groups, hgp, j) {
100 if (hgp->host_no == pp1->sg_id.host_no) {
101 if (store_path(hgp->paths, pp1))
108 if (!found_hostgroup) {
109 /* this path belongs to new host port
110 * within this adapter
112 hgp = alloc_hostgroup();
116 if (store_hostgroup(agp->host_groups, hgp))
120 if (store_path(hgp->paths, pp1))
123 hgp->host_no = pp1->sg_id.host_no;
126 /* delete paths from original path_group
127 * as they are added into adapter group now
129 vector_del_slot(pgp->paths, i);
136 out: /* add back paths into pg as re-ordering failed
138 vector_foreach_slot(adapters, agp, i) {
139 vector_foreach_slot(agp->host_groups, hgp, j) {
140 while (VECTOR_SIZE(hgp->paths) > 0) {
141 pp = VECTOR_SLOT(hgp->paths, 0);
142 if (store_path(pgp->paths, pp))
143 condlog(3, "failed to restore "
144 "path %s into path group",
146 vector_del_slot(hgp->paths, 0);
150 free_adaptergroup(adapters);
154 /* re-order paths in pg by alternating adapters and host ports
155 * for optimized selection
157 int order_paths_in_pg_by_alt_adapters(struct pathgroup *pgp, vector adapters,
160 int next_adapter_index = 0;
161 struct adapter_group *agp;
162 struct host_group *hgp;
165 while (total_paths > 0) {
166 agp = VECTOR_SLOT(adapters, next_adapter_index);
168 condlog(0, "can't get adapter group %d", next_adapter_index);
172 hgp = VECTOR_SLOT(agp->host_groups, agp->next_host_index);
174 condlog(0, "can't get host group %d of adapter group %d", next_adapter_index, agp->next_host_index);
178 if (!hgp->num_paths) {
179 agp->next_host_index++;
180 agp->next_host_index %= agp->num_hosts;
181 next_adapter_index++;
182 next_adapter_index %= VECTOR_SIZE(adapters);
186 pp = VECTOR_SLOT(hgp->paths, 0);
188 if (store_path(pgp->paths, pp))
193 vector_del_slot(hgp->paths, 0);
197 agp->next_host_index++;
198 agp->next_host_index %= agp->num_hosts;
199 next_adapter_index++;
200 next_adapter_index %= VECTOR_SIZE(adapters);
203 /* all paths are added into path_group
204 * in crafted child order
209 /* round-robin: order paths in path group to alternate
210 * between all host adapters
212 int rr_optimize_path_order(struct pathgroup *pgp)
219 total_paths = VECTOR_SIZE(pgp->paths);
220 vector_foreach_slot(pgp->paths, pp, i) {
221 if (pp->sg_id.proto_id != SCSI_PROTOCOL_FCP &&
222 pp->sg_id.proto_id != SCSI_PROTOCOL_SAS &&
223 pp->sg_id.proto_id != SCSI_PROTOCOL_ISCSI &&
224 pp->sg_id.proto_id != SCSI_PROTOCOL_SRP) {
225 /* return success as default path order
226 * is maintained in path group
231 adapters = vector_alloc();
235 /* group paths in path group by host adapters
237 if (group_by_host_adapter(pgp, adapters)) {
238 /* already freed adapters */
239 condlog(3, "Failed to group paths by adapters");
243 /* re-order paths in pg to alternate between adapters and host ports
245 if (order_paths_in_pg_by_alt_adapters(pgp, adapters, total_paths)) {
246 condlog(3, "Failed to re-order paths in pg by adapters "
248 free_adaptergroup(adapters);
249 /* return failure as original paths are
255 free_adaptergroup(adapters);
259 int setup_map(struct multipath *mpp, char **params, struct vectors *vecs)
261 struct pathgroup * pgp;
263 int i, marginal_pathgroups;
267 * don't bother if devmap size is unknown
269 if (mpp->size <= 0) {
270 condlog(3, "%s: devmap size is unknown", mpp->alias);
274 if (mpp->disable_queueing && VECTOR_SIZE(mpp->paths) != 0)
275 mpp->disable_queueing = 0;
278 * If this map was created with add_map_without_path(),
279 * mpp->hwe might not be set yet.
282 extract_hwe_from_path(mpp);
285 * properties selectors
287 * Ordering matters for some properties:
288 * - features after no_path_retry and retain_hwhandler
289 * - hwhandler after retain_hwhandler
290 * No guarantee that this list is complete, check code in
291 * propsel.c if in doubt.
293 conf = get_multipath_config();
294 pthread_cleanup_push(put_multipath_config, conf);
296 select_pgfailback(conf, mpp);
297 select_pgpolicy(conf, mpp);
300 * If setup_map() is called from e.g. from reload_map() or resize_map(),
301 * make sure that we don't corrupt attributes.
303 save_attr = steal_ptr(mpp->selector);
304 select_selector(conf, mpp);
306 mpp->selector = save_attr;
310 select_no_path_retry(conf, mpp);
311 select_retain_hwhandler(conf, mpp);
313 save_attr = steal_ptr(mpp->features);
314 select_features(conf, mpp);
316 mpp->features = save_attr;
320 save_attr = steal_ptr(mpp->hwhandler);
321 select_hwhandler(conf, mpp);
323 mpp->hwhandler = save_attr;
327 select_rr_weight(conf, mpp);
328 select_minio(conf, mpp);
329 select_mode(conf, mpp);
330 select_uid(conf, mpp);
331 select_gid(conf, mpp);
332 select_fast_io_fail(conf, mpp);
333 select_dev_loss(conf, mpp);
334 select_eh_deadline(conf, mpp);
335 select_reservation_key(conf, mpp);
336 select_deferred_remove(conf, mpp);
337 select_marginal_path_err_sample_time(conf, mpp);
338 select_marginal_path_err_rate_threshold(conf, mpp);
339 select_marginal_path_err_recheck_gap_time(conf, mpp);
340 select_marginal_path_double_failed_time(conf, mpp);
341 select_san_path_err_threshold(conf, mpp);
342 select_san_path_err_forget_rate(conf, mpp);
343 select_san_path_err_recovery_time(conf, mpp);
344 select_delay_checks(conf, mpp);
345 select_skip_kpartx(conf, mpp);
346 select_max_sectors_kb(conf, mpp);
347 select_ghost_delay(conf, mpp);
348 select_flush_on_last_del(conf, mpp);
350 sysfs_set_scsi_tmo(mpp, conf->checkint);
351 marginal_pathgroups = conf->marginal_pathgroups;
352 pthread_cleanup_pop(1);
354 if (!mpp->features || !mpp->hwhandler || !mpp->selector) {
355 condlog(0, "%s: map select failed", mpp->alias);
359 if (marginal_path_check_enabled(mpp))
360 start_io_err_stat_thread(vecs);
363 * assign paths to path groups -- start with no groups and all paths
367 vector_foreach_slot (mpp->pg, pgp, i)
368 free_pathgroup(pgp, KEEP_PATHS);
370 vector_free(mpp->pg);
373 if (group_paths(mpp, marginal_pathgroups))
377 * ponders each path group and determine highest prio pg
378 * to switch over (default to first)
380 mpp->bestpg = select_path_group(mpp);
382 /* re-order paths in all path groups in an optimized way
383 * for round-robin path selectors to get maximum throughput.
385 if (!strncmp(mpp->selector, "round-robin", 11)) {
386 vector_foreach_slot(mpp->pg, pgp, i) {
387 if (VECTOR_SIZE(pgp->paths) <= 2)
389 if (rr_optimize_path_order(pgp)) {
390 condlog(2, "cannot re-order paths for "
399 * transform the mp->pg vector of vectors of paths
400 * into a mp->params strings to feed the device-mapper
402 if (assemble_map(mpp, params)) {
403 condlog(0, "%s: problem assembing map", mpp->alias);
410 compute_pgid(struct pathgroup * pgp)
415 vector_foreach_slot (pgp->paths, pp, i)
420 pgcmp (struct multipath * mpp, struct multipath * cmpp)
423 struct pathgroup * pgp;
424 struct pathgroup * cpgp;
430 vector_foreach_slot (mpp->pg, pgp, i) {
433 vector_foreach_slot (cmpp->pg, cpgp, j) {
434 if (pgp->id == cpgp->id &&
435 !pathcmp(pgp, cpgp)) {
447 static struct udev_device *
448 get_udev_for_mpp(const struct multipath *mpp)
451 struct udev_device *udd;
453 if (!mpp || !mpp->dmi) {
454 condlog(1, "%s called with empty mpp", __func__);
458 devnum = makedev(mpp->dmi->major, mpp->dmi->minor);
459 udd = udev_device_new_from_devnum(udev, 'b', devnum);
461 condlog(1, "failed to get udev device for %s", mpp->alias);
467 void trigger_partitions_udev_change(struct udev_device *dev,
468 const char *action, int len)
470 struct udev_enumerate *part_enum;
471 struct udev_list_entry *item;
474 part_enum = udev_enumerate_new(udev);
478 if (udev_enumerate_add_match_parent(part_enum, dev) < 0 ||
479 udev_enumerate_add_match_subsystem(part_enum, "block") < 0 ||
480 udev_enumerate_scan_devices(part_enum) < 0)
483 udev_list_entry_foreach(item,
484 udev_enumerate_get_list_entry(part_enum)) {
486 struct udev_device *part;
488 syspath = udev_list_entry_get_name(item);
489 part = udev_device_new_from_syspath(udev, syspath);
493 devtype = udev_device_get_devtype(part);
494 if (devtype && !strcmp("partition", devtype)) {
495 condlog(4, "%s: triggering %s event for %s", __func__,
497 sysfs_attr_set_value(part, "uevent", action, len);
499 udev_device_unref(part);
502 udev_enumerate_unref(part_enum);
506 trigger_paths_udev_change(struct multipath *mpp, bool is_mpath)
508 struct pathgroup *pgp;
512 * If a path changes from multipath to non-multipath, we must
513 * synthesize an artificial "add" event, otherwise the LVM2 rules
514 * (69-lvm2-lvmetad.rules) won't pick it up. Otherwise, we'd just
515 * irritate ourselves with an "add", so use "change".
517 const char *action = is_mpath ? "change" : "add";
519 if (!mpp || !mpp->pg)
522 vector_foreach_slot (mpp->pg, pgp, i) {
525 vector_foreach_slot(pgp->paths, pp, j) {
531 * Paths that are already classified as multipath
532 * members don't need another uevent.
534 env = udev_device_get_property_value(
535 pp->udev, "DM_MULTIPATH_DEVICE_PATH");
537 if (is_mpath && env != NULL && !strcmp(env, "1")) {
539 * If FIND_MULTIPATHS_WAIT_UNTIL is not "0",
540 * path is in "maybe" state and timer is running
541 * Send uevent now (see multipath.rules).
543 env = udev_device_get_property_value(
544 pp->udev, "FIND_MULTIPATHS_WAIT_UNTIL");
545 if (env == NULL || !strcmp(env, "0"))
547 } else if (!is_mpath &&
548 (env == NULL || !strcmp(env, "0")))
551 condlog(3, "triggering %s uevent for %s (is %smultipath member)",
552 action, pp->dev, is_mpath ? "" : "no ");
553 sysfs_attr_set_value(pp->udev, "uevent",
554 action, strlen(action));
555 trigger_partitions_udev_change(pp->udev, action,
560 mpp->needs_paths_uevent = 0;
564 sysfs_set_max_sectors_kb(struct multipath *mpp, int is_reload)
566 struct pathgroup * pgp;
569 int i, j, ret, err = 0;
570 struct udev_device *udd;
573 if (mpp->max_sectors_kb == MAX_SECTORS_KB_UNDEF)
575 max_sectors_kb = mpp->max_sectors_kb;
577 if (!mpp->dmi && dm_get_info(mpp->alias, &mpp->dmi) != 0) {
578 condlog(1, "failed to get dm info for %s", mpp->alias);
581 udd = get_udev_for_mpp(mpp);
583 condlog(1, "failed to get udev device to set max_sectors_kb for %s", mpp->alias);
586 ret = sysfs_attr_get_value(udd, "queue/max_sectors_kb", buff,
588 udev_device_unref(udd);
590 condlog(1, "failed to get current max_sectors_kb from %s", mpp->alias);
593 if (sscanf(buff, "%u\n", &max_sectors_kb) != 1) {
594 condlog(1, "can't parse current max_sectors_kb from %s",
599 snprintf(buff, 11, "%d", max_sectors_kb);
601 vector_foreach_slot (mpp->pg, pgp, i) {
602 vector_foreach_slot(pgp->paths, pp, j) {
603 ret = sysfs_attr_set_value(pp->udev,
604 "queue/max_sectors_kb",
607 condlog(1, "failed setting max_sectors_kb on %s : %s", pp->dev, strerror(-ret));
615 static bool is_udev_ready(struct multipath *cmpp)
617 struct udev_device *mpp_ud;
622 * MPATH_DEVICE_READY != 1 can mean two things:
623 * (a) no usable paths
624 * (b) device was never fully processed (e.g. udev killed)
625 * If we are in this code path (startup or forced reconfigure),
626 * (b) can mean that upper layers like kpartx have never been
627 * run for this map. Thus force udev reload.
630 mpp_ud = get_udev_for_mpp(cmpp);
633 env = udev_device_get_property_value(mpp_ud, "MPATH_DEVICE_READY");
634 rc = (env != NULL && !strcmp(env, "1"));
635 udev_device_unref(mpp_ud);
636 condlog(4, "%s: %s: \"%s\" -> %d\n", __func__, cmpp->alias, env, rc);
641 select_reload_action(struct multipath *mpp, const char *reason)
643 mpp->action = ACT_RELOAD;
644 condlog(3, "%s: set ACT_RELOAD (%s)", mpp->alias, reason);
647 void select_action (struct multipath *mpp, const struct _vector *curmp,
650 struct multipath * cmpp;
651 struct multipath * cmpp_by_name;
652 char * mpp_feat, * cmpp_feat;
654 cmpp = find_mp_by_wwid(curmp, mpp->wwid);
655 cmpp_by_name = find_mp_by_alias(curmp, mpp->alias);
656 if (mpp->need_reload || (cmpp && cmpp->need_reload))
661 condlog(2, "%s: rename %s to %s", mpp->wwid,
662 cmpp->alias, mpp->alias);
663 strlcpy(mpp->alias_old, cmpp->alias, WWID_SIZE);
664 mpp->action = ACT_RENAME;
666 mpp->force_udev_reload = 1;
667 mpp->action = ACT_FORCERENAME;
671 mpp->action = ACT_CREATE;
672 condlog(3, "%s: set ACT_CREATE (map does not exist)",
678 condlog(1, "%s: can't use alias \"%s\" used by %s, falling back to WWID",
679 mpp->wwid, mpp->alias, cmpp_by_name->wwid);
680 /* We can do this because wwid wasn't found */
682 mpp->alias = strdup(mpp->wwid);
683 mpp->action = ACT_CREATE;
684 condlog(3, "%s: set ACT_CREATE (map does not exist, name changed)",
689 if (cmpp != cmpp_by_name) {
690 condlog(2, "%s: unable to rename %s to %s (%s is used by %s)",
691 mpp->wwid, cmpp->alias, mpp->alias,
692 mpp->alias, cmpp_by_name->wwid);
693 /* reset alias to existing alias */
695 mpp->alias = strdup(cmpp->alias);
696 mpp->action = ACT_IMPOSSIBLE;
701 mpp->force_udev_reload = 1;
702 mpp->action = ACT_RELOAD;
703 condlog(3, "%s: set ACT_RELOAD (forced by user)",
707 if (cmpp->size != mpp->size) {
708 mpp->force_udev_reload = 1;
709 mpp->action = ACT_RESIZE;
710 condlog(3, "%s: set ACT_RESIZE (size change)",
715 if (!is_udev_ready(cmpp) && count_active_paths(mpp) > 0) {
716 mpp->force_udev_reload = 1;
717 mpp->action = ACT_RELOAD;
718 condlog(3, "%s: set ACT_RELOAD (udev incomplete)",
723 if (mpp->no_path_retry != NO_PATH_RETRY_UNDEF &&
724 !!strstr(mpp->features, "queue_if_no_path") !=
725 !!strstr(cmpp->features, "queue_if_no_path")) {
726 select_reload_action(mpp, "no_path_retry change");
729 if ((mpp->retain_hwhandler != RETAIN_HWHANDLER_ON ||
730 strcmp(cmpp->hwhandler, "0") == 0) &&
731 (strlen(cmpp->hwhandler) != strlen(mpp->hwhandler) ||
732 strncmp(cmpp->hwhandler, mpp->hwhandler,
733 strlen(mpp->hwhandler)))) {
734 select_reload_action(mpp, "hwhandler change");
738 if (mpp->retain_hwhandler != RETAIN_HWHANDLER_UNDEF &&
739 !!strstr(mpp->features, "retain_attached_hw_handler") !=
740 !!strstr(cmpp->features, "retain_attached_hw_handler") &&
741 get_linux_version_code() < KERNEL_VERSION(4, 3, 0)) {
742 select_reload_action(mpp, "retain_hwhandler change");
746 cmpp_feat = strdup(cmpp->features);
747 mpp_feat = strdup(mpp->features);
748 if (cmpp_feat && mpp_feat) {
749 remove_feature(&mpp_feat, "queue_if_no_path");
750 remove_feature(&mpp_feat, "retain_attached_hw_handler");
751 remove_feature(&cmpp_feat, "queue_if_no_path");
752 remove_feature(&cmpp_feat, "retain_attached_hw_handler");
753 if (strcmp(mpp_feat, cmpp_feat)) {
754 select_reload_action(mpp, "features change");
763 if (!cmpp->selector || strncmp(cmpp->selector, mpp->selector,
764 strlen(mpp->selector))) {
765 select_reload_action(mpp, "selector change");
768 if (cmpp->minio != mpp->minio) {
769 select_reload_action(mpp, "minio change");
772 if (!cmpp->pg || VECTOR_SIZE(cmpp->pg) != VECTOR_SIZE(mpp->pg)) {
773 select_reload_action(mpp, "path group number change");
776 if (pgcmp(mpp, cmpp)) {
777 select_reload_action(mpp, "path group topology change");
780 if (cmpp->nextpg != mpp->bestpg) {
781 mpp->action = ACT_SWITCHPG;
782 condlog(3, "%s: set ACT_SWITCHPG (next path group change)",
786 mpp->action = ACT_NOTHING;
787 condlog(3, "%s: set ACT_NOTHING (map unchanged)",
792 int reinstate_paths(struct multipath *mpp)
795 struct pathgroup * pgp;
801 vector_foreach_slot (mpp->pg, pgp, i) {
805 vector_foreach_slot (pgp->paths, pp, j) {
806 if (pp->state != PATH_UP &&
807 (pgp->status == PGSTATE_DISABLED ||
808 pgp->status == PGSTATE_ACTIVE))
811 if (pp->dmstate == PSTATE_FAILED) {
812 if (dm_reinstate_path(mpp->alias, pp->dev_t))
813 condlog(0, "%s: error reinstating",
822 lock_multipath (struct multipath * mpp, int lock)
824 struct pathgroup * pgp;
829 if (!mpp || !mpp->pg)
832 vector_foreach_slot (mpp->pg, pgp, i) {
835 vector_foreach_slot(pgp->paths, pp, j) {
836 if (lock && flock(pp->fd, LOCK_SH | LOCK_NB) &&
837 errno == EWOULDBLOCK)
840 flock(pp->fd, LOCK_UN);
845 vector_foreach_slot (mpp->pg, pgp, x) {
850 vector_foreach_slot(pgp->paths, pp, y) {
851 if (x == i && y >= j)
853 flock(pp->fd, LOCK_UN);
859 int domap(struct multipath *mpp, char *params, int is_daemon)
865 * last chance to quit before touching the devmaps
867 if (mpp->action == ACT_DRY_RUN) {
868 print_multipath_topology(mpp, libmp_verbosity);
872 if (mpp->action == ACT_CREATE && dm_map_present(mpp->alias)) {
873 char wwid[WWID_SIZE];
875 if (dm_get_uuid(mpp->alias, wwid, sizeof(wwid)) == 0) {
876 if (!strncmp(mpp->wwid, wwid, sizeof(wwid))) {
877 condlog(3, "%s: map already present",
879 mpp->action = ACT_RELOAD;
881 condlog(0, "%s: map \"%s\" already present with WWID %s, skipping",
882 mpp->wwid, mpp->alias, wwid);
883 condlog(0, "please check alias settings in config and bindings file");
884 mpp->action = ACT_REJECT;
889 switch (mpp->action) {
896 dm_switchgroup(mpp->alias, mpp->bestpg);
898 * we may have avoided reinstating paths because there where in
899 * active or disabled PG. Now that the topology has changed,
902 reinstate_paths(mpp);
906 if (lock_multipath(mpp, 1)) {
907 condlog(3, "%s: failed to create map (in use)",
912 sysfs_set_max_sectors_kb(mpp, 0);
913 if (is_daemon && mpp->ghost_delay > 0 && count_active_paths(mpp) &&
914 pathcount(mpp, PATH_UP) == 0)
915 mpp->ghost_delay_tick = mpp->ghost_delay;
916 r = dm_addmap_create(mpp, params);
918 lock_multipath(mpp, 0);
922 sysfs_set_max_sectors_kb(mpp, 1);
923 if (mpp->ghost_delay_tick > 0 && pathcount(mpp, PATH_UP))
924 mpp->ghost_delay_tick = 0;
925 r = dm_addmap_reload(mpp, params, 0);
929 sysfs_set_max_sectors_kb(mpp, 1);
930 if (mpp->ghost_delay_tick > 0 && pathcount(mpp, PATH_UP))
931 mpp->ghost_delay_tick = 0;
932 r = dm_addmap_reload(mpp, params, 1);
936 conf = get_multipath_config();
937 pthread_cleanup_push(put_multipath_config, conf);
938 r = dm_rename(mpp->alias_old, mpp->alias,
939 conf->partition_delim, mpp->skip_kpartx);
940 pthread_cleanup_pop(1);
943 case ACT_FORCERENAME:
944 conf = get_multipath_config();
945 pthread_cleanup_push(put_multipath_config, conf);
946 r = dm_rename(mpp->alias_old, mpp->alias,
947 conf->partition_delim, mpp->skip_kpartx);
948 pthread_cleanup_pop(1);
950 sysfs_set_max_sectors_kb(mpp, 1);
951 if (mpp->ghost_delay_tick > 0 &&
952 pathcount(mpp, PATH_UP))
953 mpp->ghost_delay_tick = 0;
954 r = dm_addmap_reload(mpp, params, 0);
964 * DM_DEVICE_CREATE, DM_DEVICE_RENAME, or DM_DEVICE_RELOAD
967 mpp->force_udev_reload = 0;
968 if (mpp->action == ACT_CREATE &&
969 (remember_wwid(mpp->wwid) == 1 ||
970 mpp->needs_paths_uevent))
971 trigger_paths_udev_change(mpp, true);
973 /* multipath client mode */
974 dm_switchgroup(mpp->alias, mpp->bestpg);
976 /* multipath daemon mode */
977 mpp->stat_map_loads++;
978 condlog(4, "%s: load table [0 %llu %s %s]", mpp->alias,
979 mpp->size, TGT_MPATH, params);
981 * Required action is over, reset for the stateful daemon.
982 * But don't do it for creation as we use in the caller the
983 * mpp->action to figure out whether to start the watievent checker.
985 if (mpp->action != ACT_CREATE)
986 mpp->action = ACT_NOTHING;
988 conf = get_multipath_config();
989 mpp->wait_for_udev = 1;
990 mpp->uev_wait_tick = conf->uev_wait_timeout;
991 put_multipath_config(conf);
996 } else if (r == DOMAP_FAIL && mpp->action == ACT_CREATE &&
997 mpp->needs_paths_uevent)
998 trigger_paths_udev_change(mpp, false);
1009 unsigned int timeout;
1010 struct config *conf;
1012 fd = mpath_connect();
1016 if (send_packet(fd, "show daemon") != 0)
1018 conf = get_multipath_config();
1019 timeout = conf->uxsock_timeout;
1020 put_multipath_config(conf);
1021 if (recv_packet(fd, &reply, timeout) != 0)
1024 if (reply && strstr(reply, "shutdown"))
1032 mpath_disconnect(fd);
1037 * The force_reload parameter determines how coalesce_paths treats existing maps.
1038 * FORCE_RELOAD_NONE: existing maps aren't touched at all
1039 * FORCE_RELOAD_YES: all maps are rebuilt from scratch and (re)loaded in DM
1040 * FORCE_RELOAD_WEAK: existing maps are compared to the current conf and only
1041 * reloaded in DM if there's a difference. This is normally sufficient.
1043 int coalesce_paths (struct vectors *vecs, vector mpvec, char *refwwid,
1044 int force_reload, enum mpath_cmds cmd)
1048 int is_daemon = (cmd == CMD_NONE) ? 1 : 0;
1049 char *params __attribute__((cleanup(cleanup_charp))) = NULL;
1050 struct multipath * mpp;
1051 struct path * pp1 = NULL;
1053 vector curmp = vecs->mpvec;
1054 vector pathvec = vecs->pathvec;
1056 struct config *conf = NULL;
1058 struct bitfield *size_mismatch_seen;
1060 /* ignore refwwid if it's empty */
1061 if (refwwid && !strlen(refwwid))
1064 if (force_reload != FORCE_RELOAD_NONE) {
1065 vector_foreach_slot (pathvec, pp1, k) {
1070 if (VECTOR_SIZE(pathvec) == 0)
1072 size_mismatch_seen = alloc_bitfield(VECTOR_SIZE(pathvec));
1073 if (size_mismatch_seen == NULL)
1079 newmp = vector_alloc();
1081 condlog(0, "can not allocate newmp");
1085 vector_foreach_slot (pathvec, pp1, k) {
1088 if (should_exit()) {
1093 /* skip this path for some reason */
1095 /* 1. if path has no unique id or wwid blacklisted */
1096 if (strlen(pp1->wwid) == 0) {
1097 orphan_path(pp1, "no WWID");
1101 conf = get_multipath_config();
1102 pthread_cleanup_push(put_multipath_config, conf);
1103 invalid = (filter_path(conf, pp1) > 0);
1104 pthread_cleanup_pop(1);
1106 orphan_path(pp1, "blacklisted");
1110 /* 2. if path already coalesced, or seen and discarded */
1111 if (pp1->mpp || is_bit_set_in_bitfield(k, size_mismatch_seen))
1114 /* 3. if path has disappeared */
1115 if (pp1->state == PATH_REMOVED) {
1116 orphan_path(pp1, "path removed");
1120 /* 4. path is out of scope */
1121 if (refwwid && strncmp(pp1->wwid, refwwid, WWID_SIZE - 1))
1124 /* If find_multipaths was selected check if the path is valid */
1125 if (!refwwid && !should_multipath(pp1, pathvec, curmp)) {
1126 orphan_path(pp1, "only one path");
1131 * at this point, we know we really got a new mp
1133 mpp = add_map_with_path(vecs, pp1, 0);
1135 orphan_path(pp1, "failed to create multipath device");
1140 condlog(0, "%s: skip coalesce (no paths)", mpp->alias);
1141 remove_map(mpp, vecs->pathvec, NULL);
1145 for (i = k + 1; i < VECTOR_SIZE(pathvec); i++) {
1146 pp2 = VECTOR_SLOT(pathvec, i);
1148 if (strcmp(pp1->wwid, pp2->wwid))
1151 if (!mpp->size && pp2->size)
1152 mpp->size = pp2->size;
1154 if (mpp->size && pp2->size &&
1155 pp2->size != mpp->size) {
1157 * ouch, avoid feeding that to the DM
1159 condlog(0, "%s: size %llu, expected %llu. "
1160 "Discard", pp2->dev, pp2->size,
1162 mpp->action = ACT_REJECT;
1163 set_bit_in_bitfield(i, size_mismatch_seen);
1168 if (setup_map(mpp, ¶ms, vecs)) {
1169 remove_map(mpp, vecs->pathvec, NULL);
1173 if (cmd == CMD_DRY_RUN)
1174 mpp->action = ACT_DRY_RUN;
1175 if (mpp->action == ACT_UNDEF)
1176 select_action(mpp, curmp,
1177 force_reload == FORCE_RELOAD_YES ? 1 : 0);
1179 r = domap(mpp, params, is_daemon);
1183 if (r == DOMAP_FAIL || r == DOMAP_RETRY) {
1184 condlog(3, "%s: domap (%u) failure "
1185 "for create/reload map",
1187 if (r == DOMAP_FAIL || is_daemon) {
1188 condlog(2, "%s: %s map",
1189 mpp->alias, (mpp->action == ACT_CREATE)?
1190 "ignoring" : "removing");
1191 remove_map(mpp, vecs->pathvec, NULL);
1193 } else /* if (r == DOMAP_RETRY && !is_daemon) */ {
1198 if (r == DOMAP_DRY) {
1199 if (!vector_alloc_slot(newmp)) {
1200 remove_map(mpp, vecs->pathvec, NULL);
1203 vector_set_slot(newmp, mpp);
1207 conf = get_multipath_config();
1208 allow_queueing = conf->allow_queueing;
1209 put_multipath_config(conf);
1210 if (!is_daemon && !allow_queueing && !check_daemon()) {
1211 if (mpp->no_path_retry != NO_PATH_RETRY_UNDEF &&
1212 mpp->no_path_retry != NO_PATH_RETRY_FAIL)
1213 condlog(3, "%s: multipathd not running, unset "
1214 "queue_if_no_path feature", mpp->alias);
1215 if (!dm_queue_if_no_path(mpp->alias, 0))
1216 remove_feature(&mpp->features,
1217 "queue_if_no_path");
1220 if (!is_daemon && mpp->action != ACT_NOTHING)
1221 print_multipath_topology(mpp, libmp_verbosity);
1223 if (mpp->action != ACT_REJECT) {
1224 if (!vector_alloc_slot(newmp)) {
1225 remove_map(mpp, vecs->pathvec, NULL);
1228 vector_set_slot(newmp, mpp);
1231 remove_map(mpp, vecs->pathvec, NULL);
1235 free(size_mismatch_seen);
1237 free_multipathvec(newmp, KEEP_PATHS);
1241 struct udev_device *get_udev_device(const char *dev, enum devtypes dev_type)
1243 struct udev_device *ud = NULL;
1246 if (dev == NULL || *dev == '\0')
1252 /* This should be GNU basename, compiler will warn if not */
1253 base = basename(dev);
1256 ud = udev_device_new_from_subsystem_sysname(udev, "block",
1260 ud = udev_device_new_from_devnum(udev, 'b', parse_devt(dev));
1263 ud = udev_device_new_from_environment(udev);
1266 condlog(0, "Internal error: get_udev_device called with invalid type %d\n",
1271 condlog(2, "get_udev_device: failed to look up %s with type %d",
1276 static int _get_refwwid(enum mpath_cmds cmd, const char *dev,
1277 enum devtypes dev_type,
1278 vector pathvec, struct config *conf, char **wwid)
1282 char buff[FILE_NAME_SIZE];
1283 const char *refwwid = NULL;
1284 char tmpwwid[WWID_SIZE];
1285 struct udev_device *udevice;
1286 int flags = DI_SYSFS | DI_WWID;
1289 return PATHINFO_FAILED;
1292 if (dev_type == DEV_NONE)
1293 return PATHINFO_FAILED;
1295 if (cmd != CMD_REMOVE_WWID)
1296 flags |= DI_BLACKLIST;
1300 if (basenamecpy(dev, buff, FILE_NAME_SIZE) == 0) {
1301 condlog(1, "basename failed for '%s' (%s)",
1303 return PATHINFO_FAILED;
1306 /* dev is used in common code below */
1308 pp = find_path_by_dev(pathvec, dev);
1312 pp = find_path_by_devt(pathvec, dev);
1317 /* For condlog below, dev is unused in get_udev_device() */
1318 dev = "environment";
1321 udevice = get_udev_device(dev, dev_type);
1324 condlog(0, "%s: cannot find block device", dev);
1325 return PATHINFO_FAILED;
1328 ret = store_pathinfo(pathvec, conf, udevice,
1330 udev_device_unref(udevice);
1332 if (ret == PATHINFO_FAILED)
1333 condlog(0, "%s: can't store path info",
1338 if (flags & DI_BLACKLIST &&
1339 filter_property(conf, pp->udev, 3, pp->uid_attribute) > 0)
1340 return PATHINFO_SKIPPED;
1345 if (((dm_get_uuid(dev, tmpwwid, WWID_SIZE)) == 0)
1346 && (strlen(tmpwwid)))
1349 /* or may be a binding */
1350 else if (get_user_friendly_wwid(dev, tmpwwid,
1351 conf->bindings_file) == 0)
1354 /* or may be an alias */
1356 refwwid = get_mpe_wwid(conf->mptable, dev);
1358 /* or directly a wwid */
1363 if (flags & DI_BLACKLIST && refwwid && strlen(refwwid) &&
1364 filter_wwid(conf->blist_wwid, conf->elist_wwid, refwwid,
1366 return PATHINFO_SKIPPED;
1372 if (refwwid && strlen(refwwid)) {
1373 *wwid = strdup(refwwid);
1377 return PATHINFO_FAILED;
1381 * Returns: PATHINFO_OK, PATHINFO_FAILED, or PATHINFO_SKIPPED (see pathinfo())
1383 int get_refwwid(enum mpath_cmds cmd, const char *dev, enum devtypes dev_type,
1384 vector pathvec, char **wwid)
1388 struct config *conf = get_multipath_config();
1390 pthread_cleanup_push(put_multipath_config, conf);
1391 ret = _get_refwwid(cmd, dev, dev_type, pathvec, conf, wwid);
1392 pthread_cleanup_pop(1);