2 * Copyright (c) 2004, 2005 Christophe Varoqui
3 * Copyright (c) 2005 Kiyoshi Ueda, NEC
4 * Copyright (c) 2005 Benjamin Marzinski, Redhat
5 * Copyright (c) 2005 Edward Goggin, EMC
9 #include <libdevmapper.h>
12 #include <sys/types.h>
19 #include <sysfs/libsysfs.h>
20 #include <sysfs/dlist.h>
26 #include <path_state.h>
37 #include <blacklist.h>
42 #include <devmapper.h>
44 #include <discovery.h>
48 #include <switchgroup.h>
49 #include <path_state.h>
57 #include "cli_handlers.h"
59 #define FILE_NAME_SIZE 256
62 #define LOG_MSG(a,b) \
64 condlog(a, "%s: %s", pp->dev_t, b); \
65 memset(b, 0, MAX_CHECKER_MSG_SIZE); \
70 fprintf(stderr, "%s:%s(%i) lock %p\n", __FILE__, __FUNCTION__, __LINE__, a); \
73 fprintf(stderr, "%s:%s(%i) unlock %p\n", __FILE__, __FUNCTION__, __LINE__, a); \
74 pthread_mutex_unlock(a)
75 #define lock_cleanup_pop(a) \
76 fprintf(stderr, "%s:%s(%i) unlock %p\n", __FILE__, __FUNCTION__, __LINE__, a); \
77 pthread_cleanup_pop(1);
79 #define lock(a) pthread_mutex_lock(a)
80 #define unlock(a) pthread_mutex_unlock(a)
81 #define lock_cleanup_pop(a) pthread_cleanup_pop(1);
84 pthread_cond_t exit_cond = PTHREAD_COND_INITIALIZER;
85 pthread_mutex_t exit_mutex = PTHREAD_MUTEX_INITIALIZER;
87 typedef void (stop_waiter_thread_func) (struct multipath *, struct vectors *);
96 char mapname[WWID_SIZE];
100 static struct event_thread *
104 struct event_thread * wp;
106 wp = (struct event_thread *)MALLOC(sizeof(struct event_thread));
112 free_waiter (void * data)
114 struct event_thread * wp = (struct event_thread *)data;
117 dm_task_destroy(wp->dmt);
122 stop_waiter_thread (struct multipath * mpp, struct vectors * vecs)
124 struct event_thread * wp = (struct event_thread *)mpp->waiter;
127 condlog(3, "%s: no waiter thread", mpp->alias);
130 condlog(2, "%s: stop event checker thread", wp->mapname);
131 pthread_kill((pthread_t)wp->thread, SIGHUP);
135 cleanup_lock (void * data)
137 pthread_mutex_unlock((pthread_mutex_t *)data);
141 adopt_paths (struct vectors * vecs, struct multipath * mpp)
149 vector_foreach_slot (vecs->pathvec, pp, i) {
150 if (!strncmp(mpp->wwid, pp->wwid, WWID_SIZE)) {
151 condlog(4, "%s ownership set", pp->dev_t);
158 orphan_path (struct path * pp)
162 pp->dmstate = PSTATE_UNDEF;
163 pp->checker_context = NULL;
166 pp->getprio_selected = 0;
175 orphan_paths (struct vectors * vecs, struct multipath * mpp)
180 vector_foreach_slot (vecs->pathvec, pp, i) {
181 if (pp->mpp == mpp) {
182 condlog(4, "%s is orphaned", pp->dev_t);
189 update_multipath_table (struct multipath *mpp, vector pathvec)
194 if (dm_get_map(mpp->alias, &mpp->size, mpp->params))
197 if (disassemble_map(pathvec, mpp->params, mpp))
204 update_multipath_status (struct multipath *mpp)
209 if(dm_get_status(mpp->alias, mpp->status))
212 if (disassemble_status(mpp->status, mpp))
219 update_multipath_strings (struct multipath *mpp, vector pathvec)
221 free_multipath_attributes(mpp);
222 free_pgvec(mpp->pg, KEEP_PATHS);
225 if (update_multipath_table(mpp, pathvec))
228 if (update_multipath_status(mpp))
235 set_multipath_wwid (struct multipath * mpp)
240 dm_get_uuid(mpp->alias, mpp->wwid);
244 * mpp->no_path_retry:
245 * -2 (QUEUE) : queue_if_no_path enabled, never turned off
246 * -1 (FAIL) : fail_if_no_path
247 * 0 (UNDEF) : nothing
248 * >0 : queue_if_no_path enabled, turned off after polling n times
251 update_queue_mode_del_path(struct multipath *mpp)
253 if (--mpp->nr_active == 0 && mpp->no_path_retry > 0) {
256 * meaning of +1: retry_tick may be decremented in
257 * checkerloop before starting retry.
259 mpp->retry_tick = mpp->no_path_retry * conf->checkint + 1;
260 condlog(1, "%s: Entering recovery mode: max_retries=%d",
261 mpp->alias, mpp->no_path_retry);
263 condlog(2, "%s: remaining active paths: %d", mpp->alias, mpp->nr_active);
267 update_queue_mode_add_path(struct multipath *mpp)
269 if (mpp->nr_active++ == 0 && mpp->no_path_retry > 0) {
270 /* come back to normal mode from retry mode */
272 dm_queue_if_no_path(mpp->alias, 1);
273 condlog(2, "%s: queue_if_no_path enabled", mpp->alias);
274 condlog(1, "%s: Recovered to normal mode", mpp->alias);
276 condlog(2, "%s: remaining active paths: %d", mpp->alias, mpp->nr_active);
280 set_no_path_retry(struct multipath *mpp)
283 mpp->nr_active = pathcount(mpp, PATH_UP);
284 select_no_path_retry(mpp);
286 switch (mpp->no_path_retry) {
287 case NO_PATH_RETRY_UNDEF:
289 case NO_PATH_RETRY_FAIL:
290 dm_queue_if_no_path(mpp->alias, 0);
292 case NO_PATH_RETRY_QUEUE:
293 dm_queue_if_no_path(mpp->alias, 1);
296 dm_queue_if_no_path(mpp->alias, 1);
297 if (mpp->nr_active == 0) {
298 /* Enter retry mode */
299 mpp->retry_tick = mpp->no_path_retry * conf->checkint;
300 condlog(1, "%s: Entering recovery mode: max_retries=%d",
301 mpp->alias, mpp->no_path_retry);
307 static struct hwentry *
308 extract_hwe_from_path(struct multipath * mpp)
311 struct pathgroup * pgp;
313 pgp = VECTOR_SLOT(mpp->pg, 0);
314 pp = VECTOR_SLOT(pgp->paths, 0);
320 remove_map (struct multipath * mpp, struct vectors * vecs,
321 stop_waiter_thread_func *stop_waiter, int purge_vec)
326 * stop the DM event waiter thread
329 stop_waiter(mpp, vecs);
332 * clear references to this map
334 orphan_paths(vecs, mpp);
337 (i = find_slot(vecs->mpvec, (void *)mpp)) != -1)
338 vector_del_slot(vecs->mpvec, i);
343 free_multipath(mpp, KEEP_PATHS);
347 remove_maps (struct vectors * vecs,
348 stop_waiter_thread_func *stop_waiter)
351 struct multipath * mpp;
353 vector_foreach_slot (vecs->mpvec, mpp, i) {
354 remove_map(mpp, vecs, stop_waiter, 1);
358 vector_free(vecs->mpvec);
363 setup_multipath (struct vectors * vecs, struct multipath * mpp)
365 if (dm_get_info(mpp->alias, &mpp->dmi))
368 set_multipath_wwid(mpp);
369 mpp->mpe = find_mpe(mpp->wwid);
370 condlog(4, "discovered map %s", mpp->alias);
372 if (update_multipath_strings(mpp, vecs->pathvec))
375 adopt_paths(vecs, mpp);
376 mpp->hwe = extract_hwe_from_path(mpp);
377 select_pgfailback(mpp);
378 set_no_path_retry(mpp);
382 condlog(0, "%s: failed to setup multipath", mpp->alias);
383 remove_map(mpp, vecs, stop_waiter_thread, 1);
388 need_switch_pathgroup (struct multipath * mpp, int refresh)
390 struct pathgroup * pgp;
394 if (!mpp || mpp->pgfailback == -FAILBACK_MANUAL)
398 * Refresh path priority values
401 vector_foreach_slot (mpp->pg, pgp, i)
402 vector_foreach_slot (pgp->paths, pp, j)
403 pathinfo(pp, conf->hwtable, DI_PRIO);
405 mpp->bestpg = select_path_group(mpp);
407 if (mpp->bestpg != mpp->nextpg)
414 switch_pathgroup (struct multipath * mpp)
416 dm_switchgroup(mpp->alias, mpp->bestpg);
417 condlog(2, "%s: switch to path group #%i",
418 mpp->alias, mpp->bestpg);
422 update_multipath (struct vectors *vecs, char *mapname)
424 struct multipath *mpp;
425 struct pathgroup *pgp;
430 mpp = find_mp_by_alias(vecs->mpvec, mapname);
435 free_pgvec(mpp->pg, KEEP_PATHS);
438 if (setup_multipath(vecs, mpp))
439 goto out; /* mpp freed in setup_multipath */
442 * compare checkers states with DM states
444 vector_foreach_slot (mpp->pg, pgp, i) {
445 vector_foreach_slot (pgp->paths, pp, j) {
446 if (pp->dmstate != PSTATE_FAILED)
449 if (pp->state != PATH_DOWN) {
450 condlog(2, "%s: mark as failed", pp->dev_t);
451 pp->state = PATH_DOWN;
452 update_queue_mode_del_path(mpp);
456 * schedule the next check earlier
458 if (pp->tick > conf->checkint)
459 pp->tick = conf->checkint;
466 condlog(0, "failed to update multipath");
471 static sigset_t unblock_sighup(void)
476 sigaddset(&set, SIGHUP);
477 pthread_sigmask(SIG_UNBLOCK, &set, &old);
482 * returns the reschedule delay
483 * negative means *stop*
486 waiteventloop (struct event_thread * waiter)
492 if (!waiter->event_nr)
493 waiter->event_nr = dm_geteventnr(waiter->mapname);
495 if (!(waiter->dmt = dm_task_create(DM_DEVICE_WAITEVENT)))
498 if (!dm_task_set_name(waiter->dmt, waiter->mapname)) {
499 dm_task_destroy(waiter->dmt);
503 if (waiter->event_nr && !dm_task_set_event_nr(waiter->dmt,
505 dm_task_destroy(waiter->dmt);
509 dm_task_no_open_count(waiter->dmt);
511 /* accept wait interruption */
512 set = unblock_sighup();
514 /* interruption spits messages */
518 r = dm_task_run(waiter->dmt);
520 /* wait is over : event or interrupt */
521 pthread_sigmask(SIG_SETMASK, &set, NULL);
524 if (!r) /* wait interrupted by signal */
527 dm_task_destroy(waiter->dmt);
535 condlog(3, "%s: devmap event #%i",
536 waiter->mapname, waiter->event_nr);
541 * 1) a table reload, which means our mpp structure is
542 * obsolete : refresh it through update_multipath()
543 * 2) a path failed by DM : mark as such through
545 * 3) map has gone away : stop the thread.
546 * 4) a path reinstate : nothing to do
547 * 5) a switch group : nothing to do
549 pthread_cleanup_push(cleanup_lock, waiter->vecs->lock);
550 lock(waiter->vecs->lock);
551 r = update_multipath(waiter->vecs, waiter->mapname);
552 lock_cleanup_pop(waiter->vecs->lock);
555 return -1; /* stop the thread */
557 event_nr = dm_geteventnr(waiter->mapname);
559 if (waiter->event_nr == event_nr)
560 return 1; /* upon problem reschedule 1s later */
562 waiter->event_nr = event_nr;
564 return -1; /* never reach there */
568 waitevent (void * et)
571 struct event_thread *waiter;
573 mlockall(MCL_CURRENT | MCL_FUTURE);
575 waiter = (struct event_thread *)et;
576 pthread_cleanup_push(free_waiter, et);
579 r = waiteventloop(waiter);
587 pthread_cleanup_pop(1);
592 start_waiter_thread (struct multipath * mpp, struct vectors * vecs)
595 struct event_thread * wp;
600 if (pthread_attr_init(&attr))
603 pthread_attr_setstacksize(&attr, 32 * 1024);
604 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
611 mpp->waiter = (void *)wp;
612 strncpy(wp->mapname, mpp->alias, WWID_SIZE);
615 if (pthread_create(&wp->thread, &attr, waitevent, wp)) {
616 condlog(0, "%s: cannot create event checker", wp->mapname);
619 condlog(2, "%s: event checker started", wp->mapname);
626 condlog(0, "failed to start waiter thread");
631 uev_add_map (char * devname, struct vectors * vecs)
634 char dev_t[BLK_DEV_SIZE];
636 struct multipath * mpp;
638 if (sscanf(devname, "dm-%d", &minor) == 1 &&
639 !sysfs_get_dev(sysfs_path, devname, dev_t, BLK_DEV_SIZE) &&
640 sscanf(dev_t, "%d:%d", &major, &minor) == 2)
641 alias = dm_mapname(major, minor);
643 alias = STRDUP(devname);
648 if (!dm_type(alias, DEFAULT_TARGET)) {
649 condlog(4, "%s: not a multipath map", alias);
654 mpp = find_mp_by_alias(vecs->mpvec, alias);
658 * this should not happen,
659 * we missed a remove map event (not sent ?)
661 condlog(2, "%s: already registered", alias);
662 remove_map(mpp, vecs, stop_waiter_thread, 1);
666 * now we can allocate
668 mpp = alloc_multipath();
675 if (setup_multipath(vecs, mpp))
676 return 1; /* mpp freed in setup_multipath */
678 if (!vector_alloc_slot(vecs->mpvec))
681 vector_set_slot(vecs->mpvec, mpp);
682 adopt_paths(vecs, mpp);
684 if (start_waiter_thread(mpp, vecs))
689 condlog(2, "%s: add devmap failed", mpp->alias);
690 remove_map(mpp, vecs, stop_waiter_thread, 1);
695 uev_remove_map (char * devname, struct vectors * vecs)
698 struct multipath * mpp;
700 if (sscanf(devname, "dm-%d", &minor) == 1)
701 mpp = find_mp_by_minor(vecs->mpvec, minor);
703 mpp = find_mp_by_alias(vecs->mpvec, devname);
706 condlog(3, "%s: devmap not registered, can't remove",
711 condlog(2, "remove %s devmap", mpp->alias);
712 remove_map(mpp, vecs, stop_waiter_thread, 1);
718 uev_add_path (char * devname, struct vectors * vecs)
722 pp = find_path_by_dev(vecs->pathvec, devname);
725 condlog(3, "%s: already in pathvec");
728 pp = store_pathinfo(vecs->pathvec, conf->hwtable,
729 devname, DI_SYSFS | DI_WWID);
732 condlog(0, "%s: failed to store path info", devname);
736 condlog(2, "%s: path checker registered", devname);
737 pp->mpp = find_mp_by_wwid(vecs->mpvec, pp->wwid);
740 condlog(4, "%s: ownership set to %s",
741 pp->dev_t, pp->mpp->alias);
743 condlog(4, "%s: orphaned", pp->dev_t);
751 uev_remove_path (char * devname, struct vectors * vecs)
756 pp = find_path_by_dev(vecs->pathvec, devname);
759 condlog(3, "%s: not in pathvec");
763 if (pp->mpp && pp->state == PATH_UP)
764 update_queue_mode_del_path(pp->mpp);
766 condlog(2, "remove %s path checker", devname);
767 i = find_slot(vecs->pathvec, (void *)pp);
768 vector_del_slot(vecs->pathvec, i);
775 show_paths (char ** r, int * len, struct vectors * vecs)
781 int maxlen = INITIAL_REPLY_LEN;
784 get_path_layout(vecs->pathvec);
785 reply = MALLOC(maxlen);
793 if (VECTOR_SIZE(vecs->pathvec) > 0)
794 c += snprint_path_header(c, reply + maxlen - c,
797 vector_foreach_slot(vecs->pathvec, pp, i)
798 c += snprint_path(c, reply + maxlen - c,
799 PRINT_PATH_CHECKER, pp);
801 again = ((c - reply) == (maxlen - 1));
804 reply = REALLOC(reply, maxlen *= 2);
808 *len = (int)(c - reply + 1);
813 show_maps (char ** r, int *len, struct vectors * vecs)
816 struct multipath * mpp;
819 int maxlen = INITIAL_REPLY_LEN;
822 get_map_layout(vecs->mpvec);
823 reply = MALLOC(maxlen);
830 if (VECTOR_SIZE(vecs->mpvec) > 0)
831 c += snprint_map_header(c, reply + maxlen - c,
834 vector_foreach_slot(vecs->mpvec, mpp, i)
835 c += snprint_map(c, reply + maxlen - c,
836 PRINT_MAP_FAILBACK, mpp);
838 again = ((c - reply) == (maxlen - 1));
841 reply = REALLOC(reply, maxlen *= 2);
844 *len = (int)(c - reply + 1);
849 dump_pathvec (char ** r, int * len, struct vectors * vecs)
856 *len = VECTOR_SIZE(vecs->pathvec) * sizeof(struct path);
857 reply = (char *)MALLOC(*len);
865 vector_foreach_slot (vecs->pathvec, pp, i) {
866 memcpy((void *)p, pp, sizeof(struct path));
867 p += sizeof(struct path);
870 /* return negative to hint caller not to add "ok" to the dump */
875 map_discovery (struct vectors * vecs)
878 struct multipath * mpp;
880 if (dm_get_maps(vecs->mpvec, "multipath"))
883 vector_foreach_slot (vecs->mpvec, mpp, i) {
884 if (setup_multipath(vecs, mpp))
886 start_waiter_thread(mpp, vecs);
893 reconfigure (struct vectors * vecs)
895 struct config * old = conf;
896 struct multipath * mpp;
902 if (load_config(DEFAULT_CONFIGFILE)) {
904 condlog(2, "reconfigure failed, continue with old config");
907 conf->verbosity = old->verbosity;
910 vector_foreach_slot (vecs->mpvec, mpp, i) {
911 mpp->mpe = find_mpe(mpp->wwid);
912 mpp->hwe = extract_hwe_from_path(mpp);
913 adopt_paths(vecs, mpp);
914 set_no_path_retry(mpp);
916 vector_foreach_slot (vecs->pathvec, pp, i) {
921 condlog(2, "reconfigured");
926 uxsock_trigger (char * str, char ** reply, int * len, void * trigger_data)
928 struct vectors * vecs;
933 vecs = (struct vectors *)trigger_data;
935 pthread_cleanup_push(cleanup_lock, vecs->lock);
938 r = parse_cmd(str, reply, len, vecs);
941 *reply = STRDUP("fail\n");
942 *len = strlen(*reply) + 1;
945 else if (!r && *len == 0) {
946 *reply = STRDUP("ok\n");
947 *len = strlen(*reply) + 1;
950 /* else if (r < 0) leave *reply alone */
952 lock_cleanup_pop(vecs->lock);
957 uev_discard(char * devpath)
962 * keep only block devices, discard partitions
964 if (sscanf(devpath, "/block/%10s", a) != 1 ||
965 sscanf(devpath, "/block/%10[^/]/%10s", a, b) == 2) {
966 condlog(4, "discard event on %s", devpath);
973 uev_trigger (struct uevent * uev, void * trigger_data)
977 struct vectors * vecs;
979 vecs = (struct vectors *)trigger_data;
981 if (uev_discard(uev->devpath))
984 basename(uev->devpath, devname);
988 * device map add/remove event
990 if (!strncmp(devname, "dm-", 3)) {
991 if (!strncmp(uev->action, "add", 3)) {
992 r = uev_add_map(devname, vecs);
996 if (!strncmp(uev->action, "remove", 6)) {
997 r = uev_remove_map(devname, vecs);
1005 * path add/remove event
1007 if (blacklist(conf->blist, devname))
1010 if (!strncmp(uev->action, "add", 3)) {
1011 r = uev_add_path(devname, vecs);
1014 if (!strncmp(uev->action, "remove", 6)) {
1015 r = uev_remove_path(devname, vecs);
1025 ueventloop (void * ap)
1027 if (uevent_listen(&uev_trigger, ap))
1028 fprintf(stderr, "error starting uevent listener");
1034 uxlsnrloop (void * ap)
1039 if (alloc_handlers())
1042 add_handler(LIST+PATHS, cli_list_paths);
1043 add_handler(LIST+MAPS, cli_list_maps);
1044 add_handler(ADD+PATH, cli_add_path);
1045 add_handler(DEL+PATH, cli_del_path);
1046 add_handler(ADD+MAP, cli_add_map);
1047 add_handler(DEL+MAP, cli_del_map);
1048 add_handler(SWITCH+MAP+GROUP, cli_switch_group);
1049 add_handler(DUMP+PATHVEC, cli_dump_pathvec);
1050 add_handler(RECONFIGURE, cli_reconfigure);
1051 add_handler(SUSPEND+MAP, cli_suspend);
1052 add_handler(RESUME+MAP, cli_resume);
1053 add_handler(REINSTATE+PATH, cli_reinstate);
1054 add_handler(FAIL+PATH, cli_fail);
1056 uxsock_listen(&uxsock_trigger, ap);
1062 exit_daemon (int status)
1065 fprintf(stderr, "bad exit status. see daemon.log\n");
1067 condlog(3, "unlink pidfile");
1068 unlink(DEFAULT_PIDFILE);
1071 pthread_cond_signal(&exit_cond);
1072 unlock(&exit_mutex);
1078 fail_path (struct path * pp)
1083 condlog(2, "checker failed path %s in map %s",
1084 pp->dev_t, pp->mpp->alias);
1086 dm_fail_path(pp->mpp->alias, pp->dev_t);
1087 update_queue_mode_del_path(pp->mpp);
1091 * caller must have locked the path list before calling that function
1094 reinstate_path (struct path * pp)
1099 if (dm_reinstate_path(pp->mpp->alias, pp->dev_t))
1100 condlog(0, "%s: reinstate failed", pp->dev_t);
1102 condlog(2, "%s: reinstated", pp->dev_t);
1103 update_queue_mode_add_path(pp->mpp);
1108 enable_group(struct path * pp)
1110 struct pathgroup * pgp;
1113 * if path is added through uev_add_path, pgindex can be unset.
1114 * next update_strings() will set it, upon map reload event.
1116 * we can safely return here, because upon map reload, all
1117 * PG will be enabled.
1119 if (!pp->mpp->pg || !pp->pgindex)
1122 pgp = VECTOR_SLOT(pp->mpp->pg, pp->pgindex - 1);
1124 if (pgp->status == PGSTATE_DISABLED) {
1125 condlog(2, "%s: enable group #%i", pp->mpp->alias, pp->pgindex);
1126 dm_enablegroup(pp->mpp->alias, pp->pgindex);
1131 mpvec_garbage_collector (struct vectors * vecs)
1133 struct multipath * mpp;
1136 vector_foreach_slot (vecs->mpvec, mpp, i) {
1137 if (mpp && mpp->alias && !dm_map_present(mpp->alias)) {
1138 condlog(2, "%s: remove dead map", mpp->alias);
1139 remove_map(mpp, vecs, stop_waiter_thread, 1);
1146 defered_failback_tick (vector mpvec)
1148 struct multipath * mpp;
1151 vector_foreach_slot (mpvec, mpp, i) {
1153 * defered failback getting sooner
1155 if (mpp->pgfailback > 0 && mpp->failback_tick > 0) {
1156 mpp->failback_tick--;
1158 if (!mpp->failback_tick && need_switch_pathgroup(mpp, 1))
1159 switch_pathgroup(mpp);
1165 retry_count_tick(vector mpvec)
1167 struct multipath *mpp;
1170 vector_foreach_slot (mpvec, mpp, i) {
1171 if (mpp->retry_tick) {
1172 condlog(4, "%s: Retrying.. No active path", mpp->alias);
1173 if(--mpp->retry_tick == 0) {
1174 dm_queue_if_no_path(mpp->alias, 0);
1175 condlog(2, "%s: Disable queueing", mpp->alias);
1182 checkerloop (void *ap)
1184 struct vectors *vecs;
1188 char checker_msg[MAX_CHECKER_MSG_SIZE];
1190 mlockall(MCL_CURRENT | MCL_FUTURE);
1192 memset(checker_msg, 0, MAX_CHECKER_MSG_SIZE);
1193 vecs = (struct vectors *)ap;
1195 condlog(2, "path checkers start up");
1198 * init the path check interval
1200 vector_foreach_slot (vecs->pathvec, pp, i) {
1201 pp->checkint = conf->checkint;
1205 pthread_cleanup_push(cleanup_lock, vecs->lock);
1209 vector_foreach_slot (vecs->pathvec, pp, i) {
1213 if (pp->tick && --pp->tick)
1214 continue; /* don't check this path yet */
1217 * provision a next check soonest,
1218 * in case we exit abnormaly from here
1220 pp->tick = conf->checkint;
1223 pathinfo(pp, conf->hwtable, DI_SYSFS);
1228 condlog(0, "%s: checkfn is void", pp->dev);
1231 newstate = pp->checkfn(pp->fd, checker_msg,
1232 &pp->checker_context);
1235 condlog(2, "%s: unusable path", pp->dev);
1236 pathinfo(pp, conf->hwtable, 0);
1240 if (newstate != pp->state) {
1241 pp->state = newstate;
1242 LOG_MSG(1, checker_msg);
1245 * upon state change, reset the checkint
1246 * to the shortest delay
1248 pp->checkint = conf->checkint;
1250 if (newstate == PATH_DOWN ||
1251 newstate == PATH_SHAKY ||
1252 update_multipath_strings(pp->mpp,
1255 * proactively fail path in the DM
1260 * cancel scheduled failback
1262 pp->mpp->failback_tick = 0;
1268 * reinstate this path
1273 * schedule [defered] failback
1275 if (pp->mpp->pgfailback > 0)
1276 pp->mpp->failback_tick =
1277 pp->mpp->pgfailback + 1;
1278 else if (pp->mpp->pgfailback == -FAILBACK_IMMEDIATE &&
1279 need_switch_pathgroup(pp->mpp, 1))
1280 switch_pathgroup(pp->mpp);
1283 * if at least one path is up in a group, and
1284 * the group is disabled, re-enable it
1286 if (newstate == PATH_UP)
1289 else if (newstate == PATH_UP || newstate == PATH_GHOST) {
1290 LOG_MSG(4, checker_msg);
1292 * double the next check delay.
1293 * max at conf->max_checkint
1295 if (pp->checkint < (conf->max_checkint / 2))
1296 pp->checkint = 2 * pp->checkint;
1298 pp->checkint = conf->max_checkint;
1300 pp->tick = pp->checkint;
1301 condlog(4, "%s: delay next check %is",
1302 pp->dev_t, pp->tick);
1305 pp->state = newstate;
1308 * path prio refreshing
1310 condlog(4, "path prio refresh");
1311 pathinfo(pp, conf->hwtable, DI_PRIO);
1313 if (need_switch_pathgroup(pp->mpp, 0)) {
1314 if (pp->mpp->pgfailback > 0)
1315 pp->mpp->failback_tick =
1316 pp->mpp->pgfailback + 1;
1317 else if (pp->mpp->pgfailback ==
1318 -FAILBACK_IMMEDIATE)
1319 switch_pathgroup(pp->mpp);
1322 defered_failback_tick(vecs->mpvec);
1323 retry_count_tick(vecs->mpvec);
1328 condlog(4, "map garbage collection");
1329 mpvec_garbage_collector(vecs);
1333 lock_cleanup_pop(vecs->lock);
1339 static struct vectors *
1342 struct vectors * vecs;
1344 vecs = (struct vectors *)MALLOC(sizeof(struct vectors));
1350 (pthread_mutex_t *)MALLOC(sizeof(pthread_mutex_t));
1355 vecs->pathvec = vector_alloc();
1360 vecs->mpvec = vector_alloc();
1365 pthread_mutex_init(vecs->lock, NULL);
1370 vector_free(vecs->pathvec);
1375 condlog(0, "failed to init paths");
1380 signal_set(int signo, void (*func) (int))
1383 struct sigaction sig;
1384 struct sigaction osig;
1386 sig.sa_handler = func;
1387 sigemptyset(&sig.sa_mask);
1390 r = sigaction(signo, &sig, &osig);
1395 return (osig.sa_handler);
1401 condlog(3, "SIGHUP received");
1404 dbg_free_final(NULL);
1417 signal_set(SIGHUP, sighup);
1418 signal_set(SIGINT, sigend);
1419 signal_set(SIGTERM, sigend);
1420 signal_set(SIGKILL, sigend);
1427 static struct sched_param sched_param = {
1431 res = sched_setscheduler (0, SCHED_RR, &sched_param);
1434 condlog(LOG_WARNING, "Could not set SCHED_RR at priority 99");
1439 set_oom_adj (int val)
1443 fp = fopen("/proc/self/oom_adj", "w");
1448 fprintf(fp, "%i", val);
1453 child (void * param)
1455 pthread_t check_thr, uevent_thr, uxlsnr_thr;
1456 pthread_attr_t attr;
1457 struct vectors * vecs;
1459 mlockall(MCL_CURRENT | MCL_FUTURE);
1464 condlog(2, "--------start up--------");
1465 condlog(2, "read " DEFAULT_CONFIGFILE);
1467 if (load_config(DEFAULT_CONFIGFILE))
1470 setlogmask(LOG_UPTO(conf->verbosity + 3));
1473 * fill the voids left in the config file
1475 if (!conf->checkint) {
1476 conf->checkint = CHECKINT;
1477 conf->max_checkint = MAX_CHECKINT;
1480 if (pidfile_create(DEFAULT_PIDFILE, getpid())) {
1494 if (sysfs_get_mnt_path(sysfs_path, FILE_NAME_SIZE)) {
1495 condlog(0, "can not find sysfs mount point");
1500 * fetch paths and multipaths lists
1501 * no paths and/or no multipaths are valid scenarii
1502 * vectors maintenance will be driven by events
1504 path_discovery(vecs->pathvec, conf, DI_SYSFS | DI_WWID | DI_CHECKER);
1505 map_discovery(vecs);
1510 pthread_attr_init(&attr);
1511 pthread_attr_setstacksize(&attr, 64 * 1024);
1512 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
1514 pthread_create(&check_thr, &attr, checkerloop, vecs);
1515 pthread_create(&uevent_thr, &attr, ueventloop, vecs);
1516 pthread_create(&uxlsnr_thr, &attr, uxlsnrloop, vecs);
1518 pthread_cond_wait(&exit_cond, &exit_mutex);
1524 remove_maps(vecs, stop_waiter_thread);
1525 free_pathvec(vecs->pathvec, FREE_PATHS);
1527 pthread_cancel(check_thr);
1528 pthread_cancel(uevent_thr);
1529 pthread_cancel(uxlsnr_thr);
1533 free_handlers(handlers);
1538 pthread_mutex_destroy(vecs->lock);
1546 condlog(2, "--------shut down-------");
1555 dbg_free_final(NULL);
1567 if( (pid = fork()) < 0){
1568 fprintf(stderr, "Failed first fork : %s\n", strerror(errno));
1576 if ( (pid = fork()) < 0)
1577 fprintf(stderr, "Failed second fork : %s\n", strerror(errno));
1581 in_fd = open("/dev/null", O_RDONLY);
1583 fprintf(stderr, "cannot open /dev/null for input : %s\n",
1587 out_fd = open("/dev/console", O_WRONLY);
1589 fprintf(stderr, "cannot open /dev/console for output : %s\n",
1594 close(STDIN_FILENO);
1596 close(STDOUT_FILENO);
1598 close(STDERR_FILENO);
1609 main (int argc, char *argv[])
1611 extern char *optarg;
1618 if (getuid() != 0) {
1619 fprintf(stderr, "need to be root\n");
1623 /* make sure we don't lock any path */
1625 umask(umask(077) | 022);
1627 conf = alloc_config();
1632 while ((arg = getopt(argc, argv, ":dv:k::")) != EOF ) {
1636 //debug=1; /* ### comment me out ### */
1639 if (sizeof(optarg) > sizeof(char *) ||
1640 !isdigit(optarg[0]))
1643 conf->verbosity = atoi(optarg);
1666 return (child(NULL));