Lines Matching +full:1 +full:br +full:- +full:100

1 // SPDX-License-Identifier: GPL-2.0-or-later
85 static u64 dlm_mig_cookie = 1;
93 dlm_mig_cookie = 1; in dlm_get_next_mig_cookie()
103 assert_spin_locked(&dlm->spinlock); in dlm_set_reco_dead_node()
104 if (dlm->reco.dead_node != dead_node) in dlm_set_reco_dead_node()
106 dlm->name, dlm->reco.dead_node, dead_node); in dlm_set_reco_dead_node()
107 dlm->reco.dead_node = dead_node; in dlm_set_reco_dead_node()
113 assert_spin_locked(&dlm->spinlock); in dlm_set_reco_master()
115 dlm->name, dlm->reco.new_master, master); in dlm_set_reco_master()
116 dlm->reco.new_master = master; in dlm_set_reco_master()
121 assert_spin_locked(&dlm->spinlock); in __dlm_reset_recovery()
122 clear_bit(dlm->reco.dead_node, dlm->recovery_map); in __dlm_reset_recovery()
137 spin_lock(&dlm->work_lock); in dlm_dispatch_work()
138 list_splice_init(&dlm->work_list, &tmp_list); in dlm_dispatch_work()
139 spin_unlock(&dlm->work_lock); in dlm_dispatch_work()
144 mlog(0, "%s: work thread has %d work items\n", dlm->name, tot); in dlm_dispatch_work()
147 workfunc = item->func; in dlm_dispatch_work()
148 list_del_init(&item->list); in dlm_dispatch_work()
151 * it disappear. just double-check. */ in dlm_dispatch_work()
152 BUG_ON(item->dlm != dlm); in dlm_dispatch_work()
156 workfunc(item, item->data); in dlm_dispatch_work()
171 * 1) sleeping with no recovery happening in dlm_kick_recovery_thread()
175 wake_up(&dlm->dlm_reco_thread_wq); in dlm_kick_recovery_thread()
183 dlm->dlm_reco_thread_task = kthread_run(dlm_recovery_thread, dlm, in dlm_launch_recovery_thread()
184 "dlm_reco-%s", dlm->name); in dlm_launch_recovery_thread()
185 if (IS_ERR(dlm->dlm_reco_thread_task)) { in dlm_launch_recovery_thread()
186 mlog_errno(PTR_ERR(dlm->dlm_reco_thread_task)); in dlm_launch_recovery_thread()
187 dlm->dlm_reco_thread_task = NULL; in dlm_launch_recovery_thread()
188 return -EINVAL; in dlm_launch_recovery_thread()
196 if (dlm->dlm_reco_thread_task) { in dlm_complete_recovery_thread()
198 kthread_stop(dlm->dlm_reco_thread_task); in dlm_complete_recovery_thread()
199 dlm->dlm_reco_thread_task = NULL; in dlm_complete_recovery_thread()
207 * 1) all recovery threads cluster wide will work on recovering
234 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task), in dlm_print_reco_node_status()
235 dlm->reco.state & DLM_RECO_STATE_ACTIVE ? "ACTIVE" : "inactive", in dlm_print_reco_node_status()
236 dlm->reco.dead_node, dlm->reco.new_master); in dlm_print_reco_node_status()
238 list_for_each_entry(ndata, &dlm->reco.node_data, list) { in dlm_print_reco_node_status()
240 switch (ndata->state) { in dlm_print_reco_node_status()
260 st = "finalize-sent"; in dlm_print_reco_node_status()
267 dlm->name, ndata->node_num, st); in dlm_print_reco_node_status()
269 list_for_each_entry(res, &dlm->reco.resources, recovering) { in dlm_print_reco_node_status()
271 dlm->name, res->lockname.len, res->lockname.name); in dlm_print_reco_node_status()
283 mlog(0, "dlm thread running for %s...\n", dlm->name); in dlm_recovery_thread()
288 if (status == -EAGAIN) { in dlm_recovery_thread()
296 wait_event_interruptible_timeout(dlm->dlm_reco_thread_wq, in dlm_recovery_thread()
309 spin_lock(&dlm->spinlock); in dlm_reco_master_ready()
310 ready = (dlm->reco.new_master != O2NM_INVALID_NODE_NUM); in dlm_reco_master_ready()
311 spin_unlock(&dlm->spinlock); in dlm_reco_master_ready()
320 spin_lock(&dlm->spinlock); in dlm_is_node_dead()
321 dead = !test_bit(node, dlm->domain_map); in dlm_is_node_dead()
322 spin_unlock(&dlm->spinlock); in dlm_is_node_dead()
331 spin_lock(&dlm->spinlock); in dlm_is_node_recovered()
332 recovered = !test_bit(node, dlm->recovery_map); in dlm_is_node_recovered()
333 spin_unlock(&dlm->spinlock); in dlm_is_node_recovered()
344 "domain %s\n", node, dlm->name); in dlm_wait_for_node_death()
347 wait_event_timeout(dlm->dlm_reco_thread_wq, in dlm_wait_for_node_death()
351 wait_event(dlm->dlm_reco_thread_wq, in dlm_wait_for_node_death()
361 "domain %s\n", node, dlm->name); in dlm_wait_for_node_recovery()
364 wait_event_timeout(dlm->dlm_reco_thread_wq, in dlm_wait_for_node_recovery()
368 wait_event(dlm->dlm_reco_thread_wq, in dlm_wait_for_node_recovery()
372 /* callers of the top-level api calls (dlmlock/dlmunlock) should
373 * block on the dlm->reco.event when recovery is in progress.
381 spin_lock(&dlm->spinlock); in dlm_in_recovery()
382 in_recovery = !!(dlm->reco.state & DLM_RECO_STATE_ACTIVE); in dlm_in_recovery()
383 spin_unlock(&dlm->spinlock); in dlm_in_recovery()
393 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task), in dlm_wait_for_recovery()
394 dlm->reco.state, dlm->reco.new_master, in dlm_wait_for_recovery()
395 dlm->reco.dead_node); in dlm_wait_for_recovery()
397 wait_event(dlm->reco.event, !dlm_in_recovery(dlm)); in dlm_wait_for_recovery()
402 assert_spin_locked(&dlm->spinlock); in dlm_begin_recovery()
403 BUG_ON(dlm->reco.state & DLM_RECO_STATE_ACTIVE); in dlm_begin_recovery()
405 dlm->name, dlm->reco.dead_node); in dlm_begin_recovery()
406 dlm->reco.state |= DLM_RECO_STATE_ACTIVE; in dlm_begin_recovery()
411 spin_lock(&dlm->spinlock); in dlm_end_recovery()
412 BUG_ON(!(dlm->reco.state & DLM_RECO_STATE_ACTIVE)); in dlm_end_recovery()
413 dlm->reco.state &= ~DLM_RECO_STATE_ACTIVE; in dlm_end_recovery()
414 spin_unlock(&dlm->spinlock); in dlm_end_recovery()
415 printk(KERN_NOTICE "o2dlm: End recovery on domain %s\n", dlm->name); in dlm_end_recovery()
416 wake_up(&dlm->reco.event); in dlm_end_recovery()
422 "dead node %u in domain %s\n", dlm->reco.new_master, in dlm_print_recovery_master()
423 (dlm->node_num == dlm->reco.new_master ? "me" : "he"), in dlm_print_recovery_master()
424 dlm->reco.dead_node, dlm->name); in dlm_print_recovery_master()
432 spin_lock(&dlm->spinlock); in dlm_do_recovery()
434 if (dlm->migrate_done) { in dlm_do_recovery()
436 "lock resources\n", dlm->name); in dlm_do_recovery()
437 spin_unlock(&dlm->spinlock); in dlm_do_recovery()
442 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM && in dlm_do_recovery()
443 test_bit(dlm->reco.new_master, dlm->recovery_map)) { in dlm_do_recovery()
445 dlm->reco.new_master, dlm->reco.dead_node); in dlm_do_recovery()
451 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) { in dlm_do_recovery()
454 bit = find_first_bit(dlm->recovery_map, O2NM_MAX_NODES); in dlm_do_recovery()
459 } else if (!test_bit(dlm->reco.dead_node, dlm->recovery_map)) { in dlm_do_recovery()
462 dlm->reco.dead_node); in dlm_do_recovery()
466 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) { in dlm_do_recovery()
468 spin_unlock(&dlm->spinlock); in dlm_do_recovery()
473 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task), in dlm_do_recovery()
474 dlm->reco.dead_node); in dlm_do_recovery()
480 spin_unlock(&dlm->spinlock); in dlm_do_recovery()
482 if (dlm->reco.new_master == dlm->node_num) in dlm_do_recovery()
485 if (dlm->reco.new_master == O2NM_INVALID_NODE_NUM) { in dlm_do_recovery()
487 * is the master, -EEXIST if it's another node. in dlm_do_recovery()
502 * have been marked as in-recovery */ in dlm_do_recovery()
511 status = dlm_remaster_locks(dlm, dlm->reco.dead_node); in dlm_do_recovery()
515 "retrying.\n", dlm->name, status, dlm->reco.dead_node); in dlm_do_recovery()
518 msleep(100); in dlm_do_recovery()
522 dlm->name, dlm->reco.dead_node, dlm->node_num); in dlm_do_recovery()
523 spin_lock(&dlm->spinlock); in dlm_do_recovery()
525 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE; in dlm_do_recovery()
526 spin_unlock(&dlm->spinlock); in dlm_do_recovery()
531 return -EAGAIN; in dlm_do_recovery()
548 "retrying\n", dlm->name); in dlm_remaster_locks()
555 list_for_each_entry(ndata, &dlm->reco.node_data, list) { in dlm_remaster_locks()
556 BUG_ON(ndata->state != DLM_RECO_NODE_DATA_INIT); in dlm_remaster_locks()
557 ndata->state = DLM_RECO_NODE_DATA_REQUESTING; in dlm_remaster_locks()
559 mlog(0, "%s: Requesting lock info from node %u\n", dlm->name, in dlm_remaster_locks()
560 ndata->node_num); in dlm_remaster_locks()
562 if (ndata->node_num == dlm->node_num) { in dlm_remaster_locks()
563 ndata->state = DLM_RECO_NODE_DATA_DONE; in dlm_remaster_locks()
568 status = dlm_request_all_locks(dlm, ndata->node_num, in dlm_remaster_locks()
575 ndata->state = DLM_RECO_NODE_DATA_DEAD; in dlm_remaster_locks()
578 wait_event_timeout(dlm->dlm_reco_thread_wq, in dlm_remaster_locks()
580 ndata->node_num), in dlm_remaster_locks()
582 mlog(0, "waited 1 sec for %u, " in dlm_remaster_locks()
583 "dead? %s\n", ndata->node_num, in dlm_remaster_locks()
584 str_yes_no(dlm_is_node_dead(dlm, ndata->node_num))); in dlm_remaster_locks()
586 /* -ENOMEM on the other node */ in dlm_remaster_locks()
590 dlm->name, ndata->node_num, in dlm_remaster_locks()
592 msleep(100); in dlm_remaster_locks()
598 switch (ndata->state) { in dlm_remaster_locks()
607 ndata->node_num, dead_node); in dlm_remaster_locks()
612 ndata->state = DLM_RECO_NODE_DATA_REQUESTED; in dlm_remaster_locks()
615 ndata->node_num, dead_node); in dlm_remaster_locks()
620 ndata->node_num, dead_node); in dlm_remaster_locks()
625 ndata->node_num, dead_node); in dlm_remaster_locks()
631 mlog(0, "%s: Done requesting all lock info\n", dlm->name); in dlm_remaster_locks()
636 while (1) { in dlm_remaster_locks()
639 all_nodes_done = 1; in dlm_remaster_locks()
641 list_for_each_entry(ndata, &dlm->reco.node_data, list) { in dlm_remaster_locks()
643 ndata->node_num); in dlm_remaster_locks()
644 switch (ndata->state) { in dlm_remaster_locks()
649 ndata->node_num, ndata->state); in dlm_remaster_locks()
655 "node %u\n", ndata->node_num, in dlm_remaster_locks()
661 dlm->name, ndata->node_num, in dlm_remaster_locks()
662 ndata->state==DLM_RECO_NODE_DATA_RECEIVING ? in dlm_remaster_locks()
668 dlm->name, ndata->node_num); in dlm_remaster_locks()
672 dlm->name, ndata->node_num); in dlm_remaster_locks()
687 spin_lock(&dlm->spinlock); in dlm_remaster_locks()
688 dlm->reco.state |= DLM_RECO_STATE_FINALIZE; in dlm_remaster_locks()
689 spin_unlock(&dlm->spinlock); in dlm_remaster_locks()
699 spin_lock(&dlm->spinlock); in dlm_remaster_locks()
701 dlm->node_num); in dlm_remaster_locks()
702 spin_unlock(&dlm->spinlock); in dlm_remaster_locks()
706 "dead=%u, this=%u, new=%u\n", dlm->name, in dlm_remaster_locks()
707 jiffies, dlm->reco.dead_node, in dlm_remaster_locks()
708 dlm->node_num, dlm->reco.new_master); in dlm_remaster_locks()
709 destroy = 1; in dlm_remaster_locks()
717 wait_event_interruptible_timeout(dlm->dlm_reco_thread_wq, in dlm_remaster_locks()
734 spin_lock(&dlm->spinlock); in dlm_init_recovery_area()
735 bitmap_copy(dlm->reco.node_map, dlm->domain_map, O2NM_MAX_NODES); in dlm_init_recovery_area()
738 spin_unlock(&dlm->spinlock); in dlm_init_recovery_area()
740 while (1) { in dlm_init_recovery_area()
741 num = find_next_bit (dlm->reco.node_map, O2NM_MAX_NODES, num); in dlm_init_recovery_area()
750 return -ENOMEM; in dlm_init_recovery_area()
752 ndata->node_num = num; in dlm_init_recovery_area()
753 ndata->state = DLM_RECO_NODE_DATA_INIT; in dlm_init_recovery_area()
755 list_add_tail(&ndata->list, &dlm->reco.node_data); in dlm_init_recovery_area()
769 list_splice_init(&dlm->reco.node_data, &tmplist); in dlm_destroy_recovery_area()
773 list_del_init(&ndata->list); in dlm_destroy_recovery_area()
792 lr.node_idx = dlm->node_num; in dlm_request_all_locks()
796 ret = o2net_send_message(DLM_LOCK_REQUEST_MSG, dlm->key, in dlm_request_all_locks()
802 "to recover dead node %u\n", dlm->name, ret, in dlm_request_all_locks()
816 struct dlm_lock_request *lr = (struct dlm_lock_request *)msg->buf; in dlm_request_all_locks_handler()
821 return -EINVAL; in dlm_request_all_locks_handler()
823 if (lr->dead_node != dlm->reco.dead_node) { in dlm_request_all_locks_handler()
825 "dead_node is %u\n", dlm->name, lr->node_idx, in dlm_request_all_locks_handler()
826 lr->dead_node, dlm->reco.dead_node); in dlm_request_all_locks_handler()
830 return -ENOMEM; in dlm_request_all_locks_handler()
832 BUG_ON(lr->dead_node != dlm->reco.dead_node); in dlm_request_all_locks_handler()
837 return -ENOMEM; in dlm_request_all_locks_handler()
845 return -ENOMEM; in dlm_request_all_locks_handler()
851 item->u.ral.reco_master = lr->node_idx; in dlm_request_all_locks_handler()
852 item->u.ral.dead_node = lr->dead_node; in dlm_request_all_locks_handler()
853 spin_lock(&dlm->work_lock); in dlm_request_all_locks_handler()
854 list_add_tail(&item->list, &dlm->work_list); in dlm_request_all_locks_handler()
855 spin_unlock(&dlm->work_lock); in dlm_request_all_locks_handler()
856 queue_work(dlm->dlm_worker, &dlm->dispatched_work); in dlm_request_all_locks_handler()
872 dlm = item->dlm; in dlm_request_all_locks_worker()
873 dead_node = item->u.ral.dead_node; in dlm_request_all_locks_worker()
874 reco_master = item->u.ral.reco_master; in dlm_request_all_locks_worker()
878 dlm->name, dead_node, reco_master); in dlm_request_all_locks_worker()
880 if (dead_node != dlm->reco.dead_node || in dlm_request_all_locks_worker()
881 reco_master != dlm->reco.new_master) { in dlm_request_all_locks_worker()
884 if (dlm->reco.new_master == O2NM_INVALID_NODE_NUM) { in dlm_request_all_locks_worker()
887 " current=(dead=%u,mas=%u)\n", dlm->name, in dlm_request_all_locks_worker()
889 dlm->reco.dead_node, dlm->reco.new_master); in dlm_request_all_locks_worker()
893 dlm->name, dlm->reco.dead_node, in dlm_request_all_locks_worker()
894 dlm->reco.new_master, dead_node, reco_master); in dlm_request_all_locks_worker()
900 * dlm->reco.resources list. now move items from that list in dlm_request_all_locks_worker()
916 "recovery state for dead node %u, ret=%d\n", dlm->name, in dlm_request_all_locks_worker()
918 skip_all_done = 1; in dlm_request_all_locks_worker()
924 spin_lock(&dlm->spinlock); in dlm_request_all_locks_worker()
925 list_splice_init(&resources, &dlm->reco.resources); in dlm_request_all_locks_worker()
926 spin_unlock(&dlm->spinlock); in dlm_request_all_locks_worker()
932 "recovery all-done for dead node %u, ret=%d\n", in dlm_request_all_locks_worker()
933 dlm->name, reco_master, dead_node, ret); in dlm_request_all_locks_worker()
947 done_msg.node_idx = dlm->node_num; in dlm_send_all_done_msg()
953 ret = o2net_send_message(DLM_RECO_DATA_DONE_MSG, dlm->key, &done_msg, in dlm_send_all_done_msg()
957 "to recover dead node %u\n", dlm->name, ret, send_to, in dlm_send_all_done_msg()
972 struct dlm_reco_data_done *done = (struct dlm_reco_data_done *)msg->buf; in dlm_reco_data_done_handler()
974 int ret = -EINVAL; in dlm_reco_data_done_handler()
977 return -EINVAL; in dlm_reco_data_done_handler()
980 "node_idx=%u, this node=%u\n", done->dead_node, in dlm_reco_data_done_handler()
981 dlm->reco.dead_node, done->node_idx, dlm->node_num); in dlm_reco_data_done_handler()
983 mlog_bug_on_msg((done->dead_node != dlm->reco.dead_node), in dlm_reco_data_done_handler()
985 "node_idx=%u, this node=%u\n", done->dead_node, in dlm_reco_data_done_handler()
986 dlm->reco.dead_node, done->node_idx, dlm->node_num); in dlm_reco_data_done_handler()
989 list_for_each_entry(ndata, &dlm->reco.node_data, list) { in dlm_reco_data_done_handler()
990 if (ndata->node_num != done->node_idx) in dlm_reco_data_done_handler()
993 switch (ndata->state) { in dlm_reco_data_done_handler()
999 " state=%d\n", ndata->node_num, in dlm_reco_data_done_handler()
1000 ndata->state); in dlm_reco_data_done_handler()
1011 ndata->node_num); in dlm_reco_data_done_handler()
1013 ndata->state = DLM_RECO_NODE_DATA_DONE; in dlm_reco_data_done_handler()
1026 "%u\n", done->node_idx); in dlm_reco_data_done_handler()
1040 spin_lock(&dlm->spinlock); in dlm_move_reco_locks_to_list()
1041 list_for_each_entry_safe(res, next, &dlm->reco.resources, recovering) { in dlm_move_reco_locks_to_list()
1044 if (dlm_is_recovery_lock(res->lockname.name, in dlm_move_reco_locks_to_list()
1045 res->lockname.len)) { in dlm_move_reco_locks_to_list()
1046 spin_lock(&res->spinlock); in dlm_move_reco_locks_to_list()
1047 list_for_each_entry(lock, &res->granted, list) { in dlm_move_reco_locks_to_list()
1048 if (lock->ml.node == dead_node) { in dlm_move_reco_locks_to_list()
1052 dead_node, dlm->name); in dlm_move_reco_locks_to_list()
1053 list_del_init(&lock->list); in dlm_move_reco_locks_to_list()
1056 * - do manually */ in dlm_move_reco_locks_to_list()
1061 spin_unlock(&res->spinlock); in dlm_move_reco_locks_to_list()
1065 if (res->owner == dead_node) { in dlm_move_reco_locks_to_list()
1069 list_move_tail(&res->recovering, list); in dlm_move_reco_locks_to_list()
1070 } else if (res->owner == DLM_LOCK_RES_OWNER_UNKNOWN) { in dlm_move_reco_locks_to_list()
1073 list_move_tail(&res->recovering, list); in dlm_move_reco_locks_to_list()
1076 spin_unlock(&dlm->spinlock); in dlm_move_reco_locks_to_list()
1082 struct list_head *iter, *queue = &res->granted; in dlm_num_locks_in_lockres()
1100 u64 mig_cookie = be64_to_cpu(mres->mig_cookie); in dlm_send_mig_lockres_msg()
1101 int mres_total_locks = be32_to_cpu(mres->total_locks); in dlm_send_mig_lockres_msg()
1103 u8 orig_flags = mres->flags, in dlm_send_mig_lockres_msg()
1104 orig_master = mres->master; in dlm_send_mig_lockres_msg()
1106 BUG_ON(mres->num_locks > DLM_MAX_MIGRATABLE_LOCKS); in dlm_send_mig_lockres_msg()
1107 if (!mres->num_locks) in dlm_send_mig_lockres_msg()
1110 /* add an all-done flag if we reached the last lock */ in dlm_send_mig_lockres_msg()
1111 orig_flags = mres->flags; in dlm_send_mig_lockres_msg()
1114 mres->flags |= DLM_MRES_ALL_DONE; in dlm_send_mig_lockres_msg()
1117 dlm->name, res->lockname.len, res->lockname.name, in dlm_send_mig_lockres_msg()
1122 ret = o2net_send_message(DLM_MIG_LOCKRES_MSG, dlm->key, mres, in dlm_send_mig_lockres_msg()
1123 struct_size(mres, ml, mres->num_locks), in dlm_send_mig_lockres_msg()
1129 "node %u (%s)\n", dlm->name, mres->lockname_len, in dlm_send_mig_lockres_msg()
1130 mres->lockname, ret, send_to, in dlm_send_mig_lockres_msg()
1134 /* might get an -ENOMEM back here */ in dlm_send_mig_lockres_msg()
1139 if (ret == -EFAULT) { in dlm_send_mig_lockres_msg()
1148 dlm_init_migratable_lockres(mres, res->lockname.name, in dlm_send_mig_lockres_msg()
1149 res->lockname.len, mres_total_locks, in dlm_send_mig_lockres_msg()
1161 mres->lockname_len = namelen; in dlm_init_migratable_lockres()
1162 memcpy(mres->lockname, lockname, namelen); in dlm_init_migratable_lockres()
1163 mres->num_locks = 0; in dlm_init_migratable_lockres()
1164 mres->total_locks = cpu_to_be32(total_locks); in dlm_init_migratable_lockres()
1165 mres->mig_cookie = cpu_to_be64(cookie); in dlm_init_migratable_lockres()
1166 mres->flags = flags; in dlm_init_migratable_lockres()
1167 mres->master = master; in dlm_init_migratable_lockres()
1174 if (!lock->lksb) in dlm_prepare_lvb_for_migration()
1182 if (lock->ml.type != LKM_EXMODE && lock->ml.type != LKM_PRMODE) in dlm_prepare_lvb_for_migration()
1185 if (dlm_lvb_is_empty(mres->lvb)) { in dlm_prepare_lvb_for_migration()
1186 memcpy(mres->lvb, lock->lksb->lvb, DLM_LVB_LEN); in dlm_prepare_lvb_for_migration()
1191 if (!memcmp(mres->lvb, lock->lksb->lvb, DLM_LVB_LEN)) in dlm_prepare_lvb_for_migration()
1196 dlm_get_lock_cookie_node(be64_to_cpu(lock->ml.cookie)), in dlm_prepare_lvb_for_migration()
1197 dlm_get_lock_cookie_seq(be64_to_cpu(lock->ml.cookie)), in dlm_prepare_lvb_for_migration()
1198 lock->lockres->lockname.len, lock->lockres->lockname.name, in dlm_prepare_lvb_for_migration()
1199 lock->ml.node); in dlm_prepare_lvb_for_migration()
1200 dlm_print_one_lock_resource(lock->lockres); in dlm_prepare_lvb_for_migration()
1204 /* returns 1 if this lock fills the network structure,
1210 int lock_num = mres->num_locks; in dlm_add_lock_to_array()
1212 ml = &(mres->ml[lock_num]); in dlm_add_lock_to_array()
1213 ml->cookie = lock->ml.cookie; in dlm_add_lock_to_array()
1214 ml->type = lock->ml.type; in dlm_add_lock_to_array()
1215 ml->convert_type = lock->ml.convert_type; in dlm_add_lock_to_array()
1216 ml->highest_blocked = lock->ml.highest_blocked; in dlm_add_lock_to_array()
1217 ml->list = queue; in dlm_add_lock_to_array()
1218 if (lock->lksb) { in dlm_add_lock_to_array()
1219 ml->flags = lock->lksb->flags; in dlm_add_lock_to_array()
1222 ml->node = lock->ml.node; in dlm_add_lock_to_array()
1223 mres->num_locks++; in dlm_add_lock_to_array()
1225 if (mres->num_locks == DLM_MAX_MIGRATABLE_LOCKS) in dlm_add_lock_to_array()
1226 return 1; in dlm_add_lock_to_array()
1240 dummy.ml.node = dlm->node_num; in dlm_add_dummy_lock()
1248 if (unlikely(ml->cookie == 0 && in dlm_is_dummy_lock()
1249 ml->type == LKM_IVMODE && in dlm_is_dummy_lock()
1250 ml->convert_type == LKM_IVMODE && in dlm_is_dummy_lock()
1251 ml->highest_blocked == LKM_IVMODE && in dlm_is_dummy_lock()
1252 ml->list == DLM_BLOCKED_LIST)) { in dlm_is_dummy_lock()
1253 *nodenum = ml->node; in dlm_is_dummy_lock()
1254 return 1; in dlm_is_dummy_lock()
1282 dlm_init_migratable_lockres(mres, res->lockname.name, in dlm_send_one_lockres()
1283 res->lockname.len, total_locks, in dlm_send_one_lockres()
1284 mig_cookie, flags, res->owner); in dlm_send_one_lockres()
1306 dlm->name, res->lockname.len, res->lockname.name, in dlm_send_one_lockres()
1319 dlm->name, ret); in dlm_send_one_lockres()
1323 "lockres %.*s\n", dlm->name, send_to, in dlm_send_one_lockres()
1325 res->lockname.len, res->lockname.name); in dlm_send_one_lockres()
1349 (struct dlm_migratable_lockres *)msg->buf; in dlm_mig_lockres_handler()
1359 return -EINVAL; in dlm_mig_lockres_handler()
1364 dlm->name, mres->lockname_len, in dlm_mig_lockres_handler()
1365 mres->lockname, mres->master); in dlm_mig_lockres_handler()
1367 return -EINVAL; in dlm_mig_lockres_handler()
1370 BUG_ON(!(mres->flags & (DLM_MRES_RECOVERY|DLM_MRES_MIGRATION))); in dlm_mig_lockres_handler()
1372 real_master = mres->master; in dlm_mig_lockres_handler()
1375 BUG_ON(!(mres->flags & DLM_MRES_RECOVERY)); in dlm_mig_lockres_handler()
1379 (mres->flags & DLM_MRES_RECOVERY) ? in dlm_mig_lockres_handler()
1380 "recovery" : "migration", mres->master); in dlm_mig_lockres_handler()
1381 if (mres->flags & DLM_MRES_ALL_DONE) in dlm_mig_lockres_handler()
1384 ret = -ENOMEM; in dlm_mig_lockres_handler()
1385 buf = kmalloc(be16_to_cpu(msg->data_len), GFP_NOFS); in dlm_mig_lockres_handler()
1393 hash = dlm_lockid_hash(mres->lockname, mres->lockname_len); in dlm_mig_lockres_handler()
1394 spin_lock(&dlm->spinlock); in dlm_mig_lockres_handler()
1395 res = __dlm_lookup_lockres_full(dlm, mres->lockname, mres->lockname_len, in dlm_mig_lockres_handler()
1400 spin_lock(&res->spinlock); in dlm_mig_lockres_handler()
1401 if (res->state & DLM_LOCK_RES_DROPPING_REF) { in dlm_mig_lockres_handler()
1404 " ref!\n", dlm->name, in dlm_mig_lockres_handler()
1405 mres->lockname_len, mres->lockname); in dlm_mig_lockres_handler()
1406 ret = -EINVAL; in dlm_mig_lockres_handler()
1407 spin_unlock(&res->spinlock); in dlm_mig_lockres_handler()
1408 spin_unlock(&dlm->spinlock); in dlm_mig_lockres_handler()
1413 if (mres->flags & DLM_MRES_RECOVERY) { in dlm_mig_lockres_handler()
1414 res->state |= DLM_LOCK_RES_RECOVERING; in dlm_mig_lockres_handler()
1416 if (res->state & DLM_LOCK_RES_MIGRATING) { in dlm_mig_lockres_handler()
1420 mres->lockname_len, in dlm_mig_lockres_handler()
1421 mres->lockname); in dlm_mig_lockres_handler()
1422 } else if (res->state & DLM_LOCK_RES_RECOVERING) { in dlm_mig_lockres_handler()
1426 mres->lockname_len, mres->lockname); in dlm_mig_lockres_handler()
1427 ret = -EFAULT; in dlm_mig_lockres_handler()
1428 spin_unlock(&res->spinlock); in dlm_mig_lockres_handler()
1429 spin_unlock(&dlm->spinlock); in dlm_mig_lockres_handler()
1433 res->state |= DLM_LOCK_RES_MIGRATING; in dlm_mig_lockres_handler()
1435 spin_unlock(&res->spinlock); in dlm_mig_lockres_handler()
1436 spin_unlock(&dlm->spinlock); in dlm_mig_lockres_handler()
1438 spin_unlock(&dlm->spinlock); in dlm_mig_lockres_handler()
1441 res = dlm_new_lockres(dlm, mres->lockname, mres->lockname_len); in dlm_mig_lockres_handler()
1450 if (mres->flags & DLM_MRES_RECOVERY) in dlm_mig_lockres_handler()
1451 res->state |= DLM_LOCK_RES_RECOVERING; in dlm_mig_lockres_handler()
1453 res->state |= DLM_LOCK_RES_MIGRATING; in dlm_mig_lockres_handler()
1455 spin_lock(&dlm->spinlock); in dlm_mig_lockres_handler()
1457 spin_unlock(&dlm->spinlock); in dlm_mig_lockres_handler()
1459 /* Add an extra ref for this lock-less lockres lest the in dlm_mig_lockres_handler()
1465 * 1. Taken above. in dlm_mig_lockres_handler()
1466 * 2. kref_init in dlm_new_lockres()->dlm_init_lockres(). in dlm_mig_lockres_handler()
1477 spin_lock(&res->spinlock); in dlm_mig_lockres_handler()
1478 res->state &= ~DLM_LOCK_RES_IN_PROGRESS; in dlm_mig_lockres_handler()
1479 spin_unlock(&res->spinlock); in dlm_mig_lockres_handler()
1480 wake_up(&res->wq); in dlm_mig_lockres_handler()
1485 * the proper res->state flags. */ in dlm_mig_lockres_handler()
1487 spin_lock(&res->spinlock); in dlm_mig_lockres_handler()
1491 if (mres->master == DLM_LOCK_RES_OWNER_UNKNOWN) { in dlm_mig_lockres_handler()
1493 BUG_ON(!(mres->flags & DLM_MRES_RECOVERY)); in dlm_mig_lockres_handler()
1496 "%.*s\n", mres->lockname_len, mres->lockname); in dlm_mig_lockres_handler()
1500 dlm_change_lockres_owner(dlm, res, dlm->node_num); in dlm_mig_lockres_handler()
1502 spin_unlock(&res->spinlock); in dlm_mig_lockres_handler()
1506 memcpy(buf, msg->buf, be16_to_cpu(msg->data_len)); /* copy the whole message */ in dlm_mig_lockres_handler()
1508 item->u.ml.lockres = res; /* already have a ref */ in dlm_mig_lockres_handler()
1509 item->u.ml.real_master = real_master; in dlm_mig_lockres_handler()
1510 item->u.ml.extra_ref = extra_refs; in dlm_mig_lockres_handler()
1511 spin_lock(&dlm->work_lock); in dlm_mig_lockres_handler()
1512 list_add_tail(&item->list, &dlm->work_list); in dlm_mig_lockres_handler()
1513 spin_unlock(&dlm->work_lock); in dlm_mig_lockres_handler()
1514 queue_work(dlm->dlm_worker, &dlm->dispatched_work); in dlm_mig_lockres_handler()
1541 dlm = item->dlm; in dlm_mig_lockres_worker()
1544 res = item->u.ml.lockres; in dlm_mig_lockres_worker()
1545 real_master = item->u.ml.real_master; in dlm_mig_lockres_worker()
1546 extra_ref = item->u.ml.extra_ref; in dlm_mig_lockres_worker()
1549 /* this case is super-rare. only occurs if in dlm_mig_lockres_worker()
1561 res->lockname.len, res->lockname.name); in dlm_mig_lockres_worker()
1563 spin_lock(&res->spinlock); in dlm_mig_lockres_worker()
1565 spin_unlock(&res->spinlock); in dlm_mig_lockres_worker()
1568 real_master, res->lockname.len, in dlm_mig_lockres_worker()
1569 res->lockname.name); in dlm_mig_lockres_worker()
1581 if ((mres->flags & (DLM_MRES_MIGRATION|DLM_MRES_ALL_DONE)) == in dlm_mig_lockres_worker()
1583 ret = dlm_finish_migration(dlm, res, mres->master); in dlm_mig_lockres_worker()
1633 spin_lock(&dlm->spinlock); in dlm_lockres_master_requery()
1634 dlm_node_iter_init(dlm->domain_map, &iter); in dlm_lockres_master_requery()
1635 spin_unlock(&dlm->spinlock); in dlm_lockres_master_requery()
1639 if (nodenum == dlm->node_num) in dlm_lockres_master_requery()
1666 req.node_idx = dlm->node_num; in dlm_do_master_requery()
1667 req.namelen = res->lockname.len; in dlm_do_master_requery()
1668 memcpy(req.name, res->lockname.name, res->lockname.len); in dlm_do_master_requery()
1671 ret = o2net_send_message(DLM_MASTER_REQUERY_MSG, dlm->key, in dlm_do_master_requery()
1676 dlm->key, nodenum); in dlm_do_master_requery()
1677 else if (status == -ENOMEM) { in dlm_do_master_requery()
1700 struct dlm_master_requery *req = (struct dlm_master_requery *)msg->buf; in dlm_master_requery_handler()
1713 hash = dlm_lockid_hash(req->name, req->namelen); in dlm_master_requery_handler()
1715 spin_lock(&dlm->spinlock); in dlm_master_requery_handler()
1716 res = __dlm_lookup_lockres(dlm, req->name, req->namelen, hash); in dlm_master_requery_handler()
1718 spin_lock(&res->spinlock); in dlm_master_requery_handler()
1719 master = res->owner; in dlm_master_requery_handler()
1720 if (master == dlm->node_num) { in dlm_master_requery_handler()
1725 spin_unlock(&res->spinlock); in dlm_master_requery_handler()
1727 spin_unlock(&dlm->spinlock); in dlm_master_requery_handler()
1732 dispatched = 1; in dlm_master_requery_handler()
1734 spin_unlock(&res->spinlock); in dlm_master_requery_handler()
1738 spin_unlock(&res->spinlock); in dlm_master_requery_handler()
1742 spin_unlock(&dlm->spinlock); in dlm_master_requery_handler()
1755 ret = &(res->granted); in dlm_list_num_to_pointer()
1764 * NOTE about in-flight requests during migration:
1767 * MIGRATING and then flushed all of its pending ASTS. So any in-flight
1782 * up-to-date, and the change will be ordered properly for the waiter.
1801 mlog(0, "running %d locks for this lockres\n", mres->num_locks); in dlm_process_recovery_data()
1802 for (i=0; i<mres->num_locks; i++) { in dlm_process_recovery_data()
1803 ml = &(mres->ml[i]); in dlm_process_recovery_data()
1807 BUG_ON(mres->num_locks != 1); in dlm_process_recovery_data()
1809 dlm->name, mres->lockname_len, mres->lockname, in dlm_process_recovery_data()
1811 spin_lock(&res->spinlock); in dlm_process_recovery_data()
1813 spin_unlock(&res->spinlock); in dlm_process_recovery_data()
1816 BUG_ON(ml->highest_blocked != LKM_IVMODE); in dlm_process_recovery_data()
1820 queue = dlm_list_num_to_pointer(res, ml->list); in dlm_process_recovery_data()
1826 if (ml->node == dlm->node_num) { in dlm_process_recovery_data()
1828 BUG_ON(!(mres->flags & DLM_MRES_MIGRATION)); in dlm_process_recovery_data()
1831 spin_lock(&res->spinlock); in dlm_process_recovery_data()
1837 if (lock->ml.cookie == ml->cookie) in dlm_process_recovery_data()
1848 c = ml->cookie; in dlm_process_recovery_data()
1855 ml->node, ml->list, ml->flags, ml->type, in dlm_process_recovery_data()
1856 ml->convert_type, ml->highest_blocked); in dlm_process_recovery_data()
1861 if (lock->ml.node != ml->node) { in dlm_process_recovery_data()
1862 c = lock->ml.cookie; in dlm_process_recovery_data()
1867 res->lockname.len, res->lockname.name, in dlm_process_recovery_data()
1868 lock->ml.node); in dlm_process_recovery_data()
1869 c = ml->cookie; in dlm_process_recovery_data()
1875 ml->node, ml->list, ml->flags, ml->type, in dlm_process_recovery_data()
1876 ml->convert_type, ml->highest_blocked); in dlm_process_recovery_data()
1882 c = ml->cookie; in dlm_process_recovery_data()
1887 j, ml->list, res->lockname.len, in dlm_process_recovery_data()
1888 res->lockname.name); in dlm_process_recovery_data()
1890 spin_unlock(&res->spinlock); in dlm_process_recovery_data()
1899 list_move_tail(&lock->list, queue); in dlm_process_recovery_data()
1900 spin_unlock(&res->spinlock); in dlm_process_recovery_data()
1907 newlock = dlm_new_lock(ml->type, ml->node, in dlm_process_recovery_data()
1908 be64_to_cpu(ml->cookie), NULL); in dlm_process_recovery_data()
1910 ret = -ENOMEM; in dlm_process_recovery_data()
1913 lksb = newlock->lksb; in dlm_process_recovery_data()
1916 if (ml->convert_type != LKM_IVMODE) { in dlm_process_recovery_data()
1917 BUG_ON(queue != &res->converting); in dlm_process_recovery_data()
1918 newlock->ml.convert_type = ml->convert_type; in dlm_process_recovery_data()
1920 lksb->flags |= (ml->flags & in dlm_process_recovery_data()
1923 if (ml->type == LKM_NLMODE) in dlm_process_recovery_data()
1930 if (ml->list == DLM_BLOCKED_LIST) in dlm_process_recovery_data()
1933 if (!dlm_lvb_is_empty(mres->lvb)) { in dlm_process_recovery_data()
1934 if (lksb->flags & DLM_LKSB_PUT_LVB) { in dlm_process_recovery_data()
1938 memcpy(lksb->lvb, mres->lvb, DLM_LVB_LEN); in dlm_process_recovery_data()
1943 memcpy(res->lvb, mres->lvb, DLM_LVB_LEN); in dlm_process_recovery_data()
1947 BUG_ON(ml->type != LKM_EXMODE && in dlm_process_recovery_data()
1948 ml->type != LKM_PRMODE); in dlm_process_recovery_data()
1949 if (!dlm_lvb_is_empty(res->lvb) && in dlm_process_recovery_data()
1950 (ml->type == LKM_EXMODE || in dlm_process_recovery_data()
1951 memcmp(res->lvb, mres->lvb, DLM_LVB_LEN))) { in dlm_process_recovery_data()
1954 "lvb! type=%d\n", dlm->name, in dlm_process_recovery_data()
1955 res->lockname.len, in dlm_process_recovery_data()
1956 res->lockname.name, ml->type); in dlm_process_recovery_data()
1959 printk("%02x", res->lvb[i]); in dlm_process_recovery_data()
1962 printk("%02x", mres->lvb[i]); in dlm_process_recovery_data()
1967 memcpy(res->lvb, mres->lvb, DLM_LVB_LEN); in dlm_process_recovery_data()
1974 * 1. order of locks on granted queue is in dlm_process_recovery_data()
1989 spin_lock(&res->spinlock); in dlm_process_recovery_data()
1991 if (lock->ml.cookie == ml->cookie) { in dlm_process_recovery_data()
1992 c = lock->ml.cookie; in dlm_process_recovery_data()
1994 "exists on this lockres!\n", dlm->name, in dlm_process_recovery_data()
1995 res->lockname.len, res->lockname.name, in dlm_process_recovery_data()
2001 ml->type, ml->convert_type, ml->node, in dlm_process_recovery_data()
2002 dlm_get_lock_cookie_node(be64_to_cpu(ml->cookie)), in dlm_process_recovery_data()
2003 dlm_get_lock_cookie_seq(be64_to_cpu(ml->cookie)), in dlm_process_recovery_data()
2004 ml->list); in dlm_process_recovery_data()
2007 bad = 1; in dlm_process_recovery_data()
2013 if (mres->flags & DLM_MRES_RECOVERY && in dlm_process_recovery_data()
2014 ml->list == DLM_CONVERTING_LIST && in dlm_process_recovery_data()
2015 newlock->ml.type > in dlm_process_recovery_data()
2016 newlock->ml.convert_type) { in dlm_process_recovery_data()
2019 list_add(&newlock->list, queue); in dlm_process_recovery_data()
2021 list_add_tail(&newlock->list, queue); in dlm_process_recovery_data()
2023 "setting refmap bit\n", dlm->name, in dlm_process_recovery_data()
2024 res->lockname.len, res->lockname.name, ml->node); in dlm_process_recovery_data()
2025 dlm_lockres_set_refmap_bit(dlm, res, ml->node); in dlm_process_recovery_data()
2027 spin_unlock(&res->spinlock); in dlm_process_recovery_data()
2033 spin_lock(&res->spinlock); in dlm_process_recovery_data()
2035 spin_unlock(&res->spinlock); in dlm_process_recovery_data()
2050 assert_spin_locked(&dlm->spinlock); in dlm_move_lockres_to_recovery_list()
2051 assert_spin_locked(&res->spinlock); in dlm_move_lockres_to_recovery_list()
2052 res->state |= DLM_LOCK_RES_RECOVERING; in dlm_move_lockres_to_recovery_list()
2053 if (!list_empty(&res->recovering)) { in dlm_move_lockres_to_recovery_list()
2056 dlm->name, res->lockname.len, res->lockname.name); in dlm_move_lockres_to_recovery_list()
2057 list_del_init(&res->recovering); in dlm_move_lockres_to_recovery_list()
2062 list_add_tail(&res->recovering, &dlm->reco.resources); in dlm_move_lockres_to_recovery_list()
2065 for (i=DLM_BLOCKED_LIST; i>=DLM_GRANTED_LIST; i--) { in dlm_move_lockres_to_recovery_list()
2069 if (lock->convert_pending) { in dlm_move_lockres_to_recovery_list()
2073 res->lockname.len, res->lockname.name); in dlm_move_lockres_to_recovery_list()
2075 lock->convert_pending = 0; in dlm_move_lockres_to_recovery_list()
2076 } else if (lock->lock_pending) { in dlm_move_lockres_to_recovery_list()
2081 res->lockname.len, res->lockname.name); in dlm_move_lockres_to_recovery_list()
2088 lock->lock_pending = 0; in dlm_move_lockres_to_recovery_list()
2089 } else if (lock->unlock_pending) { in dlm_move_lockres_to_recovery_list()
2102 res->lockname.len, res->lockname.name); in dlm_move_lockres_to_recovery_list()
2104 lock->unlock_pending = 0; in dlm_move_lockres_to_recovery_list()
2105 } else if (lock->cancel_pending) { in dlm_move_lockres_to_recovery_list()
2113 res->lockname.len, res->lockname.name); in dlm_move_lockres_to_recovery_list()
2115 lock->cancel_pending = 0; in dlm_move_lockres_to_recovery_list()
2125 * sets the res->owner to the new master.
2134 assert_spin_locked(&dlm->spinlock); in dlm_finish_local_lockres_recovery()
2136 list_for_each_entry_safe(res, next, &dlm->reco.resources, recovering) { in dlm_finish_local_lockres_recovery()
2137 if (res->owner == dead_node) { in dlm_finish_local_lockres_recovery()
2139 dlm->name, res->lockname.len, res->lockname.name, in dlm_finish_local_lockres_recovery()
2140 res->owner, new_master); in dlm_finish_local_lockres_recovery()
2141 list_del_init(&res->recovering); in dlm_finish_local_lockres_recovery()
2142 spin_lock(&res->spinlock); in dlm_finish_local_lockres_recovery()
2146 res->state &= ~DLM_LOCK_RES_RECOVERING; in dlm_finish_local_lockres_recovery()
2149 spin_unlock(&res->spinlock); in dlm_finish_local_lockres_recovery()
2150 wake_up(&res->wq); in dlm_finish_local_lockres_recovery()
2162 if (res->state & DLM_LOCK_RES_RECOVERY_WAITING) { in dlm_finish_local_lockres_recovery()
2163 spin_lock(&res->spinlock); in dlm_finish_local_lockres_recovery()
2164 res->state &= ~DLM_LOCK_RES_RECOVERY_WAITING; in dlm_finish_local_lockres_recovery()
2165 spin_unlock(&res->spinlock); in dlm_finish_local_lockres_recovery()
2166 wake_up(&res->wq); in dlm_finish_local_lockres_recovery()
2169 if (!(res->state & DLM_LOCK_RES_RECOVERING)) in dlm_finish_local_lockres_recovery()
2172 if (res->owner != dead_node && in dlm_finish_local_lockres_recovery()
2173 res->owner != dlm->node_num) in dlm_finish_local_lockres_recovery()
2176 if (!list_empty(&res->recovering)) { in dlm_finish_local_lockres_recovery()
2177 list_del_init(&res->recovering); in dlm_finish_local_lockres_recovery()
2184 dlm->name, res->lockname.len, res->lockname.name, in dlm_finish_local_lockres_recovery()
2185 res->owner, new_master); in dlm_finish_local_lockres_recovery()
2186 spin_lock(&res->spinlock); in dlm_finish_local_lockres_recovery()
2188 res->state &= ~DLM_LOCK_RES_RECOVERING; in dlm_finish_local_lockres_recovery()
2191 spin_unlock(&res->spinlock); in dlm_finish_local_lockres_recovery()
2192 wake_up(&res->wq); in dlm_finish_local_lockres_recovery()
2200 if (lock->ml.type != LKM_EXMODE && in dlm_lvb_needs_invalidation()
2201 lock->ml.type != LKM_PRMODE) in dlm_lvb_needs_invalidation()
2202 return 1; in dlm_lvb_needs_invalidation()
2203 } else if (lock->ml.type == LKM_EXMODE) in dlm_lvb_needs_invalidation()
2204 return 1; in dlm_lvb_needs_invalidation()
2217 assert_spin_locked(&dlm->spinlock); in dlm_revalidate_lvb()
2218 assert_spin_locked(&res->spinlock); in dlm_revalidate_lvb()
2220 if (res->owner == dlm->node_num) in dlm_revalidate_lvb()
2227 search_node = dlm->node_num; in dlm_revalidate_lvb()
2228 local = 1; /* check local state for valid lvb */ in dlm_revalidate_lvb()
2234 if (lock->ml.node == search_node) { in dlm_revalidate_lvb()
2237 blank_lvb = 1; in dlm_revalidate_lvb()
2238 memset(lock->lksb->lvb, 0, DLM_LVB_LEN); in dlm_revalidate_lvb()
2246 res->lockname.len, res->lockname.name, dead_node); in dlm_revalidate_lvb()
2247 memset(res->lvb, 0, DLM_LVB_LEN); in dlm_revalidate_lvb()
2258 * 1) remove any stale locks for the dead node in dlm_free_dead_locks()
2261 assert_spin_locked(&dlm->spinlock); in dlm_free_dead_locks()
2262 assert_spin_locked(&res->spinlock); in dlm_free_dead_locks()
2268 list_for_each_entry_safe(lock, next, &res->granted, list) { in dlm_free_dead_locks()
2269 if (lock->ml.node == dead_node) { in dlm_free_dead_locks()
2270 list_del_init(&lock->list); in dlm_free_dead_locks()
2272 /* Can't schedule DLM_UNLOCK_FREE_LOCK - do manually */ in dlm_free_dead_locks()
2277 list_for_each_entry_safe(lock, next, &res->converting, list) { in dlm_free_dead_locks()
2278 if (lock->ml.node == dead_node) { in dlm_free_dead_locks()
2279 list_del_init(&lock->list); in dlm_free_dead_locks()
2281 /* Can't schedule DLM_UNLOCK_FREE_LOCK - do manually */ in dlm_free_dead_locks()
2286 list_for_each_entry_safe(lock, next, &res->blocked, list) { in dlm_free_dead_locks()
2287 if (lock->ml.node == dead_node) { in dlm_free_dead_locks()
2288 list_del_init(&lock->list); in dlm_free_dead_locks()
2290 /* Can't schedule DLM_UNLOCK_FREE_LOCK - do manually */ in dlm_free_dead_locks()
2298 "dropping ref from lockres\n", dlm->name, in dlm_free_dead_locks()
2299 res->lockname.len, res->lockname.name, freed, dead_node); in dlm_free_dead_locks()
2300 if(!test_bit(dead_node, res->refmap)) { in dlm_free_dead_locks()
2302 "but ref was not set\n", dlm->name, in dlm_free_dead_locks()
2303 res->lockname.len, res->lockname.name, freed, dead_node); in dlm_free_dead_locks()
2306 res->state |= DLM_LOCK_RES_RECOVERY_WAITING; in dlm_free_dead_locks()
2308 } else if (test_bit(dead_node, res->refmap)) { in dlm_free_dead_locks()
2310 "no locks and had not purged before dying\n", dlm->name, in dlm_free_dead_locks()
2311 res->lockname.len, res->lockname.name, dead_node); in dlm_free_dead_locks()
2334 * 1) if the dead node was the master, move the lockres in dlm_do_local_recovery_cleanup()
2350 if (dlm_is_recovery_lock(res->lockname.name, in dlm_do_local_recovery_cleanup()
2351 res->lockname.len)) { in dlm_do_local_recovery_cleanup()
2352 spin_lock(&res->spinlock); in dlm_do_local_recovery_cleanup()
2353 list_for_each_entry(lock, &res->granted, list) { in dlm_do_local_recovery_cleanup()
2354 if (lock->ml.node == dead_node) { in dlm_do_local_recovery_cleanup()
2358 dead_node, dlm->name); in dlm_do_local_recovery_cleanup()
2359 list_del_init(&lock->list); in dlm_do_local_recovery_cleanup()
2363 * - do manually */ in dlm_do_local_recovery_cleanup()
2369 if ((res->owner == dead_node) && in dlm_do_local_recovery_cleanup()
2370 (res->state & DLM_LOCK_RES_DROPPING_REF)) { in dlm_do_local_recovery_cleanup()
2373 spin_unlock(&res->spinlock); in dlm_do_local_recovery_cleanup()
2374 wake_up(&res->wq); in dlm_do_local_recovery_cleanup()
2377 } else if (res->owner == dlm->node_num) in dlm_do_local_recovery_cleanup()
2379 spin_unlock(&res->spinlock); in dlm_do_local_recovery_cleanup()
2382 spin_lock(&res->spinlock); in dlm_do_local_recovery_cleanup()
2385 if (res->owner == dead_node) { in dlm_do_local_recovery_cleanup()
2386 if (res->state & DLM_LOCK_RES_DROPPING_REF) { in dlm_do_local_recovery_cleanup()
2391 dlm->name, res->lockname.len, in dlm_do_local_recovery_cleanup()
2392 res->lockname.name, dead_node); in dlm_do_local_recovery_cleanup()
2395 spin_unlock(&res->spinlock); in dlm_do_local_recovery_cleanup()
2396 wake_up(&res->wq); in dlm_do_local_recovery_cleanup()
2401 } else if (res->owner == dlm->node_num) { in dlm_do_local_recovery_cleanup()
2404 } else if (res->owner == DLM_LOCK_RES_OWNER_UNKNOWN) { in dlm_do_local_recovery_cleanup()
2405 if (test_bit(dead_node, res->refmap)) { in dlm_do_local_recovery_cleanup()
2408 dlm->name, res->lockname.len, in dlm_do_local_recovery_cleanup()
2409 res->lockname.name, dead_node); in dlm_do_local_recovery_cleanup()
2413 spin_unlock(&res->spinlock); in dlm_do_local_recovery_cleanup()
2421 assert_spin_locked(&dlm->spinlock); in __dlm_hb_node_down()
2423 if (dlm->reco.new_master == idx) { in __dlm_hb_node_down()
2425 dlm->name, idx); in __dlm_hb_node_down()
2426 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) { in __dlm_hb_node_down()
2431 "finalize1 state, clearing\n", dlm->name, idx); in __dlm_hb_node_down()
2432 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE; in __dlm_hb_node_down()
2438 if (dlm->joining_node == idx) { in __dlm_hb_node_down()
2444 if (!test_bit(idx, dlm->live_nodes_map)) { in __dlm_hb_node_down()
2447 dlm->name, idx); in __dlm_hb_node_down()
2452 if (!test_bit(idx, dlm->domain_map)) { in __dlm_hb_node_down()
2459 clear_bit(idx, dlm->live_nodes_map); in __dlm_hb_node_down()
2462 if (!test_bit(idx, dlm->recovery_map)) in __dlm_hb_node_down()
2469 clear_bit(idx, dlm->domain_map); in __dlm_hb_node_down()
2470 clear_bit(idx, dlm->exit_domain_map); in __dlm_hb_node_down()
2473 wake_up(&dlm->migration_wq); in __dlm_hb_node_down()
2475 set_bit(idx, dlm->recovery_map); in __dlm_hb_node_down()
2489 if (test_bit(idx, dlm->domain_map)) in dlm_hb_node_down_cb()
2492 spin_lock(&dlm->spinlock); in dlm_hb_node_down_cb()
2494 spin_unlock(&dlm->spinlock); in dlm_hb_node_down_cb()
2506 spin_lock(&dlm->spinlock); in dlm_hb_node_up_cb()
2507 set_bit(idx, dlm->live_nodes_map); in dlm_hb_node_up_cb()
2510 spin_unlock(&dlm->spinlock); in dlm_hb_node_up_cb()
2519 dlm->node_num, dlm->name); in dlm_reco_ast()
2525 dlm->node_num, dlm->name); in dlm_reco_bast()
2539 * or b) dlm->reco.new_master gets set to some nodenum
2548 int status = -EINVAL; in dlm_pick_recovery_master()
2551 dlm->name, jiffies, dlm->reco.dead_node, dlm->node_num); in dlm_pick_recovery_master()
2560 dlm->name, ret, lksb.status); in dlm_pick_recovery_master()
2564 dlm->name, dlm->node_num); in dlm_pick_recovery_master()
2570 "do the recovery\n", dlm->name, in dlm_pick_recovery_master()
2571 dlm->reco.new_master); in dlm_pick_recovery_master()
2572 status = -EEXIST; in dlm_pick_recovery_master()
2577 spin_lock(&dlm->spinlock); in dlm_pick_recovery_master()
2578 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) { in dlm_pick_recovery_master()
2579 status = -EINVAL; in dlm_pick_recovery_master()
2581 "node got recovered already\n", dlm->name); in dlm_pick_recovery_master()
2582 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM) { in dlm_pick_recovery_master()
2585 dlm->name, dlm->reco.new_master); in dlm_pick_recovery_master()
2589 spin_unlock(&dlm->spinlock); in dlm_pick_recovery_master()
2596 "begin_reco now\n", dlm->name, in dlm_pick_recovery_master()
2597 dlm->reco.dead_node, dlm->node_num); in dlm_pick_recovery_master()
2599 dlm->reco.dead_node); in dlm_pick_recovery_master()
2604 spin_lock(&dlm->spinlock); in dlm_pick_recovery_master()
2605 dlm_set_reco_master(dlm, dlm->node_num); in dlm_pick_recovery_master()
2606 spin_unlock(&dlm->spinlock); in dlm_pick_recovery_master()
2627 dlm->name, dlm->node_num); in dlm_pick_recovery_master()
2631 wait_event_timeout(dlm->dlm_reco_thread_wq, in dlm_pick_recovery_master()
2636 dlm->name); in dlm_pick_recovery_master()
2641 dlm->name, dlm->reco.new_master, dlm->reco.dead_node); in dlm_pick_recovery_master()
2642 status = -EEXIST; in dlm_pick_recovery_master()
2645 dlm->name, dlm->node_num); in dlm_pick_recovery_master()
2652 "lksb.status=%s\n", dlm->name, dlm_errname(ret), in dlm_pick_recovery_master()
2670 struct dlm_begin_reco br; in dlm_send_begin_reco_message() local
2676 mlog(0, "%s: dead node is %u\n", dlm->name, dead_node); in dlm_send_begin_reco_message()
2678 spin_lock(&dlm->spinlock); in dlm_send_begin_reco_message()
2679 dlm_node_iter_init(dlm->domain_map, &iter); in dlm_send_begin_reco_message()
2680 spin_unlock(&dlm->spinlock); in dlm_send_begin_reco_message()
2684 memset(&br, 0, sizeof(br)); in dlm_send_begin_reco_message()
2685 br.node_idx = dlm->node_num; in dlm_send_begin_reco_message()
2686 br.dead_node = dead_node; in dlm_send_begin_reco_message()
2695 if (nodenum == dlm->node_num) { in dlm_send_begin_reco_message()
2702 ret = o2net_send_message(DLM_BEGIN_RECO_MSG, dlm->key, in dlm_send_begin_reco_message()
2703 &br, sizeof(br), nodenum, &status); in dlm_send_begin_reco_message()
2711 "begin reco msg (%d)\n", dlm->name, nodenum, ret); in dlm_send_begin_reco_message()
2717 * dlm_begin_reco_handler() returned EAGAIN and not -EAGAIN. in dlm_send_begin_reco_message()
2720 if (ret == -EAGAIN || ret == EAGAIN) { in dlm_send_begin_reco_message()
2723 "to complete, backoff for a bit\n", dlm->name, in dlm_send_begin_reco_message()
2725 msleep(100); in dlm_send_begin_reco_message()
2735 "returned %d\n", dlm->name, nodenum, ret); in dlm_send_begin_reco_message()
2746 msleep(100); in dlm_send_begin_reco_message()
2758 struct dlm_begin_reco *br = (struct dlm_begin_reco *)msg->buf; in dlm_begin_reco_handler() local
2764 spin_lock(&dlm->spinlock); in dlm_begin_reco_handler()
2765 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) { in dlm_begin_reco_handler()
2768 dlm->name, br->node_idx, br->dead_node, in dlm_begin_reco_handler()
2769 dlm->reco.dead_node, dlm->reco.new_master); in dlm_begin_reco_handler()
2770 spin_unlock(&dlm->spinlock); in dlm_begin_reco_handler()
2772 return -EAGAIN; in dlm_begin_reco_handler()
2774 spin_unlock(&dlm->spinlock); in dlm_begin_reco_handler()
2777 dlm->name, br->node_idx, br->dead_node, in dlm_begin_reco_handler()
2778 dlm->reco.dead_node, dlm->reco.new_master); in dlm_begin_reco_handler()
2780 dlm_fire_domain_eviction_callbacks(dlm, br->dead_node); in dlm_begin_reco_handler()
2782 spin_lock(&dlm->spinlock); in dlm_begin_reco_handler()
2783 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM) { in dlm_begin_reco_handler()
2784 if (test_bit(dlm->reco.new_master, dlm->recovery_map)) { in dlm_begin_reco_handler()
2786 "to %u\n", dlm->name, dlm->reco.new_master, in dlm_begin_reco_handler()
2787 br->node_idx); in dlm_begin_reco_handler()
2790 "to %u\n", dlm->name, dlm->reco.new_master, in dlm_begin_reco_handler()
2791 br->node_idx); in dlm_begin_reco_handler()
2795 if (dlm->reco.dead_node != O2NM_INVALID_NODE_NUM) { in dlm_begin_reco_handler()
2797 "node %u changing it to %u\n", dlm->name, in dlm_begin_reco_handler()
2798 dlm->reco.dead_node, br->node_idx, br->dead_node); in dlm_begin_reco_handler()
2800 dlm_set_reco_master(dlm, br->node_idx); in dlm_begin_reco_handler()
2801 dlm_set_reco_dead_node(dlm, br->dead_node); in dlm_begin_reco_handler()
2802 if (!test_bit(br->dead_node, dlm->recovery_map)) { in dlm_begin_reco_handler()
2805 br->node_idx, br->dead_node, br->dead_node); in dlm_begin_reco_handler()
2806 if (!test_bit(br->dead_node, dlm->domain_map) || in dlm_begin_reco_handler()
2807 !test_bit(br->dead_node, dlm->live_nodes_map)) in dlm_begin_reco_handler()
2810 br->dead_node); in dlm_begin_reco_handler()
2813 set_bit(br->dead_node, dlm->domain_map); in dlm_begin_reco_handler()
2814 set_bit(br->dead_node, dlm->live_nodes_map); in dlm_begin_reco_handler()
2815 __dlm_hb_node_down(dlm, br->dead_node); in dlm_begin_reco_handler()
2817 spin_unlock(&dlm->spinlock); in dlm_begin_reco_handler()
2822 dlm->name, br->node_idx, br->dead_node, in dlm_begin_reco_handler()
2823 dlm->reco.dead_node, dlm->reco.new_master); in dlm_begin_reco_handler()
2837 int stage = 1; in dlm_send_finalize_reco_message()
2840 "stage %d\n", dlm->name, dlm->reco.dead_node, stage); in dlm_send_finalize_reco_message()
2842 spin_lock(&dlm->spinlock); in dlm_send_finalize_reco_message()
2843 dlm_node_iter_init(dlm->domain_map, &iter); in dlm_send_finalize_reco_message()
2844 spin_unlock(&dlm->spinlock); in dlm_send_finalize_reco_message()
2848 fr.node_idx = dlm->node_num; in dlm_send_finalize_reco_message()
2849 fr.dead_node = dlm->reco.dead_node; in dlm_send_finalize_reco_message()
2854 if (nodenum == dlm->node_num) in dlm_send_finalize_reco_message()
2856 ret = o2net_send_message(DLM_FINALIZE_RECO_MSG, dlm->key, in dlm_send_finalize_reco_message()
2863 dlm->key, nodenum); in dlm_send_finalize_reco_message()
2876 if (stage == 1) { in dlm_send_finalize_reco_message()
2878 iter.curnode = -1; in dlm_send_finalize_reco_message()
2890 struct dlm_finalize_reco *fr = (struct dlm_finalize_reco *)msg->buf; in dlm_finalize_reco_handler()
2891 int stage = 1; in dlm_finalize_reco_handler()
2897 if (fr->flags & DLM_FINALIZE_STAGE2) in dlm_finalize_reco_handler()
2901 "node %u (%u:%u)\n", dlm->name, fr->node_idx, stage, in dlm_finalize_reco_handler()
2902 fr->dead_node, dlm->reco.dead_node, dlm->reco.new_master); in dlm_finalize_reco_handler()
2904 spin_lock(&dlm->spinlock); in dlm_finalize_reco_handler()
2906 if (dlm->reco.new_master != fr->node_idx) { in dlm_finalize_reco_handler()
2909 fr->node_idx, dlm->reco.new_master, fr->dead_node); in dlm_finalize_reco_handler()
2912 if (dlm->reco.dead_node != fr->dead_node) { in dlm_finalize_reco_handler()
2915 fr->node_idx, fr->dead_node, dlm->reco.dead_node); in dlm_finalize_reco_handler()
2920 case 1: in dlm_finalize_reco_handler()
2921 dlm_finish_local_lockres_recovery(dlm, fr->dead_node, fr->node_idx); in dlm_finalize_reco_handler()
2922 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) { in dlm_finalize_reco_handler()
2926 dlm->name, fr->node_idx, fr->dead_node); in dlm_finalize_reco_handler()
2930 dlm->reco.state |= DLM_RECO_STATE_FINALIZE; in dlm_finalize_reco_handler()
2931 spin_unlock(&dlm->spinlock); in dlm_finalize_reco_handler()
2934 if (!(dlm->reco.state & DLM_RECO_STATE_FINALIZE)) { in dlm_finalize_reco_handler()
2938 dlm->name, fr->node_idx, fr->dead_node); in dlm_finalize_reco_handler()
2942 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE; in dlm_finalize_reco_handler()
2944 spin_unlock(&dlm->spinlock); in dlm_finalize_reco_handler()
2950 dlm->name, fr->node_idx, dlm->reco.dead_node, dlm->reco.new_master); in dlm_finalize_reco_handler()