Lines Matching refs:dlm

40 static void dlm_do_local_recovery_cleanup(struct dlm_ctxt *dlm, u8 dead_node);
43 static int dlm_do_recovery(struct dlm_ctxt *dlm);
45 static int dlm_pick_recovery_master(struct dlm_ctxt *dlm);
46 static int dlm_remaster_locks(struct dlm_ctxt *dlm, u8 dead_node);
47 static int dlm_init_recovery_area(struct dlm_ctxt *dlm, u8 dead_node);
48 static int dlm_request_all_locks(struct dlm_ctxt *dlm,
50 static void dlm_destroy_recovery_area(struct dlm_ctxt *dlm);
57 static int dlm_send_mig_lockres_msg(struct dlm_ctxt *dlm,
62 static int dlm_process_recovery_data(struct dlm_ctxt *dlm,
65 static int dlm_send_finalize_reco_message(struct dlm_ctxt *dlm);
66 static int dlm_send_all_done_msg(struct dlm_ctxt *dlm,
68 static int dlm_send_begin_reco_message(struct dlm_ctxt *dlm, u8 dead_node);
69 static void dlm_move_reco_locks_to_list(struct dlm_ctxt *dlm,
71 static void dlm_finish_local_lockres_recovery(struct dlm_ctxt *dlm,
79 static int dlm_lockres_master_requery(struct dlm_ctxt *dlm,
102 static inline void dlm_set_reco_dead_node(struct dlm_ctxt *dlm,
105 assert_spin_locked(&dlm->spinlock);
106 if (dlm->reco.dead_node != dead_node)
108 dlm->name, dlm->reco.dead_node, dead_node);
109 dlm->reco.dead_node = dead_node;
112 static inline void dlm_set_reco_master(struct dlm_ctxt *dlm,
115 assert_spin_locked(&dlm->spinlock);
117 dlm->name, dlm->reco.new_master, master);
118 dlm->reco.new_master = master;
121 static inline void __dlm_reset_recovery(struct dlm_ctxt *dlm)
123 assert_spin_locked(&dlm->spinlock);
124 clear_bit(dlm->reco.dead_node, dlm->recovery_map);
125 dlm_set_reco_dead_node(dlm, O2NM_INVALID_NODE_NUM);
126 dlm_set_reco_master(dlm, O2NM_INVALID_NODE_NUM);
129 static inline void dlm_reset_recovery(struct dlm_ctxt *dlm)
131 spin_lock(&dlm->spinlock);
132 __dlm_reset_recovery(dlm);
133 spin_unlock(&dlm->spinlock);
139 struct dlm_ctxt *dlm =
146 spin_lock(&dlm->work_lock);
147 list_splice_init(&dlm->work_list, &tmp_list);
148 spin_unlock(&dlm->work_lock);
153 mlog(0, "%s: work thread has %d work items\n", dlm->name, tot);
159 /* already have ref on dlm to avoid having
161 BUG_ON(item->dlm != dlm);
167 dlm_put(dlm);
176 void dlm_kick_recovery_thread(struct dlm_ctxt *dlm)
184 wake_up(&dlm->dlm_reco_thread_wq);
188 int dlm_launch_recovery_thread(struct dlm_ctxt *dlm)
190 mlog(0, "starting dlm recovery thread...\n");
192 dlm->dlm_reco_thread_task = kthread_run(dlm_recovery_thread, dlm,
193 "dlm_reco-%s", dlm->name);
194 if (IS_ERR(dlm->dlm_reco_thread_task)) {
195 mlog_errno(PTR_ERR(dlm->dlm_reco_thread_task));
196 dlm->dlm_reco_thread_task = NULL;
203 void dlm_complete_recovery_thread(struct dlm_ctxt *dlm)
205 if (dlm->dlm_reco_thread_task) {
206 mlog(0, "waiting for dlm recovery thread to exit\n");
207 kthread_stop(dlm->dlm_reco_thread_task);
208 dlm->dlm_reco_thread_task = NULL;
237 static void dlm_print_reco_node_status(struct dlm_ctxt *dlm)
243 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task),
244 dlm->reco.state & DLM_RECO_STATE_ACTIVE ? "ACTIVE" : "inactive",
245 dlm->reco.dead_node, dlm->reco.new_master);
247 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
276 dlm->name, ndata->node_num, st);
278 list_for_each_entry(res, &dlm->reco.resources, recovering) {
280 dlm->name, res->lockname.len, res->lockname.name);
289 struct dlm_ctxt *dlm = data;
292 mlog(0, "dlm thread running for %s...\n", dlm->name);
295 if (dlm_domain_fully_joined(dlm)) {
296 status = dlm_do_recovery(dlm);
305 wait_event_interruptible_timeout(dlm->dlm_reco_thread_wq,
315 static int dlm_reco_master_ready(struct dlm_ctxt *dlm)
318 spin_lock(&dlm->spinlock);
319 ready = (dlm->reco.new_master != O2NM_INVALID_NODE_NUM);
320 spin_unlock(&dlm->spinlock);
326 int dlm_is_node_dead(struct dlm_ctxt *dlm, u8 node)
329 spin_lock(&dlm->spinlock);
330 dead = !test_bit(node, dlm->domain_map);
331 spin_unlock(&dlm->spinlock);
337 static int dlm_is_node_recovered(struct dlm_ctxt *dlm, u8 node)
340 spin_lock(&dlm->spinlock);
341 recovered = !test_bit(node, dlm->recovery_map);
342 spin_unlock(&dlm->spinlock);
347 void dlm_wait_for_node_death(struct dlm_ctxt *dlm, u8 node, int timeout)
349 if (dlm_is_node_dead(dlm, node))
353 "domain %s\n", node, dlm->name);
356 wait_event_timeout(dlm->dlm_reco_thread_wq,
357 dlm_is_node_dead(dlm, node),
360 wait_event(dlm->dlm_reco_thread_wq,
361 dlm_is_node_dead(dlm, node));
364 void dlm_wait_for_node_recovery(struct dlm_ctxt *dlm, u8 node, int timeout)
366 if (dlm_is_node_recovered(dlm, node))
370 "domain %s\n", node, dlm->name);
373 wait_event_timeout(dlm->dlm_reco_thread_wq,
374 dlm_is_node_recovered(dlm, node),
377 wait_event(dlm->dlm_reco_thread_wq,
378 dlm_is_node_recovered(dlm, node));
382 * block on the dlm->reco.event when recovery is in progress.
383 * the dlm recovery thread will set this state when it begins
387 static int dlm_in_recovery(struct dlm_ctxt *dlm)
390 spin_lock(&dlm->spinlock);
391 in_recovery = !!(dlm->reco.state & DLM_RECO_STATE_ACTIVE);
392 spin_unlock(&dlm->spinlock);
397 void dlm_wait_for_recovery(struct dlm_ctxt *dlm)
399 if (dlm_in_recovery(dlm)) {
402 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task),
403 dlm->reco.state, dlm->reco.new_master,
404 dlm->reco.dead_node);
406 wait_event(dlm->reco.event, !dlm_in_recovery(dlm));
409 static void dlm_begin_recovery(struct dlm_ctxt *dlm)
411 assert_spin_locked(&dlm->spinlock);
412 BUG_ON(dlm->reco.state & DLM_RECO_STATE_ACTIVE);
414 dlm->name, dlm->reco.dead_node);
415 dlm->reco.state |= DLM_RECO_STATE_ACTIVE;
418 static void dlm_end_recovery(struct dlm_ctxt *dlm)
420 spin_lock(&dlm->spinlock);
421 BUG_ON(!(dlm->reco.state & DLM_RECO_STATE_ACTIVE));
422 dlm->reco.state &= ~DLM_RECO_STATE_ACTIVE;
423 spin_unlock(&dlm->spinlock);
424 printk(KERN_NOTICE "o2dlm: End recovery on domain %s\n", dlm->name);
425 wake_up(&dlm->reco.event);
428 static void dlm_print_recovery_master(struct dlm_ctxt *dlm)
431 "dead node %u in domain %s\n", dlm->reco.new_master,
432 (dlm->node_num == dlm->reco.new_master ? "me" : "he"),
433 dlm->reco.dead_node, dlm->name);
436 static int dlm_do_recovery(struct dlm_ctxt *dlm)
441 spin_lock(&dlm->spinlock);
443 if (dlm->migrate_done) {
445 "lock resources\n", dlm->name);
446 spin_unlock(&dlm->spinlock);
451 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM &&
452 test_bit(dlm->reco.new_master, dlm->recovery_map)) {
454 dlm->reco.new_master, dlm->reco.dead_node);
456 dlm_set_reco_master(dlm, O2NM_INVALID_NODE_NUM);
460 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) {
463 bit = find_next_bit (dlm->recovery_map, O2NM_MAX_NODES, 0);
465 dlm_set_reco_dead_node(dlm, O2NM_INVALID_NODE_NUM);
467 dlm_set_reco_dead_node(dlm, bit);
468 } else if (!test_bit(dlm->reco.dead_node, dlm->recovery_map)) {
471 dlm->reco.dead_node);
472 dlm_set_reco_dead_node(dlm, O2NM_INVALID_NODE_NUM);
475 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) {
477 spin_unlock(&dlm->spinlock);
482 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task),
483 dlm->reco.dead_node);
487 dlm_begin_recovery(dlm);
489 spin_unlock(&dlm->spinlock);
491 if (dlm->reco.new_master == dlm->node_num)
494 if (dlm->reco.new_master == O2NM_INVALID_NODE_NUM) {
499 ret = dlm_pick_recovery_master(dlm);
507 dlm_print_recovery_master(dlm);
512 dlm_end_recovery(dlm);
518 dlm_print_recovery_master(dlm);
520 status = dlm_remaster_locks(dlm, dlm->reco.dead_node);
524 "retrying.\n", dlm->name, status, dlm->reco.dead_node);
531 dlm->name, dlm->reco.dead_node, dlm->node_num);
532 spin_lock(&dlm->spinlock);
533 __dlm_reset_recovery(dlm);
534 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE;
535 spin_unlock(&dlm->spinlock);
537 dlm_end_recovery(dlm);
543 static int dlm_remaster_locks(struct dlm_ctxt *dlm, u8 dead_node)
554 status = dlm_init_recovery_area(dlm, dead_node);
557 "retrying\n", dlm->name);
564 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
568 mlog(0, "%s: Requesting lock info from node %u\n", dlm->name,
571 if (ndata->node_num == dlm->node_num) {
577 status = dlm_request_all_locks(dlm, ndata->node_num,
587 wait_event_timeout(dlm->dlm_reco_thread_wq,
588 dlm_is_node_dead(dlm,
593 dlm_is_node_dead(dlm, ndata->node_num) ?
600 dlm->name, ndata->node_num,
641 mlog(0, "%s: Done requesting all lock info\n", dlm->name);
651 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
671 dlm->name, ndata->node_num,
678 dlm->name, ndata->node_num);
682 dlm->name, ndata->node_num);
697 spin_lock(&dlm->spinlock);
698 dlm->reco.state |= DLM_RECO_STATE_FINALIZE;
699 spin_unlock(&dlm->spinlock);
705 ret = dlm_send_finalize_reco_message(dlm);
709 spin_lock(&dlm->spinlock);
710 dlm_finish_local_lockres_recovery(dlm, dead_node,
711 dlm->node_num);
712 spin_unlock(&dlm->spinlock);
716 "dead=%u, this=%u, new=%u\n", dlm->name,
717 jiffies, dlm->reco.dead_node,
718 dlm->node_num, dlm->reco.new_master);
722 dlm_kick_thread(dlm, NULL);
727 wait_event_interruptible_timeout(dlm->dlm_reco_thread_wq,
734 dlm_destroy_recovery_area(dlm);
739 static int dlm_init_recovery_area(struct dlm_ctxt *dlm, u8 dead_node)
744 spin_lock(&dlm->spinlock);
745 memcpy(dlm->reco.node_map, dlm->domain_map, sizeof(dlm->domain_map));
748 spin_unlock(&dlm->spinlock);
751 num = find_next_bit (dlm->reco.node_map, O2NM_MAX_NODES, num);
759 dlm_destroy_recovery_area(dlm);
765 list_add_tail(&ndata->list, &dlm->reco.node_data);
773 static void dlm_destroy_recovery_area(struct dlm_ctxt *dlm)
779 list_splice_init(&dlm->reco.node_data, &tmplist);
788 static int dlm_request_all_locks(struct dlm_ctxt *dlm, u8 request_from,
802 lr.node_idx = dlm->node_num;
806 ret = o2net_send_message(DLM_LOCK_REQUEST_MSG, dlm->key,
812 "to recover dead node %u\n", dlm->name, ret,
825 struct dlm_ctxt *dlm = data;
830 if (!dlm_grab(dlm))
833 if (lr->dead_node != dlm->reco.dead_node) {
835 "dead_node is %u\n", dlm->name, lr->node_idx,
836 lr->dead_node, dlm->reco.dead_node);
837 dlm_print_reco_node_status(dlm);
839 dlm_put(dlm);
842 BUG_ON(lr->dead_node != dlm->reco.dead_node);
846 dlm_put(dlm);
854 dlm_put(dlm);
859 dlm_grab(dlm); /* get an extra ref for the work item */
860 dlm_init_work_item(dlm, item, dlm_request_all_locks_worker, buf);
863 spin_lock(&dlm->work_lock);
864 list_add_tail(&item->list, &dlm->work_list);
865 spin_unlock(&dlm->work_lock);
866 queue_work(dlm->dlm_worker, &dlm->dispatched_work);
868 dlm_put(dlm);
876 struct dlm_ctxt *dlm;
882 dlm = item->dlm;
888 dlm->name, dead_node, reco_master);
890 if (dead_node != dlm->reco.dead_node ||
891 reco_master != dlm->reco.new_master) {
894 if (dlm->reco.new_master == O2NM_INVALID_NODE_NUM) {
897 " current=(dead=%u,mas=%u)\n", dlm->name,
899 dlm->reco.dead_node, dlm->reco.new_master);
903 dlm->name, dlm->reco.dead_node,
904 dlm->reco.new_master, dead_node, reco_master);
910 * dlm->reco.resources list. now move items from that list
915 dlm_move_reco_locks_to_list(dlm, &resources, dead_node);
917 /* now we can begin blasting lockreses without the dlm lock */
922 ret = dlm_send_one_lockres(dlm, res, mres, reco_master,
926 "recovery state for dead node %u, ret=%d\n", dlm->name,
934 spin_lock(&dlm->spinlock);
935 list_splice_init(&resources, &dlm->reco.resources);
936 spin_unlock(&dlm->spinlock);
939 ret = dlm_send_all_done_msg(dlm, dead_node, reco_master);
943 dlm->name, reco_master, dead_node, ret);
951 static int dlm_send_all_done_msg(struct dlm_ctxt *dlm, u8 dead_node, u8 send_to)
957 done_msg.node_idx = dlm->node_num;
963 ret = o2net_send_message(DLM_RECO_DATA_DONE_MSG, dlm->key, &done_msg,
967 "to recover dead node %u\n", dlm->name, ret, send_to,
981 struct dlm_ctxt *dlm = data;
986 if (!dlm_grab(dlm))
991 dlm->reco.dead_node, done->node_idx, dlm->node_num);
993 mlog_bug_on_msg((done->dead_node != dlm->reco.dead_node),
996 dlm->reco.dead_node, done->node_idx, dlm->node_num);
999 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
1032 dlm_kick_recovery_thread(dlm);
1037 dlm_put(dlm);
1043 static void dlm_move_reco_locks_to_list(struct dlm_ctxt *dlm,
1050 spin_lock(&dlm->spinlock);
1051 list_for_each_entry_safe(res, next, &dlm->reco.resources, recovering) {
1062 dead_node, dlm->name);
1086 spin_unlock(&dlm->spinlock);
1104 static int dlm_send_mig_lockres_msg(struct dlm_ctxt *dlm,
1127 dlm->name, res->lockname.len, res->lockname.name,
1132 ret = o2net_send_message(DLM_MIG_LOCKRES_MSG, dlm->key, mres,
1139 "node %u (%s)\n", dlm->name, mres->lockname_len,
1240 static void dlm_add_dummy_lock(struct dlm_ctxt *dlm,
1250 dummy.ml.node = dlm->node_num;
1254 static inline int dlm_is_dummy_lock(struct dlm_ctxt *dlm,
1269 int dlm_send_one_lockres(struct dlm_ctxt *dlm, struct dlm_lock_resource *res,
1307 ret = dlm_send_mig_lockres_msg(dlm, mres, send_to,
1316 dlm->name, res->lockname.len, res->lockname.name,
1319 dlm_add_dummy_lock(dlm, mres);
1322 ret = dlm_send_mig_lockres_msg(dlm, mres, send_to, res, total_locks);
1329 dlm->name, ret);
1333 "lockres %.*s\n", dlm->name, send_to,
1357 struct dlm_ctxt *dlm = data;
1368 if (!dlm_grab(dlm))
1371 if (!dlm_joined(dlm)) {
1374 dlm->name, mres->lockname_len,
1376 dlm_put(dlm);
1404 spin_lock(&dlm->spinlock);
1405 res = __dlm_lookup_lockres_full(dlm, mres->lockname, mres->lockname_len,
1414 " ref!\n", dlm->name,
1418 spin_unlock(&dlm->spinlock);
1439 spin_unlock(&dlm->spinlock);
1446 spin_unlock(&dlm->spinlock);
1448 spin_unlock(&dlm->spinlock);
1451 res = dlm_new_lockres(dlm, mres->lockname, mres->lockname_len);
1465 spin_lock(&dlm->spinlock);
1466 __dlm_insert_lockres(dlm, res);
1467 spin_unlock(&dlm->spinlock);
1500 dlm_lockres_grab_inflight_ref(dlm, res);
1510 dlm_change_lockres_owner(dlm, res, dlm->node_num);
1515 dlm_grab(dlm); /* get an extra ref for the work item */
1517 dlm_init_work_item(dlm, item, dlm_mig_lockres_worker, buf);
1521 spin_lock(&dlm->work_lock);
1522 list_add_tail(&item->list, &dlm->work_list);
1523 spin_unlock(&dlm->work_lock);
1524 queue_work(dlm->dlm_worker, &dlm->dispatched_work);
1531 dlm_put(dlm);
1544 struct dlm_ctxt *dlm;
1551 dlm = item->dlm;
1562 ret = dlm_lockres_master_requery(dlm, res, &real_master);
1574 dlm_lockres_drop_inflight_ref(dlm, res);
1585 ret = dlm_process_recovery_data(dlm, res, mres);
1593 ret = dlm_finish_migration(dlm, res, mres->master);
1610 static int dlm_lockres_master_requery(struct dlm_ctxt *dlm,
1643 spin_lock(&dlm->spinlock);
1644 dlm_node_iter_init(dlm->domain_map, &iter);
1645 spin_unlock(&dlm->spinlock);
1649 if (nodenum == dlm->node_num)
1651 ret = dlm_do_master_requery(dlm, res, nodenum, real_master);
1668 int dlm_do_master_requery(struct dlm_ctxt *dlm, struct dlm_lock_resource *res,
1676 req.node_idx = dlm->node_num;
1681 ret = o2net_send_message(DLM_MASTER_REQUERY_MSG, dlm->key,
1686 dlm->key, nodenum);
1709 struct dlm_ctxt *dlm = data;
1717 if (!dlm_grab(dlm)) {
1725 spin_lock(&dlm->spinlock);
1726 res = __dlm_lookup_lockres(dlm, req->name, req->namelen, hash);
1730 if (master == dlm->node_num) {
1731 int ret = dlm_dispatch_assert_master(dlm, res,
1737 spin_unlock(&dlm->spinlock);
1738 dlm_put(dlm);
1743 __dlm_lockres_grab_inflight_worker(dlm, res);
1752 spin_unlock(&dlm->spinlock);
1755 dlm_put(dlm);
1796 static int dlm_process_recovery_data(struct dlm_ctxt *dlm,
1815 if (dlm_is_dummy_lock(dlm, ml, &from)) {
1819 dlm->name, mres->lockname_len, mres->lockname,
1822 dlm_lockres_set_refmap_bit(dlm, res, from);
1836 if (ml->node == dlm->node_num) {
1964 "lvb! type=%d\n", dlm->name,
2004 "exists on this lockres!\n", dlm->name,
2033 "setting refmap bit\n", dlm->name,
2035 dlm_lockres_set_refmap_bit(dlm, res, ml->node);
2044 dlm_lockres_drop_inflight_ref(dlm, res);
2053 void dlm_move_lockres_to_recovery_list(struct dlm_ctxt *dlm,
2060 assert_spin_locked(&dlm->spinlock);
2066 dlm->name, res->lockname.len, res->lockname.name);
2072 list_add_tail(&res->recovering, &dlm->reco.resources);
2137 static void dlm_finish_local_lockres_recovery(struct dlm_ctxt *dlm,
2144 assert_spin_locked(&dlm->spinlock);
2146 list_for_each_entry_safe(res, next, &dlm->reco.resources, recovering) {
2149 dlm->name, res->lockname.len, res->lockname.name,
2155 dlm_change_lockres_owner(dlm, res, new_master);
2158 __dlm_dirty_lockres(dlm, res);
2170 bucket = dlm_lockres_hash(dlm, i);
2183 res->owner != dlm->node_num)
2194 dlm->name, res->lockname.len, res->lockname.name,
2197 dlm_change_lockres_owner(dlm, res, new_master);
2200 __dlm_dirty_lockres(dlm, res);
2218 static void dlm_revalidate_lvb(struct dlm_ctxt *dlm,
2227 assert_spin_locked(&dlm->spinlock);
2230 if (res->owner == dlm->node_num)
2237 search_node = dlm->node_num;
2261 static void dlm_free_dead_locks(struct dlm_ctxt *dlm,
2271 assert_spin_locked(&dlm->spinlock);
2308 "dropping ref from lockres\n", dlm->name,
2312 "but ref was not set\n", dlm->name,
2317 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2320 "no locks and had not purged before dying\n", dlm->name,
2322 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2326 __dlm_dirty_lockres(dlm, res);
2329 static void dlm_do_local_recovery_cleanup(struct dlm_ctxt *dlm, u8 dead_node)
2339 dlm_clean_master_list(dlm, dead_node);
2351 * dead node. once recovery finishes, the dlm thread
2356 bucket = dlm_lockres_hash(dlm, i);
2368 dead_node, dlm->name);
2382 __dlm_do_purge_lockres(dlm, res);
2387 } else if (res->owner == dlm->node_num)
2388 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2394 dlm_revalidate_lvb(dlm, res, dead_node);
2401 dlm->name, res->lockname.len,
2404 __dlm_do_purge_lockres(dlm, res);
2410 dlm_move_lockres_to_recovery_list(dlm, res);
2411 } else if (res->owner == dlm->node_num) {
2412 dlm_free_dead_locks(dlm, res, dead_node);
2413 __dlm_lockres_calc_usage(dlm, res);
2418 dlm->name, res->lockname.len,
2420 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2429 static void __dlm_hb_node_down(struct dlm_ctxt *dlm, int idx)
2431 assert_spin_locked(&dlm->spinlock);
2433 if (dlm->reco.new_master == idx) {
2435 dlm->name, idx);
2436 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) {
2441 "finalize1 state, clearing\n", dlm->name, idx);
2442 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE;
2443 __dlm_reset_recovery(dlm);
2448 if (dlm->joining_node == idx) {
2450 __dlm_set_joining_node(dlm, DLM_LOCK_RES_OWNER_UNKNOWN);
2454 if (!test_bit(idx, dlm->live_nodes_map)) {
2457 dlm->name, idx);
2462 if (!test_bit(idx, dlm->domain_map)) {
2469 clear_bit(idx, dlm->live_nodes_map);
2472 if (!test_bit(idx, dlm->recovery_map))
2473 dlm_do_local_recovery_cleanup(dlm, idx);
2476 dlm_hb_event_notify_attached(dlm, idx, 0);
2479 clear_bit(idx, dlm->domain_map);
2480 clear_bit(idx, dlm->exit_domain_map);
2483 wake_up(&dlm->migration_wq);
2485 set_bit(idx, dlm->recovery_map);
2490 struct dlm_ctxt *dlm = data;
2492 if (!dlm_grab(dlm))
2496 * This will notify any dlm users that a node in our domain
2499 if (test_bit(idx, dlm->domain_map))
2500 dlm_fire_domain_eviction_callbacks(dlm, idx);
2502 spin_lock(&dlm->spinlock);
2503 __dlm_hb_node_down(dlm, idx);
2504 spin_unlock(&dlm->spinlock);
2506 dlm_put(dlm);
2511 struct dlm_ctxt *dlm = data;
2513 if (!dlm_grab(dlm))
2516 spin_lock(&dlm->spinlock);
2517 set_bit(idx, dlm->live_nodes_map);
2520 spin_unlock(&dlm->spinlock);
2522 dlm_put(dlm);
2527 struct dlm_ctxt *dlm = astdata;
2528 mlog(0, "ast for recovery lock fired!, this=%u, dlm=%s\n",
2529 dlm->node_num, dlm->name);
2533 struct dlm_ctxt *dlm = astdata;
2534 mlog(0, "bast for recovery lock fired!, this=%u, dlm=%s\n",
2535 dlm->node_num, dlm->name);
2549 * or b) dlm->reco.new_master gets set to some nodenum
2554 static int dlm_pick_recovery_master(struct dlm_ctxt *dlm)
2561 dlm->name, jiffies, dlm->reco.dead_node, dlm->node_num);
2565 ret = dlmlock(dlm, LKM_EXMODE, &lksb, LKM_NOQUEUE|LKM_RECOVERY,
2567 dlm_reco_ast, dlm, dlm_reco_bast);
2570 dlm->name, ret, lksb.status);
2573 mlog(0, "dlm=%s dlmlock says I got it (this=%u)\n",
2574 dlm->name, dlm->node_num);
2578 if (dlm_reco_master_ready(dlm)) {
2580 "do the recovery\n", dlm->name,
2581 dlm->reco.new_master);
2587 spin_lock(&dlm->spinlock);
2588 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) {
2591 "node got recovered already\n", dlm->name);
2592 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM) {
2595 dlm->name, dlm->reco.new_master);
2599 spin_unlock(&dlm->spinlock);
2606 "begin_reco now\n", dlm->name,
2607 dlm->reco.dead_node, dlm->node_num);
2608 status = dlm_send_begin_reco_message(dlm,
2609 dlm->reco.dead_node);
2614 spin_lock(&dlm->spinlock);
2615 dlm_set_reco_master(dlm, dlm->node_num);
2616 spin_unlock(&dlm->spinlock);
2621 ret = dlmunlock(dlm, &lksb, 0, dlm_reco_unlock_ast, dlm);
2624 ret = dlmunlock(dlm, &lksb, LKM_CANCEL, dlm_reco_unlock_ast, dlm);
2636 mlog(0, "dlm=%s dlmlock says another node got it (this=%u)\n",
2637 dlm->name, dlm->node_num);
2641 wait_event_timeout(dlm->dlm_reco_thread_wq,
2642 dlm_reco_master_ready(dlm),
2644 if (!dlm_reco_master_ready(dlm)) {
2646 dlm->name);
2651 dlm->name, dlm->reco.new_master, dlm->reco.dead_node);
2654 mlog(0, "dlm=%s dlmlock says master node died (this=%u)\n",
2655 dlm->name, dlm->node_num);
2662 "lksb.status=%s\n", dlm->name, dlm_errname(ret),
2664 res = dlm_lookup_lockres(dlm, DLM_RECOVERY_LOCK_NAME,
2678 static int dlm_send_begin_reco_message(struct dlm_ctxt *dlm, u8 dead_node)
2686 mlog(0, "%s: dead node is %u\n", dlm->name, dead_node);
2688 spin_lock(&dlm->spinlock);
2689 dlm_node_iter_init(dlm->domain_map, &iter);
2690 spin_unlock(&dlm->spinlock);
2695 br.node_idx = dlm->node_num;
2705 if (nodenum == dlm->node_num) {
2713 ret = o2net_send_message(DLM_BEGIN_RECO_MSG, dlm->key,
2722 "begin reco msg (%d)\n", dlm->name, nodenum, ret);
2734 "to complete, backoff for a bit\n", dlm->name,
2745 mlog(ML_ERROR, "begin reco of dlm %s to node %u "
2746 "returned %d\n", dlm->name, nodenum, ret);
2747 res = dlm_lookup_lockres(dlm, DLM_RECOVERY_LOCK_NAME,
2768 struct dlm_ctxt *dlm = data;
2772 if (!dlm_grab(dlm))
2775 spin_lock(&dlm->spinlock);
2776 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) {
2779 dlm->name, br->node_idx, br->dead_node,
2780 dlm->reco.dead_node, dlm->reco.new_master);
2781 spin_unlock(&dlm->spinlock);
2782 dlm_put(dlm);
2785 spin_unlock(&dlm->spinlock);
2788 dlm->name, br->node_idx, br->dead_node,
2789 dlm->reco.dead_node, dlm->reco.new_master);
2791 dlm_fire_domain_eviction_callbacks(dlm, br->dead_node);
2793 spin_lock(&dlm->spinlock);
2794 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM) {
2795 if (test_bit(dlm->reco.new_master, dlm->recovery_map)) {
2797 "to %u\n", dlm->name, dlm->reco.new_master,
2801 "to %u\n", dlm->name, dlm->reco.new_master,
2806 if (dlm->reco.dead_node != O2NM_INVALID_NODE_NUM) {
2808 "node %u changing it to %u\n", dlm->name,
2809 dlm->reco.dead_node, br->node_idx, br->dead_node);
2811 dlm_set_reco_master(dlm, br->node_idx);
2812 dlm_set_reco_dead_node(dlm, br->dead_node);
2813 if (!test_bit(br->dead_node, dlm->recovery_map)) {
2817 if (!test_bit(br->dead_node, dlm->domain_map) ||
2818 !test_bit(br->dead_node, dlm->live_nodes_map))
2824 set_bit(br->dead_node, dlm->domain_map);
2825 set_bit(br->dead_node, dlm->live_nodes_map);
2826 __dlm_hb_node_down(dlm, br->dead_node);
2828 spin_unlock(&dlm->spinlock);
2830 dlm_kick_recovery_thread(dlm);
2833 dlm->name, br->node_idx, br->dead_node,
2834 dlm->reco.dead_node, dlm->reco.new_master);
2836 dlm_put(dlm);
2841 static int dlm_send_finalize_reco_message(struct dlm_ctxt *dlm)
2851 "stage %d\n", dlm->name, dlm->reco.dead_node, stage);
2853 spin_lock(&dlm->spinlock);
2854 dlm_node_iter_init(dlm->domain_map, &iter);
2855 spin_unlock(&dlm->spinlock);
2859 fr.node_idx = dlm->node_num;
2860 fr.dead_node = dlm->reco.dead_node;
2865 if (nodenum == dlm->node_num)
2867 ret = o2net_send_message(DLM_FINALIZE_RECO_MSG, dlm->key,
2874 dlm->key, nodenum);
2900 struct dlm_ctxt *dlm = data;
2905 if (!dlm_grab(dlm))
2912 "node %u (%u:%u)\n", dlm->name, fr->node_idx, stage,
2913 fr->dead_node, dlm->reco.dead_node, dlm->reco.new_master);
2915 spin_lock(&dlm->spinlock);
2917 if (dlm->reco.new_master != fr->node_idx) {
2920 fr->node_idx, dlm->reco.new_master, fr->dead_node);
2923 if (dlm->reco.dead_node != fr->dead_node) {
2926 fr->node_idx, fr->dead_node, dlm->reco.dead_node);
2932 dlm_finish_local_lockres_recovery(dlm, fr->dead_node, fr->node_idx);
2933 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) {
2937 dlm->name, fr->node_idx, fr->dead_node);
2938 dlm_print_reco_node_status(dlm);
2941 dlm->reco.state |= DLM_RECO_STATE_FINALIZE;
2942 spin_unlock(&dlm->spinlock);
2945 if (!(dlm->reco.state & DLM_RECO_STATE_FINALIZE)) {
2949 dlm->name, fr->node_idx, fr->dead_node);
2950 dlm_print_reco_node_status(dlm);
2953 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE;
2954 __dlm_reset_recovery(dlm);
2955 spin_unlock(&dlm->spinlock);
2956 dlm_kick_recovery_thread(dlm);
2961 dlm->name, fr->node_idx, dlm->reco.dead_node, dlm->reco.new_master);
2963 dlm_put(dlm);