Lines Matching defs:dlm

38 static void dlm_do_local_recovery_cleanup(struct dlm_ctxt *dlm, u8 dead_node);
41 static int dlm_do_recovery(struct dlm_ctxt *dlm);
43 static int dlm_pick_recovery_master(struct dlm_ctxt *dlm);
44 static int dlm_remaster_locks(struct dlm_ctxt *dlm, u8 dead_node);
45 static int dlm_init_recovery_area(struct dlm_ctxt *dlm, u8 dead_node);
46 static int dlm_request_all_locks(struct dlm_ctxt *dlm,
48 static void dlm_destroy_recovery_area(struct dlm_ctxt *dlm);
55 static int dlm_send_mig_lockres_msg(struct dlm_ctxt *dlm,
60 static int dlm_process_recovery_data(struct dlm_ctxt *dlm,
63 static int dlm_send_finalize_reco_message(struct dlm_ctxt *dlm);
64 static int dlm_send_all_done_msg(struct dlm_ctxt *dlm,
66 static int dlm_send_begin_reco_message(struct dlm_ctxt *dlm, u8 dead_node);
67 static void dlm_move_reco_locks_to_list(struct dlm_ctxt *dlm,
69 static void dlm_finish_local_lockres_recovery(struct dlm_ctxt *dlm,
77 static int dlm_lockres_master_requery(struct dlm_ctxt *dlm,
100 static inline void dlm_set_reco_dead_node(struct dlm_ctxt *dlm,
103 assert_spin_locked(&dlm->spinlock);
104 if (dlm->reco.dead_node != dead_node)
106 dlm->name, dlm->reco.dead_node, dead_node);
107 dlm->reco.dead_node = dead_node;
110 static inline void dlm_set_reco_master(struct dlm_ctxt *dlm,
113 assert_spin_locked(&dlm->spinlock);
115 dlm->name, dlm->reco.new_master, master);
116 dlm->reco.new_master = master;
119 static inline void __dlm_reset_recovery(struct dlm_ctxt *dlm)
121 assert_spin_locked(&dlm->spinlock);
122 clear_bit(dlm->reco.dead_node, dlm->recovery_map);
123 dlm_set_reco_dead_node(dlm, O2NM_INVALID_NODE_NUM);
124 dlm_set_reco_master(dlm, O2NM_INVALID_NODE_NUM);
130 struct dlm_ctxt *dlm =
137 spin_lock(&dlm->work_lock);
138 list_splice_init(&dlm->work_list, &tmp_list);
139 spin_unlock(&dlm->work_lock);
144 mlog(0, "%s: work thread has %d work items\n", dlm->name, tot);
150 /* already have ref on dlm to avoid having
152 BUG_ON(item->dlm != dlm);
158 dlm_put(dlm);
167 void dlm_kick_recovery_thread(struct dlm_ctxt *dlm)
175 wake_up(&dlm->dlm_reco_thread_wq);
179 int dlm_launch_recovery_thread(struct dlm_ctxt *dlm)
181 mlog(0, "starting dlm recovery thread...\n");
183 dlm->dlm_reco_thread_task = kthread_run(dlm_recovery_thread, dlm,
184 "dlm_reco-%s", dlm->name);
185 if (IS_ERR(dlm->dlm_reco_thread_task)) {
186 mlog_errno(PTR_ERR(dlm->dlm_reco_thread_task));
187 dlm->dlm_reco_thread_task = NULL;
194 void dlm_complete_recovery_thread(struct dlm_ctxt *dlm)
196 if (dlm->dlm_reco_thread_task) {
197 mlog(0, "waiting for dlm recovery thread to exit\n");
198 kthread_stop(dlm->dlm_reco_thread_task);
199 dlm->dlm_reco_thread_task = NULL;
228 static void dlm_print_reco_node_status(struct dlm_ctxt *dlm)
234 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task),
235 dlm->reco.state & DLM_RECO_STATE_ACTIVE ? "ACTIVE" : "inactive",
236 dlm->reco.dead_node, dlm->reco.new_master);
238 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
267 dlm->name, ndata->node_num, st);
269 list_for_each_entry(res, &dlm->reco.resources, recovering) {
271 dlm->name, res->lockname.len, res->lockname.name);
280 struct dlm_ctxt *dlm = data;
283 mlog(0, "dlm thread running for %s...\n", dlm->name);
286 if (dlm_domain_fully_joined(dlm)) {
287 status = dlm_do_recovery(dlm);
296 wait_event_interruptible_timeout(dlm->dlm_reco_thread_wq,
306 static int dlm_reco_master_ready(struct dlm_ctxt *dlm)
309 spin_lock(&dlm->spinlock);
310 ready = (dlm->reco.new_master != O2NM_INVALID_NODE_NUM);
311 spin_unlock(&dlm->spinlock);
317 int dlm_is_node_dead(struct dlm_ctxt *dlm, u8 node)
320 spin_lock(&dlm->spinlock);
321 dead = !test_bit(node, dlm->domain_map);
322 spin_unlock(&dlm->spinlock);
328 static int dlm_is_node_recovered(struct dlm_ctxt *dlm, u8 node)
331 spin_lock(&dlm->spinlock);
332 recovered = !test_bit(node, dlm->recovery_map);
333 spin_unlock(&dlm->spinlock);
338 void dlm_wait_for_node_death(struct dlm_ctxt *dlm, u8 node, int timeout)
340 if (dlm_is_node_dead(dlm, node))
344 "domain %s\n", node, dlm->name);
347 wait_event_timeout(dlm->dlm_reco_thread_wq,
348 dlm_is_node_dead(dlm, node),
351 wait_event(dlm->dlm_reco_thread_wq,
352 dlm_is_node_dead(dlm, node));
355 void dlm_wait_for_node_recovery(struct dlm_ctxt *dlm, u8 node, int timeout)
357 if (dlm_is_node_recovered(dlm, node))
361 "domain %s\n", node, dlm->name);
364 wait_event_timeout(dlm->dlm_reco_thread_wq,
365 dlm_is_node_recovered(dlm, node),
368 wait_event(dlm->dlm_reco_thread_wq,
369 dlm_is_node_recovered(dlm, node));
373 * block on the dlm->reco.event when recovery is in progress.
374 * the dlm recovery thread will set this state when it begins
378 static int dlm_in_recovery(struct dlm_ctxt *dlm)
381 spin_lock(&dlm->spinlock);
382 in_recovery = !!(dlm->reco.state & DLM_RECO_STATE_ACTIVE);
383 spin_unlock(&dlm->spinlock);
388 void dlm_wait_for_recovery(struct dlm_ctxt *dlm)
390 if (dlm_in_recovery(dlm)) {
393 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task),
394 dlm->reco.state, dlm->reco.new_master,
395 dlm->reco.dead_node);
397 wait_event(dlm->reco.event, !dlm_in_recovery(dlm));
400 static void dlm_begin_recovery(struct dlm_ctxt *dlm)
402 assert_spin_locked(&dlm->spinlock);
403 BUG_ON(dlm->reco.state & DLM_RECO_STATE_ACTIVE);
405 dlm->name, dlm->reco.dead_node);
406 dlm->reco.state |= DLM_RECO_STATE_ACTIVE;
409 static void dlm_end_recovery(struct dlm_ctxt *dlm)
411 spin_lock(&dlm->spinlock);
412 BUG_ON(!(dlm->reco.state & DLM_RECO_STATE_ACTIVE));
413 dlm->reco.state &= ~DLM_RECO_STATE_ACTIVE;
414 spin_unlock(&dlm->spinlock);
415 printk(KERN_NOTICE "o2dlm: End recovery on domain %s\n", dlm->name);
416 wake_up(&dlm->reco.event);
419 static void dlm_print_recovery_master(struct dlm_ctxt *dlm)
422 "dead node %u in domain %s\n", dlm->reco.new_master,
423 (dlm->node_num == dlm->reco.new_master ? "me" : "he"),
424 dlm->reco.dead_node, dlm->name);
427 static int dlm_do_recovery(struct dlm_ctxt *dlm)
432 spin_lock(&dlm->spinlock);
434 if (dlm->migrate_done) {
436 "lock resources\n", dlm->name);
437 spin_unlock(&dlm->spinlock);
442 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM &&
443 test_bit(dlm->reco.new_master, dlm->recovery_map)) {
445 dlm->reco.new_master, dlm->reco.dead_node);
447 dlm_set_reco_master(dlm, O2NM_INVALID_NODE_NUM);
451 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) {
454 bit = find_first_bit(dlm->recovery_map, O2NM_MAX_NODES);
456 dlm_set_reco_dead_node(dlm, O2NM_INVALID_NODE_NUM);
458 dlm_set_reco_dead_node(dlm, bit);
459 } else if (!test_bit(dlm->reco.dead_node, dlm->recovery_map)) {
462 dlm->reco.dead_node);
463 dlm_set_reco_dead_node(dlm, O2NM_INVALID_NODE_NUM);
466 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) {
468 spin_unlock(&dlm->spinlock);
473 dlm->name, task_pid_nr(dlm->dlm_reco_thread_task),
474 dlm->reco.dead_node);
478 dlm_begin_recovery(dlm);
480 spin_unlock(&dlm->spinlock);
482 if (dlm->reco.new_master == dlm->node_num)
485 if (dlm->reco.new_master == O2NM_INVALID_NODE_NUM) {
490 ret = dlm_pick_recovery_master(dlm);
498 dlm_print_recovery_master(dlm);
503 dlm_end_recovery(dlm);
509 dlm_print_recovery_master(dlm);
511 status = dlm_remaster_locks(dlm, dlm->reco.dead_node);
515 "retrying.\n", dlm->name, status, dlm->reco.dead_node);
522 dlm->name, dlm->reco.dead_node, dlm->node_num);
523 spin_lock(&dlm->spinlock);
524 __dlm_reset_recovery(dlm);
525 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE;
526 spin_unlock(&dlm->spinlock);
528 dlm_end_recovery(dlm);
534 static int dlm_remaster_locks(struct dlm_ctxt *dlm, u8 dead_node)
545 status = dlm_init_recovery_area(dlm, dead_node);
548 "retrying\n", dlm->name);
555 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
559 mlog(0, "%s: Requesting lock info from node %u\n", dlm->name,
562 if (ndata->node_num == dlm->node_num) {
568 status = dlm_request_all_locks(dlm, ndata->node_num,
578 wait_event_timeout(dlm->dlm_reco_thread_wq,
579 dlm_is_node_dead(dlm,
584 dlm_is_node_dead(dlm, ndata->node_num) ?
591 dlm->name, ndata->node_num,
632 mlog(0, "%s: Done requesting all lock info\n", dlm->name);
642 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
662 dlm->name, ndata->node_num,
669 dlm->name, ndata->node_num);
673 dlm->name, ndata->node_num);
688 spin_lock(&dlm->spinlock);
689 dlm->reco.state |= DLM_RECO_STATE_FINALIZE;
690 spin_unlock(&dlm->spinlock);
696 ret = dlm_send_finalize_reco_message(dlm);
700 spin_lock(&dlm->spinlock);
701 dlm_finish_local_lockres_recovery(dlm, dead_node,
702 dlm->node_num);
703 spin_unlock(&dlm->spinlock);
707 "dead=%u, this=%u, new=%u\n", dlm->name,
708 jiffies, dlm->reco.dead_node,
709 dlm->node_num, dlm->reco.new_master);
713 dlm_kick_thread(dlm, NULL);
718 wait_event_interruptible_timeout(dlm->dlm_reco_thread_wq,
725 dlm_destroy_recovery_area(dlm);
730 static int dlm_init_recovery_area(struct dlm_ctxt *dlm, u8 dead_node)
735 spin_lock(&dlm->spinlock);
736 bitmap_copy(dlm->reco.node_map, dlm->domain_map, O2NM_MAX_NODES);
739 spin_unlock(&dlm->spinlock);
742 num = find_next_bit (dlm->reco.node_map, O2NM_MAX_NODES, num);
750 dlm_destroy_recovery_area(dlm);
756 list_add_tail(&ndata->list, &dlm->reco.node_data);
764 static void dlm_destroy_recovery_area(struct dlm_ctxt *dlm)
770 list_splice_init(&dlm->reco.node_data, &tmplist);
779 static int dlm_request_all_locks(struct dlm_ctxt *dlm, u8 request_from,
793 lr.node_idx = dlm->node_num;
797 ret = o2net_send_message(DLM_LOCK_REQUEST_MSG, dlm->key,
803 "to recover dead node %u\n", dlm->name, ret,
816 struct dlm_ctxt *dlm = data;
821 if (!dlm_grab(dlm))
824 if (lr->dead_node != dlm->reco.dead_node) {
826 "dead_node is %u\n", dlm->name, lr->node_idx,
827 lr->dead_node, dlm->reco.dead_node);
828 dlm_print_reco_node_status(dlm);
830 dlm_put(dlm);
833 BUG_ON(lr->dead_node != dlm->reco.dead_node);
837 dlm_put(dlm);
845 dlm_put(dlm);
850 dlm_grab(dlm); /* get an extra ref for the work item */
851 dlm_init_work_item(dlm, item, dlm_request_all_locks_worker, buf);
854 spin_lock(&dlm->work_lock);
855 list_add_tail(&item->list, &dlm->work_list);
856 spin_unlock(&dlm->work_lock);
857 queue_work(dlm->dlm_worker, &dlm->dispatched_work);
859 dlm_put(dlm);
867 struct dlm_ctxt *dlm;
873 dlm = item->dlm;
879 dlm->name, dead_node, reco_master);
881 if (dead_node != dlm->reco.dead_node ||
882 reco_master != dlm->reco.new_master) {
885 if (dlm->reco.new_master == O2NM_INVALID_NODE_NUM) {
888 " current=(dead=%u,mas=%u)\n", dlm->name,
890 dlm->reco.dead_node, dlm->reco.new_master);
894 dlm->name, dlm->reco.dead_node,
895 dlm->reco.new_master, dead_node, reco_master);
901 * dlm->reco.resources list. now move items from that list
906 dlm_move_reco_locks_to_list(dlm, &resources, dead_node);
908 /* now we can begin blasting lockreses without the dlm lock */
913 ret = dlm_send_one_lockres(dlm, res, mres, reco_master,
917 "recovery state for dead node %u, ret=%d\n", dlm->name,
925 spin_lock(&dlm->spinlock);
926 list_splice_init(&resources, &dlm->reco.resources);
927 spin_unlock(&dlm->spinlock);
930 ret = dlm_send_all_done_msg(dlm, dead_node, reco_master);
934 dlm->name, reco_master, dead_node, ret);
942 static int dlm_send_all_done_msg(struct dlm_ctxt *dlm, u8 dead_node, u8 send_to)
948 done_msg.node_idx = dlm->node_num;
954 ret = o2net_send_message(DLM_RECO_DATA_DONE_MSG, dlm->key, &done_msg,
958 "to recover dead node %u\n", dlm->name, ret, send_to,
972 struct dlm_ctxt *dlm = data;
977 if (!dlm_grab(dlm))
982 dlm->reco.dead_node, done->node_idx, dlm->node_num);
984 mlog_bug_on_msg((done->dead_node != dlm->reco.dead_node),
987 dlm->reco.dead_node, done->node_idx, dlm->node_num);
990 list_for_each_entry(ndata, &dlm->reco.node_data, list) {
1023 dlm_kick_recovery_thread(dlm);
1028 dlm_put(dlm);
1034 static void dlm_move_reco_locks_to_list(struct dlm_ctxt *dlm,
1041 spin_lock(&dlm->spinlock);
1042 list_for_each_entry_safe(res, next, &dlm->reco.resources, recovering) {
1053 dead_node, dlm->name);
1077 spin_unlock(&dlm->spinlock);
1095 static int dlm_send_mig_lockres_msg(struct dlm_ctxt *dlm,
1118 dlm->name, res->lockname.len, res->lockname.name,
1123 ret = o2net_send_message(DLM_MIG_LOCKRES_MSG, dlm->key, mres,
1130 "node %u (%s)\n", dlm->name, mres->lockname_len,
1231 static void dlm_add_dummy_lock(struct dlm_ctxt *dlm,
1241 dummy.ml.node = dlm->node_num;
1245 static inline int dlm_is_dummy_lock(struct dlm_ctxt *dlm,
1260 int dlm_send_one_lockres(struct dlm_ctxt *dlm, struct dlm_lock_resource *res,
1298 ret = dlm_send_mig_lockres_msg(dlm, mres, send_to,
1307 dlm->name, res->lockname.len, res->lockname.name,
1310 dlm_add_dummy_lock(dlm, mres);
1313 ret = dlm_send_mig_lockres_msg(dlm, mres, send_to, res, total_locks);
1320 dlm->name, ret);
1324 "lockres %.*s\n", dlm->name, send_to,
1348 struct dlm_ctxt *dlm = data;
1359 if (!dlm_grab(dlm))
1362 if (!dlm_joined(dlm)) {
1365 dlm->name, mres->lockname_len,
1367 dlm_put(dlm);
1395 spin_lock(&dlm->spinlock);
1396 res = __dlm_lookup_lockres_full(dlm, mres->lockname, mres->lockname_len,
1405 " ref!\n", dlm->name,
1409 spin_unlock(&dlm->spinlock);
1430 spin_unlock(&dlm->spinlock);
1437 spin_unlock(&dlm->spinlock);
1439 spin_unlock(&dlm->spinlock);
1442 res = dlm_new_lockres(dlm, mres->lockname, mres->lockname_len);
1456 spin_lock(&dlm->spinlock);
1457 __dlm_insert_lockres(dlm, res);
1458 spin_unlock(&dlm->spinlock);
1491 dlm_lockres_grab_inflight_ref(dlm, res);
1501 dlm_change_lockres_owner(dlm, res, dlm->node_num);
1506 dlm_grab(dlm); /* get an extra ref for the work item */
1508 dlm_init_work_item(dlm, item, dlm_mig_lockres_worker, buf);
1512 spin_lock(&dlm->work_lock);
1513 list_add_tail(&item->list, &dlm->work_list);
1514 spin_unlock(&dlm->work_lock);
1515 queue_work(dlm->dlm_worker, &dlm->dispatched_work);
1522 dlm_put(dlm);
1535 struct dlm_ctxt *dlm;
1542 dlm = item->dlm;
1553 ret = dlm_lockres_master_requery(dlm, res, &real_master);
1565 dlm_lockres_drop_inflight_ref(dlm, res);
1576 ret = dlm_process_recovery_data(dlm, res, mres);
1584 ret = dlm_finish_migration(dlm, res, mres->master);
1601 static int dlm_lockres_master_requery(struct dlm_ctxt *dlm,
1634 spin_lock(&dlm->spinlock);
1635 dlm_node_iter_init(dlm->domain_map, &iter);
1636 spin_unlock(&dlm->spinlock);
1640 if (nodenum == dlm->node_num)
1642 ret = dlm_do_master_requery(dlm, res, nodenum, real_master);
1659 int dlm_do_master_requery(struct dlm_ctxt *dlm, struct dlm_lock_resource *res,
1667 req.node_idx = dlm->node_num;
1672 ret = o2net_send_message(DLM_MASTER_REQUERY_MSG, dlm->key,
1677 dlm->key, nodenum);
1700 struct dlm_ctxt *dlm = data;
1708 if (!dlm_grab(dlm)) {
1716 spin_lock(&dlm->spinlock);
1717 res = __dlm_lookup_lockres(dlm, req->name, req->namelen, hash);
1721 if (master == dlm->node_num) {
1722 int ret = dlm_dispatch_assert_master(dlm, res,
1728 spin_unlock(&dlm->spinlock);
1729 dlm_put(dlm);
1734 __dlm_lockres_grab_inflight_worker(dlm, res);
1743 spin_unlock(&dlm->spinlock);
1746 dlm_put(dlm);
1787 static int dlm_process_recovery_data(struct dlm_ctxt *dlm,
1806 if (dlm_is_dummy_lock(dlm, ml, &from)) {
1810 dlm->name, mres->lockname_len, mres->lockname,
1813 dlm_lockres_set_refmap_bit(dlm, res, from);
1827 if (ml->node == dlm->node_num) {
1955 "lvb! type=%d\n", dlm->name,
1995 "exists on this lockres!\n", dlm->name,
2024 "setting refmap bit\n", dlm->name,
2026 dlm_lockres_set_refmap_bit(dlm, res, ml->node);
2035 dlm_lockres_drop_inflight_ref(dlm, res);
2044 void dlm_move_lockres_to_recovery_list(struct dlm_ctxt *dlm,
2051 assert_spin_locked(&dlm->spinlock);
2057 dlm->name, res->lockname.len, res->lockname.name);
2063 list_add_tail(&res->recovering, &dlm->reco.resources);
2128 static void dlm_finish_local_lockres_recovery(struct dlm_ctxt *dlm,
2135 assert_spin_locked(&dlm->spinlock);
2137 list_for_each_entry_safe(res, next, &dlm->reco.resources, recovering) {
2140 dlm->name, res->lockname.len, res->lockname.name,
2146 dlm_change_lockres_owner(dlm, res, new_master);
2149 __dlm_dirty_lockres(dlm, res);
2161 bucket = dlm_lockres_hash(dlm, i);
2174 res->owner != dlm->node_num)
2185 dlm->name, res->lockname.len, res->lockname.name,
2188 dlm_change_lockres_owner(dlm, res, new_master);
2191 __dlm_dirty_lockres(dlm, res);
2209 static void dlm_revalidate_lvb(struct dlm_ctxt *dlm,
2218 assert_spin_locked(&dlm->spinlock);
2221 if (res->owner == dlm->node_num)
2228 search_node = dlm->node_num;
2252 static void dlm_free_dead_locks(struct dlm_ctxt *dlm,
2262 assert_spin_locked(&dlm->spinlock);
2299 "dropping ref from lockres\n", dlm->name,
2303 "but ref was not set\n", dlm->name,
2308 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2311 "no locks and had not purged before dying\n", dlm->name,
2313 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2317 __dlm_dirty_lockres(dlm, res);
2320 static void dlm_do_local_recovery_cleanup(struct dlm_ctxt *dlm, u8 dead_node)
2330 dlm_clean_master_list(dlm, dead_node);
2342 * dead node. once recovery finishes, the dlm thread
2347 bucket = dlm_lockres_hash(dlm, i);
2359 dead_node, dlm->name);
2373 __dlm_do_purge_lockres(dlm, res);
2378 } else if (res->owner == dlm->node_num)
2379 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2385 dlm_revalidate_lvb(dlm, res, dead_node);
2392 dlm->name, res->lockname.len,
2395 __dlm_do_purge_lockres(dlm, res);
2401 dlm_move_lockres_to_recovery_list(dlm, res);
2402 } else if (res->owner == dlm->node_num) {
2403 dlm_free_dead_locks(dlm, res, dead_node);
2404 __dlm_lockres_calc_usage(dlm, res);
2409 dlm->name, res->lockname.len,
2411 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
2420 static void __dlm_hb_node_down(struct dlm_ctxt *dlm, int idx)
2422 assert_spin_locked(&dlm->spinlock);
2424 if (dlm->reco.new_master == idx) {
2426 dlm->name, idx);
2427 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) {
2432 "finalize1 state, clearing\n", dlm->name, idx);
2433 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE;
2434 __dlm_reset_recovery(dlm);
2439 if (dlm->joining_node == idx) {
2441 __dlm_set_joining_node(dlm, DLM_LOCK_RES_OWNER_UNKNOWN);
2445 if (!test_bit(idx, dlm->live_nodes_map)) {
2448 dlm->name, idx);
2453 if (!test_bit(idx, dlm->domain_map)) {
2460 clear_bit(idx, dlm->live_nodes_map);
2463 if (!test_bit(idx, dlm->recovery_map))
2464 dlm_do_local_recovery_cleanup(dlm, idx);
2467 dlm_hb_event_notify_attached(dlm, idx, 0);
2470 clear_bit(idx, dlm->domain_map);
2471 clear_bit(idx, dlm->exit_domain_map);
2474 wake_up(&dlm->migration_wq);
2476 set_bit(idx, dlm->recovery_map);
2481 struct dlm_ctxt *dlm = data;
2483 if (!dlm_grab(dlm))
2487 * This will notify any dlm users that a node in our domain
2490 if (test_bit(idx, dlm->domain_map))
2491 dlm_fire_domain_eviction_callbacks(dlm, idx);
2493 spin_lock(&dlm->spinlock);
2494 __dlm_hb_node_down(dlm, idx);
2495 spin_unlock(&dlm->spinlock);
2497 dlm_put(dlm);
2502 struct dlm_ctxt *dlm = data;
2504 if (!dlm_grab(dlm))
2507 spin_lock(&dlm->spinlock);
2508 set_bit(idx, dlm->live_nodes_map);
2511 spin_unlock(&dlm->spinlock);
2513 dlm_put(dlm);
2518 struct dlm_ctxt *dlm = astdata;
2519 mlog(0, "ast for recovery lock fired!, this=%u, dlm=%s\n",
2520 dlm->node_num, dlm->name);
2524 struct dlm_ctxt *dlm = astdata;
2525 mlog(0, "bast for recovery lock fired!, this=%u, dlm=%s\n",
2526 dlm->node_num, dlm->name);
2540 * or b) dlm->reco.new_master gets set to some nodenum
2545 static int dlm_pick_recovery_master(struct dlm_ctxt *dlm)
2552 dlm->name, jiffies, dlm->reco.dead_node, dlm->node_num);
2556 ret = dlmlock(dlm, LKM_EXMODE, &lksb, LKM_NOQUEUE|LKM_RECOVERY,
2558 dlm_reco_ast, dlm, dlm_reco_bast);
2561 dlm->name, ret, lksb.status);
2564 mlog(0, "dlm=%s dlmlock says I got it (this=%u)\n",
2565 dlm->name, dlm->node_num);
2569 if (dlm_reco_master_ready(dlm)) {
2571 "do the recovery\n", dlm->name,
2572 dlm->reco.new_master);
2578 spin_lock(&dlm->spinlock);
2579 if (dlm->reco.dead_node == O2NM_INVALID_NODE_NUM) {
2582 "node got recovered already\n", dlm->name);
2583 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM) {
2586 dlm->name, dlm->reco.new_master);
2590 spin_unlock(&dlm->spinlock);
2597 "begin_reco now\n", dlm->name,
2598 dlm->reco.dead_node, dlm->node_num);
2599 status = dlm_send_begin_reco_message(dlm,
2600 dlm->reco.dead_node);
2605 spin_lock(&dlm->spinlock);
2606 dlm_set_reco_master(dlm, dlm->node_num);
2607 spin_unlock(&dlm->spinlock);
2612 ret = dlmunlock(dlm, &lksb, 0, dlm_reco_unlock_ast, dlm);
2615 ret = dlmunlock(dlm, &lksb, LKM_CANCEL, dlm_reco_unlock_ast, dlm);
2627 mlog(0, "dlm=%s dlmlock says another node got it (this=%u)\n",
2628 dlm->name, dlm->node_num);
2632 wait_event_timeout(dlm->dlm_reco_thread_wq,
2633 dlm_reco_master_ready(dlm),
2635 if (!dlm_reco_master_ready(dlm)) {
2637 dlm->name);
2642 dlm->name, dlm->reco.new_master, dlm->reco.dead_node);
2645 mlog(0, "dlm=%s dlmlock says master node died (this=%u)\n",
2646 dlm->name, dlm->node_num);
2653 "lksb.status=%s\n", dlm->name, dlm_errname(ret),
2655 res = dlm_lookup_lockres(dlm, DLM_RECOVERY_LOCK_NAME,
2669 static int dlm_send_begin_reco_message(struct dlm_ctxt *dlm, u8 dead_node)
2677 mlog(0, "%s: dead node is %u\n", dlm->name, dead_node);
2679 spin_lock(&dlm->spinlock);
2680 dlm_node_iter_init(dlm->domain_map, &iter);
2681 spin_unlock(&dlm->spinlock);
2686 br.node_idx = dlm->node_num;
2696 if (nodenum == dlm->node_num) {
2703 ret = o2net_send_message(DLM_BEGIN_RECO_MSG, dlm->key,
2712 "begin reco msg (%d)\n", dlm->name, nodenum, ret);
2724 "to complete, backoff for a bit\n", dlm->name,
2735 mlog(ML_ERROR, "begin reco of dlm %s to node %u "
2736 "returned %d\n", dlm->name, nodenum, ret);
2737 res = dlm_lookup_lockres(dlm, DLM_RECOVERY_LOCK_NAME,
2758 struct dlm_ctxt *dlm = data;
2762 if (!dlm_grab(dlm))
2765 spin_lock(&dlm->spinlock);
2766 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) {
2769 dlm->name, br->node_idx, br->dead_node,
2770 dlm->reco.dead_node, dlm->reco.new_master);
2771 spin_unlock(&dlm->spinlock);
2772 dlm_put(dlm);
2775 spin_unlock(&dlm->spinlock);
2778 dlm->name, br->node_idx, br->dead_node,
2779 dlm->reco.dead_node, dlm->reco.new_master);
2781 dlm_fire_domain_eviction_callbacks(dlm, br->dead_node);
2783 spin_lock(&dlm->spinlock);
2784 if (dlm->reco.new_master != O2NM_INVALID_NODE_NUM) {
2785 if (test_bit(dlm->reco.new_master, dlm->recovery_map)) {
2787 "to %u\n", dlm->name, dlm->reco.new_master,
2791 "to %u\n", dlm->name, dlm->reco.new_master,
2796 if (dlm->reco.dead_node != O2NM_INVALID_NODE_NUM) {
2798 "node %u changing it to %u\n", dlm->name,
2799 dlm->reco.dead_node, br->node_idx, br->dead_node);
2801 dlm_set_reco_master(dlm, br->node_idx);
2802 dlm_set_reco_dead_node(dlm, br->dead_node);
2803 if (!test_bit(br->dead_node, dlm->recovery_map)) {
2807 if (!test_bit(br->dead_node, dlm->domain_map) ||
2808 !test_bit(br->dead_node, dlm->live_nodes_map))
2814 set_bit(br->dead_node, dlm->domain_map);
2815 set_bit(br->dead_node, dlm->live_nodes_map);
2816 __dlm_hb_node_down(dlm, br->dead_node);
2818 spin_unlock(&dlm->spinlock);
2820 dlm_kick_recovery_thread(dlm);
2823 dlm->name, br->node_idx, br->dead_node,
2824 dlm->reco.dead_node, dlm->reco.new_master);
2826 dlm_put(dlm);
2831 static int dlm_send_finalize_reco_message(struct dlm_ctxt *dlm)
2841 "stage %d\n", dlm->name, dlm->reco.dead_node, stage);
2843 spin_lock(&dlm->spinlock);
2844 dlm_node_iter_init(dlm->domain_map, &iter);
2845 spin_unlock(&dlm->spinlock);
2849 fr.node_idx = dlm->node_num;
2850 fr.dead_node = dlm->reco.dead_node;
2855 if (nodenum == dlm->node_num)
2857 ret = o2net_send_message(DLM_FINALIZE_RECO_MSG, dlm->key,
2864 dlm->key, nodenum);
2890 struct dlm_ctxt *dlm = data;
2895 if (!dlm_grab(dlm))
2902 "node %u (%u:%u)\n", dlm->name, fr->node_idx, stage,
2903 fr->dead_node, dlm->reco.dead_node, dlm->reco.new_master);
2905 spin_lock(&dlm->spinlock);
2907 if (dlm->reco.new_master != fr->node_idx) {
2910 fr->node_idx, dlm->reco.new_master, fr->dead_node);
2913 if (dlm->reco.dead_node != fr->dead_node) {
2916 fr->node_idx, fr->dead_node, dlm->reco.dead_node);
2922 dlm_finish_local_lockres_recovery(dlm, fr->dead_node, fr->node_idx);
2923 if (dlm->reco.state & DLM_RECO_STATE_FINALIZE) {
2927 dlm->name, fr->node_idx, fr->dead_node);
2928 dlm_print_reco_node_status(dlm);
2931 dlm->reco.state |= DLM_RECO_STATE_FINALIZE;
2932 spin_unlock(&dlm->spinlock);
2935 if (!(dlm->reco.state & DLM_RECO_STATE_FINALIZE)) {
2939 dlm->name, fr->node_idx, fr->dead_node);
2940 dlm_print_reco_node_status(dlm);
2943 dlm->reco.state &= ~DLM_RECO_STATE_FINALIZE;
2944 __dlm_reset_recovery(dlm);
2945 spin_unlock(&dlm->spinlock);
2946 dlm_kick_recovery_thread(dlm);
2951 dlm->name, fr->node_idx, dlm->reco.dead_node, dlm->reco.new_master);
2953 dlm_put(dlm);