1 /******************************************************************************
2 *******************************************************************************
4 ** Copyright (C) 2005-2008 Red Hat, Inc. All rights reserved.
6 ** This copyrighted material is made available to anyone wishing to use,
7 ** modify, copy, or redistribute it subject to the terms and conditions
8 ** of the GNU General Public License v.2.
10 *******************************************************************************
11 ******************************************************************************/
13 #include "dlm_internal.h"
14 #include "lockspace.h"
21 static void add_ordered_member(struct dlm_ls
*ls
, struct dlm_member
*new)
23 struct dlm_member
*memb
= NULL
;
24 struct list_head
*tmp
;
25 struct list_head
*newlist
= &new->list
;
26 struct list_head
*head
= &ls
->ls_nodes
;
28 list_for_each(tmp
, head
) {
29 memb
= list_entry(tmp
, struct dlm_member
, list
);
30 if (new->nodeid
< memb
->nodeid
)
35 list_add_tail(newlist
, head
);
37 /* FIXME: can use list macro here */
38 newlist
->prev
= tmp
->prev
;
40 tmp
->prev
->next
= newlist
;
45 static int dlm_add_member(struct dlm_ls
*ls
, int nodeid
)
47 struct dlm_member
*memb
;
50 memb
= kzalloc(sizeof(struct dlm_member
), GFP_KERNEL
);
54 w
= dlm_node_weight(ls
->ls_name
, nodeid
);
60 memb
->nodeid
= nodeid
;
62 add_ordered_member(ls
, memb
);
67 static void dlm_remove_member(struct dlm_ls
*ls
, struct dlm_member
*memb
)
69 list_move(&memb
->list
, &ls
->ls_nodes_gone
);
73 int dlm_is_member(struct dlm_ls
*ls
, int nodeid
)
75 struct dlm_member
*memb
;
77 list_for_each_entry(memb
, &ls
->ls_nodes
, list
) {
78 if (memb
->nodeid
== nodeid
)
84 int dlm_is_removed(struct dlm_ls
*ls
, int nodeid
)
86 struct dlm_member
*memb
;
88 list_for_each_entry(memb
, &ls
->ls_nodes_gone
, list
) {
89 if (memb
->nodeid
== nodeid
)
95 static void clear_memb_list(struct list_head
*head
)
97 struct dlm_member
*memb
;
99 while (!list_empty(head
)) {
100 memb
= list_entry(head
->next
, struct dlm_member
, list
);
101 list_del(&memb
->list
);
106 void dlm_clear_members(struct dlm_ls
*ls
)
108 clear_memb_list(&ls
->ls_nodes
);
109 ls
->ls_num_nodes
= 0;
112 void dlm_clear_members_gone(struct dlm_ls
*ls
)
114 clear_memb_list(&ls
->ls_nodes_gone
);
117 static void make_member_array(struct dlm_ls
*ls
)
119 struct dlm_member
*memb
;
120 int i
, w
, x
= 0, total
= 0, all_zero
= 0, *array
;
122 kfree(ls
->ls_node_array
);
123 ls
->ls_node_array
= NULL
;
125 list_for_each_entry(memb
, &ls
->ls_nodes
, list
) {
127 total
+= memb
->weight
;
130 /* all nodes revert to weight of 1 if all have weight 0 */
133 total
= ls
->ls_num_nodes
;
137 ls
->ls_total_weight
= total
;
139 array
= kmalloc(sizeof(int) * total
, GFP_KERNEL
);
143 list_for_each_entry(memb
, &ls
->ls_nodes
, list
) {
144 if (!all_zero
&& !memb
->weight
)
152 DLM_ASSERT(x
< total
, printk("total %d x %d\n", total
, x
););
154 for (i
= 0; i
< w
; i
++)
155 array
[x
++] = memb
->nodeid
;
158 ls
->ls_node_array
= array
;
161 /* send a status request to all members just to establish comms connections */
163 static int ping_members(struct dlm_ls
*ls
)
165 struct dlm_member
*memb
;
168 list_for_each_entry(memb
, &ls
->ls_nodes
, list
) {
169 error
= dlm_recovery_stopped(ls
);
172 error
= dlm_rcom_status(ls
, memb
->nodeid
);
177 log_debug(ls
, "ping_members aborted %d last nodeid %d",
178 error
, ls
->ls_recover_nodeid
);
182 int dlm_recover_members(struct dlm_ls
*ls
, struct dlm_recover
*rv
, int *neg_out
)
184 struct dlm_member
*memb
, *safe
;
185 int i
, error
, found
, pos
= 0, neg
= 0, low
= -1;
187 /* previously removed members that we've not finished removing need to
188 count as a negative change so the "neg" recovery steps will happen */
190 list_for_each_entry(memb
, &ls
->ls_nodes_gone
, list
) {
191 log_debug(ls
, "prev removed member %d", memb
->nodeid
);
195 /* move departed members from ls_nodes to ls_nodes_gone */
197 list_for_each_entry_safe(memb
, safe
, &ls
->ls_nodes
, list
) {
199 for (i
= 0; i
< rv
->node_count
; i
++) {
200 if (memb
->nodeid
== rv
->nodeids
[i
]) {
208 dlm_remove_member(ls
, memb
);
209 log_debug(ls
, "remove member %d", memb
->nodeid
);
213 /* Add an entry to ls_nodes_gone for members that were removed and
214 then added again, so that previous state for these nodes will be
215 cleared during recovery. */
217 for (i
= 0; i
< rv
->new_count
; i
++) {
218 if (!dlm_is_member(ls
, rv
->new[i
]))
220 log_debug(ls
, "new nodeid %d is a re-added member", rv
->new[i
]);
222 memb
= kzalloc(sizeof(struct dlm_member
), GFP_KERNEL
);
225 memb
->nodeid
= rv
->new[i
];
226 list_add_tail(&memb
->list
, &ls
->ls_nodes_gone
);
230 /* add new members to ls_nodes */
232 for (i
= 0; i
< rv
->node_count
; i
++) {
233 if (dlm_is_member(ls
, rv
->nodeids
[i
]))
235 dlm_add_member(ls
, rv
->nodeids
[i
]);
237 log_debug(ls
, "add member %d", rv
->nodeids
[i
]);
240 list_for_each_entry(memb
, &ls
->ls_nodes
, list
) {
241 if (low
== -1 || memb
->nodeid
< low
)
244 ls
->ls_low_nodeid
= low
;
246 make_member_array(ls
);
247 dlm_set_recover_status(ls
, DLM_RS_NODES
);
250 error
= ping_members(ls
);
251 if (!error
|| error
== -EPROTO
) {
252 /* new_lockspace() may be waiting to know if the config
254 ls
->ls_members_result
= error
;
255 complete(&ls
->ls_members_done
);
260 error
= dlm_recover_members_wait(ls
);
262 log_debug(ls
, "total members %d error %d", ls
->ls_num_nodes
, error
);
266 /* Userspace guarantees that dlm_ls_stop() has completed on all nodes before
267 dlm_ls_start() is called on any of them to start the new recovery. */
269 int dlm_ls_stop(struct dlm_ls
*ls
)
274 * Prevent dlm_recv from being in the middle of something when we do
275 * the stop. This includes ensuring dlm_recv isn't processing a
276 * recovery message (rcom), while dlm_recoverd is aborting and
277 * resetting things from an in-progress recovery. i.e. we want
278 * dlm_recoverd to abort its recovery without worrying about dlm_recv
279 * processing an rcom at the same time. Stopping dlm_recv also makes
280 * it easy for dlm_receive_message() to check locking stopped and add a
281 * message to the requestqueue without races.
284 down_write(&ls
->ls_recv_active
);
287 * Abort any recovery that's in progress (see RECOVERY_STOP,
288 * dlm_recovery_stopped()) and tell any other threads running in the
289 * dlm to quit any processing (see RUNNING, dlm_locking_stopped()).
292 spin_lock(&ls
->ls_recover_lock
);
293 set_bit(LSFL_RECOVERY_STOP
, &ls
->ls_flags
);
294 new = test_and_clear_bit(LSFL_RUNNING
, &ls
->ls_flags
);
295 ls
->ls_recover_seq
++;
296 spin_unlock(&ls
->ls_recover_lock
);
299 * Let dlm_recv run again, now any normal messages will be saved on the
300 * requestqueue for later.
303 up_write(&ls
->ls_recv_active
);
306 * This in_recovery lock does two things:
307 * 1) Keeps this function from returning until all threads are out
308 * of locking routines and locking is truely stopped.
309 * 2) Keeps any new requests from being processed until it's unlocked
310 * when recovery is complete.
314 down_write(&ls
->ls_in_recovery
);
317 * The recoverd suspend/resume makes sure that dlm_recoverd (if
318 * running) has noticed RECOVERY_STOP above and quit processing the
322 dlm_recoverd_suspend(ls
);
323 ls
->ls_recover_status
= 0;
324 dlm_recoverd_resume(ls
);
326 if (!ls
->ls_recover_begin
)
327 ls
->ls_recover_begin
= jiffies
;
331 int dlm_ls_start(struct dlm_ls
*ls
)
333 struct dlm_recover
*rv
= NULL
, *rv_old
;
334 int *ids
= NULL
, *new = NULL
;
335 int error
, ids_count
= 0, new_count
= 0;
337 rv
= kzalloc(sizeof(struct dlm_recover
), GFP_KERNEL
);
341 error
= dlm_nodeid_list(ls
->ls_name
, &ids
, &ids_count
,
346 spin_lock(&ls
->ls_recover_lock
);
348 /* the lockspace needs to be stopped before it can be started */
350 if (!dlm_locking_stopped(ls
)) {
351 spin_unlock(&ls
->ls_recover_lock
);
352 log_error(ls
, "start ignored: lockspace running");
358 rv
->node_count
= ids_count
;
360 rv
->new_count
= new_count
;
361 rv
->seq
= ++ls
->ls_recover_seq
;
362 rv_old
= ls
->ls_recover_args
;
363 ls
->ls_recover_args
= rv
;
364 spin_unlock(&ls
->ls_recover_lock
);
367 log_error(ls
, "unused recovery %llx %d",
368 (unsigned long long)rv_old
->seq
, rv_old
->node_count
);
369 kfree(rv_old
->nodeids
);
374 dlm_recoverd_kick(ls
);