Committer: Michael Beasley <mike@snafu.setup>
[mikesnafu-overlay.git] / fs / dlm / member.c
blobfa17f5a278831fa3acf3977930fae7fcc63af2df
1 /******************************************************************************
2 *******************************************************************************
3 **
4 ** Copyright (C) 2005-2008 Red Hat, Inc. All rights reserved.
5 **
6 ** This copyrighted material is made available to anyone wishing to use,
7 ** modify, copy, or redistribute it subject to the terms and conditions
8 ** of the GNU General Public License v.2.
9 **
10 *******************************************************************************
11 ******************************************************************************/
13 #include "dlm_internal.h"
14 #include "lockspace.h"
15 #include "member.h"
16 #include "recoverd.h"
17 #include "recover.h"
18 #include "rcom.h"
19 #include "config.h"
21 static void add_ordered_member(struct dlm_ls *ls, struct dlm_member *new)
23 struct dlm_member *memb = NULL;
24 struct list_head *tmp;
25 struct list_head *newlist = &new->list;
26 struct list_head *head = &ls->ls_nodes;
28 list_for_each(tmp, head) {
29 memb = list_entry(tmp, struct dlm_member, list);
30 if (new->nodeid < memb->nodeid)
31 break;
34 if (!memb)
35 list_add_tail(newlist, head);
36 else {
37 /* FIXME: can use list macro here */
38 newlist->prev = tmp->prev;
39 newlist->next = tmp;
40 tmp->prev->next = newlist;
41 tmp->prev = newlist;
45 static int dlm_add_member(struct dlm_ls *ls, int nodeid)
47 struct dlm_member *memb;
48 int w;
50 memb = kzalloc(sizeof(struct dlm_member), GFP_KERNEL);
51 if (!memb)
52 return -ENOMEM;
54 w = dlm_node_weight(ls->ls_name, nodeid);
55 if (w < 0) {
56 kfree(memb);
57 return w;
60 memb->nodeid = nodeid;
61 memb->weight = w;
62 add_ordered_member(ls, memb);
63 ls->ls_num_nodes++;
64 return 0;
67 static void dlm_remove_member(struct dlm_ls *ls, struct dlm_member *memb)
69 list_move(&memb->list, &ls->ls_nodes_gone);
70 ls->ls_num_nodes--;
73 int dlm_is_member(struct dlm_ls *ls, int nodeid)
75 struct dlm_member *memb;
77 list_for_each_entry(memb, &ls->ls_nodes, list) {
78 if (memb->nodeid == nodeid)
79 return 1;
81 return 0;
84 int dlm_is_removed(struct dlm_ls *ls, int nodeid)
86 struct dlm_member *memb;
88 list_for_each_entry(memb, &ls->ls_nodes_gone, list) {
89 if (memb->nodeid == nodeid)
90 return 1;
92 return 0;
95 static void clear_memb_list(struct list_head *head)
97 struct dlm_member *memb;
99 while (!list_empty(head)) {
100 memb = list_entry(head->next, struct dlm_member, list);
101 list_del(&memb->list);
102 kfree(memb);
106 void dlm_clear_members(struct dlm_ls *ls)
108 clear_memb_list(&ls->ls_nodes);
109 ls->ls_num_nodes = 0;
112 void dlm_clear_members_gone(struct dlm_ls *ls)
114 clear_memb_list(&ls->ls_nodes_gone);
117 static void make_member_array(struct dlm_ls *ls)
119 struct dlm_member *memb;
120 int i, w, x = 0, total = 0, all_zero = 0, *array;
122 kfree(ls->ls_node_array);
123 ls->ls_node_array = NULL;
125 list_for_each_entry(memb, &ls->ls_nodes, list) {
126 if (memb->weight)
127 total += memb->weight;
130 /* all nodes revert to weight of 1 if all have weight 0 */
132 if (!total) {
133 total = ls->ls_num_nodes;
134 all_zero = 1;
137 ls->ls_total_weight = total;
139 array = kmalloc(sizeof(int) * total, GFP_KERNEL);
140 if (!array)
141 return;
143 list_for_each_entry(memb, &ls->ls_nodes, list) {
144 if (!all_zero && !memb->weight)
145 continue;
147 if (all_zero)
148 w = 1;
149 else
150 w = memb->weight;
152 DLM_ASSERT(x < total, printk("total %d x %d\n", total, x););
154 for (i = 0; i < w; i++)
155 array[x++] = memb->nodeid;
158 ls->ls_node_array = array;
161 /* send a status request to all members just to establish comms connections */
163 static int ping_members(struct dlm_ls *ls)
165 struct dlm_member *memb;
166 int error = 0;
168 list_for_each_entry(memb, &ls->ls_nodes, list) {
169 error = dlm_recovery_stopped(ls);
170 if (error)
171 break;
172 error = dlm_rcom_status(ls, memb->nodeid);
173 if (error)
174 break;
176 if (error)
177 log_debug(ls, "ping_members aborted %d last nodeid %d",
178 error, ls->ls_recover_nodeid);
179 return error;
182 int dlm_recover_members(struct dlm_ls *ls, struct dlm_recover *rv, int *neg_out)
184 struct dlm_member *memb, *safe;
185 int i, error, found, pos = 0, neg = 0, low = -1;
187 /* previously removed members that we've not finished removing need to
188 count as a negative change so the "neg" recovery steps will happen */
190 list_for_each_entry(memb, &ls->ls_nodes_gone, list) {
191 log_debug(ls, "prev removed member %d", memb->nodeid);
192 neg++;
195 /* move departed members from ls_nodes to ls_nodes_gone */
197 list_for_each_entry_safe(memb, safe, &ls->ls_nodes, list) {
198 found = 0;
199 for (i = 0; i < rv->node_count; i++) {
200 if (memb->nodeid == rv->nodeids[i]) {
201 found = 1;
202 break;
206 if (!found) {
207 neg++;
208 dlm_remove_member(ls, memb);
209 log_debug(ls, "remove member %d", memb->nodeid);
213 /* add new members to ls_nodes */
215 for (i = 0; i < rv->node_count; i++) {
216 if (dlm_is_member(ls, rv->nodeids[i]))
217 continue;
218 dlm_add_member(ls, rv->nodeids[i]);
219 pos++;
220 log_debug(ls, "add member %d", rv->nodeids[i]);
223 list_for_each_entry(memb, &ls->ls_nodes, list) {
224 if (low == -1 || memb->nodeid < low)
225 low = memb->nodeid;
227 ls->ls_low_nodeid = low;
229 make_member_array(ls);
230 dlm_set_recover_status(ls, DLM_RS_NODES);
231 *neg_out = neg;
233 error = ping_members(ls);
234 if (!error || error == -EPROTO) {
235 /* new_lockspace() may be waiting to know if the config
236 is good or bad */
237 ls->ls_members_result = error;
238 complete(&ls->ls_members_done);
240 if (error)
241 goto out;
243 error = dlm_recover_members_wait(ls);
244 out:
245 log_debug(ls, "total members %d error %d", ls->ls_num_nodes, error);
246 return error;
249 /* Userspace guarantees that dlm_ls_stop() has completed on all nodes before
250 dlm_ls_start() is called on any of them to start the new recovery. */
252 int dlm_ls_stop(struct dlm_ls *ls)
254 int new;
257 * Prevent dlm_recv from being in the middle of something when we do
258 * the stop. This includes ensuring dlm_recv isn't processing a
259 * recovery message (rcom), while dlm_recoverd is aborting and
260 * resetting things from an in-progress recovery. i.e. we want
261 * dlm_recoverd to abort its recovery without worrying about dlm_recv
262 * processing an rcom at the same time. Stopping dlm_recv also makes
263 * it easy for dlm_receive_message() to check locking stopped and add a
264 * message to the requestqueue without races.
267 down_write(&ls->ls_recv_active);
270 * Abort any recovery that's in progress (see RECOVERY_STOP,
271 * dlm_recovery_stopped()) and tell any other threads running in the
272 * dlm to quit any processing (see RUNNING, dlm_locking_stopped()).
275 spin_lock(&ls->ls_recover_lock);
276 set_bit(LSFL_RECOVERY_STOP, &ls->ls_flags);
277 new = test_and_clear_bit(LSFL_RUNNING, &ls->ls_flags);
278 ls->ls_recover_seq++;
279 spin_unlock(&ls->ls_recover_lock);
282 * Let dlm_recv run again, now any normal messages will be saved on the
283 * requestqueue for later.
286 up_write(&ls->ls_recv_active);
289 * This in_recovery lock does two things:
290 * 1) Keeps this function from returning until all threads are out
291 * of locking routines and locking is truely stopped.
292 * 2) Keeps any new requests from being processed until it's unlocked
293 * when recovery is complete.
296 if (new)
297 down_write(&ls->ls_in_recovery);
300 * The recoverd suspend/resume makes sure that dlm_recoverd (if
301 * running) has noticed RECOVERY_STOP above and quit processing the
302 * previous recovery.
305 dlm_recoverd_suspend(ls);
306 ls->ls_recover_status = 0;
307 dlm_recoverd_resume(ls);
309 if (!ls->ls_recover_begin)
310 ls->ls_recover_begin = jiffies;
311 return 0;
314 int dlm_ls_start(struct dlm_ls *ls)
316 struct dlm_recover *rv = NULL, *rv_old;
317 int *ids = NULL;
318 int error, count;
320 rv = kzalloc(sizeof(struct dlm_recover), GFP_KERNEL);
321 if (!rv)
322 return -ENOMEM;
324 error = count = dlm_nodeid_list(ls->ls_name, &ids);
325 if (error <= 0)
326 goto fail;
328 spin_lock(&ls->ls_recover_lock);
330 /* the lockspace needs to be stopped before it can be started */
332 if (!dlm_locking_stopped(ls)) {
333 spin_unlock(&ls->ls_recover_lock);
334 log_error(ls, "start ignored: lockspace running");
335 error = -EINVAL;
336 goto fail;
339 rv->nodeids = ids;
340 rv->node_count = count;
341 rv->seq = ++ls->ls_recover_seq;
342 rv_old = ls->ls_recover_args;
343 ls->ls_recover_args = rv;
344 spin_unlock(&ls->ls_recover_lock);
346 if (rv_old) {
347 kfree(rv_old->nodeids);
348 kfree(rv_old);
351 dlm_recoverd_kick(ls);
352 return 0;
354 fail:
355 kfree(rv);
356 kfree(ids);
357 return error;