fs: dlm: fix return -EINTR on recovery stopped
[linux-block.git] / fs / dlm / lockspace.c
CommitLineData
2522fe45 1// SPDX-License-Identifier: GPL-2.0-only
e7fd4179
DT
2/******************************************************************************
3*******************************************************************************
4**
5** Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
60f98d18 6** Copyright (C) 2004-2011 Red Hat, Inc. All rights reserved.
e7fd4179 7**
e7fd4179
DT
8**
9*******************************************************************************
10******************************************************************************/
11
7963b8a5
PG
12#include <linux/module.h>
13
e7fd4179
DT
14#include "dlm_internal.h"
15#include "lockspace.h"
16#include "member.h"
17#include "recoverd.h"
e7fd4179 18#include "dir.h"
a070a91c 19#include "midcomms.h"
e7fd4179
DT
20#include "lowcomms.h"
21#include "config.h"
22#include "memory.h"
23#include "lock.h"
c56b39cd 24#include "recover.h"
2896ee37 25#include "requestqueue.h"
0f8e0d9a 26#include "user.h"
23e8e1aa 27#include "ast.h"
e7fd4179 28
e7fd4179 29static int ls_count;
90135925 30static struct mutex ls_lock;
e7fd4179
DT
31static struct list_head lslist;
32static spinlock_t lslist_lock;
33static struct task_struct * scand_task;
34
35
36static ssize_t dlm_control_store(struct dlm_ls *ls, const char *buf, size_t len)
37{
38 ssize_t ret = len;
6edb5687
FF
39 int n;
40 int rc = kstrtoint(buf, 0, &n);
e7fd4179 41
6edb5687
FF
42 if (rc)
43 return rc;
e2de7f56
PC
44 ls = dlm_find_lockspace_local(ls->ls_local_handle);
45 if (!ls)
46 return -EINVAL;
47
e7fd4179
DT
48 switch (n) {
49 case 0:
50 dlm_ls_stop(ls);
51 break;
52 case 1:
53 dlm_ls_start(ls);
54 break;
55 default:
56 ret = -EINVAL;
57 }
e2de7f56 58 dlm_put_lockspace(ls);
e7fd4179
DT
59 return ret;
60}
61
62static ssize_t dlm_event_store(struct dlm_ls *ls, const char *buf, size_t len)
63{
6edb5687
FF
64 int rc = kstrtoint(buf, 0, &ls->ls_uevent_result);
65
66 if (rc)
67 return rc;
e7fd4179
DT
68 set_bit(LSFL_UEVENT_WAIT, &ls->ls_flags);
69 wake_up(&ls->ls_uevent_wait);
70 return len;
71}
72
73static ssize_t dlm_id_show(struct dlm_ls *ls, char *buf)
74{
a1d144c7 75 return snprintf(buf, PAGE_SIZE, "%u\n", ls->ls_global_id);
e7fd4179
DT
76}
77
78static ssize_t dlm_id_store(struct dlm_ls *ls, const char *buf, size_t len)
79{
6edb5687
FF
80 int rc = kstrtouint(buf, 0, &ls->ls_global_id);
81
82 if (rc)
83 return rc;
e7fd4179
DT
84 return len;
85}
86
4875647a
DT
87static ssize_t dlm_nodir_show(struct dlm_ls *ls, char *buf)
88{
89 return snprintf(buf, PAGE_SIZE, "%u\n", dlm_no_directory(ls));
90}
91
92static ssize_t dlm_nodir_store(struct dlm_ls *ls, const char *buf, size_t len)
93{
6edb5687
FF
94 int val;
95 int rc = kstrtoint(buf, 0, &val);
96
97 if (rc)
98 return rc;
4875647a
DT
99 if (val == 1)
100 set_bit(LSFL_NODIR, &ls->ls_flags);
101 return len;
102}
103
c56b39cd
DT
104static ssize_t dlm_recover_status_show(struct dlm_ls *ls, char *buf)
105{
106 uint32_t status = dlm_recover_status(ls);
a1d144c7 107 return snprintf(buf, PAGE_SIZE, "%x\n", status);
c56b39cd
DT
108}
109
faa0f267
DT
110static ssize_t dlm_recover_nodeid_show(struct dlm_ls *ls, char *buf)
111{
a1d144c7 112 return snprintf(buf, PAGE_SIZE, "%d\n", ls->ls_recover_nodeid);
faa0f267
DT
113}
114
e7fd4179
DT
115struct dlm_attr {
116 struct attribute attr;
117 ssize_t (*show)(struct dlm_ls *, char *);
118 ssize_t (*store)(struct dlm_ls *, const char *, size_t);
119};
120
121static struct dlm_attr dlm_attr_control = {
122 .attr = {.name = "control", .mode = S_IWUSR},
123 .store = dlm_control_store
124};
125
126static struct dlm_attr dlm_attr_event = {
127 .attr = {.name = "event_done", .mode = S_IWUSR},
128 .store = dlm_event_store
129};
130
131static struct dlm_attr dlm_attr_id = {
132 .attr = {.name = "id", .mode = S_IRUGO | S_IWUSR},
133 .show = dlm_id_show,
134 .store = dlm_id_store
135};
136
4875647a
DT
137static struct dlm_attr dlm_attr_nodir = {
138 .attr = {.name = "nodir", .mode = S_IRUGO | S_IWUSR},
139 .show = dlm_nodir_show,
140 .store = dlm_nodir_store
141};
142
c56b39cd
DT
143static struct dlm_attr dlm_attr_recover_status = {
144 .attr = {.name = "recover_status", .mode = S_IRUGO},
145 .show = dlm_recover_status_show
146};
147
faa0f267
DT
148static struct dlm_attr dlm_attr_recover_nodeid = {
149 .attr = {.name = "recover_nodeid", .mode = S_IRUGO},
150 .show = dlm_recover_nodeid_show
151};
152
e7fd4179
DT
153static struct attribute *dlm_attrs[] = {
154 &dlm_attr_control.attr,
155 &dlm_attr_event.attr,
156 &dlm_attr_id.attr,
4875647a 157 &dlm_attr_nodir.attr,
c56b39cd 158 &dlm_attr_recover_status.attr,
faa0f267 159 &dlm_attr_recover_nodeid.attr,
e7fd4179
DT
160 NULL,
161};
c9c5b5e1 162ATTRIBUTE_GROUPS(dlm);
e7fd4179
DT
163
164static ssize_t dlm_attr_show(struct kobject *kobj, struct attribute *attr,
165 char *buf)
166{
167 struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
168 struct dlm_attr *a = container_of(attr, struct dlm_attr, attr);
169 return a->show ? a->show(ls, buf) : 0;
170}
171
172static ssize_t dlm_attr_store(struct kobject *kobj, struct attribute *attr,
173 const char *buf, size_t len)
174{
175 struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
176 struct dlm_attr *a = container_of(attr, struct dlm_attr, attr);
177 return a->store ? a->store(ls, buf, len) : len;
178}
179
ba542e3b
PC
180static void lockspace_kobj_release(struct kobject *k)
181{
182 struct dlm_ls *ls = container_of(k, struct dlm_ls, ls_kobj);
183 kfree(ls);
184}
185
52cf25d0 186static const struct sysfs_ops dlm_attr_ops = {
e7fd4179
DT
187 .show = dlm_attr_show,
188 .store = dlm_attr_store,
189};
190
191static struct kobj_type dlm_ktype = {
c9c5b5e1 192 .default_groups = dlm_groups,
e7fd4179 193 .sysfs_ops = &dlm_attr_ops,
ba542e3b 194 .release = lockspace_kobj_release,
e7fd4179
DT
195};
196
d405936b 197static struct kset *dlm_kset;
e7fd4179 198
e7fd4179
DT
199static int do_uevent(struct dlm_ls *ls, int in)
200{
e7fd4179
DT
201 if (in)
202 kobject_uevent(&ls->ls_kobj, KOBJ_ONLINE);
203 else
204 kobject_uevent(&ls->ls_kobj, KOBJ_OFFLINE);
205
075f0177 206 log_rinfo(ls, "%s the lockspace group...", in ? "joining" : "leaving");
8b0e7b2c
DT
207
208 /* dlm_controld will see the uevent, do the necessary group management
209 and then write to sysfs to wake us */
210
f084a4f4
RL
211 wait_event(ls->ls_uevent_wait,
212 test_and_clear_bit(LSFL_UEVENT_WAIT, &ls->ls_flags));
8b0e7b2c 213
f084a4f4 214 log_rinfo(ls, "group event done %d", ls->ls_uevent_result);
e7fd4179 215
f084a4f4 216 return ls->ls_uevent_result;
e7fd4179
DT
217}
218
b4a5d4bc
SW
219static int dlm_uevent(struct kset *kset, struct kobject *kobj,
220 struct kobj_uevent_env *env)
221{
222 struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
223
224 add_uevent_var(env, "LOCKSPACE=%s", ls->ls_name);
225 return 0;
226}
227
417f7c59 228static const struct kset_uevent_ops dlm_uevent_ops = {
b4a5d4bc
SW
229 .uevent = dlm_uevent,
230};
e7fd4179 231
30727174 232int __init dlm_lockspace_init(void)
e7fd4179 233{
e7fd4179 234 ls_count = 0;
90135925 235 mutex_init(&ls_lock);
e7fd4179
DT
236 INIT_LIST_HEAD(&lslist);
237 spin_lock_init(&lslist_lock);
238
b4a5d4bc 239 dlm_kset = kset_create_and_add("dlm", &dlm_uevent_ops, kernel_kobj);
d405936b 240 if (!dlm_kset) {
8e24eea7 241 printk(KERN_WARNING "%s: can not create kset\n", __func__);
d405936b
GKH
242 return -ENOMEM;
243 }
244 return 0;
e7fd4179
DT
245}
246
247void dlm_lockspace_exit(void)
248{
d405936b 249 kset_unregister(dlm_kset);
e7fd4179
DT
250}
251
c1dcf65f
DT
252static struct dlm_ls *find_ls_to_scan(void)
253{
254 struct dlm_ls *ls;
255
256 spin_lock(&lslist_lock);
257 list_for_each_entry(ls, &lslist, ls_list) {
258 if (time_after_eq(jiffies, ls->ls_scan_time +
259 dlm_config.ci_scan_secs * HZ)) {
260 spin_unlock(&lslist_lock);
261 return ls;
262 }
263 }
264 spin_unlock(&lslist_lock);
265 return NULL;
266}
267
e7fd4179
DT
268static int dlm_scand(void *data)
269{
270 struct dlm_ls *ls;
271
272 while (!kthread_should_stop()) {
c1dcf65f
DT
273 ls = find_ls_to_scan();
274 if (ls) {
85e86edf 275 if (dlm_lock_recovery_try(ls)) {
c1dcf65f 276 ls->ls_scan_time = jiffies;
85e86edf 277 dlm_scan_rsbs(ls);
3ae1acf9 278 dlm_scan_timeout(ls);
c6ff669b 279 dlm_scan_waiters(ls);
85e86edf 280 dlm_unlock_recovery(ls);
c1dcf65f
DT
281 } else {
282 ls->ls_scan_time += HZ;
85e86edf 283 }
c6ff669b 284 continue;
85e86edf 285 }
c6ff669b 286 schedule_timeout_interruptible(dlm_config.ci_scan_secs * HZ);
e7fd4179
DT
287 }
288 return 0;
289}
290
291static int dlm_scand_start(void)
292{
293 struct task_struct *p;
294 int error = 0;
295
296 p = kthread_run(dlm_scand, NULL, "dlm_scand");
297 if (IS_ERR(p))
298 error = PTR_ERR(p);
299 else
300 scand_task = p;
301 return error;
302}
303
304static void dlm_scand_stop(void)
305{
306 kthread_stop(scand_task);
307}
308
e7fd4179
DT
309struct dlm_ls *dlm_find_lockspace_global(uint32_t id)
310{
311 struct dlm_ls *ls;
312
313 spin_lock(&lslist_lock);
314
315 list_for_each_entry(ls, &lslist, ls_list) {
316 if (ls->ls_global_id == id) {
317 ls->ls_count++;
318 goto out;
319 }
320 }
321 ls = NULL;
322 out:
323 spin_unlock(&lslist_lock);
324 return ls;
325}
326
597d0cae 327struct dlm_ls *dlm_find_lockspace_local(dlm_lockspace_t *lockspace)
e7fd4179 328{
597d0cae 329 struct dlm_ls *ls;
e7fd4179
DT
330
331 spin_lock(&lslist_lock);
597d0cae
DT
332 list_for_each_entry(ls, &lslist, ls_list) {
333 if (ls->ls_local_handle == lockspace) {
334 ls->ls_count++;
335 goto out;
336 }
337 }
338 ls = NULL;
339 out:
340 spin_unlock(&lslist_lock);
341 return ls;
342}
343
344struct dlm_ls *dlm_find_lockspace_device(int minor)
345{
346 struct dlm_ls *ls;
347
348 spin_lock(&lslist_lock);
349 list_for_each_entry(ls, &lslist, ls_list) {
350 if (ls->ls_device.minor == minor) {
351 ls->ls_count++;
352 goto out;
353 }
354 }
355 ls = NULL;
356 out:
e7fd4179
DT
357 spin_unlock(&lslist_lock);
358 return ls;
359}
360
361void dlm_put_lockspace(struct dlm_ls *ls)
362{
363 spin_lock(&lslist_lock);
364 ls->ls_count--;
365 spin_unlock(&lslist_lock);
366}
367
368static void remove_lockspace(struct dlm_ls *ls)
369{
370 for (;;) {
371 spin_lock(&lslist_lock);
372 if (ls->ls_count == 0) {
0f8e0d9a 373 WARN_ON(ls->ls_create_count != 0);
e7fd4179
DT
374 list_del(&ls->ls_list);
375 spin_unlock(&lslist_lock);
376 return;
377 }
378 spin_unlock(&lslist_lock);
379 ssleep(1);
380 }
381}
382
383static int threads_start(void)
384{
385 int error;
386
e7fd4179
DT
387 error = dlm_scand_start();
388 if (error) {
389 log_print("cannot start dlm_scand thread %d", error);
23e8e1aa 390 goto fail;
e7fd4179
DT
391 }
392
393 /* Thread for sending/receiving messages for all lockspace's */
a070a91c 394 error = dlm_midcomms_start();
e7fd4179
DT
395 if (error) {
396 log_print("cannot start dlm lowcomms %d", error);
397 goto scand_fail;
398 }
399
400 return 0;
401
402 scand_fail:
403 dlm_scand_stop();
e7fd4179
DT
404 fail:
405 return error;
406}
407
60f98d18
DT
408static int new_lockspace(const char *name, const char *cluster,
409 uint32_t flags, int lvblen,
410 const struct dlm_lockspace_ops *ops, void *ops_arg,
411 int *ops_result, dlm_lockspace_t **lockspace)
e7fd4179
DT
412{
413 struct dlm_ls *ls;
0f8e0d9a 414 int i, size, error;
79d72b54 415 int do_unreg = 0;
60f98d18 416 int namelen = strlen(name);
e7fd4179 417
3f0806d2 418 if (namelen > DLM_LOCKSPACE_LEN || namelen == 0)
e7fd4179
DT
419 return -EINVAL;
420
421 if (!lvblen || (lvblen % 8))
422 return -EINVAL;
423
424 if (!try_module_get(THIS_MODULE))
425 return -EINVAL;
426
dc68c7ed 427 if (!dlm_user_daemon_available()) {
60f98d18
DT
428 log_print("dlm user daemon not available");
429 error = -EUNATCH;
430 goto out;
431 }
432
433 if (ops && ops_result) {
434 if (!dlm_config.ci_recover_callbacks)
435 *ops_result = -EOPNOTSUPP;
436 else
437 *ops_result = 0;
438 }
439
3b0e761b
ZL
440 if (!cluster)
441 log_print("dlm cluster name '%s' is being used without an application provided cluster name",
442 dlm_config.ci_cluster_name);
443
60f98d18
DT
444 if (dlm_config.ci_recover_callbacks && cluster &&
445 strncmp(cluster, dlm_config.ci_cluster_name, DLM_LOCKSPACE_LEN)) {
8e174374
GH
446 log_print("dlm cluster name '%s' does not match "
447 "the application cluster name '%s'",
60f98d18
DT
448 dlm_config.ci_cluster_name, cluster);
449 error = -EBADR;
450 goto out;
dc68c7ed
DT
451 }
452
0f8e0d9a
DT
453 error = 0;
454
455 spin_lock(&lslist_lock);
456 list_for_each_entry(ls, &lslist, ls_list) {
457 WARN_ON(ls->ls_create_count <= 0);
458 if (ls->ls_namelen != namelen)
459 continue;
460 if (memcmp(ls->ls_name, name, namelen))
461 continue;
462 if (flags & DLM_LSFL_NEWEXCL) {
463 error = -EEXIST;
464 break;
465 }
466 ls->ls_create_count++;
8511a272
DT
467 *lockspace = ls;
468 error = 1;
0f8e0d9a 469 break;
e7fd4179 470 }
0f8e0d9a
DT
471 spin_unlock(&lslist_lock);
472
0f8e0d9a 473 if (error)
8511a272 474 goto out;
0f8e0d9a
DT
475
476 error = -ENOMEM;
e7fd4179 477
573c24c4 478 ls = kzalloc(sizeof(struct dlm_ls) + namelen, GFP_NOFS);
e7fd4179
DT
479 if (!ls)
480 goto out;
e7fd4179
DT
481 memcpy(ls->ls_name, name, namelen);
482 ls->ls_namelen = namelen;
e7fd4179
DT
483 ls->ls_lvblen = lvblen;
484 ls->ls_count = 0;
485 ls->ls_flags = 0;
c1dcf65f 486 ls->ls_scan_time = jiffies;
e7fd4179 487
60f98d18
DT
488 if (ops && dlm_config.ci_recover_callbacks) {
489 ls->ls_ops = ops;
490 ls->ls_ops_arg = ops_arg;
491 }
492
3ae1acf9
DT
493 if (flags & DLM_LSFL_TIMEWARN)
494 set_bit(LSFL_TIMEWARN, &ls->ls_flags);
3ae1acf9 495
fad59c13 496 /* ls_exflags are forced to match among nodes, and we don't
0f8e0d9a
DT
497 need to require all nodes to have some flags set */
498 ls->ls_exflags = (flags & ~(DLM_LSFL_TIMEWARN | DLM_LSFL_FS |
499 DLM_LSFL_NEWEXCL));
fad59c13 500
d921a23f 501 size = READ_ONCE(dlm_config.ci_rsbtbl_size);
e7fd4179
DT
502 ls->ls_rsbtbl_size = size;
503
42bc47b3 504 ls->ls_rsbtbl = vmalloc(array_size(size, sizeof(struct dlm_rsbtable)));
e7fd4179
DT
505 if (!ls->ls_rsbtbl)
506 goto out_lsfree;
507 for (i = 0; i < size; i++) {
9beb3bf5
BP
508 ls->ls_rsbtbl[i].keep.rb_node = NULL;
509 ls->ls_rsbtbl[i].toss.rb_node = NULL;
c7be761a 510 spin_lock_init(&ls->ls_rsbtbl[i].lock);
e7fd4179
DT
511 }
512
05c32f47
DT
513 spin_lock_init(&ls->ls_remove_spin);
514
515 for (i = 0; i < DLM_REMOVE_NAMES_MAX; i++) {
516 ls->ls_remove_names[i] = kzalloc(DLM_RESNAME_MAXLEN+1,
517 GFP_KERNEL);
518 if (!ls->ls_remove_names[i])
519 goto out_rsbtbl;
520 }
521
3d6aa675
DT
522 idr_init(&ls->ls_lkbidr);
523 spin_lock_init(&ls->ls_lkbidr_spin);
e7fd4179 524
e7fd4179 525 INIT_LIST_HEAD(&ls->ls_waiters);
90135925 526 mutex_init(&ls->ls_waiters_mutex);
ef0c2bb0
DT
527 INIT_LIST_HEAD(&ls->ls_orphans);
528 mutex_init(&ls->ls_orphans_mutex);
3ae1acf9
DT
529 INIT_LIST_HEAD(&ls->ls_timeout);
530 mutex_init(&ls->ls_timeout_mutex);
e7fd4179 531
3881ac04
DT
532 INIT_LIST_HEAD(&ls->ls_new_rsb);
533 spin_lock_init(&ls->ls_new_rsb_spin);
534
e7fd4179
DT
535 INIT_LIST_HEAD(&ls->ls_nodes);
536 INIT_LIST_HEAD(&ls->ls_nodes_gone);
537 ls->ls_num_nodes = 0;
538 ls->ls_low_nodeid = 0;
539 ls->ls_total_weight = 0;
540 ls->ls_node_array = NULL;
541
542 memset(&ls->ls_stub_rsb, 0, sizeof(struct dlm_rsb));
543 ls->ls_stub_rsb.res_ls = ls;
544
5de6319b
DT
545 ls->ls_debug_rsb_dentry = NULL;
546 ls->ls_debug_waiters_dentry = NULL;
e7fd4179
DT
547
548 init_waitqueue_head(&ls->ls_uevent_wait);
549 ls->ls_uevent_result = 0;
8b0e7b2c
DT
550 init_completion(&ls->ls_members_done);
551 ls->ls_members_result = -1;
e7fd4179 552
23e8e1aa
DT
553 mutex_init(&ls->ls_cb_mutex);
554 INIT_LIST_HEAD(&ls->ls_cb_delay);
555
e7fd4179 556 ls->ls_recoverd_task = NULL;
90135925 557 mutex_init(&ls->ls_recoverd_active);
e7fd4179 558 spin_lock_init(&ls->ls_recover_lock);
98f176fb
DT
559 spin_lock_init(&ls->ls_rcom_spin);
560 get_random_bytes(&ls->ls_rcom_seq, sizeof(uint64_t));
e7fd4179
DT
561 ls->ls_recover_status = 0;
562 ls->ls_recover_seq = 0;
563 ls->ls_recover_args = NULL;
564 init_rwsem(&ls->ls_in_recovery);
c36258b5 565 init_rwsem(&ls->ls_recv_active);
e7fd4179 566 INIT_LIST_HEAD(&ls->ls_requestqueue);
90135925 567 mutex_init(&ls->ls_requestqueue_mutex);
597d0cae 568 mutex_init(&ls->ls_clear_proc_locks);
e7fd4179 569
489d8e55
AA
570 /* Due backwards compatibility with 3.1 we need to use maximum
571 * possible dlm message size to be sure the message will fit and
572 * not having out of bounds issues. However on sending side 3.2
573 * might send less.
574 */
d10a0b88 575 ls->ls_recover_buf = kmalloc(DLM_MAX_SOCKET_BUFSIZE, GFP_NOFS);
e7fd4179 576 if (!ls->ls_recover_buf)
05c32f47 577 goto out_lkbidr;
e7fd4179 578
757a4271
DT
579 ls->ls_slot = 0;
580 ls->ls_num_slots = 0;
581 ls->ls_slots_size = 0;
582 ls->ls_slots = NULL;
583
e7fd4179
DT
584 INIT_LIST_HEAD(&ls->ls_recover_list);
585 spin_lock_init(&ls->ls_recover_list_lock);
1d7c484e
DT
586 idr_init(&ls->ls_recover_idr);
587 spin_lock_init(&ls->ls_recover_idr_lock);
e7fd4179 588 ls->ls_recover_list_count = 0;
597d0cae 589 ls->ls_local_handle = ls;
e7fd4179
DT
590 init_waitqueue_head(&ls->ls_wait_general);
591 INIT_LIST_HEAD(&ls->ls_root_list);
592 init_rwsem(&ls->ls_root_sem);
593
5f88f1ea 594 spin_lock(&lslist_lock);
0f8e0d9a 595 ls->ls_create_count = 1;
5f88f1ea
DT
596 list_add(&ls->ls_list, &lslist);
597 spin_unlock(&lslist_lock);
598
23e8e1aa
DT
599 if (flags & DLM_LSFL_FS) {
600 error = dlm_callback_start(ls);
601 if (error) {
602 log_error(ls, "can't start dlm_callback %d", error);
603 goto out_delist;
604 }
605 }
606
475f230c
DT
607 init_waitqueue_head(&ls->ls_recover_lock_wait);
608
609 /*
610 * Once started, dlm_recoverd first looks for ls in lslist, then
611 * initializes ls_in_recovery as locked in "down" mode. We need
612 * to wait for the wakeup from dlm_recoverd because in_recovery
613 * has to start out in down mode.
614 */
615
e7fd4179
DT
616 error = dlm_recoverd_start(ls);
617 if (error) {
618 log_error(ls, "can't start dlm_recoverd %d", error);
23e8e1aa 619 goto out_callback;
e7fd4179
DT
620 }
621
475f230c
DT
622 wait_event(ls->ls_recover_lock_wait,
623 test_bit(LSFL_RECOVER_LOCK, &ls->ls_flags));
624
0ffddafc
WH
625 /* let kobject handle freeing of ls if there's an error */
626 do_unreg = 1;
627
901195ed
GKH
628 ls->ls_kobj.kset = dlm_kset;
629 error = kobject_init_and_add(&ls->ls_kobj, &dlm_ktype, NULL,
630 "%s", ls->ls_name);
e7fd4179 631 if (error)
23e8e1aa 632 goto out_recoverd;
901195ed 633 kobject_uevent(&ls->ls_kobj, KOBJ_ADD);
79d72b54 634
8b0e7b2c
DT
635 /* This uevent triggers dlm_controld in userspace to add us to the
636 group of nodes that are members of this lockspace (managed by the
637 cluster infrastructure.) Once it's done that, it tells us who the
638 current lockspace members are (via configfs) and then tells the
639 lockspace to start running (via sysfs) in dlm_ls_start(). */
640
e7fd4179
DT
641 error = do_uevent(ls, 1);
642 if (error)
23e8e1aa 643 goto out_recoverd;
79d72b54 644
8b0e7b2c
DT
645 wait_for_completion(&ls->ls_members_done);
646 error = ls->ls_members_result;
647 if (error)
648 goto out_members;
649
79d72b54
DT
650 dlm_create_debug_file(ls);
651
075f0177 652 log_rinfo(ls, "join complete");
e7fd4179
DT
653 *lockspace = ls;
654 return 0;
655
8b0e7b2c
DT
656 out_members:
657 do_uevent(ls, 0);
658 dlm_clear_members(ls);
659 kfree(ls->ls_node_array);
23e8e1aa 660 out_recoverd:
5f88f1ea 661 dlm_recoverd_stop(ls);
23e8e1aa
DT
662 out_callback:
663 dlm_callback_stop(ls);
79d72b54 664 out_delist:
e7fd4179
DT
665 spin_lock(&lslist_lock);
666 list_del(&ls->ls_list);
667 spin_unlock(&lslist_lock);
1d7c484e 668 idr_destroy(&ls->ls_recover_idr);
e7fd4179 669 kfree(ls->ls_recover_buf);
05c32f47 670 out_lkbidr:
3d6aa675 671 idr_destroy(&ls->ls_lkbidr);
b982896c 672 out_rsbtbl:
3456880f
TM
673 for (i = 0; i < DLM_REMOVE_NAMES_MAX; i++)
674 kfree(ls->ls_remove_names[i]);
c282af49 675 vfree(ls->ls_rsbtbl);
e7fd4179 676 out_lsfree:
79d72b54 677 if (do_unreg)
197b12d6 678 kobject_put(&ls->ls_kobj);
79d72b54
DT
679 else
680 kfree(ls);
e7fd4179
DT
681 out:
682 module_put(THIS_MODULE);
683 return error;
684}
685
60f98d18
DT
686int dlm_new_lockspace(const char *name, const char *cluster,
687 uint32_t flags, int lvblen,
688 const struct dlm_lockspace_ops *ops, void *ops_arg,
689 int *ops_result, dlm_lockspace_t **lockspace)
e7fd4179
DT
690{
691 int error = 0;
692
90135925 693 mutex_lock(&ls_lock);
e7fd4179
DT
694 if (!ls_count)
695 error = threads_start();
696 if (error)
697 goto out;
698
60f98d18
DT
699 error = new_lockspace(name, cluster, flags, lvblen, ops, ops_arg,
700 ops_result, lockspace);
e7fd4179
DT
701 if (!error)
702 ls_count++;
8511a272
DT
703 if (error > 0)
704 error = 0;
9d232469
AA
705 if (!ls_count) {
706 dlm_scand_stop();
a070a91c 707 dlm_midcomms_shutdown();
9d232469
AA
708 dlm_lowcomms_stop();
709 }
e7fd4179 710 out:
90135925 711 mutex_unlock(&ls_lock);
e7fd4179
DT
712 return error;
713}
714
3d6aa675 715static int lkb_idr_is_local(int id, void *p, void *data)
e7fd4179 716{
3d6aa675
DT
717 struct dlm_lkb *lkb = p;
718
a97f4a66 719 return lkb->lkb_nodeid == 0 && lkb->lkb_grmode != DLM_LOCK_IV;
3d6aa675
DT
720}
721
722static int lkb_idr_is_any(int id, void *p, void *data)
723{
724 return 1;
725}
726
727static int lkb_idr_free(int id, void *p, void *data)
728{
729 struct dlm_lkb *lkb = p;
730
3d6aa675
DT
731 if (lkb->lkb_lvbptr && lkb->lkb_flags & DLM_IFL_MSTCPY)
732 dlm_free_lvb(lkb->lkb_lvbptr);
733
734 dlm_free_lkb(lkb);
735 return 0;
736}
737
738/* NOTE: We check the lkbidr here rather than the resource table.
739 This is because there may be LKBs queued as ASTs that have been unlinked
740 from their RSBs and are pending deletion once the AST has been delivered */
741
742static int lockspace_busy(struct dlm_ls *ls, int force)
743{
744 int rv;
745
746 spin_lock(&ls->ls_lkbidr_spin);
747 if (force == 0) {
748 rv = idr_for_each(&ls->ls_lkbidr, lkb_idr_is_any, ls);
749 } else if (force == 1) {
750 rv = idr_for_each(&ls->ls_lkbidr, lkb_idr_is_local, ls);
751 } else {
752 rv = 0;
e7fd4179 753 }
3d6aa675
DT
754 spin_unlock(&ls->ls_lkbidr_spin);
755 return rv;
e7fd4179
DT
756}
757
758static int release_lockspace(struct dlm_ls *ls, int force)
759{
e7fd4179 760 struct dlm_rsb *rsb;
9beb3bf5 761 struct rb_node *n;
0f8e0d9a
DT
762 int i, busy, rv;
763
3d6aa675 764 busy = lockspace_busy(ls, force);
0f8e0d9a
DT
765
766 spin_lock(&lslist_lock);
767 if (ls->ls_create_count == 1) {
3d6aa675 768 if (busy) {
0f8e0d9a 769 rv = -EBUSY;
3d6aa675 770 } else {
0f8e0d9a
DT
771 /* remove_lockspace takes ls off lslist */
772 ls->ls_create_count = 0;
773 rv = 0;
774 }
775 } else if (ls->ls_create_count > 1) {
776 rv = --ls->ls_create_count;
777 } else {
778 rv = -EINVAL;
779 }
780 spin_unlock(&lslist_lock);
781
782 if (rv) {
783 log_debug(ls, "release_lockspace no remove %d", rv);
784 return rv;
785 }
e7fd4179 786
0f8e0d9a 787 dlm_device_deregister(ls);
e7fd4179 788
dc68c7ed 789 if (force < 3 && dlm_user_daemon_available())
e7fd4179
DT
790 do_uevent(ls, 0);
791
792 dlm_recoverd_stop(ls);
793
9d232469
AA
794 if (ls_count == 1) {
795 dlm_scand_stop();
a070a91c 796 dlm_midcomms_shutdown();
9d232469
AA
797 }
798
23e8e1aa
DT
799 dlm_callback_stop(ls);
800
e7fd4179
DT
801 remove_lockspace(ls);
802
803 dlm_delete_debug_file(ls);
804
8fc6ed9a 805 idr_destroy(&ls->ls_recover_idr);
e7fd4179
DT
806 kfree(ls->ls_recover_buf);
807
e7fd4179 808 /*
3d6aa675 809 * Free all lkb's in idr
e7fd4179
DT
810 */
811
3d6aa675 812 idr_for_each(&ls->ls_lkbidr, lkb_idr_free, ls);
3d6aa675 813 idr_destroy(&ls->ls_lkbidr);
e7fd4179 814
e7fd4179
DT
815 /*
816 * Free all rsb's on rsbtbl[] lists
817 */
818
819 for (i = 0; i < ls->ls_rsbtbl_size; i++) {
9beb3bf5
BP
820 while ((n = rb_first(&ls->ls_rsbtbl[i].keep))) {
821 rsb = rb_entry(n, struct dlm_rsb, res_hashnode);
822 rb_erase(n, &ls->ls_rsbtbl[i].keep);
52bda2b5 823 dlm_free_rsb(rsb);
e7fd4179
DT
824 }
825
9beb3bf5
BP
826 while ((n = rb_first(&ls->ls_rsbtbl[i].toss))) {
827 rsb = rb_entry(n, struct dlm_rsb, res_hashnode);
828 rb_erase(n, &ls->ls_rsbtbl[i].toss);
52bda2b5 829 dlm_free_rsb(rsb);
e7fd4179
DT
830 }
831 }
832
c282af49 833 vfree(ls->ls_rsbtbl);
e7fd4179 834
05c32f47
DT
835 for (i = 0; i < DLM_REMOVE_NAMES_MAX; i++)
836 kfree(ls->ls_remove_names[i]);
837
3881ac04
DT
838 while (!list_empty(&ls->ls_new_rsb)) {
839 rsb = list_first_entry(&ls->ls_new_rsb, struct dlm_rsb,
840 res_hashchain);
841 list_del(&rsb->res_hashchain);
842 dlm_free_rsb(rsb);
843 }
844
e7fd4179
DT
845 /*
846 * Free structures on any other lists
847 */
848
2896ee37 849 dlm_purge_requestqueue(ls);
e7fd4179 850 kfree(ls->ls_recover_args);
e7fd4179
DT
851 dlm_clear_members(ls);
852 dlm_clear_members_gone(ls);
853 kfree(ls->ls_node_array);
075f0177 854 log_rinfo(ls, "release_lockspace final free");
197b12d6 855 kobject_put(&ls->ls_kobj);
79d72b54 856 /* The ls structure will be freed when the kobject is done with */
e7fd4179 857
e7fd4179
DT
858 module_put(THIS_MODULE);
859 return 0;
860}
861
862/*
863 * Called when a system has released all its locks and is not going to use the
864 * lockspace any longer. We free everything we're managing for this lockspace.
865 * Remaining nodes will go through the recovery process as if we'd died. The
866 * lockspace must continue to function as usual, participating in recoveries,
867 * until this returns.
868 *
869 * Force has 4 possible values:
870 * 0 - don't destroy locksapce if it has any LKBs
871 * 1 - destroy lockspace if it has remote LKBs but not if it has local LKBs
872 * 2 - destroy lockspace regardless of LKBs
873 * 3 - destroy lockspace as part of a forced shutdown
874 */
875
876int dlm_release_lockspace(void *lockspace, int force)
877{
878 struct dlm_ls *ls;
0f8e0d9a 879 int error;
e7fd4179
DT
880
881 ls = dlm_find_lockspace_local(lockspace);
882 if (!ls)
883 return -EINVAL;
884 dlm_put_lockspace(ls);
0f8e0d9a
DT
885
886 mutex_lock(&ls_lock);
887 error = release_lockspace(ls, force);
888 if (!error)
889 ls_count--;
278afcbf 890 if (!ls_count)
9d232469 891 dlm_lowcomms_stop();
0f8e0d9a
DT
892 mutex_unlock(&ls_lock);
893
894 return error;
e7fd4179
DT
895}
896
dc68c7ed
DT
897void dlm_stop_lockspaces(void)
898{
899 struct dlm_ls *ls;
696b3d84 900 int count;
dc68c7ed
DT
901
902 restart:
696b3d84 903 count = 0;
dc68c7ed
DT
904 spin_lock(&lslist_lock);
905 list_for_each_entry(ls, &lslist, ls_list) {
696b3d84
DT
906 if (!test_bit(LSFL_RUNNING, &ls->ls_flags)) {
907 count++;
dc68c7ed 908 continue;
696b3d84 909 }
dc68c7ed
DT
910 spin_unlock(&lslist_lock);
911 log_error(ls, "no userland control daemon, stopping lockspace");
912 dlm_ls_stop(ls);
913 goto restart;
914 }
915 spin_unlock(&lslist_lock);
696b3d84
DT
916
917 if (count)
918 log_print("dlm user daemon left %d lockspaces", count);
dc68c7ed
DT
919}
920