Merge tag 'trace-v6.3-rc1' of git://git.kernel.org/pub/scm/linux/kernel/git/trace...
[linux-block.git] / fs / dlm / lockspace.c
CommitLineData
2522fe45 1// SPDX-License-Identifier: GPL-2.0-only
e7fd4179
DT
2/******************************************************************************
3*******************************************************************************
4**
5** Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
60f98d18 6** Copyright (C) 2004-2011 Red Hat, Inc. All rights reserved.
e7fd4179 7**
e7fd4179
DT
8**
9*******************************************************************************
10******************************************************************************/
11
7963b8a5
PG
12#include <linux/module.h>
13
e7fd4179
DT
14#include "dlm_internal.h"
15#include "lockspace.h"
16#include "member.h"
17#include "recoverd.h"
e7fd4179 18#include "dir.h"
a070a91c 19#include "midcomms.h"
e7fd4179
DT
20#include "config.h"
21#include "memory.h"
22#include "lock.h"
c56b39cd 23#include "recover.h"
2896ee37 24#include "requestqueue.h"
0f8e0d9a 25#include "user.h"
23e8e1aa 26#include "ast.h"
e7fd4179 27
e7fd4179 28static int ls_count;
90135925 29static struct mutex ls_lock;
e7fd4179
DT
30static struct list_head lslist;
31static spinlock_t lslist_lock;
32static struct task_struct * scand_task;
33
34
35static ssize_t dlm_control_store(struct dlm_ls *ls, const char *buf, size_t len)
36{
37 ssize_t ret = len;
6edb5687
FF
38 int n;
39 int rc = kstrtoint(buf, 0, &n);
e7fd4179 40
6edb5687
FF
41 if (rc)
42 return rc;
e2de7f56
PC
43 ls = dlm_find_lockspace_local(ls->ls_local_handle);
44 if (!ls)
45 return -EINVAL;
46
e7fd4179
DT
47 switch (n) {
48 case 0:
49 dlm_ls_stop(ls);
50 break;
51 case 1:
52 dlm_ls_start(ls);
53 break;
54 default:
55 ret = -EINVAL;
56 }
e2de7f56 57 dlm_put_lockspace(ls);
e7fd4179
DT
58 return ret;
59}
60
61static ssize_t dlm_event_store(struct dlm_ls *ls, const char *buf, size_t len)
62{
6edb5687
FF
63 int rc = kstrtoint(buf, 0, &ls->ls_uevent_result);
64
65 if (rc)
66 return rc;
e7fd4179
DT
67 set_bit(LSFL_UEVENT_WAIT, &ls->ls_flags);
68 wake_up(&ls->ls_uevent_wait);
69 return len;
70}
71
72static ssize_t dlm_id_show(struct dlm_ls *ls, char *buf)
73{
a1d144c7 74 return snprintf(buf, PAGE_SIZE, "%u\n", ls->ls_global_id);
e7fd4179
DT
75}
76
77static ssize_t dlm_id_store(struct dlm_ls *ls, const char *buf, size_t len)
78{
6edb5687
FF
79 int rc = kstrtouint(buf, 0, &ls->ls_global_id);
80
81 if (rc)
82 return rc;
e7fd4179
DT
83 return len;
84}
85
4875647a
DT
86static ssize_t dlm_nodir_show(struct dlm_ls *ls, char *buf)
87{
88 return snprintf(buf, PAGE_SIZE, "%u\n", dlm_no_directory(ls));
89}
90
91static ssize_t dlm_nodir_store(struct dlm_ls *ls, const char *buf, size_t len)
92{
6edb5687
FF
93 int val;
94 int rc = kstrtoint(buf, 0, &val);
95
96 if (rc)
97 return rc;
4875647a
DT
98 if (val == 1)
99 set_bit(LSFL_NODIR, &ls->ls_flags);
100 return len;
101}
102
c56b39cd
DT
103static ssize_t dlm_recover_status_show(struct dlm_ls *ls, char *buf)
104{
105 uint32_t status = dlm_recover_status(ls);
a1d144c7 106 return snprintf(buf, PAGE_SIZE, "%x\n", status);
c56b39cd
DT
107}
108
faa0f267
DT
109static ssize_t dlm_recover_nodeid_show(struct dlm_ls *ls, char *buf)
110{
a1d144c7 111 return snprintf(buf, PAGE_SIZE, "%d\n", ls->ls_recover_nodeid);
faa0f267
DT
112}
113
e7fd4179
DT
114struct dlm_attr {
115 struct attribute attr;
116 ssize_t (*show)(struct dlm_ls *, char *);
117 ssize_t (*store)(struct dlm_ls *, const char *, size_t);
118};
119
120static struct dlm_attr dlm_attr_control = {
121 .attr = {.name = "control", .mode = S_IWUSR},
122 .store = dlm_control_store
123};
124
125static struct dlm_attr dlm_attr_event = {
126 .attr = {.name = "event_done", .mode = S_IWUSR},
127 .store = dlm_event_store
128};
129
130static struct dlm_attr dlm_attr_id = {
131 .attr = {.name = "id", .mode = S_IRUGO | S_IWUSR},
132 .show = dlm_id_show,
133 .store = dlm_id_store
134};
135
4875647a
DT
136static struct dlm_attr dlm_attr_nodir = {
137 .attr = {.name = "nodir", .mode = S_IRUGO | S_IWUSR},
138 .show = dlm_nodir_show,
139 .store = dlm_nodir_store
140};
141
c56b39cd
DT
142static struct dlm_attr dlm_attr_recover_status = {
143 .attr = {.name = "recover_status", .mode = S_IRUGO},
144 .show = dlm_recover_status_show
145};
146
faa0f267
DT
147static struct dlm_attr dlm_attr_recover_nodeid = {
148 .attr = {.name = "recover_nodeid", .mode = S_IRUGO},
149 .show = dlm_recover_nodeid_show
150};
151
e7fd4179
DT
152static struct attribute *dlm_attrs[] = {
153 &dlm_attr_control.attr,
154 &dlm_attr_event.attr,
155 &dlm_attr_id.attr,
4875647a 156 &dlm_attr_nodir.attr,
c56b39cd 157 &dlm_attr_recover_status.attr,
faa0f267 158 &dlm_attr_recover_nodeid.attr,
e7fd4179
DT
159 NULL,
160};
c9c5b5e1 161ATTRIBUTE_GROUPS(dlm);
e7fd4179
DT
162
163static ssize_t dlm_attr_show(struct kobject *kobj, struct attribute *attr,
164 char *buf)
165{
166 struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
167 struct dlm_attr *a = container_of(attr, struct dlm_attr, attr);
168 return a->show ? a->show(ls, buf) : 0;
169}
170
171static ssize_t dlm_attr_store(struct kobject *kobj, struct attribute *attr,
172 const char *buf, size_t len)
173{
174 struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
175 struct dlm_attr *a = container_of(attr, struct dlm_attr, attr);
176 return a->store ? a->store(ls, buf, len) : len;
177}
178
ba542e3b
PC
179static void lockspace_kobj_release(struct kobject *k)
180{
181 struct dlm_ls *ls = container_of(k, struct dlm_ls, ls_kobj);
182 kfree(ls);
183}
184
52cf25d0 185static const struct sysfs_ops dlm_attr_ops = {
e7fd4179
DT
186 .show = dlm_attr_show,
187 .store = dlm_attr_store,
188};
189
190static struct kobj_type dlm_ktype = {
c9c5b5e1 191 .default_groups = dlm_groups,
e7fd4179 192 .sysfs_ops = &dlm_attr_ops,
ba542e3b 193 .release = lockspace_kobj_release,
e7fd4179
DT
194};
195
d405936b 196static struct kset *dlm_kset;
e7fd4179 197
e7fd4179
DT
198static int do_uevent(struct dlm_ls *ls, int in)
199{
e7fd4179
DT
200 if (in)
201 kobject_uevent(&ls->ls_kobj, KOBJ_ONLINE);
202 else
203 kobject_uevent(&ls->ls_kobj, KOBJ_OFFLINE);
204
075f0177 205 log_rinfo(ls, "%s the lockspace group...", in ? "joining" : "leaving");
8b0e7b2c
DT
206
207 /* dlm_controld will see the uevent, do the necessary group management
208 and then write to sysfs to wake us */
209
f084a4f4
RL
210 wait_event(ls->ls_uevent_wait,
211 test_and_clear_bit(LSFL_UEVENT_WAIT, &ls->ls_flags));
8b0e7b2c 212
f084a4f4 213 log_rinfo(ls, "group event done %d", ls->ls_uevent_result);
e7fd4179 214
f084a4f4 215 return ls->ls_uevent_result;
e7fd4179
DT
216}
217
56d5f362 218static int dlm_uevent(const struct kobject *kobj, struct kobj_uevent_env *env)
b4a5d4bc 219{
56d5f362 220 const struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
b4a5d4bc
SW
221
222 add_uevent_var(env, "LOCKSPACE=%s", ls->ls_name);
223 return 0;
224}
225
417f7c59 226static const struct kset_uevent_ops dlm_uevent_ops = {
b4a5d4bc
SW
227 .uevent = dlm_uevent,
228};
e7fd4179 229
30727174 230int __init dlm_lockspace_init(void)
e7fd4179 231{
e7fd4179 232 ls_count = 0;
90135925 233 mutex_init(&ls_lock);
e7fd4179
DT
234 INIT_LIST_HEAD(&lslist);
235 spin_lock_init(&lslist_lock);
236
b4a5d4bc 237 dlm_kset = kset_create_and_add("dlm", &dlm_uevent_ops, kernel_kobj);
d405936b 238 if (!dlm_kset) {
8e24eea7 239 printk(KERN_WARNING "%s: can not create kset\n", __func__);
d405936b
GKH
240 return -ENOMEM;
241 }
242 return 0;
e7fd4179
DT
243}
244
245void dlm_lockspace_exit(void)
246{
d405936b 247 kset_unregister(dlm_kset);
e7fd4179
DT
248}
249
c1dcf65f
DT
250static struct dlm_ls *find_ls_to_scan(void)
251{
252 struct dlm_ls *ls;
253
254 spin_lock(&lslist_lock);
255 list_for_each_entry(ls, &lslist, ls_list) {
256 if (time_after_eq(jiffies, ls->ls_scan_time +
257 dlm_config.ci_scan_secs * HZ)) {
258 spin_unlock(&lslist_lock);
259 return ls;
260 }
261 }
262 spin_unlock(&lslist_lock);
263 return NULL;
264}
265
e7fd4179
DT
266static int dlm_scand(void *data)
267{
268 struct dlm_ls *ls;
269
270 while (!kthread_should_stop()) {
c1dcf65f
DT
271 ls = find_ls_to_scan();
272 if (ls) {
85e86edf 273 if (dlm_lock_recovery_try(ls)) {
c1dcf65f 274 ls->ls_scan_time = jiffies;
85e86edf 275 dlm_scan_rsbs(ls);
3ae1acf9 276 dlm_scan_timeout(ls);
85e86edf 277 dlm_unlock_recovery(ls);
c1dcf65f
DT
278 } else {
279 ls->ls_scan_time += HZ;
85e86edf 280 }
c6ff669b 281 continue;
85e86edf 282 }
c6ff669b 283 schedule_timeout_interruptible(dlm_config.ci_scan_secs * HZ);
e7fd4179
DT
284 }
285 return 0;
286}
287
288static int dlm_scand_start(void)
289{
290 struct task_struct *p;
291 int error = 0;
292
293 p = kthread_run(dlm_scand, NULL, "dlm_scand");
294 if (IS_ERR(p))
295 error = PTR_ERR(p);
296 else
297 scand_task = p;
298 return error;
299}
300
301static void dlm_scand_stop(void)
302{
303 kthread_stop(scand_task);
304}
305
e7fd4179
DT
306struct dlm_ls *dlm_find_lockspace_global(uint32_t id)
307{
308 struct dlm_ls *ls;
309
310 spin_lock(&lslist_lock);
311
312 list_for_each_entry(ls, &lslist, ls_list) {
313 if (ls->ls_global_id == id) {
3cb5977c 314 atomic_inc(&ls->ls_count);
e7fd4179
DT
315 goto out;
316 }
317 }
318 ls = NULL;
319 out:
320 spin_unlock(&lslist_lock);
321 return ls;
322}
323
597d0cae 324struct dlm_ls *dlm_find_lockspace_local(dlm_lockspace_t *lockspace)
e7fd4179 325{
597d0cae 326 struct dlm_ls *ls;
e7fd4179
DT
327
328 spin_lock(&lslist_lock);
597d0cae
DT
329 list_for_each_entry(ls, &lslist, ls_list) {
330 if (ls->ls_local_handle == lockspace) {
3cb5977c 331 atomic_inc(&ls->ls_count);
597d0cae
DT
332 goto out;
333 }
334 }
335 ls = NULL;
336 out:
337 spin_unlock(&lslist_lock);
338 return ls;
339}
340
341struct dlm_ls *dlm_find_lockspace_device(int minor)
342{
343 struct dlm_ls *ls;
344
345 spin_lock(&lslist_lock);
346 list_for_each_entry(ls, &lslist, ls_list) {
347 if (ls->ls_device.minor == minor) {
3cb5977c 348 atomic_inc(&ls->ls_count);
597d0cae
DT
349 goto out;
350 }
351 }
352 ls = NULL;
353 out:
e7fd4179
DT
354 spin_unlock(&lslist_lock);
355 return ls;
356}
357
358void dlm_put_lockspace(struct dlm_ls *ls)
359{
3cb5977c
AA
360 if (atomic_dec_and_test(&ls->ls_count))
361 wake_up(&ls->ls_count_wait);
e7fd4179
DT
362}
363
364static void remove_lockspace(struct dlm_ls *ls)
365{
3cb5977c
AA
366retry:
367 wait_event(ls->ls_count_wait, atomic_read(&ls->ls_count) == 0);
368
369 spin_lock(&lslist_lock);
370 if (atomic_read(&ls->ls_count) != 0) {
e7fd4179 371 spin_unlock(&lslist_lock);
3cb5977c 372 goto retry;
e7fd4179 373 }
3cb5977c
AA
374
375 WARN_ON(ls->ls_create_count != 0);
376 list_del(&ls->ls_list);
377 spin_unlock(&lslist_lock);
e7fd4179
DT
378}
379
380static int threads_start(void)
381{
382 int error;
383
aad633dc
AA
384 /* Thread for sending/receiving messages for all lockspace's */
385 error = dlm_midcomms_start();
e7fd4179 386 if (error) {
aad633dc 387 log_print("cannot start dlm midcomms %d", error);
23e8e1aa 388 goto fail;
e7fd4179
DT
389 }
390
aad633dc 391 error = dlm_scand_start();
e7fd4179 392 if (error) {
aad633dc
AA
393 log_print("cannot start dlm_scand thread %d", error);
394 goto midcomms_fail;
e7fd4179
DT
395 }
396
397 return 0;
398
aad633dc
AA
399 midcomms_fail:
400 dlm_midcomms_stop();
e7fd4179
DT
401 fail:
402 return error;
403}
404
60f98d18
DT
405static int new_lockspace(const char *name, const char *cluster,
406 uint32_t flags, int lvblen,
407 const struct dlm_lockspace_ops *ops, void *ops_arg,
408 int *ops_result, dlm_lockspace_t **lockspace)
e7fd4179
DT
409{
410 struct dlm_ls *ls;
0f8e0d9a 411 int i, size, error;
79d72b54 412 int do_unreg = 0;
60f98d18 413 int namelen = strlen(name);
e7fd4179 414
3f0806d2 415 if (namelen > DLM_LOCKSPACE_LEN || namelen == 0)
e7fd4179
DT
416 return -EINVAL;
417
b5c9d37c 418 if (lvblen % 8)
e7fd4179
DT
419 return -EINVAL;
420
421 if (!try_module_get(THIS_MODULE))
422 return -EINVAL;
423
dc68c7ed 424 if (!dlm_user_daemon_available()) {
60f98d18
DT
425 log_print("dlm user daemon not available");
426 error = -EUNATCH;
427 goto out;
428 }
429
430 if (ops && ops_result) {
431 if (!dlm_config.ci_recover_callbacks)
432 *ops_result = -EOPNOTSUPP;
433 else
434 *ops_result = 0;
435 }
436
3b0e761b
ZL
437 if (!cluster)
438 log_print("dlm cluster name '%s' is being used without an application provided cluster name",
439 dlm_config.ci_cluster_name);
440
60f98d18
DT
441 if (dlm_config.ci_recover_callbacks && cluster &&
442 strncmp(cluster, dlm_config.ci_cluster_name, DLM_LOCKSPACE_LEN)) {
8e174374
GH
443 log_print("dlm cluster name '%s' does not match "
444 "the application cluster name '%s'",
60f98d18
DT
445 dlm_config.ci_cluster_name, cluster);
446 error = -EBADR;
447 goto out;
dc68c7ed
DT
448 }
449
0f8e0d9a
DT
450 error = 0;
451
452 spin_lock(&lslist_lock);
453 list_for_each_entry(ls, &lslist, ls_list) {
454 WARN_ON(ls->ls_create_count <= 0);
455 if (ls->ls_namelen != namelen)
456 continue;
457 if (memcmp(ls->ls_name, name, namelen))
458 continue;
459 if (flags & DLM_LSFL_NEWEXCL) {
460 error = -EEXIST;
461 break;
462 }
463 ls->ls_create_count++;
8511a272
DT
464 *lockspace = ls;
465 error = 1;
0f8e0d9a 466 break;
e7fd4179 467 }
0f8e0d9a
DT
468 spin_unlock(&lslist_lock);
469
0f8e0d9a 470 if (error)
8511a272 471 goto out;
0f8e0d9a
DT
472
473 error = -ENOMEM;
e7fd4179 474
d96d0f96 475 ls = kzalloc(sizeof(*ls), GFP_NOFS);
e7fd4179
DT
476 if (!ls)
477 goto out;
e7fd4179
DT
478 memcpy(ls->ls_name, name, namelen);
479 ls->ls_namelen = namelen;
e7fd4179 480 ls->ls_lvblen = lvblen;
3cb5977c
AA
481 atomic_set(&ls->ls_count, 0);
482 init_waitqueue_head(&ls->ls_count_wait);
e7fd4179 483 ls->ls_flags = 0;
c1dcf65f 484 ls->ls_scan_time = jiffies;
e7fd4179 485
60f98d18
DT
486 if (ops && dlm_config.ci_recover_callbacks) {
487 ls->ls_ops = ops;
488 ls->ls_ops_arg = ops_arg;
489 }
490
81eeb82f 491#ifdef CONFIG_DLM_DEPRECATED_API
6b0afc0c 492 if (flags & DLM_LSFL_TIMEWARN) {
81eeb82f
AA
493 pr_warn_once("===============================================================\n"
494 "WARNING: the dlm DLM_LSFL_TIMEWARN flag is being deprecated and\n"
495 " will be removed in v6.2!\n"
496 " Inclusive DLM_LSFL_TIMEWARN define in UAPI header!\n"
497 "===============================================================\n");
81eeb82f 498
3ae1acf9 499 set_bit(LSFL_TIMEWARN, &ls->ls_flags);
81eeb82f 500 }
3ae1acf9 501
fad59c13 502 /* ls_exflags are forced to match among nodes, and we don't
6b0afc0c
AA
503 * need to require all nodes to have some flags set
504 */
0f8e0d9a
DT
505 ls->ls_exflags = (flags & ~(DLM_LSFL_TIMEWARN | DLM_LSFL_FS |
506 DLM_LSFL_NEWEXCL));
6b0afc0c
AA
507#else
508 /* ls_exflags are forced to match among nodes, and we don't
509 * need to require all nodes to have some flags set
510 */
511 ls->ls_exflags = (flags & ~(DLM_LSFL_FS | DLM_LSFL_NEWEXCL));
512#endif
fad59c13 513
d921a23f 514 size = READ_ONCE(dlm_config.ci_rsbtbl_size);
e7fd4179
DT
515 ls->ls_rsbtbl_size = size;
516
42bc47b3 517 ls->ls_rsbtbl = vmalloc(array_size(size, sizeof(struct dlm_rsbtable)));
e7fd4179
DT
518 if (!ls->ls_rsbtbl)
519 goto out_lsfree;
520 for (i = 0; i < size; i++) {
9beb3bf5
BP
521 ls->ls_rsbtbl[i].keep.rb_node = NULL;
522 ls->ls_rsbtbl[i].toss.rb_node = NULL;
c7be761a 523 spin_lock_init(&ls->ls_rsbtbl[i].lock);
e7fd4179
DT
524 }
525
05c32f47
DT
526 for (i = 0; i < DLM_REMOVE_NAMES_MAX; i++) {
527 ls->ls_remove_names[i] = kzalloc(DLM_RESNAME_MAXLEN+1,
528 GFP_KERNEL);
529 if (!ls->ls_remove_names[i])
530 goto out_rsbtbl;
531 }
532
3d6aa675
DT
533 idr_init(&ls->ls_lkbidr);
534 spin_lock_init(&ls->ls_lkbidr_spin);
e7fd4179 535
e7fd4179 536 INIT_LIST_HEAD(&ls->ls_waiters);
90135925 537 mutex_init(&ls->ls_waiters_mutex);
ef0c2bb0
DT
538 INIT_LIST_HEAD(&ls->ls_orphans);
539 mutex_init(&ls->ls_orphans_mutex);
6b0afc0c 540#ifdef CONFIG_DLM_DEPRECATED_API
3ae1acf9
DT
541 INIT_LIST_HEAD(&ls->ls_timeout);
542 mutex_init(&ls->ls_timeout_mutex);
6b0afc0c 543#endif
e7fd4179 544
3881ac04
DT
545 INIT_LIST_HEAD(&ls->ls_new_rsb);
546 spin_lock_init(&ls->ls_new_rsb_spin);
547
e7fd4179
DT
548 INIT_LIST_HEAD(&ls->ls_nodes);
549 INIT_LIST_HEAD(&ls->ls_nodes_gone);
550 ls->ls_num_nodes = 0;
551 ls->ls_low_nodeid = 0;
552 ls->ls_total_weight = 0;
553 ls->ls_node_array = NULL;
554
555 memset(&ls->ls_stub_rsb, 0, sizeof(struct dlm_rsb));
556 ls->ls_stub_rsb.res_ls = ls;
557
5de6319b
DT
558 ls->ls_debug_rsb_dentry = NULL;
559 ls->ls_debug_waiters_dentry = NULL;
e7fd4179
DT
560
561 init_waitqueue_head(&ls->ls_uevent_wait);
562 ls->ls_uevent_result = 0;
682bb91b
AA
563 init_completion(&ls->ls_recovery_done);
564 ls->ls_recovery_result = -1;
e7fd4179 565
a4c0352b 566 spin_lock_init(&ls->ls_cb_lock);
23e8e1aa
DT
567 INIT_LIST_HEAD(&ls->ls_cb_delay);
568
e7fd4179 569 ls->ls_recoverd_task = NULL;
90135925 570 mutex_init(&ls->ls_recoverd_active);
e7fd4179 571 spin_lock_init(&ls->ls_recover_lock);
98f176fb
DT
572 spin_lock_init(&ls->ls_rcom_spin);
573 get_random_bytes(&ls->ls_rcom_seq, sizeof(uint64_t));
e7fd4179 574 ls->ls_recover_status = 0;
317dd6ba 575 ls->ls_recover_seq = get_random_u64();
e7fd4179
DT
576 ls->ls_recover_args = NULL;
577 init_rwsem(&ls->ls_in_recovery);
c36258b5 578 init_rwsem(&ls->ls_recv_active);
e7fd4179 579 INIT_LIST_HEAD(&ls->ls_requestqueue);
164d88ab
AA
580 atomic_set(&ls->ls_requestqueue_cnt, 0);
581 init_waitqueue_head(&ls->ls_requestqueue_wait);
90135925 582 mutex_init(&ls->ls_requestqueue_mutex);
296d9d1e 583 spin_lock_init(&ls->ls_clear_proc_locks);
e7fd4179 584
489d8e55
AA
585 /* Due backwards compatibility with 3.1 we need to use maximum
586 * possible dlm message size to be sure the message will fit and
587 * not having out of bounds issues. However on sending side 3.2
588 * might send less.
589 */
d10a0b88 590 ls->ls_recover_buf = kmalloc(DLM_MAX_SOCKET_BUFSIZE, GFP_NOFS);
e7fd4179 591 if (!ls->ls_recover_buf)
05c32f47 592 goto out_lkbidr;
e7fd4179 593
757a4271
DT
594 ls->ls_slot = 0;
595 ls->ls_num_slots = 0;
596 ls->ls_slots_size = 0;
597 ls->ls_slots = NULL;
598
e7fd4179
DT
599 INIT_LIST_HEAD(&ls->ls_recover_list);
600 spin_lock_init(&ls->ls_recover_list_lock);
1d7c484e
DT
601 idr_init(&ls->ls_recover_idr);
602 spin_lock_init(&ls->ls_recover_idr_lock);
e7fd4179 603 ls->ls_recover_list_count = 0;
597d0cae 604 ls->ls_local_handle = ls;
e7fd4179
DT
605 init_waitqueue_head(&ls->ls_wait_general);
606 INIT_LIST_HEAD(&ls->ls_root_list);
607 init_rwsem(&ls->ls_root_sem);
608
5f88f1ea 609 spin_lock(&lslist_lock);
0f8e0d9a 610 ls->ls_create_count = 1;
5f88f1ea
DT
611 list_add(&ls->ls_list, &lslist);
612 spin_unlock(&lslist_lock);
613
23e8e1aa
DT
614 if (flags & DLM_LSFL_FS) {
615 error = dlm_callback_start(ls);
616 if (error) {
617 log_error(ls, "can't start dlm_callback %d", error);
618 goto out_delist;
619 }
620 }
621
475f230c
DT
622 init_waitqueue_head(&ls->ls_recover_lock_wait);
623
624 /*
625 * Once started, dlm_recoverd first looks for ls in lslist, then
626 * initializes ls_in_recovery as locked in "down" mode. We need
627 * to wait for the wakeup from dlm_recoverd because in_recovery
628 * has to start out in down mode.
629 */
630
e7fd4179
DT
631 error = dlm_recoverd_start(ls);
632 if (error) {
633 log_error(ls, "can't start dlm_recoverd %d", error);
23e8e1aa 634 goto out_callback;
e7fd4179
DT
635 }
636
475f230c
DT
637 wait_event(ls->ls_recover_lock_wait,
638 test_bit(LSFL_RECOVER_LOCK, &ls->ls_flags));
639
0ffddafc
WH
640 /* let kobject handle freeing of ls if there's an error */
641 do_unreg = 1;
642
901195ed
GKH
643 ls->ls_kobj.kset = dlm_kset;
644 error = kobject_init_and_add(&ls->ls_kobj, &dlm_ktype, NULL,
645 "%s", ls->ls_name);
e7fd4179 646 if (error)
23e8e1aa 647 goto out_recoverd;
901195ed 648 kobject_uevent(&ls->ls_kobj, KOBJ_ADD);
79d72b54 649
8b0e7b2c
DT
650 /* This uevent triggers dlm_controld in userspace to add us to the
651 group of nodes that are members of this lockspace (managed by the
652 cluster infrastructure.) Once it's done that, it tells us who the
653 current lockspace members are (via configfs) and then tells the
654 lockspace to start running (via sysfs) in dlm_ls_start(). */
655
e7fd4179
DT
656 error = do_uevent(ls, 1);
657 if (error)
23e8e1aa 658 goto out_recoverd;
79d72b54 659
682bb91b
AA
660 /* wait until recovery is successful or failed */
661 wait_for_completion(&ls->ls_recovery_done);
662 error = ls->ls_recovery_result;
8b0e7b2c
DT
663 if (error)
664 goto out_members;
665
79d72b54
DT
666 dlm_create_debug_file(ls);
667
075f0177 668 log_rinfo(ls, "join complete");
e7fd4179
DT
669 *lockspace = ls;
670 return 0;
671
8b0e7b2c
DT
672 out_members:
673 do_uevent(ls, 0);
674 dlm_clear_members(ls);
675 kfree(ls->ls_node_array);
23e8e1aa 676 out_recoverd:
5f88f1ea 677 dlm_recoverd_stop(ls);
23e8e1aa
DT
678 out_callback:
679 dlm_callback_stop(ls);
79d72b54 680 out_delist:
e7fd4179
DT
681 spin_lock(&lslist_lock);
682 list_del(&ls->ls_list);
683 spin_unlock(&lslist_lock);
1d7c484e 684 idr_destroy(&ls->ls_recover_idr);
e7fd4179 685 kfree(ls->ls_recover_buf);
05c32f47 686 out_lkbidr:
3d6aa675 687 idr_destroy(&ls->ls_lkbidr);
b982896c 688 out_rsbtbl:
3456880f
TM
689 for (i = 0; i < DLM_REMOVE_NAMES_MAX; i++)
690 kfree(ls->ls_remove_names[i]);
c282af49 691 vfree(ls->ls_rsbtbl);
e7fd4179 692 out_lsfree:
79d72b54 693 if (do_unreg)
197b12d6 694 kobject_put(&ls->ls_kobj);
79d72b54
DT
695 else
696 kfree(ls);
e7fd4179
DT
697 out:
698 module_put(THIS_MODULE);
699 return error;
700}
701
12cda13c
AA
702static int __dlm_new_lockspace(const char *name, const char *cluster,
703 uint32_t flags, int lvblen,
704 const struct dlm_lockspace_ops *ops,
705 void *ops_arg, int *ops_result,
706 dlm_lockspace_t **lockspace)
e7fd4179
DT
707{
708 int error = 0;
709
90135925 710 mutex_lock(&ls_lock);
e7fd4179
DT
711 if (!ls_count)
712 error = threads_start();
713 if (error)
714 goto out;
715
60f98d18
DT
716 error = new_lockspace(name, cluster, flags, lvblen, ops, ops_arg,
717 ops_result, lockspace);
e7fd4179
DT
718 if (!error)
719 ls_count++;
8511a272
DT
720 if (error > 0)
721 error = 0;
9d232469
AA
722 if (!ls_count) {
723 dlm_scand_stop();
a070a91c 724 dlm_midcomms_shutdown();
8b0188b0 725 dlm_midcomms_stop();
9d232469 726 }
e7fd4179 727 out:
90135925 728 mutex_unlock(&ls_lock);
e7fd4179
DT
729 return error;
730}
731
12cda13c
AA
732int dlm_new_lockspace(const char *name, const char *cluster, uint32_t flags,
733 int lvblen, const struct dlm_lockspace_ops *ops,
734 void *ops_arg, int *ops_result,
735 dlm_lockspace_t **lockspace)
736{
737 return __dlm_new_lockspace(name, cluster, flags | DLM_LSFL_FS, lvblen,
738 ops, ops_arg, ops_result, lockspace);
739}
740
741int dlm_new_user_lockspace(const char *name, const char *cluster,
742 uint32_t flags, int lvblen,
743 const struct dlm_lockspace_ops *ops,
744 void *ops_arg, int *ops_result,
745 dlm_lockspace_t **lockspace)
746{
747 return __dlm_new_lockspace(name, cluster, flags, lvblen, ops,
748 ops_arg, ops_result, lockspace);
749}
750
3d6aa675 751static int lkb_idr_is_local(int id, void *p, void *data)
e7fd4179 752{
3d6aa675
DT
753 struct dlm_lkb *lkb = p;
754
a97f4a66 755 return lkb->lkb_nodeid == 0 && lkb->lkb_grmode != DLM_LOCK_IV;
3d6aa675
DT
756}
757
758static int lkb_idr_is_any(int id, void *p, void *data)
759{
760 return 1;
761}
762
763static int lkb_idr_free(int id, void *p, void *data)
764{
765 struct dlm_lkb *lkb = p;
766
3d6aa675
DT
767 if (lkb->lkb_lvbptr && lkb->lkb_flags & DLM_IFL_MSTCPY)
768 dlm_free_lvb(lkb->lkb_lvbptr);
769
770 dlm_free_lkb(lkb);
771 return 0;
772}
773
774/* NOTE: We check the lkbidr here rather than the resource table.
775 This is because there may be LKBs queued as ASTs that have been unlinked
776 from their RSBs and are pending deletion once the AST has been delivered */
777
778static int lockspace_busy(struct dlm_ls *ls, int force)
779{
780 int rv;
781
782 spin_lock(&ls->ls_lkbidr_spin);
783 if (force == 0) {
784 rv = idr_for_each(&ls->ls_lkbidr, lkb_idr_is_any, ls);
785 } else if (force == 1) {
786 rv = idr_for_each(&ls->ls_lkbidr, lkb_idr_is_local, ls);
787 } else {
788 rv = 0;
e7fd4179 789 }
3d6aa675
DT
790 spin_unlock(&ls->ls_lkbidr_spin);
791 return rv;
e7fd4179
DT
792}
793
794static int release_lockspace(struct dlm_ls *ls, int force)
795{
e7fd4179 796 struct dlm_rsb *rsb;
9beb3bf5 797 struct rb_node *n;
0f8e0d9a
DT
798 int i, busy, rv;
799
3d6aa675 800 busy = lockspace_busy(ls, force);
0f8e0d9a
DT
801
802 spin_lock(&lslist_lock);
803 if (ls->ls_create_count == 1) {
3d6aa675 804 if (busy) {
0f8e0d9a 805 rv = -EBUSY;
3d6aa675 806 } else {
0f8e0d9a
DT
807 /* remove_lockspace takes ls off lslist */
808 ls->ls_create_count = 0;
809 rv = 0;
810 }
811 } else if (ls->ls_create_count > 1) {
812 rv = --ls->ls_create_count;
813 } else {
814 rv = -EINVAL;
815 }
816 spin_unlock(&lslist_lock);
817
818 if (rv) {
819 log_debug(ls, "release_lockspace no remove %d", rv);
820 return rv;
821 }
e7fd4179 822
b8b750e0
AA
823 if (ls_count == 1)
824 dlm_midcomms_version_wait();
825
0f8e0d9a 826 dlm_device_deregister(ls);
e7fd4179 827
dc68c7ed 828 if (force < 3 && dlm_user_daemon_available())
e7fd4179
DT
829 do_uevent(ls, 0);
830
831 dlm_recoverd_stop(ls);
832
9d232469
AA
833 if (ls_count == 1) {
834 dlm_scand_stop();
ecd95673 835 dlm_clear_members(ls);
a070a91c 836 dlm_midcomms_shutdown();
9d232469
AA
837 }
838
23e8e1aa
DT
839 dlm_callback_stop(ls);
840
e7fd4179
DT
841 remove_lockspace(ls);
842
843 dlm_delete_debug_file(ls);
844
8fc6ed9a 845 idr_destroy(&ls->ls_recover_idr);
e7fd4179
DT
846 kfree(ls->ls_recover_buf);
847
e7fd4179 848 /*
3d6aa675 849 * Free all lkb's in idr
e7fd4179
DT
850 */
851
3d6aa675 852 idr_for_each(&ls->ls_lkbidr, lkb_idr_free, ls);
3d6aa675 853 idr_destroy(&ls->ls_lkbidr);
e7fd4179 854
e7fd4179
DT
855 /*
856 * Free all rsb's on rsbtbl[] lists
857 */
858
859 for (i = 0; i < ls->ls_rsbtbl_size; i++) {
9beb3bf5
BP
860 while ((n = rb_first(&ls->ls_rsbtbl[i].keep))) {
861 rsb = rb_entry(n, struct dlm_rsb, res_hashnode);
862 rb_erase(n, &ls->ls_rsbtbl[i].keep);
52bda2b5 863 dlm_free_rsb(rsb);
e7fd4179
DT
864 }
865
9beb3bf5
BP
866 while ((n = rb_first(&ls->ls_rsbtbl[i].toss))) {
867 rsb = rb_entry(n, struct dlm_rsb, res_hashnode);
868 rb_erase(n, &ls->ls_rsbtbl[i].toss);
52bda2b5 869 dlm_free_rsb(rsb);
e7fd4179
DT
870 }
871 }
872
c282af49 873 vfree(ls->ls_rsbtbl);
e7fd4179 874
05c32f47
DT
875 for (i = 0; i < DLM_REMOVE_NAMES_MAX; i++)
876 kfree(ls->ls_remove_names[i]);
877
3881ac04
DT
878 while (!list_empty(&ls->ls_new_rsb)) {
879 rsb = list_first_entry(&ls->ls_new_rsb, struct dlm_rsb,
880 res_hashchain);
881 list_del(&rsb->res_hashchain);
882 dlm_free_rsb(rsb);
883 }
884
e7fd4179
DT
885 /*
886 * Free structures on any other lists
887 */
888
2896ee37 889 dlm_purge_requestqueue(ls);
e7fd4179 890 kfree(ls->ls_recover_args);
e7fd4179
DT
891 dlm_clear_members(ls);
892 dlm_clear_members_gone(ls);
893 kfree(ls->ls_node_array);
075f0177 894 log_rinfo(ls, "release_lockspace final free");
197b12d6 895 kobject_put(&ls->ls_kobj);
79d72b54 896 /* The ls structure will be freed when the kobject is done with */
e7fd4179 897
e7fd4179
DT
898 module_put(THIS_MODULE);
899 return 0;
900}
901
902/*
903 * Called when a system has released all its locks and is not going to use the
904 * lockspace any longer. We free everything we're managing for this lockspace.
905 * Remaining nodes will go through the recovery process as if we'd died. The
906 * lockspace must continue to function as usual, participating in recoveries,
907 * until this returns.
908 *
909 * Force has 4 possible values:
bb6866a5 910 * 0 - don't destroy lockspace if it has any LKBs
e7fd4179
DT
911 * 1 - destroy lockspace if it has remote LKBs but not if it has local LKBs
912 * 2 - destroy lockspace regardless of LKBs
913 * 3 - destroy lockspace as part of a forced shutdown
914 */
915
916int dlm_release_lockspace(void *lockspace, int force)
917{
918 struct dlm_ls *ls;
0f8e0d9a 919 int error;
e7fd4179
DT
920
921 ls = dlm_find_lockspace_local(lockspace);
922 if (!ls)
923 return -EINVAL;
924 dlm_put_lockspace(ls);
0f8e0d9a
DT
925
926 mutex_lock(&ls_lock);
927 error = release_lockspace(ls, force);
928 if (!error)
929 ls_count--;
278afcbf 930 if (!ls_count)
8b0188b0 931 dlm_midcomms_stop();
0f8e0d9a
DT
932 mutex_unlock(&ls_lock);
933
934 return error;
e7fd4179
DT
935}
936
dc68c7ed
DT
937void dlm_stop_lockspaces(void)
938{
939 struct dlm_ls *ls;
696b3d84 940 int count;
dc68c7ed
DT
941
942 restart:
696b3d84 943 count = 0;
dc68c7ed
DT
944 spin_lock(&lslist_lock);
945 list_for_each_entry(ls, &lslist, ls_list) {
696b3d84
DT
946 if (!test_bit(LSFL_RUNNING, &ls->ls_flags)) {
947 count++;
dc68c7ed 948 continue;
696b3d84 949 }
dc68c7ed
DT
950 spin_unlock(&lslist_lock);
951 log_error(ls, "no userland control daemon, stopping lockspace");
952 dlm_ls_stop(ls);
953 goto restart;
954 }
955 spin_unlock(&lslist_lock);
696b3d84
DT
956
957 if (count)
958 log_print("dlm user daemon left %d lockspaces", count);
dc68c7ed
DT
959}
960
2c3fa6ae
AA
961void dlm_stop_lockspaces_check(void)
962{
963 struct dlm_ls *ls;
964
965 spin_lock(&lslist_lock);
966 list_for_each_entry(ls, &lslist, ls_list) {
967 if (WARN_ON(!rwsem_is_locked(&ls->ls_in_recovery) ||
968 !dlm_locking_stopped(ls)))
969 break;
970 }
971 spin_unlock(&lslist_lock);
972}