fs: replace NIPQUAD()
[linux-2.6-block.git] / fs / ocfs2 / cluster / nodemanager.c
CommitLineData
0c83ed8e
KH
1/* -*- mode: c; c-basic-offset: 8; -*-
2 * vim: noexpandtab sw=8 ts=8 sts=0:
3 *
4 * Copyright (C) 2004, 2005 Oracle. All rights reserved.
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public
17 * License along with this program; if not, write to the
18 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
19 * Boston, MA 021110-1307, USA.
20 */
21
22#include <linux/kernel.h>
23#include <linux/module.h>
0c83ed8e
KH
24#include <linux/configfs.h>
25
0c83ed8e
KH
26#include "tcp.h"
27#include "nodemanager.h"
28#include "heartbeat.h"
29#include "masklog.h"
30#include "sys.h"
31#include "ver.h"
32
33/* for now we operate under the assertion that there can be only one
34 * cluster active at a time. Changing this will require trickling
35 * cluster references throughout where nodes are looked up */
296b75ed 36struct o2nm_cluster *o2nm_single_cluster = NULL;
0c83ed8e 37
0c83ed8e 38
0c83ed8e
KH
39struct o2nm_node *o2nm_get_node_by_num(u8 node_num)
40{
41 struct o2nm_node *node = NULL;
42
43 if (node_num >= O2NM_MAX_NODES || o2nm_single_cluster == NULL)
44 goto out;
45
46 read_lock(&o2nm_single_cluster->cl_nodes_lock);
47 node = o2nm_single_cluster->cl_nodes[node_num];
48 if (node)
49 config_item_get(&node->nd_item);
50 read_unlock(&o2nm_single_cluster->cl_nodes_lock);
51out:
52 return node;
53}
54EXPORT_SYMBOL_GPL(o2nm_get_node_by_num);
55
56int o2nm_configured_node_map(unsigned long *map, unsigned bytes)
57{
58 struct o2nm_cluster *cluster = o2nm_single_cluster;
59
60 BUG_ON(bytes < (sizeof(cluster->cl_nodes_bitmap)));
61
62 if (cluster == NULL)
63 return -EINVAL;
64
65 read_lock(&cluster->cl_nodes_lock);
66 memcpy(map, cluster->cl_nodes_bitmap, sizeof(cluster->cl_nodes_bitmap));
67 read_unlock(&cluster->cl_nodes_lock);
68
69 return 0;
70}
71EXPORT_SYMBOL_GPL(o2nm_configured_node_map);
72
73static struct o2nm_node *o2nm_node_ip_tree_lookup(struct o2nm_cluster *cluster,
74 __be32 ip_needle,
75 struct rb_node ***ret_p,
76 struct rb_node **ret_parent)
77{
78 struct rb_node **p = &cluster->cl_node_ip_tree.rb_node;
79 struct rb_node *parent = NULL;
80 struct o2nm_node *node, *ret = NULL;
81
82 while (*p) {
79cd22d3
AM
83 int cmp;
84
0c83ed8e
KH
85 parent = *p;
86 node = rb_entry(parent, struct o2nm_node, nd_ip_node);
87
79cd22d3
AM
88 cmp = memcmp(&ip_needle, &node->nd_ipv4_address,
89 sizeof(ip_needle));
90 if (cmp < 0)
0c83ed8e 91 p = &(*p)->rb_left;
79cd22d3 92 else if (cmp > 0)
0c83ed8e
KH
93 p = &(*p)->rb_right;
94 else {
95 ret = node;
96 break;
97 }
98 }
99
100 if (ret_p != NULL)
101 *ret_p = p;
102 if (ret_parent != NULL)
103 *ret_parent = parent;
104
105 return ret;
106}
107
108struct o2nm_node *o2nm_get_node_by_ip(__be32 addr)
109{
110 struct o2nm_node *node = NULL;
111 struct o2nm_cluster *cluster = o2nm_single_cluster;
112
113 if (cluster == NULL)
114 goto out;
115
116 read_lock(&cluster->cl_nodes_lock);
117 node = o2nm_node_ip_tree_lookup(cluster, addr, NULL, NULL);
118 if (node)
119 config_item_get(&node->nd_item);
120 read_unlock(&cluster->cl_nodes_lock);
121
122out:
123 return node;
124}
125EXPORT_SYMBOL_GPL(o2nm_get_node_by_ip);
126
127void o2nm_node_put(struct o2nm_node *node)
128{
129 config_item_put(&node->nd_item);
130}
131EXPORT_SYMBOL_GPL(o2nm_node_put);
132
133void o2nm_node_get(struct o2nm_node *node)
134{
135 config_item_get(&node->nd_item);
136}
137EXPORT_SYMBOL_GPL(o2nm_node_get);
138
139u8 o2nm_this_node(void)
140{
141 u8 node_num = O2NM_MAX_NODES;
142
143 if (o2nm_single_cluster && o2nm_single_cluster->cl_has_local)
144 node_num = o2nm_single_cluster->cl_local_node;
145
146 return node_num;
147}
148EXPORT_SYMBOL_GPL(o2nm_this_node);
149
150/* node configfs bits */
151
152static struct o2nm_cluster *to_o2nm_cluster(struct config_item *item)
153{
154 return item ?
155 container_of(to_config_group(item), struct o2nm_cluster,
156 cl_group)
157 : NULL;
158}
159
160static struct o2nm_node *to_o2nm_node(struct config_item *item)
161{
162 return item ? container_of(item, struct o2nm_node, nd_item) : NULL;
163}
164
165static void o2nm_node_release(struct config_item *item)
166{
167 struct o2nm_node *node = to_o2nm_node(item);
168 kfree(node);
169}
170
171static ssize_t o2nm_node_num_read(struct o2nm_node *node, char *page)
172{
173 return sprintf(page, "%d\n", node->nd_num);
174}
175
176static struct o2nm_cluster *to_o2nm_cluster_from_node(struct o2nm_node *node)
177{
178 /* through the first node_set .parent
179 * mycluster/nodes/mynode == o2nm_cluster->o2nm_node_group->o2nm_node */
180 return to_o2nm_cluster(node->nd_item.ci_parent->ci_parent);
181}
182
183enum {
184 O2NM_NODE_ATTR_NUM = 0,
185 O2NM_NODE_ATTR_PORT,
186 O2NM_NODE_ATTR_ADDRESS,
187 O2NM_NODE_ATTR_LOCAL,
188};
189
190static ssize_t o2nm_node_num_write(struct o2nm_node *node, const char *page,
191 size_t count)
192{
193 struct o2nm_cluster *cluster = to_o2nm_cluster_from_node(node);
194 unsigned long tmp;
195 char *p = (char *)page;
196
197 tmp = simple_strtoul(p, &p, 0);
198 if (!p || (*p && (*p != '\n')))
199 return -EINVAL;
200
201 if (tmp >= O2NM_MAX_NODES)
202 return -ERANGE;
203
204 /* once we're in the cl_nodes tree networking can look us up by
205 * node number and try to use our address and port attributes
206 * to connect to this node.. make sure that they've been set
207 * before writing the node attribute? */
208 if (!test_bit(O2NM_NODE_ATTR_ADDRESS, &node->nd_set_attributes) ||
209 !test_bit(O2NM_NODE_ATTR_PORT, &node->nd_set_attributes))
210 return -EINVAL; /* XXX */
211
212 write_lock(&cluster->cl_nodes_lock);
213 if (cluster->cl_nodes[tmp])
214 p = NULL;
215 else {
216 cluster->cl_nodes[tmp] = node;
217 node->nd_num = tmp;
218 set_bit(tmp, cluster->cl_nodes_bitmap);
219 }
220 write_unlock(&cluster->cl_nodes_lock);
221 if (p == NULL)
222 return -EEXIST;
223
224 return count;
225}
226static ssize_t o2nm_node_ipv4_port_read(struct o2nm_node *node, char *page)
227{
228 return sprintf(page, "%u\n", ntohs(node->nd_ipv4_port));
229}
230
231static ssize_t o2nm_node_ipv4_port_write(struct o2nm_node *node,
232 const char *page, size_t count)
233{
234 unsigned long tmp;
235 char *p = (char *)page;
236
237 tmp = simple_strtoul(p, &p, 0);
238 if (!p || (*p && (*p != '\n')))
239 return -EINVAL;
240
241 if (tmp == 0)
242 return -EINVAL;
243 if (tmp >= (u16)-1)
244 return -ERANGE;
245
246 node->nd_ipv4_port = htons(tmp);
247
248 return count;
249}
250
251static ssize_t o2nm_node_ipv4_address_read(struct o2nm_node *node, char *page)
252{
be859405 253 return sprintf(page, "%pI4\n", &node->nd_ipv4_address);
0c83ed8e
KH
254}
255
256static ssize_t o2nm_node_ipv4_address_write(struct o2nm_node *node,
257 const char *page,
258 size_t count)
259{
260 struct o2nm_cluster *cluster = to_o2nm_cluster_from_node(node);
261 int ret, i;
262 struct rb_node **p, *parent;
263 unsigned int octets[4];
264 __be32 ipv4_addr = 0;
265
266 ret = sscanf(page, "%3u.%3u.%3u.%3u", &octets[3], &octets[2],
267 &octets[1], &octets[0]);
268 if (ret != 4)
269 return -EINVAL;
270
271 for (i = 0; i < ARRAY_SIZE(octets); i++) {
272 if (octets[i] > 255)
273 return -ERANGE;
274 be32_add_cpu(&ipv4_addr, octets[i] << (i * 8));
275 }
276
277 ret = 0;
278 write_lock(&cluster->cl_nodes_lock);
279 if (o2nm_node_ip_tree_lookup(cluster, ipv4_addr, &p, &parent))
280 ret = -EEXIST;
281 else {
282 rb_link_node(&node->nd_ip_node, parent, p);
283 rb_insert_color(&node->nd_ip_node, &cluster->cl_node_ip_tree);
284 }
285 write_unlock(&cluster->cl_nodes_lock);
286 if (ret)
287 return ret;
288
289 memcpy(&node->nd_ipv4_address, &ipv4_addr, sizeof(ipv4_addr));
290
291 return count;
292}
293
294static ssize_t o2nm_node_local_read(struct o2nm_node *node, char *page)
295{
296 return sprintf(page, "%d\n", node->nd_local);
297}
298
299static ssize_t o2nm_node_local_write(struct o2nm_node *node, const char *page,
300 size_t count)
301{
302 struct o2nm_cluster *cluster = to_o2nm_cluster_from_node(node);
303 unsigned long tmp;
304 char *p = (char *)page;
305 ssize_t ret;
306
307 tmp = simple_strtoul(p, &p, 0);
308 if (!p || (*p && (*p != '\n')))
309 return -EINVAL;
310
311 tmp = !!tmp; /* boolean of whether this node wants to be local */
312
313 /* setting local turns on networking rx for now so we require having
314 * set everything else first */
315 if (!test_bit(O2NM_NODE_ATTR_ADDRESS, &node->nd_set_attributes) ||
316 !test_bit(O2NM_NODE_ATTR_NUM, &node->nd_set_attributes) ||
317 !test_bit(O2NM_NODE_ATTR_PORT, &node->nd_set_attributes))
318 return -EINVAL; /* XXX */
319
320 /* the only failure case is trying to set a new local node
321 * when a different one is already set */
322 if (tmp && tmp == cluster->cl_has_local &&
323 cluster->cl_local_node != node->nd_num)
324 return -EBUSY;
325
326 /* bring up the rx thread if we're setting the new local node. */
327 if (tmp && !cluster->cl_has_local) {
328 ret = o2net_start_listening(node);
329 if (ret)
330 return ret;
331 }
332
333 if (!tmp && cluster->cl_has_local &&
334 cluster->cl_local_node == node->nd_num) {
335 o2net_stop_listening(node);
336 cluster->cl_local_node = O2NM_INVALID_NODE_NUM;
337 }
338
339 node->nd_local = tmp;
340 if (node->nd_local) {
341 cluster->cl_has_local = tmp;
342 cluster->cl_local_node = node->nd_num;
343 }
344
345 return count;
346}
347
348struct o2nm_node_attribute {
349 struct configfs_attribute attr;
350 ssize_t (*show)(struct o2nm_node *, char *);
351 ssize_t (*store)(struct o2nm_node *, const char *, size_t);
352};
353
354static struct o2nm_node_attribute o2nm_node_attr_num = {
355 .attr = { .ca_owner = THIS_MODULE,
356 .ca_name = "num",
357 .ca_mode = S_IRUGO | S_IWUSR },
358 .show = o2nm_node_num_read,
359 .store = o2nm_node_num_write,
360};
361
362static struct o2nm_node_attribute o2nm_node_attr_ipv4_port = {
363 .attr = { .ca_owner = THIS_MODULE,
364 .ca_name = "ipv4_port",
365 .ca_mode = S_IRUGO | S_IWUSR },
366 .show = o2nm_node_ipv4_port_read,
367 .store = o2nm_node_ipv4_port_write,
368};
369
370static struct o2nm_node_attribute o2nm_node_attr_ipv4_address = {
371 .attr = { .ca_owner = THIS_MODULE,
372 .ca_name = "ipv4_address",
373 .ca_mode = S_IRUGO | S_IWUSR },
374 .show = o2nm_node_ipv4_address_read,
375 .store = o2nm_node_ipv4_address_write,
376};
377
378static struct o2nm_node_attribute o2nm_node_attr_local = {
379 .attr = { .ca_owner = THIS_MODULE,
380 .ca_name = "local",
381 .ca_mode = S_IRUGO | S_IWUSR },
382 .show = o2nm_node_local_read,
383 .store = o2nm_node_local_write,
384};
385
386static struct configfs_attribute *o2nm_node_attrs[] = {
387 [O2NM_NODE_ATTR_NUM] = &o2nm_node_attr_num.attr,
388 [O2NM_NODE_ATTR_PORT] = &o2nm_node_attr_ipv4_port.attr,
389 [O2NM_NODE_ATTR_ADDRESS] = &o2nm_node_attr_ipv4_address.attr,
390 [O2NM_NODE_ATTR_LOCAL] = &o2nm_node_attr_local.attr,
391 NULL,
392};
393
394static int o2nm_attr_index(struct configfs_attribute *attr)
395{
396 int i;
397 for (i = 0; i < ARRAY_SIZE(o2nm_node_attrs); i++) {
398 if (attr == o2nm_node_attrs[i])
399 return i;
400 }
401 BUG();
402 return 0;
403}
404
405static ssize_t o2nm_node_show(struct config_item *item,
406 struct configfs_attribute *attr,
407 char *page)
408{
409 struct o2nm_node *node = to_o2nm_node(item);
410 struct o2nm_node_attribute *o2nm_node_attr =
411 container_of(attr, struct o2nm_node_attribute, attr);
412 ssize_t ret = 0;
413
414 if (o2nm_node_attr->show)
415 ret = o2nm_node_attr->show(node, page);
416 return ret;
417}
418
419static ssize_t o2nm_node_store(struct config_item *item,
420 struct configfs_attribute *attr,
421 const char *page, size_t count)
422{
423 struct o2nm_node *node = to_o2nm_node(item);
424 struct o2nm_node_attribute *o2nm_node_attr =
425 container_of(attr, struct o2nm_node_attribute, attr);
426 ssize_t ret;
427 int attr_index = o2nm_attr_index(attr);
428
429 if (o2nm_node_attr->store == NULL) {
430 ret = -EINVAL;
431 goto out;
432 }
433
434 if (test_bit(attr_index, &node->nd_set_attributes))
435 return -EBUSY;
436
437 ret = o2nm_node_attr->store(node, page, count);
438 if (ret < count)
439 goto out;
440
441 set_bit(attr_index, &node->nd_set_attributes);
442out:
443 return ret;
444}
445
446static struct configfs_item_operations o2nm_node_item_ops = {
447 .release = o2nm_node_release,
448 .show_attribute = o2nm_node_show,
449 .store_attribute = o2nm_node_store,
450};
451
452static struct config_item_type o2nm_node_type = {
453 .ct_item_ops = &o2nm_node_item_ops,
454 .ct_attrs = o2nm_node_attrs,
455 .ct_owner = THIS_MODULE,
456};
457
458/* node set */
459
460struct o2nm_node_group {
461 struct config_group ns_group;
462 /* some stuff? */
463};
464
465#if 0
466static struct o2nm_node_group *to_o2nm_node_group(struct config_group *group)
467{
468 return group ?
469 container_of(group, struct o2nm_node_group, ns_group)
470 : NULL;
471}
472#endif
473
b5dd8030
JM
474struct o2nm_cluster_attribute {
475 struct configfs_attribute attr;
476 ssize_t (*show)(struct o2nm_cluster *, char *);
477 ssize_t (*store)(struct o2nm_cluster *, const char *, size_t);
478};
479
480static ssize_t o2nm_cluster_attr_write(const char *page, ssize_t count,
481 unsigned int *val)
482{
483 unsigned long tmp;
484 char *p = (char *)page;
485
486 tmp = simple_strtoul(p, &p, 0);
487 if (!p || (*p && (*p != '\n')))
488 return -EINVAL;
489
490 if (tmp == 0)
491 return -EINVAL;
492 if (tmp >= (u32)-1)
493 return -ERANGE;
494
495 *val = tmp;
496
497 return count;
498}
499
500static ssize_t o2nm_cluster_attr_idle_timeout_ms_read(
501 struct o2nm_cluster *cluster, char *page)
502{
503 return sprintf(page, "%u\n", cluster->cl_idle_timeout_ms);
504}
505
506static ssize_t o2nm_cluster_attr_idle_timeout_ms_write(
507 struct o2nm_cluster *cluster, const char *page, size_t count)
508{
509 ssize_t ret;
510 unsigned int val;
511
512 ret = o2nm_cluster_attr_write(page, count, &val);
513
514 if (ret > 0) {
828ae6af
AB
515 if (cluster->cl_idle_timeout_ms != val
516 && o2net_num_connected_peers()) {
517 mlog(ML_NOTICE,
518 "o2net: cannot change idle timeout after "
519 "the first peer has agreed to it."
520 " %d connected peers\n",
521 o2net_num_connected_peers());
522 ret = -EINVAL;
523 } else if (val <= cluster->cl_keepalive_delay_ms) {
b5dd8030
JM
524 mlog(ML_NOTICE, "o2net: idle timeout must be larger "
525 "than keepalive delay\n");
828ae6af
AB
526 ret = -EINVAL;
527 } else {
528 cluster->cl_idle_timeout_ms = val;
b5dd8030 529 }
b5dd8030
JM
530 }
531
532 return ret;
533}
534
535static ssize_t o2nm_cluster_attr_keepalive_delay_ms_read(
536 struct o2nm_cluster *cluster, char *page)
537{
538 return sprintf(page, "%u\n", cluster->cl_keepalive_delay_ms);
539}
540
541static ssize_t o2nm_cluster_attr_keepalive_delay_ms_write(
542 struct o2nm_cluster *cluster, const char *page, size_t count)
543{
544 ssize_t ret;
545 unsigned int val;
546
547 ret = o2nm_cluster_attr_write(page, count, &val);
548
549 if (ret > 0) {
828ae6af
AB
550 if (cluster->cl_keepalive_delay_ms != val
551 && o2net_num_connected_peers()) {
552 mlog(ML_NOTICE,
553 "o2net: cannot change keepalive delay after"
554 " the first peer has agreed to it."
555 " %d connected peers\n",
556 o2net_num_connected_peers());
557 ret = -EINVAL;
558 } else if (val >= cluster->cl_idle_timeout_ms) {
b5dd8030
JM
559 mlog(ML_NOTICE, "o2net: keepalive delay must be "
560 "smaller than idle timeout\n");
828ae6af
AB
561 ret = -EINVAL;
562 } else {
563 cluster->cl_keepalive_delay_ms = val;
b5dd8030 564 }
b5dd8030
JM
565 }
566
567 return ret;
568}
569
570static ssize_t o2nm_cluster_attr_reconnect_delay_ms_read(
571 struct o2nm_cluster *cluster, char *page)
572{
573 return sprintf(page, "%u\n", cluster->cl_reconnect_delay_ms);
574}
575
576static ssize_t o2nm_cluster_attr_reconnect_delay_ms_write(
577 struct o2nm_cluster *cluster, const char *page, size_t count)
578{
579 return o2nm_cluster_attr_write(page, count,
580 &cluster->cl_reconnect_delay_ms);
581}
582static struct o2nm_cluster_attribute o2nm_cluster_attr_idle_timeout_ms = {
583 .attr = { .ca_owner = THIS_MODULE,
584 .ca_name = "idle_timeout_ms",
585 .ca_mode = S_IRUGO | S_IWUSR },
586 .show = o2nm_cluster_attr_idle_timeout_ms_read,
587 .store = o2nm_cluster_attr_idle_timeout_ms_write,
588};
589
590static struct o2nm_cluster_attribute o2nm_cluster_attr_keepalive_delay_ms = {
591 .attr = { .ca_owner = THIS_MODULE,
592 .ca_name = "keepalive_delay_ms",
593 .ca_mode = S_IRUGO | S_IWUSR },
594 .show = o2nm_cluster_attr_keepalive_delay_ms_read,
595 .store = o2nm_cluster_attr_keepalive_delay_ms_write,
596};
597
598static struct o2nm_cluster_attribute o2nm_cluster_attr_reconnect_delay_ms = {
599 .attr = { .ca_owner = THIS_MODULE,
600 .ca_name = "reconnect_delay_ms",
601 .ca_mode = S_IRUGO | S_IWUSR },
602 .show = o2nm_cluster_attr_reconnect_delay_ms_read,
603 .store = o2nm_cluster_attr_reconnect_delay_ms_write,
604};
605
606static struct configfs_attribute *o2nm_cluster_attrs[] = {
607 &o2nm_cluster_attr_idle_timeout_ms.attr,
608 &o2nm_cluster_attr_keepalive_delay_ms.attr,
609 &o2nm_cluster_attr_reconnect_delay_ms.attr,
610 NULL,
611};
612static ssize_t o2nm_cluster_show(struct config_item *item,
613 struct configfs_attribute *attr,
614 char *page)
615{
616 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
617 struct o2nm_cluster_attribute *o2nm_cluster_attr =
618 container_of(attr, struct o2nm_cluster_attribute, attr);
619 ssize_t ret = 0;
620
621 if (o2nm_cluster_attr->show)
622 ret = o2nm_cluster_attr->show(cluster, page);
623 return ret;
624}
625
626static ssize_t o2nm_cluster_store(struct config_item *item,
627 struct configfs_attribute *attr,
628 const char *page, size_t count)
629{
630 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
631 struct o2nm_cluster_attribute *o2nm_cluster_attr =
632 container_of(attr, struct o2nm_cluster_attribute, attr);
633 ssize_t ret;
634
635 if (o2nm_cluster_attr->store == NULL) {
636 ret = -EINVAL;
637 goto out;
638 }
639
640 ret = o2nm_cluster_attr->store(cluster, page, count);
641 if (ret < count)
642 goto out;
643out:
644 return ret;
645}
646
f89ab861
JB
647static struct config_item *o2nm_node_group_make_item(struct config_group *group,
648 const char *name)
0c83ed8e
KH
649{
650 struct o2nm_node *node = NULL;
0c83ed8e 651
f89ab861 652 if (strlen(name) > O2NM_MAX_NAME_LEN)
a6795e9e 653 return ERR_PTR(-ENAMETOOLONG);
0c83ed8e 654
cd861280 655 node = kzalloc(sizeof(struct o2nm_node), GFP_KERNEL);
f89ab861 656 if (node == NULL)
a6795e9e 657 return ERR_PTR(-ENOMEM);
0c83ed8e
KH
658
659 strcpy(node->nd_name, name); /* use item.ci_namebuf instead? */
660 config_item_init_type_name(&node->nd_item, name, &o2nm_node_type);
661 spin_lock_init(&node->nd_lock);
662
a6795e9e 663 return &node->nd_item;
0c83ed8e
KH
664}
665
666static void o2nm_node_group_drop_item(struct config_group *group,
667 struct config_item *item)
668{
669 struct o2nm_node *node = to_o2nm_node(item);
670 struct o2nm_cluster *cluster = to_o2nm_cluster(group->cg_item.ci_parent);
671
672 o2net_disconnect_node(node);
673
674 if (cluster->cl_has_local &&
675 (cluster->cl_local_node == node->nd_num)) {
676 cluster->cl_has_local = 0;
677 cluster->cl_local_node = O2NM_INVALID_NODE_NUM;
678 o2net_stop_listening(node);
679 }
680
681 /* XXX call into net to stop this node from trading messages */
682
683 write_lock(&cluster->cl_nodes_lock);
684
685 /* XXX sloppy */
686 if (node->nd_ipv4_address)
687 rb_erase(&node->nd_ip_node, &cluster->cl_node_ip_tree);
688
689 /* nd_num might be 0 if the node number hasn't been set.. */
690 if (cluster->cl_nodes[node->nd_num] == node) {
691 cluster->cl_nodes[node->nd_num] = NULL;
692 clear_bit(node->nd_num, cluster->cl_nodes_bitmap);
693 }
694 write_unlock(&cluster->cl_nodes_lock);
695
696 config_item_put(item);
697}
698
699static struct configfs_group_operations o2nm_node_group_group_ops = {
700 .make_item = o2nm_node_group_make_item,
701 .drop_item = o2nm_node_group_drop_item,
702};
703
704static struct config_item_type o2nm_node_group_type = {
705 .ct_group_ops = &o2nm_node_group_group_ops,
706 .ct_owner = THIS_MODULE,
707};
708
709/* cluster */
710
711static void o2nm_cluster_release(struct config_item *item)
712{
713 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
714
715 kfree(cluster->cl_group.default_groups);
716 kfree(cluster);
717}
718
719static struct configfs_item_operations o2nm_cluster_item_ops = {
720 .release = o2nm_cluster_release,
b5dd8030
JM
721 .show_attribute = o2nm_cluster_show,
722 .store_attribute = o2nm_cluster_store,
0c83ed8e
KH
723};
724
725static struct config_item_type o2nm_cluster_type = {
726 .ct_item_ops = &o2nm_cluster_item_ops,
b5dd8030 727 .ct_attrs = o2nm_cluster_attrs,
0c83ed8e
KH
728 .ct_owner = THIS_MODULE,
729};
730
731/* cluster set */
732
733struct o2nm_cluster_group {
734 struct configfs_subsystem cs_subsys;
735 /* some stuff? */
736};
737
738#if 0
739static struct o2nm_cluster_group *to_o2nm_cluster_group(struct config_group *group)
740{
741 return group ?
742 container_of(to_configfs_subsystem(group), struct o2nm_cluster_group, cs_subsys)
743 : NULL;
744}
745#endif
746
f89ab861
JB
747static struct config_group *o2nm_cluster_group_make_group(struct config_group *group,
748 const char *name)
0c83ed8e
KH
749{
750 struct o2nm_cluster *cluster = NULL;
751 struct o2nm_node_group *ns = NULL;
f89ab861 752 struct config_group *o2hb_group = NULL, *ret = NULL;
0c83ed8e
KH
753 void *defs = NULL;
754
1b1dcc1b 755 /* this runs under the parent dir's i_mutex; there can be only
0c83ed8e 756 * one caller in here at a time */
f89ab861 757 if (o2nm_single_cluster)
a6795e9e 758 return ERR_PTR(-ENOSPC);
0c83ed8e 759
cd861280
RD
760 cluster = kzalloc(sizeof(struct o2nm_cluster), GFP_KERNEL);
761 ns = kzalloc(sizeof(struct o2nm_node_group), GFP_KERNEL);
0c83ed8e
KH
762 defs = kcalloc(3, sizeof(struct config_group *), GFP_KERNEL);
763 o2hb_group = o2hb_alloc_hb_set();
f89ab861 764 if (cluster == NULL || ns == NULL || o2hb_group == NULL || defs == NULL)
0c83ed8e
KH
765 goto out;
766
767 config_group_init_type_name(&cluster->cl_group, name,
768 &o2nm_cluster_type);
769 config_group_init_type_name(&ns->ns_group, "node",
770 &o2nm_node_group_type);
771
772 cluster->cl_group.default_groups = defs;
773 cluster->cl_group.default_groups[0] = &ns->ns_group;
774 cluster->cl_group.default_groups[1] = o2hb_group;
775 cluster->cl_group.default_groups[2] = NULL;
776 rwlock_init(&cluster->cl_nodes_lock);
777 cluster->cl_node_ip_tree = RB_ROOT;
b5dd8030
JM
778 cluster->cl_reconnect_delay_ms = O2NET_RECONNECT_DELAY_MS_DEFAULT;
779 cluster->cl_idle_timeout_ms = O2NET_IDLE_TIMEOUT_MS_DEFAULT;
780 cluster->cl_keepalive_delay_ms = O2NET_KEEPALIVE_DELAY_MS_DEFAULT;
0c83ed8e 781
f89ab861 782 ret = &cluster->cl_group;
0c83ed8e
KH
783 o2nm_single_cluster = cluster;
784
785out:
f89ab861 786 if (ret == NULL) {
0c83ed8e
KH
787 kfree(cluster);
788 kfree(ns);
789 o2hb_free_hb_set(o2hb_group);
790 kfree(defs);
a6795e9e 791 ret = ERR_PTR(-ENOMEM);
0c83ed8e
KH
792 }
793
794 return ret;
795}
796
797static void o2nm_cluster_group_drop_item(struct config_group *group, struct config_item *item)
798{
799 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
800 int i;
801 struct config_item *killme;
802
803 BUG_ON(o2nm_single_cluster != cluster);
804 o2nm_single_cluster = NULL;
805
806 for (i = 0; cluster->cl_group.default_groups[i]; i++) {
807 killme = &cluster->cl_group.default_groups[i]->cg_item;
808 cluster->cl_group.default_groups[i] = NULL;
809 config_item_put(killme);
810 }
811
812 config_item_put(item);
813}
814
815static struct configfs_group_operations o2nm_cluster_group_group_ops = {
816 .make_group = o2nm_cluster_group_make_group,
817 .drop_item = o2nm_cluster_group_drop_item,
818};
819
820static struct config_item_type o2nm_cluster_group_type = {
821 .ct_group_ops = &o2nm_cluster_group_group_ops,
822 .ct_owner = THIS_MODULE,
823};
824
825static struct o2nm_cluster_group o2nm_cluster_group = {
826 .cs_subsys = {
827 .su_group = {
828 .cg_item = {
829 .ci_namebuf = "cluster",
830 .ci_type = &o2nm_cluster_group_type,
831 },
832 },
833 },
834};
835
14829422
JB
836int o2nm_depend_item(struct config_item *item)
837{
838 return configfs_depend_item(&o2nm_cluster_group.cs_subsys, item);
839}
840
841void o2nm_undepend_item(struct config_item *item)
842{
843 configfs_undepend_item(&o2nm_cluster_group.cs_subsys, item);
844}
845
16c6a4f2
JB
846int o2nm_depend_this_node(void)
847{
848 int ret = 0;
849 struct o2nm_node *local_node;
850
851 local_node = o2nm_get_node_by_num(o2nm_this_node());
852 if (!local_node) {
853 ret = -EINVAL;
854 goto out;
855 }
856
857 ret = o2nm_depend_item(&local_node->nd_item);
858 o2nm_node_put(local_node);
859
860out:
861 return ret;
862}
863
864void o2nm_undepend_this_node(void)
865{
866 struct o2nm_node *local_node;
867
868 local_node = o2nm_get_node_by_num(o2nm_this_node());
869 BUG_ON(!local_node);
870
871 o2nm_undepend_item(&local_node->nd_item);
872 o2nm_node_put(local_node);
873}
874
875
0c83ed8e
KH
876static void __exit exit_o2nm(void)
877{
0c83ed8e
KH
878 /* XXX sync with hb callbacks and shut down hb? */
879 o2net_unregister_hb_callbacks();
880 configfs_unregister_subsystem(&o2nm_cluster_group.cs_subsys);
881 o2cb_sys_shutdown();
882
883 o2net_exit();
884}
885
886static int __init init_o2nm(void)
887{
888 int ret = -1;
889
890 cluster_print_version();
891
892 o2hb_init();
2309e9e0
SM
893
894 ret = o2net_init();
895 if (ret)
896 goto out;
0c83ed8e 897
0c83ed8e
KH
898 ret = o2net_register_hb_callbacks();
899 if (ret)
3878f110 900 goto out_o2net;
0c83ed8e
KH
901
902 config_group_init(&o2nm_cluster_group.cs_subsys.su_group);
e6bd07ae 903 mutex_init(&o2nm_cluster_group.cs_subsys.su_mutex);
0c83ed8e
KH
904 ret = configfs_register_subsystem(&o2nm_cluster_group.cs_subsys);
905 if (ret) {
906 printk(KERN_ERR "nodemanager: Registration returned %d\n", ret);
907 goto out_callbacks;
908 }
909
910 ret = o2cb_sys_init();
911 if (!ret)
912 goto out;
913
914 configfs_unregister_subsystem(&o2nm_cluster_group.cs_subsys);
915out_callbacks:
916 o2net_unregister_hb_callbacks();
895928b8
JM
917out_o2net:
918 o2net_exit();
0c83ed8e
KH
919out:
920 return ret;
921}
922
923MODULE_AUTHOR("Oracle");
924MODULE_LICENSE("GPL");
925
926module_init(init_o2nm)
927module_exit(exit_o2nm)