On Tue, Nov 06, 2007 at 02:33:53AM -0800, akpm@linux-foundation.org wrote:
[mmotm.git] / fs / ocfs2 / cluster / nodemanager.c
blob7ee6188bc79a76ebc939b738bcfc3914c99b3ef6
1 /* -*- mode: c; c-basic-offset: 8; -*-
2 * vim: noexpandtab sw=8 ts=8 sts=0:
4 * Copyright (C) 2004, 2005 Oracle. All rights reserved.
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * General Public License for more details.
16 * You should have received a copy of the GNU General Public
17 * License along with this program; if not, write to the
18 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
19 * Boston, MA 021110-1307, USA.
22 #include <linux/kernel.h>
23 #include <linux/module.h>
24 #include <linux/configfs.h>
26 #include "tcp.h"
27 #include "nodemanager.h"
28 #include "heartbeat.h"
29 #include "masklog.h"
30 #include "sys.h"
31 #include "ver.h"
33 /* for now we operate under the assertion that there can be only one
34 * cluster active at a time. Changing this will require trickling
35 * cluster references throughout where nodes are looked up */
36 struct o2nm_cluster *o2nm_single_cluster = NULL;
39 struct o2nm_node *o2nm_get_node_by_num(u8 node_num)
41 struct o2nm_node *node = NULL;
43 if (node_num >= O2NM_MAX_NODES || o2nm_single_cluster == NULL)
44 goto out;
46 read_lock(&o2nm_single_cluster->cl_nodes_lock);
47 node = o2nm_single_cluster->cl_nodes[node_num];
48 if (node)
49 config_item_get(&node->nd_item);
50 read_unlock(&o2nm_single_cluster->cl_nodes_lock);
51 out:
52 return node;
54 EXPORT_SYMBOL_GPL(o2nm_get_node_by_num);
56 int o2nm_configured_node_map(unsigned long *map, unsigned bytes)
58 struct o2nm_cluster *cluster = o2nm_single_cluster;
60 BUG_ON(bytes < (sizeof(cluster->cl_nodes_bitmap)));
62 if (cluster == NULL)
63 return -EINVAL;
65 read_lock(&cluster->cl_nodes_lock);
66 memcpy(map, cluster->cl_nodes_bitmap, sizeof(cluster->cl_nodes_bitmap));
67 read_unlock(&cluster->cl_nodes_lock);
69 return 0;
71 EXPORT_SYMBOL_GPL(o2nm_configured_node_map);
73 static struct o2nm_node *o2nm_node_ip_tree_lookup(struct o2nm_cluster *cluster,
74 __be32 ip_needle,
75 struct rb_node ***ret_p,
76 struct rb_node **ret_parent)
78 struct rb_node **p = &cluster->cl_node_ip_tree.rb_node;
79 struct rb_node *parent = NULL;
80 struct o2nm_node *node, *ret = NULL;
82 while (*p) {
83 int cmp;
85 parent = *p;
86 node = rb_entry(parent, struct o2nm_node, nd_ip_node);
88 cmp = memcmp(&ip_needle, &node->nd_ipv4_address,
89 sizeof(ip_needle));
90 if (cmp < 0)
91 p = &(*p)->rb_left;
92 else if (cmp > 0)
93 p = &(*p)->rb_right;
94 else {
95 ret = node;
96 break;
100 if (ret_p != NULL)
101 *ret_p = p;
102 if (ret_parent != NULL)
103 *ret_parent = parent;
105 return ret;
108 struct o2nm_node *o2nm_get_node_by_ip(__be32 addr)
110 struct o2nm_node *node = NULL;
111 struct o2nm_cluster *cluster = o2nm_single_cluster;
113 if (cluster == NULL)
114 goto out;
116 read_lock(&cluster->cl_nodes_lock);
117 node = o2nm_node_ip_tree_lookup(cluster, addr, NULL, NULL);
118 if (node)
119 config_item_get(&node->nd_item);
120 read_unlock(&cluster->cl_nodes_lock);
122 out:
123 return node;
125 EXPORT_SYMBOL_GPL(o2nm_get_node_by_ip);
127 void o2nm_node_put(struct o2nm_node *node)
129 config_item_put(&node->nd_item);
131 EXPORT_SYMBOL_GPL(o2nm_node_put);
133 void o2nm_node_get(struct o2nm_node *node)
135 config_item_get(&node->nd_item);
137 EXPORT_SYMBOL_GPL(o2nm_node_get);
139 u8 o2nm_this_node(void)
141 u8 node_num = O2NM_MAX_NODES;
143 if (o2nm_single_cluster && o2nm_single_cluster->cl_has_local)
144 node_num = o2nm_single_cluster->cl_local_node;
146 return node_num;
148 EXPORT_SYMBOL_GPL(o2nm_this_node);
150 /* node configfs bits */
152 static struct o2nm_cluster *to_o2nm_cluster(struct config_item *item)
154 return item ?
155 container_of(to_config_group(item), struct o2nm_cluster,
156 cl_group)
157 : NULL;
160 static struct o2nm_node *to_o2nm_node(struct config_item *item)
162 return item ? container_of(item, struct o2nm_node, nd_item) : NULL;
165 static void o2nm_node_release(struct config_item *item)
167 struct o2nm_node *node = to_o2nm_node(item);
168 kfree(node);
171 static ssize_t o2nm_node_num_read(struct o2nm_node *node, char *page)
173 return sprintf(page, "%d\n", node->nd_num);
176 static struct o2nm_cluster *to_o2nm_cluster_from_node(struct o2nm_node *node)
178 /* through the first node_set .parent
179 * mycluster/nodes/mynode == o2nm_cluster->o2nm_node_group->o2nm_node */
180 return to_o2nm_cluster(node->nd_item.ci_parent->ci_parent);
183 enum {
184 O2NM_NODE_ATTR_NUM = 0,
185 O2NM_NODE_ATTR_PORT,
186 O2NM_NODE_ATTR_ADDRESS,
187 O2NM_NODE_ATTR_LOCAL,
190 static ssize_t o2nm_node_num_write(struct o2nm_node *node, const char *page,
191 size_t count)
193 struct o2nm_cluster *cluster = to_o2nm_cluster_from_node(node);
194 unsigned long tmp;
195 char *p = (char *)page;
197 tmp = simple_strtoul(p, &p, 0);
198 if (!p || (*p && (*p != '\n')))
199 return -EINVAL;
201 if (tmp >= O2NM_MAX_NODES)
202 return -ERANGE;
204 /* once we're in the cl_nodes tree networking can look us up by
205 * node number and try to use our address and port attributes
206 * to connect to this node.. make sure that they've been set
207 * before writing the node attribute? */
208 if (!test_bit(O2NM_NODE_ATTR_ADDRESS, &node->nd_set_attributes) ||
209 !test_bit(O2NM_NODE_ATTR_PORT, &node->nd_set_attributes))
210 return -EINVAL; /* XXX */
212 write_lock(&cluster->cl_nodes_lock);
213 if (cluster->cl_nodes[tmp])
214 p = NULL;
215 else {
216 cluster->cl_nodes[tmp] = node;
217 node->nd_num = tmp;
218 set_bit(tmp, cluster->cl_nodes_bitmap);
220 write_unlock(&cluster->cl_nodes_lock);
221 if (p == NULL)
222 return -EEXIST;
224 return count;
226 static ssize_t o2nm_node_ipv4_port_read(struct o2nm_node *node, char *page)
228 return sprintf(page, "%u\n", ntohs(node->nd_ipv4_port));
231 static ssize_t o2nm_node_ipv4_port_write(struct o2nm_node *node,
232 const char *page, size_t count)
234 unsigned long tmp;
235 char *p = (char *)page;
237 tmp = simple_strtoul(p, &p, 0);
238 if (!p || (*p && (*p != '\n')))
239 return -EINVAL;
241 if (tmp == 0)
242 return -EINVAL;
243 if (tmp >= (u16)-1)
244 return -ERANGE;
246 node->nd_ipv4_port = htons(tmp);
248 return count;
251 static ssize_t o2nm_node_ipv4_address_read(struct o2nm_node *node, char *page)
253 return sprintf(page, "%pI4\n", &node->nd_ipv4_address);
256 static ssize_t o2nm_node_ipv4_address_write(struct o2nm_node *node,
257 const char *page,
258 size_t count)
260 struct o2nm_cluster *cluster = to_o2nm_cluster_from_node(node);
261 int ret, i;
262 struct rb_node **p, *parent;
263 unsigned int octets[4];
264 __be32 ipv4_addr = 0;
266 ret = sscanf(page, "%3u.%3u.%3u.%3u", &octets[3], &octets[2],
267 &octets[1], &octets[0]);
268 if (ret != 4)
269 return -EINVAL;
271 for (i = 0; i < ARRAY_SIZE(octets); i++) {
272 if (octets[i] > 255)
273 return -ERANGE;
274 be32_add_cpu(&ipv4_addr, octets[i] << (i * 8));
277 ret = 0;
278 write_lock(&cluster->cl_nodes_lock);
279 if (o2nm_node_ip_tree_lookup(cluster, ipv4_addr, &p, &parent))
280 ret = -EEXIST;
281 else {
282 rb_link_node(&node->nd_ip_node, parent, p);
283 rb_insert_color(&node->nd_ip_node, &cluster->cl_node_ip_tree);
285 write_unlock(&cluster->cl_nodes_lock);
286 if (ret)
287 return ret;
289 memcpy(&node->nd_ipv4_address, &ipv4_addr, sizeof(ipv4_addr));
291 return count;
294 static ssize_t o2nm_node_local_read(struct o2nm_node *node, char *page)
296 return sprintf(page, "%d\n", node->nd_local);
299 static ssize_t o2nm_node_local_write(struct o2nm_node *node, const char *page,
300 size_t count)
302 struct o2nm_cluster *cluster = to_o2nm_cluster_from_node(node);
303 unsigned long tmp;
304 char *p = (char *)page;
305 ssize_t ret;
307 tmp = simple_strtoul(p, &p, 0);
308 if (!p || (*p && (*p != '\n')))
309 return -EINVAL;
311 tmp = !!tmp; /* boolean of whether this node wants to be local */
313 /* setting local turns on networking rx for now so we require having
314 * set everything else first */
315 if (!test_bit(O2NM_NODE_ATTR_ADDRESS, &node->nd_set_attributes) ||
316 !test_bit(O2NM_NODE_ATTR_NUM, &node->nd_set_attributes) ||
317 !test_bit(O2NM_NODE_ATTR_PORT, &node->nd_set_attributes))
318 return -EINVAL; /* XXX */
320 /* the only failure case is trying to set a new local node
321 * when a different one is already set */
322 if (tmp && tmp == cluster->cl_has_local &&
323 cluster->cl_local_node != node->nd_num)
324 return -EBUSY;
326 /* bring up the rx thread if we're setting the new local node. */
327 if (tmp && !cluster->cl_has_local) {
328 ret = o2net_start_listening(node);
329 if (ret)
330 return ret;
333 if (!tmp && cluster->cl_has_local &&
334 cluster->cl_local_node == node->nd_num) {
335 o2net_stop_listening(node);
336 cluster->cl_local_node = O2NM_INVALID_NODE_NUM;
339 node->nd_local = tmp;
340 if (node->nd_local) {
341 cluster->cl_has_local = tmp;
342 cluster->cl_local_node = node->nd_num;
345 return count;
348 struct o2nm_node_attribute {
349 struct configfs_attribute attr;
350 ssize_t (*show)(struct o2nm_node *, char *);
351 ssize_t (*store)(struct o2nm_node *, const char *, size_t);
354 static struct o2nm_node_attribute o2nm_node_attr_num = {
355 .attr = { .ca_owner = THIS_MODULE,
356 .ca_name = "num",
357 .ca_mode = S_IRUGO | S_IWUSR },
358 .show = o2nm_node_num_read,
359 .store = o2nm_node_num_write,
362 static struct o2nm_node_attribute o2nm_node_attr_ipv4_port = {
363 .attr = { .ca_owner = THIS_MODULE,
364 .ca_name = "ipv4_port",
365 .ca_mode = S_IRUGO | S_IWUSR },
366 .show = o2nm_node_ipv4_port_read,
367 .store = o2nm_node_ipv4_port_write,
370 static struct o2nm_node_attribute o2nm_node_attr_ipv4_address = {
371 .attr = { .ca_owner = THIS_MODULE,
372 .ca_name = "ipv4_address",
373 .ca_mode = S_IRUGO | S_IWUSR },
374 .show = o2nm_node_ipv4_address_read,
375 .store = o2nm_node_ipv4_address_write,
378 static struct o2nm_node_attribute o2nm_node_attr_local = {
379 .attr = { .ca_owner = THIS_MODULE,
380 .ca_name = "local",
381 .ca_mode = S_IRUGO | S_IWUSR },
382 .show = o2nm_node_local_read,
383 .store = o2nm_node_local_write,
386 static struct configfs_attribute *o2nm_node_attrs[] = {
387 [O2NM_NODE_ATTR_NUM] = &o2nm_node_attr_num.attr,
388 [O2NM_NODE_ATTR_PORT] = &o2nm_node_attr_ipv4_port.attr,
389 [O2NM_NODE_ATTR_ADDRESS] = &o2nm_node_attr_ipv4_address.attr,
390 [O2NM_NODE_ATTR_LOCAL] = &o2nm_node_attr_local.attr,
391 NULL,
394 static int o2nm_attr_index(struct configfs_attribute *attr)
396 int i;
397 for (i = 0; i < ARRAY_SIZE(o2nm_node_attrs); i++) {
398 if (attr == o2nm_node_attrs[i])
399 return i;
401 BUG();
402 return 0;
405 static ssize_t o2nm_node_show(struct config_item *item,
406 struct configfs_attribute *attr,
407 char *page)
409 struct o2nm_node *node = to_o2nm_node(item);
410 struct o2nm_node_attribute *o2nm_node_attr =
411 container_of(attr, struct o2nm_node_attribute, attr);
412 ssize_t ret = 0;
414 if (o2nm_node_attr->show)
415 ret = o2nm_node_attr->show(node, page);
416 return ret;
419 static ssize_t o2nm_node_store(struct config_item *item,
420 struct configfs_attribute *attr,
421 const char *page, size_t count)
423 struct o2nm_node *node = to_o2nm_node(item);
424 struct o2nm_node_attribute *o2nm_node_attr =
425 container_of(attr, struct o2nm_node_attribute, attr);
426 ssize_t ret;
427 int attr_index = o2nm_attr_index(attr);
429 if (o2nm_node_attr->store == NULL) {
430 ret = -EINVAL;
431 goto out;
434 if (test_bit(attr_index, &node->nd_set_attributes))
435 return -EBUSY;
437 ret = o2nm_node_attr->store(node, page, count);
438 if (ret < count)
439 goto out;
441 set_bit(attr_index, &node->nd_set_attributes);
442 out:
443 return ret;
446 static struct configfs_item_operations o2nm_node_item_ops = {
447 .release = o2nm_node_release,
448 .show_attribute = o2nm_node_show,
449 .store_attribute = o2nm_node_store,
452 static struct config_item_type o2nm_node_type = {
453 .ct_item_ops = &o2nm_node_item_ops,
454 .ct_attrs = o2nm_node_attrs,
455 .ct_owner = THIS_MODULE,
458 /* node set */
460 struct o2nm_node_group {
461 struct config_group ns_group;
462 /* some stuff? */
465 #if 0
466 static struct o2nm_node_group *to_o2nm_node_group(struct config_group *group)
468 return group ?
469 container_of(group, struct o2nm_node_group, ns_group)
470 : NULL;
472 #endif
474 struct o2nm_cluster_attribute {
475 struct configfs_attribute attr;
476 ssize_t (*show)(struct o2nm_cluster *, char *);
477 ssize_t (*store)(struct o2nm_cluster *, const char *, size_t);
480 static ssize_t o2nm_cluster_attr_write(const char *page, ssize_t count,
481 unsigned int *val)
483 unsigned long tmp;
484 char *p = (char *)page;
486 tmp = simple_strtoul(p, &p, 0);
487 if (!p || (*p && (*p != '\n')))
488 return -EINVAL;
490 if (tmp == 0)
491 return -EINVAL;
492 if (tmp >= (u32)-1)
493 return -ERANGE;
495 *val = tmp;
497 return count;
500 static ssize_t o2nm_cluster_attr_idle_timeout_ms_read(
501 struct o2nm_cluster *cluster, char *page)
503 return sprintf(page, "%u\n", cluster->cl_idle_timeout_ms);
506 static ssize_t o2nm_cluster_attr_idle_timeout_ms_write(
507 struct o2nm_cluster *cluster, const char *page, size_t count)
509 ssize_t ret;
510 unsigned int val;
512 ret = o2nm_cluster_attr_write(page, count, &val);
514 if (ret > 0) {
515 if (cluster->cl_idle_timeout_ms != val
516 && o2net_num_connected_peers()) {
517 mlog(ML_NOTICE,
518 "o2net: cannot change idle timeout after "
519 "the first peer has agreed to it."
520 " %d connected peers\n",
521 o2net_num_connected_peers());
522 ret = -EINVAL;
523 } else if (val <= cluster->cl_keepalive_delay_ms) {
524 mlog(ML_NOTICE, "o2net: idle timeout must be larger "
525 "than keepalive delay\n");
526 ret = -EINVAL;
527 } else {
528 cluster->cl_idle_timeout_ms = val;
532 return ret;
535 static ssize_t o2nm_cluster_attr_keepalive_delay_ms_read(
536 struct o2nm_cluster *cluster, char *page)
538 return sprintf(page, "%u\n", cluster->cl_keepalive_delay_ms);
541 static ssize_t o2nm_cluster_attr_keepalive_delay_ms_write(
542 struct o2nm_cluster *cluster, const char *page, size_t count)
544 ssize_t ret;
545 unsigned int val;
547 ret = o2nm_cluster_attr_write(page, count, &val);
549 if (ret > 0) {
550 if (cluster->cl_keepalive_delay_ms != val
551 && o2net_num_connected_peers()) {
552 mlog(ML_NOTICE,
553 "o2net: cannot change keepalive delay after"
554 " the first peer has agreed to it."
555 " %d connected peers\n",
556 o2net_num_connected_peers());
557 ret = -EINVAL;
558 } else if (val >= cluster->cl_idle_timeout_ms) {
559 mlog(ML_NOTICE, "o2net: keepalive delay must be "
560 "smaller than idle timeout\n");
561 ret = -EINVAL;
562 } else {
563 cluster->cl_keepalive_delay_ms = val;
567 return ret;
570 static ssize_t o2nm_cluster_attr_reconnect_delay_ms_read(
571 struct o2nm_cluster *cluster, char *page)
573 return sprintf(page, "%u\n", cluster->cl_reconnect_delay_ms);
576 static ssize_t o2nm_cluster_attr_reconnect_delay_ms_write(
577 struct o2nm_cluster *cluster, const char *page, size_t count)
579 return o2nm_cluster_attr_write(page, count,
580 &cluster->cl_reconnect_delay_ms);
582 static struct o2nm_cluster_attribute o2nm_cluster_attr_idle_timeout_ms = {
583 .attr = { .ca_owner = THIS_MODULE,
584 .ca_name = "idle_timeout_ms",
585 .ca_mode = S_IRUGO | S_IWUSR },
586 .show = o2nm_cluster_attr_idle_timeout_ms_read,
587 .store = o2nm_cluster_attr_idle_timeout_ms_write,
590 static struct o2nm_cluster_attribute o2nm_cluster_attr_keepalive_delay_ms = {
591 .attr = { .ca_owner = THIS_MODULE,
592 .ca_name = "keepalive_delay_ms",
593 .ca_mode = S_IRUGO | S_IWUSR },
594 .show = o2nm_cluster_attr_keepalive_delay_ms_read,
595 .store = o2nm_cluster_attr_keepalive_delay_ms_write,
598 static struct o2nm_cluster_attribute o2nm_cluster_attr_reconnect_delay_ms = {
599 .attr = { .ca_owner = THIS_MODULE,
600 .ca_name = "reconnect_delay_ms",
601 .ca_mode = S_IRUGO | S_IWUSR },
602 .show = o2nm_cluster_attr_reconnect_delay_ms_read,
603 .store = o2nm_cluster_attr_reconnect_delay_ms_write,
606 static struct configfs_attribute *o2nm_cluster_attrs[] = {
607 &o2nm_cluster_attr_idle_timeout_ms.attr,
608 &o2nm_cluster_attr_keepalive_delay_ms.attr,
609 &o2nm_cluster_attr_reconnect_delay_ms.attr,
610 NULL,
612 static ssize_t o2nm_cluster_show(struct config_item *item,
613 struct configfs_attribute *attr,
614 char *page)
616 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
617 struct o2nm_cluster_attribute *o2nm_cluster_attr =
618 container_of(attr, struct o2nm_cluster_attribute, attr);
619 ssize_t ret = 0;
621 if (o2nm_cluster_attr->show)
622 ret = o2nm_cluster_attr->show(cluster, page);
623 return ret;
626 static ssize_t o2nm_cluster_store(struct config_item *item,
627 struct configfs_attribute *attr,
628 const char *page, size_t count)
630 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
631 struct o2nm_cluster_attribute *o2nm_cluster_attr =
632 container_of(attr, struct o2nm_cluster_attribute, attr);
633 ssize_t ret;
635 if (o2nm_cluster_attr->store == NULL) {
636 ret = -EINVAL;
637 goto out;
640 ret = o2nm_cluster_attr->store(cluster, page, count);
641 if (ret < count)
642 goto out;
643 out:
644 return ret;
647 static struct config_item *o2nm_node_group_make_item(struct config_group *group,
648 const char *name)
650 struct o2nm_node *node = NULL;
652 if (strlen(name) > O2NM_MAX_NAME_LEN)
653 return ERR_PTR(-ENAMETOOLONG);
655 node = kzalloc(sizeof(struct o2nm_node), GFP_KERNEL);
656 if (node == NULL)
657 return ERR_PTR(-ENOMEM);
659 strcpy(node->nd_name, name); /* use item.ci_namebuf instead? */
660 config_item_init_type_name(&node->nd_item, name, &o2nm_node_type);
661 spin_lock_init(&node->nd_lock);
663 return &node->nd_item;
666 static void o2nm_node_group_drop_item(struct config_group *group,
667 struct config_item *item)
669 struct o2nm_node *node = to_o2nm_node(item);
670 struct o2nm_cluster *cluster = to_o2nm_cluster(group->cg_item.ci_parent);
672 o2net_disconnect_node(node);
674 if (cluster->cl_has_local &&
675 (cluster->cl_local_node == node->nd_num)) {
676 cluster->cl_has_local = 0;
677 cluster->cl_local_node = O2NM_INVALID_NODE_NUM;
678 o2net_stop_listening(node);
681 /* XXX call into net to stop this node from trading messages */
683 write_lock(&cluster->cl_nodes_lock);
685 /* XXX sloppy */
686 if (node->nd_ipv4_address)
687 rb_erase(&node->nd_ip_node, &cluster->cl_node_ip_tree);
689 /* nd_num might be 0 if the node number hasn't been set.. */
690 if (cluster->cl_nodes[node->nd_num] == node) {
691 cluster->cl_nodes[node->nd_num] = NULL;
692 clear_bit(node->nd_num, cluster->cl_nodes_bitmap);
694 write_unlock(&cluster->cl_nodes_lock);
696 config_item_put(item);
699 static struct configfs_group_operations o2nm_node_group_group_ops = {
700 .make_item = o2nm_node_group_make_item,
701 .drop_item = o2nm_node_group_drop_item,
704 static struct config_item_type o2nm_node_group_type = {
705 .ct_group_ops = &o2nm_node_group_group_ops,
706 .ct_owner = THIS_MODULE,
709 /* cluster */
711 static void o2nm_cluster_release(struct config_item *item)
713 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
715 kfree(cluster->cl_group.default_groups);
716 kfree(cluster);
719 static struct configfs_item_operations o2nm_cluster_item_ops = {
720 .release = o2nm_cluster_release,
721 .show_attribute = o2nm_cluster_show,
722 .store_attribute = o2nm_cluster_store,
725 static struct config_item_type o2nm_cluster_type = {
726 .ct_item_ops = &o2nm_cluster_item_ops,
727 .ct_attrs = o2nm_cluster_attrs,
728 .ct_owner = THIS_MODULE,
731 /* cluster set */
733 struct o2nm_cluster_group {
734 struct configfs_subsystem cs_subsys;
735 /* some stuff? */
738 #if 0
739 static struct o2nm_cluster_group *to_o2nm_cluster_group(struct config_group *group)
741 return group ?
742 container_of(to_configfs_subsystem(group), struct o2nm_cluster_group, cs_subsys)
743 : NULL;
745 #endif
747 static struct config_group *o2nm_cluster_group_make_group(struct config_group *group,
748 const char *name)
750 struct o2nm_cluster *cluster = NULL;
751 struct o2nm_node_group *ns = NULL;
752 struct config_group *o2hb_group = NULL, *ret = NULL;
753 void *defs = NULL;
755 /* this runs under the parent dir's i_mutex; there can be only
756 * one caller in here at a time */
757 if (o2nm_single_cluster)
758 return ERR_PTR(-ENOSPC);
760 cluster = kzalloc(sizeof(struct o2nm_cluster), GFP_KERNEL);
761 ns = kzalloc(sizeof(struct o2nm_node_group), GFP_KERNEL);
762 defs = kcalloc(3, sizeof(struct config_group *), GFP_KERNEL);
763 o2hb_group = o2hb_alloc_hb_set();
764 if (cluster == NULL || ns == NULL || o2hb_group == NULL || defs == NULL)
765 goto out;
767 config_group_init_type_name(&cluster->cl_group, name,
768 &o2nm_cluster_type);
769 config_group_init_type_name(&ns->ns_group, "node",
770 &o2nm_node_group_type);
772 cluster->cl_group.default_groups = defs;
773 cluster->cl_group.default_groups[0] = &ns->ns_group;
774 cluster->cl_group.default_groups[1] = o2hb_group;
775 cluster->cl_group.default_groups[2] = NULL;
776 rwlock_init(&cluster->cl_nodes_lock);
777 cluster->cl_node_ip_tree = RB_ROOT;
778 cluster->cl_reconnect_delay_ms = O2NET_RECONNECT_DELAY_MS_DEFAULT;
779 cluster->cl_idle_timeout_ms = O2NET_IDLE_TIMEOUT_MS_DEFAULT;
780 cluster->cl_keepalive_delay_ms = O2NET_KEEPALIVE_DELAY_MS_DEFAULT;
782 ret = &cluster->cl_group;
783 o2nm_single_cluster = cluster;
785 out:
786 if (ret == NULL) {
787 kfree(cluster);
788 kfree(ns);
789 o2hb_free_hb_set(o2hb_group);
790 kfree(defs);
791 ret = ERR_PTR(-ENOMEM);
794 return ret;
797 static void o2nm_cluster_group_drop_item(struct config_group *group, struct config_item *item)
799 struct o2nm_cluster *cluster = to_o2nm_cluster(item);
800 int i;
801 struct config_item *killme;
803 BUG_ON(o2nm_single_cluster != cluster);
804 o2nm_single_cluster = NULL;
806 for (i = 0; cluster->cl_group.default_groups[i]; i++) {
807 killme = &cluster->cl_group.default_groups[i]->cg_item;
808 cluster->cl_group.default_groups[i] = NULL;
809 config_item_put(killme);
812 config_item_put(item);
815 static struct configfs_group_operations o2nm_cluster_group_group_ops = {
816 .make_group = o2nm_cluster_group_make_group,
817 .drop_item = o2nm_cluster_group_drop_item,
820 static struct config_item_type o2nm_cluster_group_type = {
821 .ct_group_ops = &o2nm_cluster_group_group_ops,
822 .ct_owner = THIS_MODULE,
825 static struct o2nm_cluster_group o2nm_cluster_group = {
826 .cs_subsys = {
827 .su_group = {
828 .cg_item = {
829 .ci_namebuf = "cluster",
830 .ci_type = &o2nm_cluster_group_type,
836 int o2nm_depend_item(struct config_item *item)
838 return configfs_depend_item(&o2nm_cluster_group.cs_subsys, item);
841 void o2nm_undepend_item(struct config_item *item)
843 configfs_undepend_item(&o2nm_cluster_group.cs_subsys, item);
846 int o2nm_depend_this_node(void)
848 int ret = 0;
849 struct o2nm_node *local_node;
851 local_node = o2nm_get_node_by_num(o2nm_this_node());
852 if (!local_node) {
853 ret = -EINVAL;
854 goto out;
857 ret = o2nm_depend_item(&local_node->nd_item);
858 o2nm_node_put(local_node);
860 out:
861 return ret;
864 void o2nm_undepend_this_node(void)
866 struct o2nm_node *local_node;
868 local_node = o2nm_get_node_by_num(o2nm_this_node());
869 BUG_ON(!local_node);
871 o2nm_undepend_item(&local_node->nd_item);
872 o2nm_node_put(local_node);
876 static void __exit exit_o2nm(void)
878 /* XXX sync with hb callbacks and shut down hb? */
879 o2net_unregister_hb_callbacks();
880 configfs_unregister_subsystem(&o2nm_cluster_group.cs_subsys);
881 o2cb_sys_shutdown();
883 o2net_exit();
884 o2hb_exit();
887 static int __init init_o2nm(void)
889 int ret = -1;
891 cluster_print_version();
893 ret = o2hb_init();
894 if (ret)
895 goto out;
897 ret = o2net_init();
898 if (ret)
899 goto out_o2hb;
901 ret = o2net_register_hb_callbacks();
902 if (ret)
903 goto out_o2net;
905 config_group_init(&o2nm_cluster_group.cs_subsys.su_group);
906 mutex_init(&o2nm_cluster_group.cs_subsys.su_mutex);
907 ret = configfs_register_subsystem(&o2nm_cluster_group.cs_subsys);
908 if (ret) {
909 printk(KERN_ERR "nodemanager: Registration returned %d\n", ret);
910 goto out_callbacks;
913 ret = o2cb_sys_init();
914 if (!ret)
915 goto out;
917 configfs_unregister_subsystem(&o2nm_cluster_group.cs_subsys);
918 out_callbacks:
919 o2net_unregister_hb_callbacks();
920 out_o2net:
921 o2net_exit();
922 out_o2hb:
923 o2hb_exit();
924 out:
925 return ret;
928 MODULE_AUTHOR("Oracle");
929 MODULE_LICENSE("GPL");
931 module_init(init_o2nm)
932 module_exit(exit_o2nm)