close_port, kpacket_gen kmalloc oom, formard.c wake_sender/skb receive oom handling...
[cor_2_6_31.git] / net / cor / cor.h
blob9f3ca04ec8d12de6370e835cd5f1368ad655626b
1 /*
2 * Connection oriented routing
3 * Copyright (C) 2007-2008 Michael Blizek
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version 2
8 * of the License, or (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
18 * 02110-1301, USA.
21 #include <asm/atomic.h>
23 #include <linux/types.h>
24 #include <linux/netdevice.h>
25 #include <linux/skbuff.h>
26 #include <linux/spinlock.h>
27 #include <linux/workqueue.h>
29 #include "settings.h"
32 /* options */
33 #define PIDOUT_NEWCONN 16
34 #define PIDOUT_SENDDEF_THRES 8
35 #define PIDOUT_SENDDEF_COUNT 16
39 #define ETH_P_COR 0x1022
40 #define AF_COR 37
41 #define PF_COR AF_COR
43 #define SOCKADDRTYPE_PORT 1
44 struct cor_sockaddr {
45 int type;
47 union {
48 __be64 port;
49 } addr;
52 #define MAX_CONN_CMD_LEN 4096
55 #define PACKET_TYPE_ANNOUNCE 1
56 #define PACKET_TYPE_DATA 2
59 * Kernel packet data - these commands are sent by the neighbor
60 * The end nodes may cause these commands to be sent, but they see them beyond
61 * the first hop.
64 /* KP_PADDING[1] */
65 #define KP_PADDING 1
67 /* KP_[N]ACK[1] sent_conn_id[4] seqno[4]
69 * sent_conn_id means that this is *not* the conn_id we use if we sent something
70 * through this conn, but the conn_id that the neighbor used to send us the
71 * packet
73 #define KP_ACK 2
74 #define KP_NACK 3
77 * KP_SPEED[1] conn_id[4] speedinfo[2]
79 * speedinfo[2] =
80 * buffer_state_value = speedinfo % 181
81 * speed_value = speedinfo / 181
83 * buffer_state = 1024 * pow(2, buffer_state_value/3.0)
84 * speed = 1024 * pow(2, speed_value/12.0)
85 * see the .0 ...
87 * This has to be done either with floating points (which is no so nice) or
88 * you can calculate:
89 * buffer_state = pow(2, value/3) *
90 * 1024 * pow(pow(2, 1.0/3), buffer_state_value%3)
91 * where 1024 * pow(pow(2, 1.0/4), value%3) can be just a table lookup
92 * (the "1024" should be part of the value in the table, because it increases
93 * the accuracy)
95 * you can do the same with the speed
98 * Some values have special meanings:
99 * if speedinfo is the highest possible value(65535), it means both values
100 * are inifinite
101 * if buffer_state_value if > 91, you have to subtract 90 and make the
102 * resulting buffer_state negative
104 #define KP_SPEED 5
106 /* NOTE on connection ids:
107 * connection ids we send are used for the receive channel
108 * connection ids we receive are used for the send channel
112 * incoming connection
113 * KP_CONNECT[1] conn_id[4]
115 #define KP_CONNECT 10
118 * incoming connection successful,
119 * the first conn_id is the same as previously sent/received in KP_CONNECT
120 * the second conn_id is generated by us and used for the other direction
121 * KP_CONNECT_SUCCESS[1] conn_id[4] conn_id[4]
123 #define KP_CONNECT_SUCCESS 11
125 /* KP_CONNECT_FAILED_*[1] conn_id[4] */
126 #define KP_CONNECT_FAILED_TEMP 12
127 #define KP_CONNECT_FAILED_PERM 13
129 /* KP_CONN_DATA[1] conn_id[4] seqno[4] length[4] data[length] */
130 #define KP_CONN_DATA 14
133 * { KP_RESET_CONN[1] conn_id[4] }
134 * We send this, if there is an established connection we want to close.
136 #define KP_RESET_CONN 15
140 * Connection data which in interpreted when connection has no target yet
141 * These commands are sent by the end node.
143 * Format:
144 * cmd[2] length[4] parameter[length]
145 * unrecogniced commands are ignored
146 * parameters which are longer than expected are ignored as well
149 /* outgoing connection: CD_CONNECT_NB[2] length[4]
150 * addrtypelen[2] addrlen[2] addrtype[addrtypelen] addr[addrlen] */
151 #define CD_CONNECT_NB 1
153 /* connection to local open part: CD_CONNECT_PORT[2] length[4] port[8] */
154 #define CD_CONNECT_PORT 2
157 * CD_LIST_NEIGH sends CDR_BINDATA if the command was successful. The response
158 * format is:
160 * totalneighs[4] response_rows[4]
161 * for every row:
162 * numaddr[2] (addrtypelen[2] addrlen[2] addrtype[addrtypelen] addr[addrlen]
163 * )[numaddr]
165 * Neighbors have to be sorted by uptime, new neighbors first. This is so that
166 * the routing daemon can easily find out whether there are new neighbors. It
167 * only needs to send a query with offset 0. If the totalneighs stays the same
168 * while new were added, a connection to another neighbor was lost.
171 /* list connected neighbors: CD_LIST_NEIGH[2] length[4] limit[4] offset[4] */
172 #define CD_LIST_NEIGH 3
175 * Connection data response
176 * Format is the same as with connection data
180 * {CDR_EXECOK[2] || CDR_EXECFAILED[2]}
181 * reasoncode[2] reasontextlength[2] reasontext[reasontextlength]
182 * reasontextlength may be 0
184 #define CDR_EXECOK 32768
185 #define CDR_EXECOK_OK 33024
187 #define CDR_EXECFAILED 32769
188 #define CDR_EXECFAILED_UNKNOWN_COMMAND 33280
189 #define CDR_EXECFAILED_PERMISSION_DENIED 33281
190 #define CDR_EXECFAILED_TEMPORARILY_OUT_OF_RESSOURCES 33282
191 #define CDR_EXECFAILED_CMD_TOO_SHORT 33283
192 #define CDR_EXECFAILED_CMD_TOO_LONG 33284
193 #define CDR_EXECFAILED_TARGETADDRTYPE_UNKNOWN 33285
194 #define CDR_EXECFAILED_TARGETADDR_DOESNTEXIST 33286
195 #define CDR_EXECFAILED_TARGETADDR_PORTCLOSED 33287
196 #define CDR_EXECFAILED_LISTENERQUEUE_FULL 33288
199 * must be sent after CDR_EXEC{OK|FAILED}
200 * CDR_EXEOK_BINDATA[2] bindatalen[4] bindata[bindatalen] */
201 #define CDR_BINDATA 32770
204 /* result codes for rcv.c/proc_packet */
205 #define RC_DROP 0
206 #define RC_FINISHED 1
208 #define RC_RCV1_ANNOUNCE 2
209 #define RC_RCV1_KERNEL 3
210 #define RC_RCV1_CONN 4
212 struct ref_counter;
214 struct ref_counter_def{
216 * implemented by user, frees struct containing the mem_counter when
217 * refs == 0
219 void (*free)(struct ref_counter *cnt);
222 struct ref_counter{
223 spinlock_t lock;
225 /* initialised with 1 */
226 int refs;
228 /* initialised with 1, if 0 deny mem_counter_incr */
229 int is_active;
231 /* should be a pointer to a global variable */
232 struct ref_counter_def *def;
235 struct htab_entry{
236 struct htab_entry *next;
239 struct htable{
240 struct htab_entry **htable;
241 __u32 htable_size;
242 __u32 cell_size;
243 __u32 num_elements;
245 int (*matches)(void *htentry, void *searcheditem);
246 __u32 key_offset;
247 __u32 entry_offset;
248 __u32 ref_counter_offset;
251 struct neighbor{
252 struct list_head nb_list;
254 struct ref_counter refs;
256 struct net_device *dev;
257 char mac[MAX_ADDR_LEN];
259 char *addr;
260 __u16 addrlen;
262 struct delayed_work cmsg_timer;
263 struct mutex cmsg_lock;
264 struct list_head control_msgs_out;
265 __u64 timeout;
266 __u32 length;
268 atomic_t ooo_packets;
270 __u32 latency;
273 * connecions which receive data from/send data to this node
274 * used when terminating all connections of a neighbor
276 struct mutex conn_list_lock;
277 struct list_head rcv_conn_list;
278 struct list_head snd_conn_list;
281 * the timer has to be inited when adding the neighbor
282 * init_timer(struct timer_list * timer);
283 * add_timer(struct timer_list * timer);
285 spinlock_t retrans_lock;
286 struct timer_list retrans_timer;
289 * next_retransmit are linked with
290 * skb_procstate->funcstate.retransmit_queue
291 * because the sk_buff next/prev fields are needed by the hashtable
293 struct sk_buff_head retrans_list;
295 struct conn *firstboundconn;
298 struct cor_sched_data{
299 spinlock_t lock;
300 struct list_head conn_list;
301 struct sk_buff_head requeue_queue;
304 #define TYPE_BUF 0
305 #define TYPE_SKB 1
307 struct data_buf_item{
308 struct list_head buf_list;
310 union {
311 struct {
312 char *buf;
313 __u32 datalen;
315 }buf;
317 struct sk_buff *skb;
318 }data;
320 __u8 type;
323 struct data_buf{
324 struct list_head items;
325 struct data_buf_item *lastread;
326 __u64 first_offset;
327 __u64 read_offset;
329 __u32 totalsize;
330 __u32 read_remaining;
332 __u32 last_read_offset;
334 __u32 last_buflen;
337 struct connlistener;
339 struct bindnode{
340 struct list_head lh;
341 struct connlistener *owner;
342 __be64 port;
345 #define SOCKSTATE_LISTENER 1
346 #define SOCKSTATE_CONN 2
348 struct sock_hdr {
349 /* The first member of connlistener/conn (see sock.c) */
350 __u8 sockstate;
353 struct connlistener {
354 /* The first member has to be the same as in conn (see sock.c) */
355 __u8 sockstate;
356 struct bindnode *bn;
357 struct mutex lock;
358 int queue_maxlen;
359 int queue_len;
360 struct list_head conn_queue;
361 wait_queue_head_t wait;
366 * There are 2 conn objects per bi-directional connection. They refer to each
367 * other with in the reversedir field. To distinguish them, the variables on
368 * the stack are usually called rconn and sconn. rconn refers to the conn object
369 * which has received a command. sconn is the other conn object. This means that
370 * in send functions rconn means the connection we want to send the command to.
373 struct conn{
374 /* The first member has to be the same as in connlistener (see sock.c)*/
375 __u8 sockstate;
377 #define SOURCE_NONE 0
378 #define SOURCE_IN 1
379 #define SOURCE_SOCK 2
381 #define TARGET_UNCONNECTED 0
382 #define TARGET_OUT 1
383 #define TARGET_SOCK 2
385 __u8 sourcetype:4,
386 targettype:4;
387 __u8 isreset;
388 __u8 qdisc_active;
389 struct list_head queue_list;
391 /* todo: convert to kref */
392 struct ref_counter refs;
394 struct mutex rcv_lock;
396 /* state */
397 __u32 credits;
398 /* credit rate */
399 __s32 sender_crate;
400 __s32 resp_crate;
402 union{
403 struct{
404 struct neighbor *nb;
405 /* list of all connections from this neighbor */
406 struct list_head nb_list;
408 struct sk_buff_head reorder_queue;
410 struct htab_entry htab_entry;
411 __u32 conn_id;
412 __u32 next_seqno;
413 __u32 ooo_packets;
414 }in;
416 struct{
417 struct list_head cl_list;
418 wait_queue_head_t wait;
419 struct socket *sock;
420 int flags;
421 }sock;
422 }source;
424 union{
425 struct{
426 __u32 paramlen;
427 __u32 cmdread;
428 __u16 cmd;
429 __u8 *cmdparams;
430 }unconnected;
432 struct{
433 /* has to be first (because it is first in target
434 * kernel too)
436 struct neighbor *nb;
437 /* list of all connections to this neighbor */
438 struct list_head nb_list;
440 __u32 conn_id;
441 __u32 seqno;
442 }out;
444 struct{
445 wait_queue_head_t wait;
446 }sock;
447 }target;
449 struct data_buf buf;
451 struct conn *reversedir;
454 /* inside skb->cb */
455 struct skb_procstate{
456 struct conn *rconn;
458 union{
459 struct{
460 struct work_struct work;
461 }rcv;
463 struct{
464 __u32 offset;
465 }announce;
467 struct{
468 __u32 conn_id;
469 __u32 seqno;
470 }rcv2;
472 struct{
473 struct htab_entry htab_entry;
474 struct ref_counter refs;
475 unsigned long timeout;
476 __u32 conn_id;
477 __u32 seqno;
478 }retransmit_queue;
479 }funcstate;
483 /* common.c */
484 extern void ref_counter_decr(struct ref_counter *cnt);
486 extern int ref_counter_incr(struct ref_counter *cnt);
488 extern void ref_counter_init(struct ref_counter *cnt,
489 struct ref_counter_def *def);
491 extern char *htable_get(struct htable *ht, __u32 key, void *searcheditem);
493 extern int htable_delete(struct htable *ht, char *oldelement, __u32 key,
494 void *searcheditem);
496 extern void htable_insert(struct htable *ht, char *newelement, __u32 key);
498 extern void htable_init(struct htable *ht, int (*matches)(void *htentry,
499 void *searcheditem), __u32 entry_offset,
500 __u32 ref_counter_offset);
502 extern struct conn *get_conn(__u32 conn_id);
504 extern int conn_init_out(struct conn *rconn, struct neighbor *nb);
506 extern void conn_init_sock_source(struct conn *conn);
507 extern void conn_init_sock_target(struct conn *conn);
509 extern void close_port(struct connlistener *listener);
511 extern struct connlistener *open_port(__be64 port);
513 extern int connect_port(struct conn *rconn, __be64 port);
515 extern int connect_neigh(struct conn *rconn,
516 __u16 addrtypelen, __u8 *addrtype,
517 __u16 addrlen, __u8 *addr);
519 extern struct conn* alloc_conn(gfp_t allocflags);
521 extern void reset_conn(struct conn *conn);
523 /* neighbor.c */
524 extern struct neighbor *find_neigh(__u16 addrtypelen, __u8 *addrtype,
525 __u16 addrlen, __u8 *addr);
527 extern __u32 generate_neigh_list(char *buf, __u32 buflen, __u32 limit,
528 __u32 offset);
530 extern void rcv_announce(struct sk_buff *skb);
532 extern int __init cor_neighbor_init(void);
534 /* rcv.c */
535 extern void drain_ooo_queue(struct conn *rconn);
537 extern void conn_rcv_buildskb(char *data, __u32 datalen, __u32 conn_id,
538 __u32 seqno);
540 extern int __init cor_rcv_init(void);
542 /* kpacket_parse.c */
543 extern void kernel_packet(struct neighbor *nb, struct sk_buff *skb, __u32 seqno);
545 /* kpacket_gen.c */
546 extern void schedule_controlmsg_timerfunc(struct neighbor *nb);
548 struct control_msg_out;
550 extern struct control_msg_out *alloc_control_msg(void);
552 extern void send_reset_conn(struct control_msg_out *cm, struct neighbor *nb,
553 __u32 conn_id);
555 extern void send_ack(struct control_msg_out *cm, struct neighbor *nb,
556 __u32 conn_id, __u32 seqno);
558 extern void send_connect_failed_temp(struct control_msg_out *cm,
559 struct neighbor *nb, __u32 conn_id);
561 extern void send_connect_success(struct control_msg_out *cm,
562 struct conn *rconn);
564 extern void send_connect_nb(struct control_msg_out *cm, struct conn *rconn);
566 extern void send_conndata(struct control_msg_out *cm, struct neighbor *nb,
567 __u32 connid, __u32 seqno, char *data_orig, char *data,
568 __u32 datalen);
570 /* cpacket_parse.c */
571 extern void parse(struct conn *rconn);
573 /* snd.c */
574 extern void retransmit_timerfunc(unsigned long arg);
576 extern struct sk_buff *create_packet_conn(struct conn *target, int size,
577 gfp_t alloc_flags);
579 extern struct sk_buff *create_packet_kernel(struct neighbor *nb, int size,
580 gfp_t alloc_flags);
582 extern void send_conn_flushdata(struct conn *rconn, char *data, __u32 datalen);
584 extern void send_packet(struct sk_buff *skb, struct neighbor *nb);
586 extern void ack_received(struct neighbor *nb, __u32 conn_id, __u32 seqno,
587 int nack);
589 extern void flush_out(struct conn *rconn);
591 extern int __init cor_snd_init(void);
593 /* forward.c */
594 extern void databuf_pull(struct data_buf *data, char *dst, int len);
596 extern size_t databuf_pulluser(struct conn *sconn, struct msghdr *msg);
598 extern void databuf_ack(struct data_buf *buf, __u64 pos);
600 extern void databuf_ackread(struct data_buf *buf);
602 extern int databuf_maypush(struct data_buf *buf);
604 extern void databuf_free(struct data_buf *data);
606 extern void databuf_init(struct data_buf *data);
608 extern int receive_userbuf(struct conn *rconn, struct msghdr *msg);
610 extern void receive_buf(struct conn *rconn, char *buf, int len);
612 extern int receive_skb(struct conn *rconn, struct sk_buff *skb);
614 extern void wake_sender(struct conn *rconn);
616 extern void forward_init(void);
619 static inline struct skb_procstate *skb_pstate(struct sk_buff *skb)
621 return (struct skb_procstate *) &(skb->cb[0]);
624 static inline struct sk_buff *skb_from_pstate(struct skb_procstate *ps)
626 return (struct sk_buff *) (((char *)ps) - offsetof(struct sk_buff,cb));
630 static inline __u32 mss(struct neighbor *nb)
632 return nb->dev->mtu - LL_RESERVED_SPACE(nb->dev) - 17;
636 static inline void put_u64(char *dst, __u64 value, int convbo)
638 char *p_value = (char *) &value;
640 if (convbo)
641 value = cpu_to_be64(value);
643 dst[0] = p_value[0];
644 dst[1] = p_value[1];
645 dst[2] = p_value[2];
646 dst[3] = p_value[3];
647 dst[4] = p_value[4];
648 dst[5] = p_value[5];
649 dst[6] = p_value[6];
650 dst[7] = p_value[7];
653 static inline void put_u32(char *dst, __u32 value, int convbo)
655 char *p_value = (char *) &value;
657 if (convbo)
658 value = cpu_to_be32(value);
660 dst[0] = p_value[0];
661 dst[1] = p_value[1];
662 dst[2] = p_value[2];
663 dst[3] = p_value[3];
666 static inline void put_u16(char *dst, __u16 value, int convbo)
668 char *p_value = (char *) &value;
670 if (convbo)
671 value = cpu_to_be16(value);
673 dst[0] = p_value[0];
674 dst[1] = p_value[1];
677 static inline char *cor_pull_skb(struct sk_buff *skb, unsigned int len)
679 char *ptr = skb_pull(skb, len);
681 if(ptr == 0)
682 return 0;
684 return ptr - len;