2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * The options processing module for ip.c
8 * Authors: A.N.Kuznetsov
12 #include <linux/capability.h>
13 #include <linux/module.h>
14 #include <linux/slab.h>
15 #include <linux/types.h>
16 #include <asm/uaccess.h>
17 #include <linux/skbuff.h>
19 #include <linux/icmp.h>
20 #include <linux/netdevice.h>
21 #include <linux/rtnetlink.h>
25 #include <net/route.h>
26 #include <net/cipso_ipv4.h>
29 * Write options to IP header, record destination address to
30 * source route option, address of outgoing interface
31 * (we should already know it, so that this function is allowed be
32 * called only after routing decision) and timestamp,
33 * if we originate this datagram.
35 * daddr is real destination address, next hop is recorded in IP header.
36 * saddr is address of outgoing interface.
39 void ip_options_build(struct sk_buff
* skb
, struct ip_options
* opt
,
40 __be32 daddr
, struct rtable
*rt
, int is_frag
)
42 unsigned char *iph
= skb_network_header(skb
);
44 memcpy(&(IPCB(skb
)->opt
), opt
, sizeof(struct ip_options
));
45 memcpy(iph
+sizeof(struct iphdr
), opt
->__data
, opt
->optlen
);
46 opt
= &(IPCB(skb
)->opt
);
49 memcpy(iph
+opt
->srr
+iph
[opt
->srr
+1]-4, &daddr
, 4);
53 ip_rt_get_source(iph
+opt
->rr
+iph
[opt
->rr
+2]-5, rt
);
55 ip_rt_get_source(iph
+opt
->ts
+iph
[opt
->ts
+2]-9, rt
);
56 if (opt
->ts_needtime
) {
60 midtime
= htonl((tv
.tv_sec
% 86400) * MSEC_PER_SEC
+ tv
.tv_nsec
/ NSEC_PER_MSEC
);
61 memcpy(iph
+opt
->ts
+iph
[opt
->ts
+2]-5, &midtime
, 4);
66 memset(iph
+opt
->rr
, IPOPT_NOP
, iph
[opt
->rr
+1]);
71 memset(iph
+opt
->ts
, IPOPT_NOP
, iph
[opt
->ts
+1]);
73 opt
->ts_needaddr
= opt
->ts_needtime
= 0;
78 * Provided (sopt, skb) points to received options,
79 * build in dopt compiled option set appropriate for answering.
80 * i.e. invert SRR option, copy anothers,
81 * and grab room in RR/TS options.
83 * NOTE: dopt cannot point to skb.
86 int ip_options_echo(struct ip_options
* dopt
, struct sk_buff
* skb
)
88 struct ip_options
*sopt
;
89 unsigned char *sptr
, *dptr
;
94 memset(dopt
, 0, sizeof(struct ip_options
));
96 sopt
= &(IPCB(skb
)->opt
);
98 if (sopt
->optlen
== 0) {
103 sptr
= skb_network_header(skb
);
106 daddr
= skb_rtable(skb
)->rt_spec_dst
;
109 optlen
= sptr
[sopt
->rr
+1];
110 soffset
= sptr
[sopt
->rr
+2];
111 dopt
->rr
= dopt
->optlen
+ sizeof(struct iphdr
);
112 memcpy(dptr
, sptr
+sopt
->rr
, optlen
);
113 if (sopt
->rr_needaddr
&& soffset
<= optlen
) {
114 if (soffset
+ 3 > optlen
)
116 dptr
[2] = soffset
+ 4;
117 dopt
->rr_needaddr
= 1;
120 dopt
->optlen
+= optlen
;
123 optlen
= sptr
[sopt
->ts
+1];
124 soffset
= sptr
[sopt
->ts
+2];
125 dopt
->ts
= dopt
->optlen
+ sizeof(struct iphdr
);
126 memcpy(dptr
, sptr
+sopt
->ts
, optlen
);
127 if (soffset
<= optlen
) {
128 if (sopt
->ts_needaddr
) {
129 if (soffset
+ 3 > optlen
)
131 dopt
->ts_needaddr
= 1;
134 if (sopt
->ts_needtime
) {
135 if (soffset
+ 3 > optlen
)
137 if ((dptr
[3]&0xF) != IPOPT_TS_PRESPEC
) {
138 dopt
->ts_needtime
= 1;
141 dopt
->ts_needtime
= 0;
143 if (soffset
+ 8 <= optlen
) {
146 memcpy(&addr
, sptr
+soffset
-1, 4);
147 if (inet_addr_type(dev_net(skb_dst(skb
)->dev
), addr
) != RTN_LOCAL
) {
148 dopt
->ts_needtime
= 1;
157 dopt
->optlen
+= optlen
;
160 unsigned char * start
= sptr
+sopt
->srr
;
166 if (soffset
> optlen
)
167 soffset
= optlen
+ 1;
170 memcpy(&faddr
, &start
[soffset
-1], 4);
171 for (soffset
-=4, doffset
=4; soffset
> 3; soffset
-=4, doffset
+=4)
172 memcpy(&dptr
[doffset
-1], &start
[soffset
-1], 4);
174 * RFC1812 requires to fix illegal source routes.
176 if (memcmp(&ip_hdr(skb
)->saddr
,
177 &start
[soffset
+ 3], 4) == 0)
181 memcpy(&start
[doffset
-1], &daddr
, 4);
187 dopt
->srr
= dopt
->optlen
+ sizeof(struct iphdr
);
188 dopt
->optlen
+= doffset
+3;
189 dopt
->is_strictroute
= sopt
->is_strictroute
;
193 optlen
= sptr
[sopt
->cipso
+1];
194 dopt
->cipso
= dopt
->optlen
+sizeof(struct iphdr
);
195 memcpy(dptr
, sptr
+sopt
->cipso
, optlen
);
197 dopt
->optlen
+= optlen
;
199 while (dopt
->optlen
& 3) {
207 * Options "fragmenting", just fill options not
208 * allowed in fragments with NOOPs.
209 * Simple and stupid 8), but the most efficient way.
212 void ip_options_fragment(struct sk_buff
* skb
)
214 unsigned char *optptr
= skb_network_header(skb
) + sizeof(struct iphdr
);
215 struct ip_options
* opt
= &(IPCB(skb
)->opt
);
229 if (optlen
<2 || optlen
>l
)
231 if (!IPOPT_COPIED(*optptr
))
232 memset(optptr
, IPOPT_NOOP
, optlen
);
238 opt
->rr_needaddr
= 0;
239 opt
->ts_needaddr
= 0;
240 opt
->ts_needtime
= 0;
244 * Verify options and fill pointers in struct options.
245 * Caller should clear *opt, and set opt->data.
246 * If opt == NULL, then skb->data should point to IP header.
249 int ip_options_compile(struct net
*net
,
250 struct ip_options
* opt
, struct sk_buff
* skb
)
254 unsigned char * optptr
;
256 unsigned char * pp_ptr
= NULL
;
257 struct rtable
*rt
= NULL
;
260 rt
= skb_rtable(skb
);
261 optptr
= (unsigned char *)&(ip_hdr(skb
)[1]);
263 optptr
= opt
->__data
;
264 iph
= optptr
- sizeof(struct iphdr
);
266 for (l
= opt
->optlen
; l
> 0; ) {
269 for (optptr
++, l
--; l
>0; optptr
++, l
--) {
270 if (*optptr
!= IPOPT_END
) {
282 if (optlen
<2 || optlen
>l
) {
297 /* NB: cf RFC-1812 5.2.4.1 */
303 if (optptr
[2] != 4 || optlen
< 7 || ((optlen
-3) & 3)) {
307 memcpy(&opt
->faddr
, &optptr
[3], 4);
309 memmove(&optptr
[3], &optptr
[7], optlen
-7);
311 opt
->is_strictroute
= (optptr
[0] == IPOPT_SSRR
);
312 opt
->srr
= optptr
- iph
;
327 if (optptr
[2] <= optlen
) {
328 if (optptr
[2]+3 > optlen
) {
333 memcpy(&optptr
[optptr
[2]-1], &rt
->rt_spec_dst
, 4);
337 opt
->rr_needaddr
= 1;
339 opt
->rr
= optptr
- iph
;
341 case IPOPT_TIMESTAMP
:
354 if (optptr
[2] <= optlen
) {
355 __be32
*timeptr
= NULL
;
356 if (optptr
[2]+3 > optptr
[1]) {
360 switch (optptr
[3]&0xF) {
361 case IPOPT_TS_TSONLY
:
362 opt
->ts
= optptr
- iph
;
364 timeptr
= (__be32
*)&optptr
[optptr
[2]-1];
365 opt
->ts_needtime
= 1;
368 case IPOPT_TS_TSANDADDR
:
369 if (optptr
[2]+7 > optptr
[1]) {
373 opt
->ts
= optptr
- iph
;
375 memcpy(&optptr
[optptr
[2]-1], &rt
->rt_spec_dst
, 4);
376 timeptr
= (__be32
*)&optptr
[optptr
[2]+3];
378 opt
->ts_needaddr
= 1;
379 opt
->ts_needtime
= 1;
382 case IPOPT_TS_PRESPEC
:
383 if (optptr
[2]+7 > optptr
[1]) {
387 opt
->ts
= optptr
- iph
;
390 memcpy(&addr
, &optptr
[optptr
[2]-1], 4);
391 if (inet_addr_type(net
, addr
) == RTN_UNICAST
)
394 timeptr
= (__be32
*)&optptr
[optptr
[2]+3];
396 opt
->ts_needtime
= 1;
400 if (!skb
&& !capable(CAP_NET_RAW
)) {
410 midtime
= htonl((tv
.tv_sec
% 86400) * MSEC_PER_SEC
+ tv
.tv_nsec
/ NSEC_PER_MSEC
);
411 memcpy(timeptr
, &midtime
, sizeof(__be32
));
415 unsigned overflow
= optptr
[3]>>4;
416 if (overflow
== 15) {
420 opt
->ts
= optptr
- iph
;
422 optptr
[3] = (optptr
[3]&0xF)|((overflow
+1)<<4);
432 if (optptr
[2] == 0 && optptr
[3] == 0)
433 opt
->router_alert
= optptr
- iph
;
436 if ((!skb
&& !capable(CAP_NET_RAW
)) || opt
->cipso
) {
440 opt
->cipso
= optptr
- iph
;
441 if (cipso_v4_validate(skb
, &optptr
)) {
449 if (!skb
&& !capable(CAP_NET_RAW
)) {
465 icmp_send(skb
, ICMP_PARAMETERPROB
, 0, htonl((pp_ptr
-iph
)<<24));
472 * Undo all the changes done by ip_options_compile().
475 void ip_options_undo(struct ip_options
* opt
)
478 unsigned char * optptr
= opt
->__data
+opt
->srr
-sizeof(struct iphdr
);
479 memmove(optptr
+7, optptr
+3, optptr
[1]-7);
480 memcpy(optptr
+3, &opt
->faddr
, 4);
482 if (opt
->rr_needaddr
) {
483 unsigned char * optptr
= opt
->__data
+opt
->rr
-sizeof(struct iphdr
);
485 memset(&optptr
[optptr
[2]-1], 0, 4);
488 unsigned char * optptr
= opt
->__data
+opt
->ts
-sizeof(struct iphdr
);
489 if (opt
->ts_needtime
) {
491 memset(&optptr
[optptr
[2]-1], 0, 4);
492 if ((optptr
[3]&0xF) == IPOPT_TS_PRESPEC
)
495 if (opt
->ts_needaddr
) {
497 memset(&optptr
[optptr
[2]-1], 0, 4);
502 static struct ip_options
*ip_options_get_alloc(const int optlen
)
504 return kzalloc(sizeof(struct ip_options
) + ((optlen
+ 3) & ~3),
508 static int ip_options_get_finish(struct net
*net
, struct ip_options
**optp
,
509 struct ip_options
*opt
, int optlen
)
512 opt
->__data
[optlen
++] = IPOPT_END
;
513 opt
->optlen
= optlen
;
514 if (optlen
&& ip_options_compile(net
, opt
, NULL
)) {
523 int ip_options_get_from_user(struct net
*net
, struct ip_options
**optp
,
524 unsigned char __user
*data
, int optlen
)
526 struct ip_options
*opt
= ip_options_get_alloc(optlen
);
530 if (optlen
&& copy_from_user(opt
->__data
, data
, optlen
)) {
534 return ip_options_get_finish(net
, optp
, opt
, optlen
);
537 int ip_options_get(struct net
*net
, struct ip_options
**optp
,
538 unsigned char *data
, int optlen
)
540 struct ip_options
*opt
= ip_options_get_alloc(optlen
);
545 memcpy(opt
->__data
, data
, optlen
);
546 return ip_options_get_finish(net
, optp
, opt
, optlen
);
549 void ip_forward_options(struct sk_buff
*skb
)
551 struct ip_options
* opt
= &(IPCB(skb
)->opt
);
552 unsigned char * optptr
;
553 struct rtable
*rt
= skb_rtable(skb
);
554 unsigned char *raw
= skb_network_header(skb
);
556 if (opt
->rr_needaddr
) {
557 optptr
= (unsigned char *)raw
+ opt
->rr
;
558 ip_rt_get_source(&optptr
[optptr
[2]-5], rt
);
561 if (opt
->srr_is_hit
) {
562 int srrptr
, srrspace
;
564 optptr
= raw
+ opt
->srr
;
566 for ( srrptr
=optptr
[2], srrspace
= optptr
[1];
570 if (srrptr
+ 3 > srrspace
)
572 if (memcmp(&rt
->rt_dst
, &optptr
[srrptr
-1], 4) == 0)
575 if (srrptr
+ 3 <= srrspace
) {
577 ip_rt_get_source(&optptr
[srrptr
-1], rt
);
578 ip_hdr(skb
)->daddr
= rt
->rt_dst
;
579 optptr
[2] = srrptr
+4;
580 } else if (net_ratelimit())
581 printk(KERN_CRIT
"ip_forward(): Argh! Destination lost!\n");
582 if (opt
->ts_needaddr
) {
583 optptr
= raw
+ opt
->ts
;
584 ip_rt_get_source(&optptr
[optptr
[2]-9], rt
);
588 if (opt
->is_changed
) {
590 ip_send_check(ip_hdr(skb
));
594 int ip_options_rcv_srr(struct sk_buff
*skb
)
596 struct ip_options
*opt
= &(IPCB(skb
)->opt
);
597 int srrspace
, srrptr
;
599 struct iphdr
*iph
= ip_hdr(skb
);
600 unsigned char *optptr
= skb_network_header(skb
) + opt
->srr
;
601 struct rtable
*rt
= skb_rtable(skb
);
603 unsigned long orefdst
;
609 if (skb
->pkt_type
!= PACKET_HOST
)
611 if (rt
->rt_type
== RTN_UNICAST
) {
612 if (!opt
->is_strictroute
)
614 icmp_send(skb
, ICMP_PARAMETERPROB
, 0, htonl(16<<24));
617 if (rt
->rt_type
!= RTN_LOCAL
)
620 for (srrptr
=optptr
[2], srrspace
= optptr
[1]; srrptr
<= srrspace
; srrptr
+= 4) {
621 if (srrptr
+ 3 > srrspace
) {
622 icmp_send(skb
, ICMP_PARAMETERPROB
, 0, htonl((opt
->srr
+2)<<24));
625 memcpy(&nexthop
, &optptr
[srrptr
-1], 4);
627 orefdst
= skb
->_skb_refdst
;
628 skb_dst_set(skb
, NULL
);
629 err
= ip_route_input(skb
, nexthop
, iph
->saddr
, iph
->tos
, skb
->dev
);
630 rt2
= skb_rtable(skb
);
631 if (err
|| (rt2
->rt_type
!= RTN_UNICAST
&& rt2
->rt_type
!= RTN_LOCAL
)) {
633 skb
->_skb_refdst
= orefdst
;
636 refdst_drop(orefdst
);
637 if (rt2
->rt_type
!= RTN_LOCAL
)
639 /* Superfast 8) loopback forward */
640 memcpy(&iph
->daddr
, &optptr
[srrptr
-1], 4);
643 if (srrptr
<= srrspace
) {