2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * The options processing module for ip.c
8 * Version: $Id: ip_options.c,v 1.21 2001/09/01 00:31:50 davem Exp $
10 * Authors: A.N.Kuznetsov
14 #include <linux/capability.h>
15 #include <linux/module.h>
16 #include <linux/types.h>
17 #include <asm/uaccess.h>
18 #include <linux/skbuff.h>
20 #include <linux/icmp.h>
21 #include <linux/netdevice.h>
22 #include <linux/rtnetlink.h>
26 #include <net/route.h>
27 #include <net/cipso_ipv4.h>
30 * Write options to IP header, record destination address to
31 * source route option, address of outgoing interface
32 * (we should already know it, so that this function is allowed be
33 * called only after routing decision) and timestamp,
34 * if we originate this datagram.
36 * daddr is real destination address, next hop is recorded in IP header.
37 * saddr is address of outgoing interface.
40 void ip_options_build(struct sk_buff
* skb
, struct ip_options
* opt
,
41 __be32 daddr
, struct rtable
*rt
, int is_frag
)
43 unsigned char * iph
= skb
->nh
.raw
;
45 memcpy(&(IPCB(skb
)->opt
), opt
, sizeof(struct ip_options
));
46 memcpy(iph
+sizeof(struct iphdr
), opt
->__data
, opt
->optlen
);
47 opt
= &(IPCB(skb
)->opt
);
51 memcpy(iph
+opt
->srr
+iph
[opt
->srr
+1]-4, &daddr
, 4);
55 ip_rt_get_source(iph
+opt
->rr
+iph
[opt
->rr
+2]-5, rt
);
57 ip_rt_get_source(iph
+opt
->ts
+iph
[opt
->ts
+2]-9, rt
);
58 if (opt
->ts_needtime
) {
62 midtime
= htonl((tv
.tv_sec
% 86400) * 1000 + tv
.tv_usec
/ 1000);
63 memcpy(iph
+opt
->ts
+iph
[opt
->ts
+2]-5, &midtime
, 4);
68 memset(iph
+opt
->rr
, IPOPT_NOP
, iph
[opt
->rr
+1]);
73 memset(iph
+opt
->ts
, IPOPT_NOP
, iph
[opt
->ts
+1]);
75 opt
->ts_needaddr
= opt
->ts_needtime
= 0;
80 * Provided (sopt, skb) points to received options,
81 * build in dopt compiled option set appropriate for answering.
82 * i.e. invert SRR option, copy anothers,
83 * and grab room in RR/TS options.
85 * NOTE: dopt cannot point to skb.
88 int ip_options_echo(struct ip_options
* dopt
, struct sk_buff
* skb
)
90 struct ip_options
*sopt
;
91 unsigned char *sptr
, *dptr
;
96 memset(dopt
, 0, sizeof(struct ip_options
));
100 sopt
= &(IPCB(skb
)->opt
);
102 if (sopt
->optlen
== 0) {
111 daddr
= ((struct rtable
*)skb
->dst
)->rt_spec_dst
;
113 daddr
= skb
->nh
.iph
->daddr
;
116 optlen
= sptr
[sopt
->rr
+1];
117 soffset
= sptr
[sopt
->rr
+2];
118 dopt
->rr
= dopt
->optlen
+ sizeof(struct iphdr
);
119 memcpy(dptr
, sptr
+sopt
->rr
, optlen
);
120 if (sopt
->rr_needaddr
&& soffset
<= optlen
) {
121 if (soffset
+ 3 > optlen
)
123 dptr
[2] = soffset
+ 4;
124 dopt
->rr_needaddr
= 1;
127 dopt
->optlen
+= optlen
;
130 optlen
= sptr
[sopt
->ts
+1];
131 soffset
= sptr
[sopt
->ts
+2];
132 dopt
->ts
= dopt
->optlen
+ sizeof(struct iphdr
);
133 memcpy(dptr
, sptr
+sopt
->ts
, optlen
);
134 if (soffset
<= optlen
) {
135 if (sopt
->ts_needaddr
) {
136 if (soffset
+ 3 > optlen
)
138 dopt
->ts_needaddr
= 1;
141 if (sopt
->ts_needtime
) {
142 if (soffset
+ 3 > optlen
)
144 if ((dptr
[3]&0xF) != IPOPT_TS_PRESPEC
) {
145 dopt
->ts_needtime
= 1;
148 dopt
->ts_needtime
= 0;
150 if (soffset
+ 8 <= optlen
) {
153 memcpy(&addr
, sptr
+soffset
-1, 4);
154 if (inet_addr_type(addr
) != RTN_LOCAL
) {
155 dopt
->ts_needtime
= 1;
164 dopt
->optlen
+= optlen
;
167 unsigned char * start
= sptr
+sopt
->srr
;
173 if (soffset
> optlen
)
174 soffset
= optlen
+ 1;
177 memcpy(&faddr
, &start
[soffset
-1], 4);
178 for (soffset
-=4, doffset
=4; soffset
> 3; soffset
-=4, doffset
+=4)
179 memcpy(&dptr
[doffset
-1], &start
[soffset
-1], 4);
181 * RFC1812 requires to fix illegal source routes.
183 if (memcmp(&skb
->nh
.iph
->saddr
, &start
[soffset
+3], 4) == 0)
187 memcpy(&start
[doffset
-1], &daddr
, 4);
193 dopt
->srr
= dopt
->optlen
+ sizeof(struct iphdr
);
194 dopt
->optlen
+= doffset
+3;
195 dopt
->is_strictroute
= sopt
->is_strictroute
;
199 optlen
= sptr
[sopt
->cipso
+1];
200 dopt
->cipso
= dopt
->optlen
+sizeof(struct iphdr
);
201 memcpy(dptr
, sptr
+sopt
->cipso
, optlen
);
203 dopt
->optlen
+= optlen
;
205 while (dopt
->optlen
& 3) {
213 * Options "fragmenting", just fill options not
214 * allowed in fragments with NOOPs.
215 * Simple and stupid 8), but the most efficient way.
218 void ip_options_fragment(struct sk_buff
* skb
)
220 unsigned char * optptr
= skb
->nh
.raw
+ sizeof(struct iphdr
);
221 struct ip_options
* opt
= &(IPCB(skb
)->opt
);
235 if (optlen
<2 || optlen
>l
)
237 if (!IPOPT_COPIED(*optptr
))
238 memset(optptr
, IPOPT_NOOP
, optlen
);
244 opt
->rr_needaddr
= 0;
245 opt
->ts_needaddr
= 0;
246 opt
->ts_needtime
= 0;
251 * Verify options and fill pointers in struct options.
252 * Caller should clear *opt, and set opt->data.
253 * If opt == NULL, then skb->data should point to IP header.
256 int ip_options_compile(struct ip_options
* opt
, struct sk_buff
* skb
)
260 unsigned char * optptr
;
262 unsigned char * pp_ptr
= NULL
;
263 struct rtable
*rt
= skb
? (struct rtable
*)skb
->dst
: NULL
;
266 opt
= &(IPCB(skb
)->opt
);
268 opt
->optlen
= ((struct iphdr
*)iph
)->ihl
*4 - sizeof(struct iphdr
);
269 optptr
= iph
+ sizeof(struct iphdr
);
272 optptr
= opt
->is_data
? opt
->__data
: (unsigned char*)&(skb
->nh
.iph
[1]);
273 iph
= optptr
- sizeof(struct iphdr
);
276 for (l
= opt
->optlen
; l
> 0; ) {
279 for (optptr
++, l
--; l
>0; optptr
++, l
--) {
280 if (*optptr
!= IPOPT_END
) {
292 if (optlen
<2 || optlen
>l
) {
307 /* NB: cf RFC-1812 5.2.4.1 */
313 if (optptr
[2] != 4 || optlen
< 7 || ((optlen
-3) & 3)) {
317 memcpy(&opt
->faddr
, &optptr
[3], 4);
319 memmove(&optptr
[3], &optptr
[7], optlen
-7);
321 opt
->is_strictroute
= (optptr
[0] == IPOPT_SSRR
);
322 opt
->srr
= optptr
- iph
;
337 if (optptr
[2] <= optlen
) {
338 if (optptr
[2]+3 > optlen
) {
343 memcpy(&optptr
[optptr
[2]-1], &rt
->rt_spec_dst
, 4);
347 opt
->rr_needaddr
= 1;
349 opt
->rr
= optptr
- iph
;
351 case IPOPT_TIMESTAMP
:
364 if (optptr
[2] <= optlen
) {
365 __be32
*timeptr
= NULL
;
366 if (optptr
[2]+3 > optptr
[1]) {
370 switch (optptr
[3]&0xF) {
371 case IPOPT_TS_TSONLY
:
372 opt
->ts
= optptr
- iph
;
374 timeptr
= (__be32
*)&optptr
[optptr
[2]-1];
375 opt
->ts_needtime
= 1;
378 case IPOPT_TS_TSANDADDR
:
379 if (optptr
[2]+7 > optptr
[1]) {
383 opt
->ts
= optptr
- iph
;
385 memcpy(&optptr
[optptr
[2]-1], &rt
->rt_spec_dst
, 4);
386 timeptr
= (__be32
*)&optptr
[optptr
[2]+3];
388 opt
->ts_needaddr
= 1;
389 opt
->ts_needtime
= 1;
392 case IPOPT_TS_PRESPEC
:
393 if (optptr
[2]+7 > optptr
[1]) {
397 opt
->ts
= optptr
- iph
;
400 memcpy(&addr
, &optptr
[optptr
[2]-1], 4);
401 if (inet_addr_type(addr
) == RTN_UNICAST
)
404 timeptr
= (__be32
*)&optptr
[optptr
[2]+3];
406 opt
->ts_needtime
= 1;
410 if (!skb
&& !capable(CAP_NET_RAW
)) {
419 do_gettimeofday(&tv
);
420 midtime
= htonl((tv
.tv_sec
% 86400) * 1000 + tv
.tv_usec
/ 1000);
421 memcpy(timeptr
, &midtime
, sizeof(__be32
));
425 unsigned overflow
= optptr
[3]>>4;
426 if (overflow
== 15) {
430 opt
->ts
= optptr
- iph
;
432 optptr
[3] = (optptr
[3]&0xF)|((overflow
+1)<<4);
442 if (optptr
[2] == 0 && optptr
[3] == 0)
443 opt
->router_alert
= optptr
- iph
;
446 if ((!skb
&& !capable(CAP_NET_RAW
)) || opt
->cipso
) {
450 opt
->cipso
= optptr
- iph
;
451 if (cipso_v4_validate(&optptr
)) {
459 if (!skb
&& !capable(CAP_NET_RAW
)) {
475 icmp_send(skb
, ICMP_PARAMETERPROB
, 0, htonl((pp_ptr
-iph
)<<24));
482 * Undo all the changes done by ip_options_compile().
485 void ip_options_undo(struct ip_options
* opt
)
488 unsigned char * optptr
= opt
->__data
+opt
->srr
-sizeof(struct iphdr
);
489 memmove(optptr
+7, optptr
+3, optptr
[1]-7);
490 memcpy(optptr
+3, &opt
->faddr
, 4);
492 if (opt
->rr_needaddr
) {
493 unsigned char * optptr
= opt
->__data
+opt
->rr
-sizeof(struct iphdr
);
495 memset(&optptr
[optptr
[2]-1], 0, 4);
498 unsigned char * optptr
= opt
->__data
+opt
->ts
-sizeof(struct iphdr
);
499 if (opt
->ts_needtime
) {
501 memset(&optptr
[optptr
[2]-1], 0, 4);
502 if ((optptr
[3]&0xF) == IPOPT_TS_PRESPEC
)
505 if (opt
->ts_needaddr
) {
507 memset(&optptr
[optptr
[2]-1], 0, 4);
512 static struct ip_options
*ip_options_get_alloc(const int optlen
)
514 struct ip_options
*opt
= kmalloc(sizeof(*opt
) + ((optlen
+ 3) & ~3),
517 memset(opt
, 0, sizeof(*opt
));
521 static int ip_options_get_finish(struct ip_options
**optp
,
522 struct ip_options
*opt
, int optlen
)
525 opt
->__data
[optlen
++] = IPOPT_END
;
526 opt
->optlen
= optlen
;
528 if (optlen
&& ip_options_compile(opt
, NULL
)) {
537 int ip_options_get_from_user(struct ip_options
**optp
, unsigned char __user
*data
, int optlen
)
539 struct ip_options
*opt
= ip_options_get_alloc(optlen
);
543 if (optlen
&& copy_from_user(opt
->__data
, data
, optlen
)) {
547 return ip_options_get_finish(optp
, opt
, optlen
);
550 int ip_options_get(struct ip_options
**optp
, unsigned char *data
, int optlen
)
552 struct ip_options
*opt
= ip_options_get_alloc(optlen
);
557 memcpy(opt
->__data
, data
, optlen
);
558 return ip_options_get_finish(optp
, opt
, optlen
);
561 void ip_forward_options(struct sk_buff
*skb
)
563 struct ip_options
* opt
= &(IPCB(skb
)->opt
);
564 unsigned char * optptr
;
565 struct rtable
*rt
= (struct rtable
*)skb
->dst
;
566 unsigned char *raw
= skb
->nh
.raw
;
568 if (opt
->rr_needaddr
) {
569 optptr
= (unsigned char *)raw
+ opt
->rr
;
570 ip_rt_get_source(&optptr
[optptr
[2]-5], rt
);
573 if (opt
->srr_is_hit
) {
574 int srrptr
, srrspace
;
576 optptr
= raw
+ opt
->srr
;
578 for ( srrptr
=optptr
[2], srrspace
= optptr
[1];
582 if (srrptr
+ 3 > srrspace
)
584 if (memcmp(&rt
->rt_dst
, &optptr
[srrptr
-1], 4) == 0)
587 if (srrptr
+ 3 <= srrspace
) {
589 ip_rt_get_source(&optptr
[srrptr
-1], rt
);
590 skb
->nh
.iph
->daddr
= rt
->rt_dst
;
591 optptr
[2] = srrptr
+4;
592 } else if (net_ratelimit())
593 printk(KERN_CRIT
"ip_forward(): Argh! Destination lost!\n");
594 if (opt
->ts_needaddr
) {
595 optptr
= raw
+ opt
->ts
;
596 ip_rt_get_source(&optptr
[optptr
[2]-9], rt
);
600 if (opt
->is_changed
) {
602 ip_send_check(skb
->nh
.iph
);
606 int ip_options_rcv_srr(struct sk_buff
*skb
)
608 struct ip_options
*opt
= &(IPCB(skb
)->opt
);
609 int srrspace
, srrptr
;
611 struct iphdr
*iph
= skb
->nh
.iph
;
612 unsigned char * optptr
= skb
->nh
.raw
+ opt
->srr
;
613 struct rtable
*rt
= (struct rtable
*)skb
->dst
;
620 if (skb
->pkt_type
!= PACKET_HOST
)
622 if (rt
->rt_type
== RTN_UNICAST
) {
623 if (!opt
->is_strictroute
)
625 icmp_send(skb
, ICMP_PARAMETERPROB
, 0, htonl(16<<24));
628 if (rt
->rt_type
!= RTN_LOCAL
)
631 for (srrptr
=optptr
[2], srrspace
= optptr
[1]; srrptr
<= srrspace
; srrptr
+= 4) {
632 if (srrptr
+ 3 > srrspace
) {
633 icmp_send(skb
, ICMP_PARAMETERPROB
, 0, htonl((opt
->srr
+2)<<24));
636 memcpy(&nexthop
, &optptr
[srrptr
-1], 4);
638 rt
= (struct rtable
*)skb
->dst
;
640 err
= ip_route_input(skb
, nexthop
, iph
->saddr
, iph
->tos
, skb
->dev
);
641 rt2
= (struct rtable
*)skb
->dst
;
642 if (err
|| (rt2
->rt_type
!= RTN_UNICAST
&& rt2
->rt_type
!= RTN_LOCAL
)) {
644 skb
->dst
= &rt
->u
.dst
;
648 if (rt2
->rt_type
!= RTN_LOCAL
)
650 /* Superfast 8) loopback forward */
651 memcpy(&iph
->daddr
, &optptr
[srrptr
-1], 4);
654 if (srrptr
<= srrspace
) {