2 * Linux INET6 implementation
5 * Pedro Roque <roque@di.fc.ul.pt>
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation; either version
10 * 2 of the License, or (at your option) any later version.
16 #include <linux/ipv6.h>
17 #include <linux/hardirq.h>
18 #include <net/if_inet6.h>
19 #include <net/ndisc.h>
23 #define SIN6_LEN_RFC2133 24
25 #define IPV6_MAXPLEN 65535
28 * NextHeader field of IPv6 header
31 #define NEXTHDR_HOP 0 /* Hop-by-hop option header. */
32 #define NEXTHDR_TCP 6 /* TCP segment. */
33 #define NEXTHDR_UDP 17 /* UDP message. */
34 #define NEXTHDR_IPV6 41 /* IPv6 in IPv6 */
35 #define NEXTHDR_ROUTING 43 /* Routing header. */
36 #define NEXTHDR_FRAGMENT 44 /* Fragmentation/reassembly header. */
37 #define NEXTHDR_ESP 50 /* Encapsulating security payload. */
38 #define NEXTHDR_AUTH 51 /* Authentication header. */
39 #define NEXTHDR_ICMP 58 /* ICMP for IPv6. */
40 #define NEXTHDR_NONE 59 /* No next header */
41 #define NEXTHDR_DEST 60 /* Destination options header. */
42 #define NEXTHDR_MOBILITY 135 /* Mobility header. */
44 #define NEXTHDR_MAX 255
48 #define IPV6_DEFAULT_HOPLIMIT 64
49 #define IPV6_DEFAULT_MCASTHOPS 1
54 * type - unicast | multicast
55 * scope - local | site | global
62 #define IPV6_ADDR_ANY 0x0000U
64 #define IPV6_ADDR_UNICAST 0x0001U
65 #define IPV6_ADDR_MULTICAST 0x0002U
67 #define IPV6_ADDR_LOOPBACK 0x0010U
68 #define IPV6_ADDR_LINKLOCAL 0x0020U
69 #define IPV6_ADDR_SITELOCAL 0x0040U
71 #define IPV6_ADDR_COMPATv4 0x0080U
73 #define IPV6_ADDR_SCOPE_MASK 0x00f0U
75 #define IPV6_ADDR_MAPPED 0x1000U
81 #define IPV6_ADDR_MC_SCOPE(a) \
82 ((a)->s6_addr[1] & 0x0f) /* nonstandard */
83 #define __IPV6_ADDR_SCOPE_INVALID -1
85 #define IPV6_ADDR_SCOPE_NODELOCAL 0x01
86 #define IPV6_ADDR_SCOPE_LINKLOCAL 0x02
87 #define IPV6_ADDR_SCOPE_SITELOCAL 0x05
88 #define IPV6_ADDR_SCOPE_ORGLOCAL 0x08
89 #define IPV6_ADDR_SCOPE_GLOBAL 0x0e
95 #define IPV6_ADDR_MC_FLAG_TRANSIENT(a) \
96 ((a)->s6_addr[1] & 0x10)
97 #define IPV6_ADDR_MC_FLAG_PREFIX(a) \
98 ((a)->s6_addr[1] & 0x20)
99 #define IPV6_ADDR_MC_FLAG_RENDEZVOUS(a) \
100 ((a)->s6_addr[1] & 0x40)
104 * fragmentation header
111 __be32 identification
;
114 #define IP6_MF 0x0001
118 #include <net/sock.h>
121 extern int sysctl_mld_max_msf
;
122 extern struct ctl_path net_ipv6_ctl_path
[];
124 #define _DEVINC(net, statname, modifier, idev, field) \
126 struct inet6_dev *_idev = (idev); \
127 if (likely(_idev != NULL)) \
128 SNMP_INC_STATS##modifier((_idev)->stats.statname, (field)); \
129 SNMP_INC_STATS##modifier((net)->mib.statname##_statistics, (field));\
132 #define _DEVADD(net, statname, modifier, idev, field, val) \
134 struct inet6_dev *_idev = (idev); \
135 if (likely(_idev != NULL)) \
136 SNMP_ADD_STATS##modifier((_idev)->stats.statname, (field), (val)); \
137 SNMP_ADD_STATS##modifier((net)->mib.statname##_statistics, (field), (val));\
140 #define _DEVUPD(net, statname, modifier, idev, field, val) \
142 struct inet6_dev *_idev = (idev); \
143 if (likely(_idev != NULL)) \
144 SNMP_UPD_PO_STATS##modifier((_idev)->stats.statname, field, (val)); \
145 SNMP_UPD_PO_STATS##modifier((net)->mib.statname##_statistics, field, (val));\
150 #define IP6_INC_STATS(net, idev,field) \
151 _DEVINC(net, ipv6, 64, idev, field)
152 #define IP6_INC_STATS_BH(net, idev,field) \
153 _DEVINC(net, ipv6, 64_BH, idev, field)
154 #define IP6_ADD_STATS(net, idev,field,val) \
155 _DEVADD(net, ipv6, 64, idev, field, val)
156 #define IP6_ADD_STATS_BH(net, idev,field,val) \
157 _DEVADD(net, ipv6, 64_BH, idev, field, val)
158 #define IP6_UPD_PO_STATS(net, idev,field,val) \
159 _DEVUPD(net, ipv6, 64, idev, field, val)
160 #define IP6_UPD_PO_STATS_BH(net, idev,field,val) \
161 _DEVUPD(net, ipv6, 64_BH, idev, field, val)
162 #define ICMP6_INC_STATS(net, idev, field) \
163 _DEVINC(net, icmpv6, , idev, field)
164 #define ICMP6_INC_STATS_BH(net, idev, field) \
165 _DEVINC(net, icmpv6, _BH, idev, field)
167 #define ICMP6MSGOUT_INC_STATS(net, idev, field) \
168 _DEVINC(net, icmpv6msg, , idev, field +256)
169 #define ICMP6MSGOUT_INC_STATS_BH(net, idev, field) \
170 _DEVINC(net, icmpv6msg, _BH, idev, field +256)
171 #define ICMP6MSGIN_INC_STATS_BH(net, idev, field) \
172 _DEVINC(net, icmpv6msg, _BH, idev, field)
174 struct ip6_ra_chain
{
175 struct ip6_ra_chain
*next
;
178 void (*destructor
)(struct sock
*);
181 extern struct ip6_ra_chain
*ip6_ra_chain
;
182 extern rwlock_t ip6_ra_lock
;
185 This structure is prepared by protocol, when parsing
186 ancillary data and passed to IPv6.
189 struct ipv6_txoptions
{
190 /* Length of this structure */
193 /* length of extension headers */
195 __u16 opt_flen
; /* after fragment hdr */
196 __u16 opt_nflen
; /* before fragment hdr */
198 struct ipv6_opt_hdr
*hopopt
;
199 struct ipv6_opt_hdr
*dst0opt
;
200 struct ipv6_rt_hdr
*srcrt
; /* Routing Header */
201 struct ipv6_opt_hdr
*dst1opt
;
203 /* Option buffer, as read by IPV6_PKTOPTIONS, starts here. */
206 struct ip6_flowlabel
{
207 struct ip6_flowlabel
*next
;
211 struct ipv6_txoptions
*opt
;
212 unsigned long linger
;
215 unsigned long lastuse
;
216 unsigned long expires
;
220 #define IPV6_FLOWINFO_MASK cpu_to_be32(0x0FFFFFFF)
221 #define IPV6_FLOWLABEL_MASK cpu_to_be32(0x000FFFFF)
223 struct ipv6_fl_socklist
{
224 struct ipv6_fl_socklist
*next
;
225 struct ip6_flowlabel
*fl
;
228 extern struct ip6_flowlabel
*fl6_sock_lookup(struct sock
*sk
, __be32 label
);
229 extern struct ipv6_txoptions
*fl6_merge_options(struct ipv6_txoptions
* opt_space
,
230 struct ip6_flowlabel
* fl
,
231 struct ipv6_txoptions
* fopt
);
232 extern void fl6_free_socklist(struct sock
*sk
);
233 extern int ipv6_flowlabel_opt(struct sock
*sk
, char __user
*optval
, int optlen
);
234 extern int ip6_flowlabel_init(void);
235 extern void ip6_flowlabel_cleanup(void);
237 static inline void fl6_sock_release(struct ip6_flowlabel
*fl
)
240 atomic_dec(&fl
->users
);
243 extern int ip6_ra_control(struct sock
*sk
, int sel
);
245 extern int ipv6_parse_hopopts(struct sk_buff
*skb
);
247 extern struct ipv6_txoptions
* ipv6_dup_options(struct sock
*sk
, struct ipv6_txoptions
*opt
);
248 extern struct ipv6_txoptions
* ipv6_renew_options(struct sock
*sk
, struct ipv6_txoptions
*opt
,
250 struct ipv6_opt_hdr __user
*newopt
,
252 struct ipv6_txoptions
*ipv6_fixup_options(struct ipv6_txoptions
*opt_space
,
253 struct ipv6_txoptions
*opt
);
255 extern int ipv6_opt_accepted(struct sock
*sk
, struct sk_buff
*skb
);
257 int ip6_frag_nqueues(struct net
*net
);
258 int ip6_frag_mem(struct net
*net
);
260 #define IPV6_FRAG_HIGH_THRESH (256 * 1024) /* 262144 */
261 #define IPV6_FRAG_LOW_THRESH (192 * 1024) /* 196608 */
262 #define IPV6_FRAG_TIMEOUT (60 * HZ) /* 60 seconds */
264 extern int __ipv6_addr_type(const struct in6_addr
*addr
);
265 static inline int ipv6_addr_type(const struct in6_addr
*addr
)
267 return __ipv6_addr_type(addr
) & 0xffff;
270 static inline int ipv6_addr_scope(const struct in6_addr
*addr
)
272 return __ipv6_addr_type(addr
) & IPV6_ADDR_SCOPE_MASK
;
275 static inline int __ipv6_addr_src_scope(int type
)
277 return (type
== IPV6_ADDR_ANY
) ? __IPV6_ADDR_SCOPE_INVALID
: (type
>> 16);
280 static inline int ipv6_addr_src_scope(const struct in6_addr
*addr
)
282 return __ipv6_addr_src_scope(__ipv6_addr_type(addr
));
285 static inline int ipv6_addr_cmp(const struct in6_addr
*a1
, const struct in6_addr
*a2
)
287 return memcmp(a1
, a2
, sizeof(struct in6_addr
));
291 ipv6_masked_addr_cmp(const struct in6_addr
*a1
, const struct in6_addr
*m
,
292 const struct in6_addr
*a2
)
294 return !!(((a1
->s6_addr32
[0] ^ a2
->s6_addr32
[0]) & m
->s6_addr32
[0]) |
295 ((a1
->s6_addr32
[1] ^ a2
->s6_addr32
[1]) & m
->s6_addr32
[1]) |
296 ((a1
->s6_addr32
[2] ^ a2
->s6_addr32
[2]) & m
->s6_addr32
[2]) |
297 ((a1
->s6_addr32
[3] ^ a2
->s6_addr32
[3]) & m
->s6_addr32
[3]));
300 static inline void ipv6_addr_copy(struct in6_addr
*a1
, const struct in6_addr
*a2
)
302 memcpy(a1
, a2
, sizeof(struct in6_addr
));
305 static inline void ipv6_addr_prefix(struct in6_addr
*pfx
,
306 const struct in6_addr
*addr
,
309 /* caller must guarantee 0 <= plen <= 128 */
313 memset(pfx
->s6_addr
, 0, sizeof(pfx
->s6_addr
));
314 memcpy(pfx
->s6_addr
, addr
, o
);
316 pfx
->s6_addr
[o
] = addr
->s6_addr
[o
] & (0xff00 >> b
);
319 static inline void ipv6_addr_set(struct in6_addr
*addr
,
320 __be32 w1
, __be32 w2
,
321 __be32 w3
, __be32 w4
)
323 addr
->s6_addr32
[0] = w1
;
324 addr
->s6_addr32
[1] = w2
;
325 addr
->s6_addr32
[2] = w3
;
326 addr
->s6_addr32
[3] = w4
;
329 static inline int ipv6_addr_equal(const struct in6_addr
*a1
,
330 const struct in6_addr
*a2
)
332 return ((a1
->s6_addr32
[0] ^ a2
->s6_addr32
[0]) |
333 (a1
->s6_addr32
[1] ^ a2
->s6_addr32
[1]) |
334 (a1
->s6_addr32
[2] ^ a2
->s6_addr32
[2]) |
335 (a1
->s6_addr32
[3] ^ a2
->s6_addr32
[3])) == 0;
338 static inline int __ipv6_prefix_equal(const __be32
*a1
, const __be32
*a2
,
339 unsigned int prefixlen
)
343 /* check complete u32 in prefix */
344 pdw
= prefixlen
>> 5;
345 if (pdw
&& memcmp(a1
, a2
, pdw
<< 2))
348 /* check incomplete u32 in prefix */
349 pbi
= prefixlen
& 0x1f;
350 if (pbi
&& ((a1
[pdw
] ^ a2
[pdw
]) & htonl((0xffffffff) << (32 - pbi
))))
356 static inline int ipv6_prefix_equal(const struct in6_addr
*a1
,
357 const struct in6_addr
*a2
,
358 unsigned int prefixlen
)
360 return __ipv6_prefix_equal(a1
->s6_addr32
, a2
->s6_addr32
,
364 struct inet_frag_queue
;
366 enum ip6_defrag_users
{
367 IP6_DEFRAG_LOCAL_DELIVER
,
368 IP6_DEFRAG_CONNTRACK_IN
,
369 __IP6_DEFRAG_CONNTRACK_IN
= IP6_DEFRAG_CONNTRACK_IN
+ USHRT_MAX
,
370 IP6_DEFRAG_CONNTRACK_OUT
,
371 __IP6_DEFRAG_CONNTRACK_OUT
= IP6_DEFRAG_CONNTRACK_OUT
+ USHRT_MAX
,
372 IP6_DEFRAG_CONNTRACK_BRIDGE_IN
,
373 __IP6_DEFRAG_CONNTRACK_BRIDGE_IN
= IP6_DEFRAG_CONNTRACK_BRIDGE_IN
+ USHRT_MAX
,
376 struct ip6_create_arg
{
379 struct in6_addr
*src
;
380 struct in6_addr
*dst
;
383 void ip6_frag_init(struct inet_frag_queue
*q
, void *a
);
384 int ip6_frag_match(struct inet_frag_queue
*q
, void *a
);
386 static inline int ipv6_addr_any(const struct in6_addr
*a
)
388 return (a
->s6_addr32
[0] | a
->s6_addr32
[1] |
389 a
->s6_addr32
[2] | a
->s6_addr32
[3]) == 0;
392 static inline int ipv6_addr_loopback(const struct in6_addr
*a
)
394 return (a
->s6_addr32
[0] | a
->s6_addr32
[1] |
395 a
->s6_addr32
[2] | (a
->s6_addr32
[3] ^ htonl(1))) == 0;
398 static inline int ipv6_addr_v4mapped(const struct in6_addr
*a
)
400 return (a
->s6_addr32
[0] | a
->s6_addr32
[1] |
401 (a
->s6_addr32
[2] ^ htonl(0x0000ffff))) == 0;
405 * Check for a RFC 4843 ORCHID address
406 * (Overlay Routable Cryptographic Hash Identifiers)
408 static inline int ipv6_addr_orchid(const struct in6_addr
*a
)
410 return (a
->s6_addr32
[0] & htonl(0xfffffff0)) == htonl(0x20010010);
413 static inline void ipv6_addr_set_v4mapped(const __be32 addr
,
414 struct in6_addr
*v4mapped
)
416 ipv6_addr_set(v4mapped
,
423 * find the first different bit between two addresses
424 * length of address must be a multiple of 32bits
426 static inline int __ipv6_addr_diff(const void *token1
, const void *token2
, int addrlen
)
428 const __be32
*a1
= token1
, *a2
= token2
;
433 for (i
= 0; i
< addrlen
; i
++) {
434 __be32 xb
= a1
[i
] ^ a2
[i
];
436 return i
* 32 + 31 - __fls(ntohl(xb
));
440 * we should *never* get to this point since that
441 * would mean the addrs are equal
443 * However, we do get to it 8) And exacly, when
444 * addresses are equal 8)
446 * ip route add 1111::/128 via ...
447 * ip route add 1111::/64 via ...
450 * Ideally, this function should stop comparison
451 * at prefix length. It does not, but it is still OK,
452 * if returned value is greater than prefix length.
458 static inline int ipv6_addr_diff(const struct in6_addr
*a1
, const struct in6_addr
*a2
)
460 return __ipv6_addr_diff(a1
, a2
, sizeof(struct in6_addr
));
463 static __inline__
void ipv6_select_ident(struct frag_hdr
*fhdr
)
465 static u32 ipv6_fragmentation_id
= 1;
466 static DEFINE_SPINLOCK(ip6_id_lock
);
468 spin_lock_bh(&ip6_id_lock
);
469 fhdr
->identification
= htonl(ipv6_fragmentation_id
);
470 if (++ipv6_fragmentation_id
== 0)
471 ipv6_fragmentation_id
= 1;
472 spin_unlock_bh(&ip6_id_lock
);
476 * Prototypes exported by ipv6
480 * rcv function (called from netdevice level)
483 extern int ipv6_rcv(struct sk_buff
*skb
,
484 struct net_device
*dev
,
485 struct packet_type
*pt
,
486 struct net_device
*orig_dev
);
488 extern int ip6_rcv_finish(struct sk_buff
*skb
);
491 * upper-layer output functions
493 extern int ip6_xmit(struct sock
*sk
,
496 struct ipv6_txoptions
*opt
);
498 extern int ip6_nd_hdr(struct sock
*sk
,
500 struct net_device
*dev
,
501 const struct in6_addr
*saddr
,
502 const struct in6_addr
*daddr
,
505 extern int ip6_find_1stfragopt(struct sk_buff
*skb
, u8
**nexthdr
);
507 extern int ip6_append_data(struct sock
*sk
,
508 int getfrag(void *from
, char *to
, int offset
, int len
, int odd
, struct sk_buff
*skb
),
514 struct ipv6_txoptions
*opt
,
520 extern int ip6_push_pending_frames(struct sock
*sk
);
522 extern void ip6_flush_pending_frames(struct sock
*sk
);
524 extern int ip6_dst_lookup(struct sock
*sk
,
525 struct dst_entry
**dst
,
527 extern struct dst_entry
* ip6_dst_lookup_flow(struct sock
*sk
,
529 const struct in6_addr
*final_dst
,
531 extern struct dst_entry
* ip6_sk_dst_lookup_flow(struct sock
*sk
,
533 const struct in6_addr
*final_dst
,
535 extern struct dst_entry
* ip6_blackhole_route(struct net
*net
,
536 struct dst_entry
*orig_dst
);
539 * skb processing functions
542 extern int ip6_output(struct sk_buff
*skb
);
543 extern int ip6_forward(struct sk_buff
*skb
);
544 extern int ip6_input(struct sk_buff
*skb
);
545 extern int ip6_mc_input(struct sk_buff
*skb
);
547 extern int __ip6_local_out(struct sk_buff
*skb
);
548 extern int ip6_local_out(struct sk_buff
*skb
);
551 * Extension header (options) processing
554 extern void ipv6_push_nfrag_opts(struct sk_buff
*skb
,
555 struct ipv6_txoptions
*opt
,
557 struct in6_addr
**daddr_p
);
558 extern void ipv6_push_frag_opts(struct sk_buff
*skb
,
559 struct ipv6_txoptions
*opt
,
562 extern int ipv6_skip_exthdr(const struct sk_buff
*, int start
,
565 extern int ipv6_ext_hdr(u8 nexthdr
);
567 extern int ipv6_find_tlv(struct sk_buff
*skb
, int offset
, int type
);
569 extern struct in6_addr
*fl6_update_dst(struct flowi6
*fl6
,
570 const struct ipv6_txoptions
*opt
,
571 struct in6_addr
*orig
);
574 * socket options (ipv6_sockglue.c)
577 extern int ipv6_setsockopt(struct sock
*sk
, int level
,
580 unsigned int optlen
);
581 extern int ipv6_getsockopt(struct sock
*sk
, int level
,
585 extern int compat_ipv6_setsockopt(struct sock
*sk
,
589 unsigned int optlen
);
590 extern int compat_ipv6_getsockopt(struct sock
*sk
,
596 extern int ip6_datagram_connect(struct sock
*sk
,
597 struct sockaddr
*addr
, int addr_len
);
599 extern int ipv6_recv_error(struct sock
*sk
, struct msghdr
*msg
, int len
);
600 extern int ipv6_recv_rxpmtu(struct sock
*sk
, struct msghdr
*msg
, int len
);
601 extern void ipv6_icmp_error(struct sock
*sk
, struct sk_buff
*skb
, int err
, __be16 port
,
602 u32 info
, u8
*payload
);
603 extern void ipv6_local_error(struct sock
*sk
, int err
, struct flowi6
*fl6
, u32 info
);
604 extern void ipv6_local_rxpmtu(struct sock
*sk
, struct flowi6
*fl6
, u32 mtu
);
606 extern int inet6_release(struct socket
*sock
);
607 extern int inet6_bind(struct socket
*sock
, struct sockaddr
*uaddr
,
609 extern int inet6_getname(struct socket
*sock
, struct sockaddr
*uaddr
,
610 int *uaddr_len
, int peer
);
611 extern int inet6_ioctl(struct socket
*sock
, unsigned int cmd
,
614 extern int inet6_hash_connect(struct inet_timewait_death_row
*death_row
,
620 extern const struct proto_ops inet6_stream_ops
;
621 extern const struct proto_ops inet6_dgram_ops
;
623 struct group_source_req
;
626 extern int ip6_mc_source(int add
, int omode
, struct sock
*sk
,
627 struct group_source_req
*pgsr
);
628 extern int ip6_mc_msfilter(struct sock
*sk
, struct group_filter
*gsf
);
629 extern int ip6_mc_msfget(struct sock
*sk
, struct group_filter
*gsf
,
630 struct group_filter __user
*optval
,
632 extern unsigned int inet6_hash_frag(__be32 id
, const struct in6_addr
*saddr
,
633 const struct in6_addr
*daddr
, u32 rnd
);
635 #ifdef CONFIG_PROC_FS
636 extern int ac6_proc_init(struct net
*net
);
637 extern void ac6_proc_exit(struct net
*net
);
638 extern int raw6_proc_init(void);
639 extern void raw6_proc_exit(void);
640 extern int tcp6_proc_init(struct net
*net
);
641 extern void tcp6_proc_exit(struct net
*net
);
642 extern int udp6_proc_init(struct net
*net
);
643 extern void udp6_proc_exit(struct net
*net
);
644 extern int udplite6_proc_init(void);
645 extern void udplite6_proc_exit(void);
646 extern int ipv6_misc_proc_init(void);
647 extern void ipv6_misc_proc_exit(void);
648 extern int snmp6_register_dev(struct inet6_dev
*idev
);
649 extern int snmp6_unregister_dev(struct inet6_dev
*idev
);
652 static inline int ac6_proc_init(struct net
*net
) { return 0; }
653 static inline void ac6_proc_exit(struct net
*net
) { }
654 static inline int snmp6_register_dev(struct inet6_dev
*idev
) { return 0; }
655 static inline int snmp6_unregister_dev(struct inet6_dev
*idev
) { return 0; }
659 extern ctl_table ipv6_route_table_template
[];
660 extern ctl_table ipv6_icmp_table_template
[];
662 extern struct ctl_table
*ipv6_icmp_sysctl_init(struct net
*net
);
663 extern struct ctl_table
*ipv6_route_sysctl_init(struct net
*net
);
664 extern int ipv6_sysctl_register(void);
665 extern void ipv6_sysctl_unregister(void);
666 extern int ipv6_static_sysctl_register(void);
667 extern void ipv6_static_sysctl_unregister(void);
670 #endif /* __KERNEL__ */
671 #endif /* _NET_IPV6_H */