2 * Copyright (c) 1980, 1986, 1993
3 * The Regents of the University of California. All rights reserved.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * 3. All advertising materials mentioning features or use of this software
14 * must display the following acknowledgement:
15 * This product includes software developed by the University of
16 * California, Berkeley and its contributors.
17 * 4. Neither the name of the University nor the names of its contributors
18 * may be used to endorse or promote products derived from this software
19 * without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * @(#)if.c 8.3 (Berkeley) 1/4/94
34 * $FreeBSD: src/sys/net/if.c,v 1.185 2004/03/13 02:35:03 brooks Exp $
35 * $DragonFly: src/sys/net/if.c,v 1.74 2008/06/15 12:15:08 sephe Exp $
38 #include "opt_compat.h"
39 #include "opt_inet6.h"
41 #include "opt_polling.h"
43 #include <sys/param.h>
44 #include <sys/malloc.h>
46 #include <sys/systm.h>
48 #include <sys/protosw.h>
49 #include <sys/socket.h>
50 #include <sys/socketvar.h>
51 #include <sys/socketops.h>
52 #include <sys/protosw.h>
53 #include <sys/kernel.h>
55 #include <sys/sockio.h>
56 #include <sys/syslog.h>
57 #include <sys/sysctl.h>
58 #include <sys/domain.h>
59 #include <sys/thread.h>
60 #include <sys/thread2.h>
61 #include <sys/serialize.h>
62 #include <sys/msgport2.h>
65 #include <net/if_arp.h>
66 #include <net/if_dl.h>
67 #include <net/if_types.h>
68 #include <net/if_var.h>
69 #include <net/ifq_var.h>
70 #include <net/radix.h>
71 #include <net/route.h>
72 #include <net/if_clone.h>
73 #include <net/netisr.h>
74 #include <net/netmsg2.h>
76 #include <machine/stdarg.h>
77 #include <machine/smp.h>
79 #if defined(INET) || defined(INET6)
81 #include <netinet/in.h>
82 #include <netinet/in_var.h>
83 #include <netinet/if_ether.h>
85 #include <netinet6/in6_var.h>
86 #include <netinet6/in6_ifattach.h>
90 #if defined(COMPAT_43)
91 #include <emulation/43bsd/43bsd_socket.h>
92 #endif /* COMPAT_43 */
94 struct netmsg_ifaddr
{
102 * System initialization
104 static void if_attachdomain(void *);
105 static void if_attachdomain1(struct ifnet
*);
106 static int ifconf(u_long
, caddr_t
, struct ucred
*);
107 static void ifinit(void *);
108 static void ifnetinit(void *);
109 static void if_slowtimo(void *);
110 static void link_rtrequest(int, struct rtentry
*, struct rt_addrinfo
*);
111 static int if_rtdel(struct radix_node
*, void *);
115 * XXX: declare here to avoid to include many inet6 related files..
116 * should be more generalized?
118 extern void nd6_setmtu(struct ifnet
*);
121 SYSCTL_NODE(_net
, PF_LINK
, link
, CTLFLAG_RW
, 0, "Link layers");
122 SYSCTL_NODE(_net_link
, 0, generic
, CTLFLAG_RW
, 0, "Generic link-management");
124 SYSINIT(interfaces
, SI_SUB_PROTO_IF
, SI_ORDER_FIRST
, ifinit
, NULL
)
125 /* Must be after netisr_init */
126 SYSINIT(ifnet
, SI_SUB_PRE_DRIVERS
, SI_ORDER_SECOND
, ifnetinit
, NULL
)
128 MALLOC_DEFINE(M_IFADDR
, "ifaddr", "interface address");
129 MALLOC_DEFINE(M_IFMADDR
, "ether_multi", "link-level multicast address");
131 int ifqmaxlen
= IFQ_MAXLEN
;
132 struct ifnethead ifnet
= TAILQ_HEAD_INITIALIZER(ifnet
);
134 /* In ifq_dispatch(), try to do direct ifnet.if_start first */
135 static int ifq_dispatch_schedonly
= 0;
136 SYSCTL_INT(_net_link_generic
, OID_AUTO
, ifq_dispatch_schedonly
, CTLFLAG_RW
,
137 &ifq_dispatch_schedonly
, 0, "");
139 /* In ifq_dispatch(), schedule ifnet.if_start without checking ifnet.if_snd */
140 static int ifq_dispatch_schednochk
= 0;
141 SYSCTL_INT(_net_link_generic
, OID_AUTO
, ifq_dispatch_schednochk
, CTLFLAG_RW
,
142 &ifq_dispatch_schednochk
, 0, "");
144 /* In if_devstart(), try to do direct ifnet.if_start first */
145 static int if_devstart_schedonly
= 0;
146 SYSCTL_INT(_net_link_generic
, OID_AUTO
, if_devstart_schedonly
, CTLFLAG_RW
,
147 &if_devstart_schedonly
, 0, "");
149 /* In if_devstart(), schedule ifnet.if_start without checking ifnet.if_snd */
150 static int if_devstart_schednochk
= 0;
151 SYSCTL_INT(_net_link_generic
, OID_AUTO
, if_devstart_schednochk
, CTLFLAG_RW
,
152 &if_devstart_schednochk
, 0, "");
155 /* Schedule ifnet.if_start on the current CPU */
156 static int if_start_oncpu_sched
= 0;
157 SYSCTL_INT(_net_link_generic
, OID_AUTO
, if_start_oncpu_sched
, CTLFLAG_RW
,
158 &if_start_oncpu_sched
, 0, "");
161 struct callout if_slowtimo_timer
;
164 struct ifnet
**ifindex2ifnet
= NULL
;
165 static struct thread ifnet_threads
[MAXCPU
];
167 #define IFQ_KTR_STRING "ifq=%p"
168 #define IFQ_KTR_ARG_SIZE (sizeof(void *))
170 #define KTR_IFQ KTR_ALL
172 KTR_INFO_MASTER(ifq
);
173 KTR_INFO(KTR_IFQ
, ifq
, enqueue
, 0, IFQ_KTR_STRING
, IFQ_KTR_ARG_SIZE
);
174 KTR_INFO(KTR_IFQ
, ifq
, dequeue
, 1, IFQ_KTR_STRING
, IFQ_KTR_ARG_SIZE
);
175 #define logifq(name, arg) KTR_LOG(ifq_ ## name, arg)
177 #define IF_START_KTR_STRING "ifp=%p"
178 #define IF_START_KTR_ARG_SIZE (sizeof(void *))
180 #define KTR_IF_START KTR_ALL
182 KTR_INFO_MASTER(if_start
);
183 KTR_INFO(KTR_IF_START
, if_start
, run
, 0,
184 IF_START_KTR_STRING
, IF_START_KTR_ARG_SIZE
);
185 KTR_INFO(KTR_IF_START
, if_start
, sched
, 1,
186 IF_START_KTR_STRING
, IF_START_KTR_ARG_SIZE
);
187 KTR_INFO(KTR_IF_START
, if_start
, avoid
, 2,
188 IF_START_KTR_STRING
, IF_START_KTR_ARG_SIZE
);
189 KTR_INFO(KTR_IF_START
, if_start
, contend_sched
, 3,
190 IF_START_KTR_STRING
, IF_START_KTR_ARG_SIZE
);
191 KTR_INFO(KTR_IF_START
, if_start
, chase_sched
, 4,
192 IF_START_KTR_STRING
, IF_START_KTR_ARG_SIZE
);
193 #define logifstart(name, arg) KTR_LOG(if_start_ ## name, arg)
196 * Network interface utility routines.
198 * Routines with ifa_ifwith* names take sockaddr *'s as
207 callout_init(&if_slowtimo_timer
);
210 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
211 if (ifp
->if_snd
.ifq_maxlen
== 0) {
212 if_printf(ifp
, "XXX: driver didn't set ifq_maxlen\n");
213 ifp
->if_snd
.ifq_maxlen
= ifqmaxlen
;
222 if_start_cpuid(struct ifnet
*ifp
)
224 return ifp
->if_cpuid
;
227 #ifdef DEVICE_POLLING
229 if_start_cpuid_poll(struct ifnet
*ifp
)
231 int poll_cpuid
= ifp
->if_poll_cpuid
;
236 return ifp
->if_cpuid
;
241 if_start_ipifunc(void *arg
)
243 struct ifnet
*ifp
= arg
;
244 struct lwkt_msg
*lmsg
= &ifp
->if_start_nmsg
[mycpuid
].nm_lmsg
;
247 if (lmsg
->ms_flags
& MSGF_DONE
)
248 lwkt_sendmsg(ifnet_portfn(mycpuid
), lmsg
);
253 * Schedule ifnet.if_start on ifnet's CPU
256 if_start_schedule(struct ifnet
*ifp
)
261 if (if_start_oncpu_sched
)
264 cpu
= ifp
->if_start_cpuid(ifp
);
267 lwkt_send_ipiq(globaldata_find(cpu
), if_start_ipifunc
, ifp
);
270 if_start_ipifunc(ifp
);
275 * This function will release ifnet.if_start interlock,
276 * if ifnet.if_start does not need to be scheduled
279 if_start_need_schedule(struct ifaltq
*ifq
, int running
)
281 if (!running
|| ifq_is_empty(ifq
)
283 || ifq
->altq_tbr
!= NULL
288 * ifnet.if_start interlock is released, if:
289 * 1) Hardware can not take any packets, due to
290 * o interface is marked down
291 * o hardware queue is full (IFF_OACTIVE)
292 * Under the second situation, hardware interrupt
293 * or polling(4) will call/schedule ifnet.if_start
294 * when hardware queue is ready
295 * 2) There is not packet in the ifnet.if_snd.
296 * Further ifq_dispatch or ifq_handoff will call/
297 * schedule ifnet.if_start
298 * 3) TBR is used and it does not allow further
300 * TBR callout will call ifnet.if_start
302 if (!running
|| !ifq_data_ready(ifq
)) {
303 ifq
->altq_started
= 0;
313 if_start_dispatch(struct netmsg
*nmsg
)
315 struct lwkt_msg
*lmsg
= &nmsg
->nm_lmsg
;
316 struct ifnet
*ifp
= lmsg
->u
.ms_resultp
;
317 struct ifaltq
*ifq
= &ifp
->if_snd
;
321 lwkt_replymsg(lmsg
, 0); /* reply ASAP */
325 if (!if_start_oncpu_sched
&& mycpuid
!= ifp
->if_start_cpuid(ifp
)) {
327 * If the ifnet is still up, we need to
328 * chase its CPU change.
330 if (ifp
->if_flags
& IFF_UP
) {
331 logifstart(chase_sched
, ifp
);
332 if_start_schedule(ifp
);
340 if (ifp
->if_flags
& IFF_UP
) {
341 lwkt_serialize_enter(ifp
->if_serializer
); /* XXX try? */
342 if ((ifp
->if_flags
& IFF_OACTIVE
) == 0) {
343 logifstart(run
, ifp
);
346 (IFF_OACTIVE
| IFF_RUNNING
)) == IFF_RUNNING
)
349 lwkt_serialize_exit(ifp
->if_serializer
);
354 if (if_start_need_schedule(ifq
, running
)) {
356 if (lmsg
->ms_flags
& MSGF_DONE
) { /* XXX necessary? */
357 logifstart(sched
, ifp
);
358 lwkt_sendmsg(ifnet_portfn(mycpuid
), lmsg
);
364 /* Device driver ifnet.if_start helper function */
366 if_devstart(struct ifnet
*ifp
)
368 struct ifaltq
*ifq
= &ifp
->if_snd
;
371 ASSERT_SERIALIZED(ifp
->if_serializer
);
374 if (ifq
->altq_started
|| !ifq_data_ready(ifq
)) {
375 logifstart(avoid
, ifp
);
379 ifq
->altq_started
= 1;
382 if (if_devstart_schedonly
) {
384 * Always schedule ifnet.if_start on ifnet's CPU,
385 * short circuit the rest of this function.
387 logifstart(sched
, ifp
);
388 if_start_schedule(ifp
);
392 logifstart(run
, ifp
);
395 if ((ifp
->if_flags
& (IFF_OACTIVE
| IFF_RUNNING
)) == IFF_RUNNING
)
398 if (if_devstart_schednochk
|| if_start_need_schedule(ifq
, running
)) {
400 * More data need to be transmitted, ifnet.if_start is
401 * scheduled on ifnet's CPU, and we keep going.
402 * NOTE: ifnet.if_start interlock is not released.
404 logifstart(sched
, ifp
);
405 if_start_schedule(ifp
);
410 * Attach an interface to the list of "active" interfaces.
412 * The serializer is optional. If non-NULL access to the interface
416 if_attach(struct ifnet
*ifp
, lwkt_serialize_t serializer
)
418 unsigned socksize
, ifasize
;
419 int namelen
, masklen
;
420 struct sockaddr_dl
*sdl
;
425 static int if_indexlim
= 8;
428 * The serializer can be passed in from the device, allowing the
429 * same serializer to be used for both the interrupt interlock and
430 * the device queue. If not specified, the netif structure will
431 * use an embedded serializer.
433 if (serializer
== NULL
) {
434 serializer
= &ifp
->if_default_serializer
;
435 lwkt_serialize_init(serializer
);
437 ifp
->if_serializer
= serializer
;
439 ifp
->if_start_cpuid
= if_start_cpuid
;
442 #ifdef DEVICE_POLLING
443 /* Device is not in polling mode by default */
444 ifp
->if_poll_cpuid
= -1;
445 if (ifp
->if_poll
!= NULL
)
446 ifp
->if_start_cpuid
= if_start_cpuid_poll
;
449 ifp
->if_start_nmsg
= kmalloc(ncpus
* sizeof(struct netmsg
),
450 M_IFADDR
/* XXX */, M_WAITOK
);
451 for (i
= 0; i
< ncpus
; ++i
) {
452 netmsg_init(&ifp
->if_start_nmsg
[i
], &netisr_adone_rport
, 0,
454 ifp
->if_start_nmsg
[i
].nm_lmsg
.u
.ms_resultp
= ifp
;
457 TAILQ_INSERT_TAIL(&ifnet
, ifp
, if_link
);
458 ifp
->if_index
= ++if_index
;
462 * The old code would work if the interface passed a pre-existing
463 * chain of ifaddrs to this code. We don't trust our callers to
464 * properly initialize the tailq, however, so we no longer allow
465 * this unlikely case.
467 ifp
->if_addrheads
= kmalloc(ncpus
* sizeof(struct ifaddrhead
),
468 M_IFADDR
, M_WAITOK
| M_ZERO
);
469 for (i
= 0; i
< ncpus
; ++i
)
470 TAILQ_INIT(&ifp
->if_addrheads
[i
]);
472 TAILQ_INIT(&ifp
->if_prefixhead
);
473 LIST_INIT(&ifp
->if_multiaddrs
);
474 getmicrotime(&ifp
->if_lastchange
);
475 if (ifindex2ifnet
== NULL
|| if_index
>= if_indexlim
) {
481 /* grow ifindex2ifnet */
482 n
= if_indexlim
* sizeof(*q
);
483 q
= kmalloc(n
, M_IFADDR
, M_WAITOK
| M_ZERO
);
485 bcopy(ifindex2ifnet
, q
, n
/2);
486 kfree(ifindex2ifnet
, M_IFADDR
);
491 ifindex2ifnet
[if_index
] = ifp
;
494 * create a Link Level name for this device
496 namelen
= strlen(ifp
->if_xname
);
497 #define _offsetof(t, m) ((int)((caddr_t)&((t *)0)->m))
498 masklen
= _offsetof(struct sockaddr_dl
, sdl_data
[0]) + namelen
;
499 socksize
= masklen
+ ifp
->if_addrlen
;
500 #define ROUNDUP(a) (1 + (((a) - 1) | (sizeof(long) - 1)))
501 if (socksize
< sizeof(*sdl
))
502 socksize
= sizeof(*sdl
);
503 socksize
= ROUNDUP(socksize
);
504 ifasize
= sizeof(struct ifaddr
) + 2 * socksize
;
505 ifa
= ifa_create(ifasize
, M_WAITOK
);
506 sdl
= (struct sockaddr_dl
*)(ifa
+ 1);
507 sdl
->sdl_len
= socksize
;
508 sdl
->sdl_family
= AF_LINK
;
509 bcopy(ifp
->if_xname
, sdl
->sdl_data
, namelen
);
510 sdl
->sdl_nlen
= namelen
;
511 sdl
->sdl_index
= ifp
->if_index
;
512 sdl
->sdl_type
= ifp
->if_type
;
513 ifp
->if_lladdr
= ifa
;
515 ifa
->ifa_rtrequest
= link_rtrequest
;
516 ifa
->ifa_addr
= (struct sockaddr
*)sdl
;
517 sdl
= (struct sockaddr_dl
*)(socksize
+ (caddr_t
)sdl
);
518 ifa
->ifa_netmask
= (struct sockaddr
*)sdl
;
519 sdl
->sdl_len
= masklen
;
521 sdl
->sdl_data
[--namelen
] = 0xff;
522 ifa_iflink(ifa
, ifp
, 0 /* Insert head */);
524 EVENTHANDLER_INVOKE(ifnet_attach_event
, ifp
);
528 ifq
->altq_disc
= NULL
;
529 ifq
->altq_flags
&= ALTQF_CANTCHANGE
;
530 ifq
->altq_tbr
= NULL
;
532 ifq
->altq_started
= 0;
533 ifq
->altq_prepended
= NULL
;
535 ifq_set_classic(ifq
);
537 if (!SLIST_EMPTY(&domains
))
538 if_attachdomain1(ifp
);
540 /* Announce the interface. */
541 rt_ifannouncemsg(ifp
, IFAN_ARRIVAL
);
545 if_attachdomain(void *dummy
)
550 TAILQ_FOREACH(ifp
, &ifnet
, if_list
)
551 if_attachdomain1(ifp
);
554 SYSINIT(domainifattach
, SI_SUB_PROTO_IFATTACHDOMAIN
, SI_ORDER_FIRST
,
555 if_attachdomain
, NULL
);
558 if_attachdomain1(struct ifnet
*ifp
)
564 /* address family dependent data region */
565 bzero(ifp
->if_afdata
, sizeof(ifp
->if_afdata
));
566 SLIST_FOREACH(dp
, &domains
, dom_next
)
567 if (dp
->dom_ifattach
)
568 ifp
->if_afdata
[dp
->dom_family
] =
569 (*dp
->dom_ifattach
)(ifp
);
574 * Purge all addresses whose type is _not_ AF_LINK
577 if_purgeaddrs_nolink(struct ifnet
*ifp
)
579 struct ifaddr_container
*ifac
, *next
;
581 TAILQ_FOREACH_MUTABLE(ifac
, &ifp
->if_addrheads
[mycpuid
],
583 struct ifaddr
*ifa
= ifac
->ifa
;
585 /* Leave link ifaddr as it is */
586 if (ifa
->ifa_addr
->sa_family
== AF_LINK
)
589 /* XXX: Ugly!! ad hoc just for INET */
590 if (ifa
->ifa_addr
&& ifa
->ifa_addr
->sa_family
== AF_INET
) {
591 struct ifaliasreq ifr
;
592 #ifdef IFADDR_DEBUG_VERBOSE
595 kprintf("purge in4 addr %p: ", ifa
);
596 for (i
= 0; i
< ncpus
; ++i
)
597 kprintf("%d ", ifa
->ifa_containers
[i
].ifa_refcnt
);
601 bzero(&ifr
, sizeof ifr
);
602 ifr
.ifra_addr
= *ifa
->ifa_addr
;
603 if (ifa
->ifa_dstaddr
)
604 ifr
.ifra_broadaddr
= *ifa
->ifa_dstaddr
;
605 if (in_control(NULL
, SIOCDIFADDR
, (caddr_t
)&ifr
, ifp
,
611 if (ifa
->ifa_addr
&& ifa
->ifa_addr
->sa_family
== AF_INET6
) {
612 #ifdef IFADDR_DEBUG_VERBOSE
615 kprintf("purge in6 addr %p: ", ifa
);
616 for (i
= 0; i
< ncpus
; ++i
)
617 kprintf("%d ", ifa
->ifa_containers
[i
].ifa_refcnt
);
622 /* ifp_addrhead is already updated */
626 ifa_ifunlink(ifa
, ifp
);
632 * Detach an interface, removing it from the
633 * list of "active" interfaces.
636 if_detach(struct ifnet
*ifp
)
638 struct radix_node_head
*rnh
;
643 EVENTHANDLER_INVOKE(ifnet_detach_event
, ifp
);
646 * Remove routes and flush queues.
649 #ifdef DEVICE_POLLING
650 if (ifp
->if_flags
& IFF_POLLING
)
651 ether_poll_deregister(ifp
);
655 if (ifq_is_enabled(&ifp
->if_snd
))
656 altq_disable(&ifp
->if_snd
);
657 if (ifq_is_attached(&ifp
->if_snd
))
658 altq_detach(&ifp
->if_snd
);
661 * Clean up all addresses.
663 ifp
->if_lladdr
= NULL
;
665 if_purgeaddrs_nolink(ifp
);
666 if (!TAILQ_EMPTY(&ifp
->if_addrheads
[mycpuid
])) {
669 ifa
= TAILQ_FIRST(&ifp
->if_addrheads
[mycpuid
])->ifa
;
670 KASSERT(ifa
->ifa_addr
->sa_family
== AF_LINK
,
671 ("non-link ifaddr is left on if_addrheads"));
673 ifa_ifunlink(ifa
, ifp
);
675 KASSERT(TAILQ_EMPTY(&ifp
->if_addrheads
[mycpuid
]),
676 ("there are still ifaddrs left on if_addrheads"));
681 * Remove all IPv4 kernel structures related to ifp.
688 * Remove all IPv6 kernel structs related to ifp. This should be done
689 * before removing routing entries below, since IPv6 interface direct
690 * routes are expected to be removed by the IPv6-specific kernel API.
691 * Otherwise, the kernel will detect some inconsistency and bark it.
697 * Delete all remaining routes using this interface
698 * Unfortuneatly the only way to do this is to slog through
699 * the entire routing table looking for routes which point
700 * to this interface...oh well...
703 for (cpu
= 0; cpu
< ncpus2
; cpu
++) {
704 lwkt_migratecpu(cpu
);
705 for (i
= 1; i
<= AF_MAX
; i
++) {
706 if ((rnh
= rt_tables
[cpu
][i
]) == NULL
)
708 rnh
->rnh_walktree(rnh
, if_rtdel
, ifp
);
711 lwkt_migratecpu(origcpu
);
713 /* Announce that the interface is gone. */
714 rt_ifannouncemsg(ifp
, IFAN_DEPARTURE
);
716 SLIST_FOREACH(dp
, &domains
, dom_next
)
717 if (dp
->dom_ifdetach
&& ifp
->if_afdata
[dp
->dom_family
])
718 (*dp
->dom_ifdetach
)(ifp
,
719 ifp
->if_afdata
[dp
->dom_family
]);
722 * Remove interface from ifindex2ifp[] and maybe decrement if_index.
724 ifindex2ifnet
[ifp
->if_index
] = NULL
;
725 while (if_index
> 0 && ifindex2ifnet
[if_index
] == NULL
)
728 TAILQ_REMOVE(&ifnet
, ifp
, if_link
);
729 kfree(ifp
->if_addrheads
, M_IFADDR
);
730 kfree(ifp
->if_start_nmsg
, M_IFADDR
);
735 * Delete Routes for a Network Interface
737 * Called for each routing entry via the rnh->rnh_walktree() call above
738 * to delete all route entries referencing a detaching network interface.
741 * rn pointer to node in the routing table
742 * arg argument passed to rnh->rnh_walktree() - detaching interface
746 * errno failed - reason indicated
750 if_rtdel(struct radix_node
*rn
, void *arg
)
752 struct rtentry
*rt
= (struct rtentry
*)rn
;
753 struct ifnet
*ifp
= arg
;
756 if (rt
->rt_ifp
== ifp
) {
759 * Protect (sorta) against walktree recursion problems
762 if (!(rt
->rt_flags
& RTF_UP
))
765 err
= rtrequest(RTM_DELETE
, rt_key(rt
), rt
->rt_gateway
,
766 rt_mask(rt
), rt
->rt_flags
,
767 (struct rtentry
**) NULL
);
769 log(LOG_WARNING
, "if_rtdel: error %d\n", err
);
777 * Locate an interface based on a complete address.
780 ifa_ifwithaddr(struct sockaddr
*addr
)
784 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
785 struct ifaddr_container
*ifac
;
787 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
788 struct ifaddr
*ifa
= ifac
->ifa
;
790 if (ifa
->ifa_addr
->sa_family
!= addr
->sa_family
)
792 if (sa_equal(addr
, ifa
->ifa_addr
))
794 if ((ifp
->if_flags
& IFF_BROADCAST
) &&
795 ifa
->ifa_broadaddr
&&
796 /* IPv6 doesn't have broadcast */
797 ifa
->ifa_broadaddr
->sa_len
!= 0 &&
798 sa_equal(ifa
->ifa_broadaddr
, addr
))
805 * Locate the point to point interface with a given destination address.
808 ifa_ifwithdstaddr(struct sockaddr
*addr
)
812 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
813 struct ifaddr_container
*ifac
;
815 if (!(ifp
->if_flags
& IFF_POINTOPOINT
))
818 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
819 struct ifaddr
*ifa
= ifac
->ifa
;
821 if (ifa
->ifa_addr
->sa_family
!= addr
->sa_family
)
823 if (ifa
->ifa_dstaddr
&&
824 sa_equal(addr
, ifa
->ifa_dstaddr
))
832 * Find an interface on a specific network. If many, choice
833 * is most specific found.
836 ifa_ifwithnet(struct sockaddr
*addr
)
839 struct ifaddr
*ifa_maybe
= NULL
;
840 u_int af
= addr
->sa_family
;
841 char *addr_data
= addr
->sa_data
, *cplim
;
844 * AF_LINK addresses can be looked up directly by their index number,
845 * so do that if we can.
848 struct sockaddr_dl
*sdl
= (struct sockaddr_dl
*)addr
;
850 if (sdl
->sdl_index
&& sdl
->sdl_index
<= if_index
)
851 return (ifindex2ifnet
[sdl
->sdl_index
]->if_lladdr
);
855 * Scan though each interface, looking for ones that have
856 * addresses in this address family.
858 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
859 struct ifaddr_container
*ifac
;
861 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
862 struct ifaddr
*ifa
= ifac
->ifa
;
863 char *cp
, *cp2
, *cp3
;
865 if (ifa
->ifa_addr
->sa_family
!= af
)
867 if (af
== AF_INET
&& ifp
->if_flags
& IFF_POINTOPOINT
) {
869 * This is a bit broken as it doesn't
870 * take into account that the remote end may
871 * be a single node in the network we are
873 * The trouble is that we don't know the
874 * netmask for the remote end.
876 if (ifa
->ifa_dstaddr
!= NULL
&&
877 sa_equal(addr
, ifa
->ifa_dstaddr
))
881 * if we have a special address handler,
882 * then use it instead of the generic one.
884 if (ifa
->ifa_claim_addr
) {
885 if ((*ifa
->ifa_claim_addr
)(ifa
, addr
)) {
893 * Scan all the bits in the ifa's address.
894 * If a bit dissagrees with what we are
895 * looking for, mask it with the netmask
896 * to see if it really matters.
899 if (ifa
->ifa_netmask
== 0)
902 cp2
= ifa
->ifa_addr
->sa_data
;
903 cp3
= ifa
->ifa_netmask
->sa_data
;
904 cplim
= ifa
->ifa_netmask
->sa_len
+
905 (char *)ifa
->ifa_netmask
;
907 if ((*cp
++ ^ *cp2
++) & *cp3
++)
908 goto next
; /* next address! */
910 * If the netmask of what we just found
911 * is more specific than what we had before
912 * (if we had one) then remember the new one
913 * before continuing to search
914 * for an even better one.
916 if (ifa_maybe
== 0 ||
917 rn_refines((char *)ifa
->ifa_netmask
,
918 (char *)ifa_maybe
->ifa_netmask
))
927 * Find an interface address specific to an interface best matching
931 ifaof_ifpforaddr(struct sockaddr
*addr
, struct ifnet
*ifp
)
933 struct ifaddr_container
*ifac
;
934 char *cp
, *cp2
, *cp3
;
936 struct ifaddr
*ifa_maybe
= 0;
937 u_int af
= addr
->sa_family
;
941 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
942 struct ifaddr
*ifa
= ifac
->ifa
;
944 if (ifa
->ifa_addr
->sa_family
!= af
)
948 if (ifa
->ifa_netmask
== NULL
) {
949 if (sa_equal(addr
, ifa
->ifa_addr
) ||
950 (ifa
->ifa_dstaddr
!= NULL
&&
951 sa_equal(addr
, ifa
->ifa_dstaddr
)))
955 if (ifp
->if_flags
& IFF_POINTOPOINT
) {
956 if (sa_equal(addr
, ifa
->ifa_dstaddr
))
960 cp2
= ifa
->ifa_addr
->sa_data
;
961 cp3
= ifa
->ifa_netmask
->sa_data
;
962 cplim
= ifa
->ifa_netmask
->sa_len
+ (char *)ifa
->ifa_netmask
;
963 for (; cp3
< cplim
; cp3
++)
964 if ((*cp
++ ^ *cp2
++) & *cp3
)
974 * Default action when installing a route with a Link Level gateway.
975 * Lookup an appropriate real ifa to point to.
976 * This should be moved to /sys/net/link.c eventually.
979 link_rtrequest(int cmd
, struct rtentry
*rt
, struct rt_addrinfo
*info
)
982 struct sockaddr
*dst
;
985 if (cmd
!= RTM_ADD
|| (ifa
= rt
->rt_ifa
) == NULL
||
986 (ifp
= ifa
->ifa_ifp
) == NULL
|| (dst
= rt_key(rt
)) == NULL
)
988 ifa
= ifaof_ifpforaddr(dst
, ifp
);
993 if (ifa
->ifa_rtrequest
&& ifa
->ifa_rtrequest
!= link_rtrequest
)
994 ifa
->ifa_rtrequest(cmd
, rt
, info
);
999 * Mark an interface down and notify protocols of
1001 * NOTE: must be called at splnet or eqivalent.
1004 if_unroute(struct ifnet
*ifp
, int flag
, int fam
)
1006 struct ifaddr_container
*ifac
;
1008 ifp
->if_flags
&= ~flag
;
1009 getmicrotime(&ifp
->if_lastchange
);
1010 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
1011 struct ifaddr
*ifa
= ifac
->ifa
;
1013 if (fam
== PF_UNSPEC
|| (fam
== ifa
->ifa_addr
->sa_family
))
1014 kpfctlinput(PRC_IFDOWN
, ifa
->ifa_addr
);
1016 ifq_purge(&ifp
->if_snd
);
1021 * Mark an interface up and notify protocols of
1023 * NOTE: must be called at splnet or eqivalent.
1026 if_route(struct ifnet
*ifp
, int flag
, int fam
)
1028 struct ifaddr_container
*ifac
;
1030 ifq_purge(&ifp
->if_snd
);
1031 ifp
->if_flags
|= flag
;
1032 getmicrotime(&ifp
->if_lastchange
);
1033 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
1034 struct ifaddr
*ifa
= ifac
->ifa
;
1036 if (fam
== PF_UNSPEC
|| (fam
== ifa
->ifa_addr
->sa_family
))
1037 kpfctlinput(PRC_IFUP
, ifa
->ifa_addr
);
1046 * Mark an interface down and notify protocols of the transition. An
1047 * interface going down is also considered to be a synchronizing event.
1048 * We must ensure that all packet processing related to the interface
1049 * has completed before we return so e.g. the caller can free the ifnet
1050 * structure that the mbufs may be referencing.
1052 * NOTE: must be called at splnet or eqivalent.
1055 if_down(struct ifnet
*ifp
)
1057 if_unroute(ifp
, IFF_UP
, AF_UNSPEC
);
1058 netmsg_service_sync();
1062 * Mark an interface up and notify protocols of
1064 * NOTE: must be called at splnet or eqivalent.
1067 if_up(struct ifnet
*ifp
)
1069 if_route(ifp
, IFF_UP
, AF_UNSPEC
);
1073 * Process a link state change.
1074 * NOTE: must be called at splsoftnet or equivalent.
1077 if_link_state_change(struct ifnet
*ifp
)
1083 * Handle interface watchdog timer routines. Called
1084 * from softclock, we decrement timers (if set) and
1085 * call the appropriate interface routine on expiration.
1088 if_slowtimo(void *arg
)
1094 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
1095 if (ifp
->if_timer
== 0 || --ifp
->if_timer
)
1097 if (ifp
->if_watchdog
) {
1098 if (lwkt_serialize_try(ifp
->if_serializer
)) {
1099 (*ifp
->if_watchdog
)(ifp
);
1100 lwkt_serialize_exit(ifp
->if_serializer
);
1102 /* try again next timeout */
1110 callout_reset(&if_slowtimo_timer
, hz
/ IFNET_SLOWHZ
, if_slowtimo
, NULL
);
1114 * Map interface name to
1115 * interface structure pointer.
1118 ifunit(const char *name
)
1123 * Search all the interfaces for this name/number
1126 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
1127 if (strncmp(ifp
->if_xname
, name
, IFNAMSIZ
) == 0)
1135 * Map interface name in a sockaddr_dl to
1136 * interface structure pointer.
1139 if_withname(struct sockaddr
*sa
)
1141 char ifname
[IFNAMSIZ
+1];
1142 struct sockaddr_dl
*sdl
= (struct sockaddr_dl
*)sa
;
1144 if ( (sa
->sa_family
!= AF_LINK
) || (sdl
->sdl_nlen
== 0) ||
1145 (sdl
->sdl_nlen
> IFNAMSIZ
) )
1149 * ifunit wants a null-terminated name. It may not be null-terminated
1150 * in the sockaddr. We don't want to change the caller's sockaddr,
1151 * and there might not be room to put the trailing null anyway, so we
1152 * make a local copy that we know we can null terminate safely.
1155 bcopy(sdl
->sdl_data
, ifname
, sdl
->sdl_nlen
);
1156 ifname
[sdl
->sdl_nlen
] = '\0';
1157 return ifunit(ifname
);
1165 ifioctl(struct socket
*so
, u_long cmd
, caddr_t data
, struct ucred
*cred
)
1173 size_t namelen
, onamelen
;
1174 char new_name
[IFNAMSIZ
];
1176 struct sockaddr_dl
*sdl
;
1182 return (ifconf(cmd
, data
, cred
));
1184 ifr
= (struct ifreq
*)data
;
1189 if ((error
= suser_cred(cred
, 0)) != 0)
1191 return ((cmd
== SIOCIFCREATE
) ?
1192 if_clone_create(ifr
->ifr_name
, sizeof(ifr
->ifr_name
)) :
1193 if_clone_destroy(ifr
->ifr_name
));
1195 case SIOCIFGCLONERS
:
1196 return (if_clone_list((struct if_clonereq
*)data
));
1199 ifp
= ifunit(ifr
->ifr_name
);
1205 ifr
->ifr_flags
= ifp
->if_flags
;
1206 ifr
->ifr_flagshigh
= ifp
->if_flags
>> 16;
1210 ifr
->ifr_reqcap
= ifp
->if_capabilities
;
1211 ifr
->ifr_curcap
= ifp
->if_capenable
;
1215 ifr
->ifr_metric
= ifp
->if_metric
;
1219 ifr
->ifr_mtu
= ifp
->if_mtu
;
1223 ifr
->ifr_phys
= ifp
->if_physical
;
1226 case SIOCGIFPOLLCPU
:
1227 #ifdef DEVICE_POLLING
1228 ifr
->ifr_pollcpu
= ifp
->if_poll_cpuid
;
1230 ifr
->ifr_pollcpu
= -1;
1234 case SIOCSIFPOLLCPU
:
1235 #ifdef DEVICE_POLLING
1236 if ((ifp
->if_flags
& IFF_POLLING
) == 0)
1237 ether_pollcpu_register(ifp
, ifr
->ifr_pollcpu
);
1242 error
= suser_cred(cred
, 0);
1245 new_flags
= (ifr
->ifr_flags
& 0xffff) |
1246 (ifr
->ifr_flagshigh
<< 16);
1247 if (ifp
->if_flags
& IFF_SMART
) {
1248 /* Smart drivers twiddle their own routes */
1249 } else if (ifp
->if_flags
& IFF_UP
&&
1250 (new_flags
& IFF_UP
) == 0) {
1254 } else if (new_flags
& IFF_UP
&&
1255 (ifp
->if_flags
& IFF_UP
) == 0) {
1261 #ifdef DEVICE_POLLING
1262 if ((new_flags
^ ifp
->if_flags
) & IFF_POLLING
) {
1263 if (new_flags
& IFF_POLLING
) {
1264 ether_poll_register(ifp
);
1266 ether_poll_deregister(ifp
);
1271 ifp
->if_flags
= (ifp
->if_flags
& IFF_CANTCHANGE
) |
1272 (new_flags
&~ IFF_CANTCHANGE
);
1273 if (new_flags
& IFF_PPROMISC
) {
1274 /* Permanently promiscuous mode requested */
1275 ifp
->if_flags
|= IFF_PROMISC
;
1276 } else if (ifp
->if_pcount
== 0) {
1277 ifp
->if_flags
&= ~IFF_PROMISC
;
1279 if (ifp
->if_ioctl
) {
1280 lwkt_serialize_enter(ifp
->if_serializer
);
1281 ifp
->if_ioctl(ifp
, cmd
, data
, cred
);
1282 lwkt_serialize_exit(ifp
->if_serializer
);
1284 getmicrotime(&ifp
->if_lastchange
);
1288 error
= suser_cred(cred
, 0);
1291 if (ifr
->ifr_reqcap
& ~ifp
->if_capabilities
)
1293 lwkt_serialize_enter(ifp
->if_serializer
);
1294 ifp
->if_ioctl(ifp
, cmd
, data
, cred
);
1295 lwkt_serialize_exit(ifp
->if_serializer
);
1299 error
= suser_cred(cred
, 0);
1302 error
= copyinstr(ifr
->ifr_data
, new_name
, IFNAMSIZ
, NULL
);
1305 if (new_name
[0] == '\0')
1307 if (ifunit(new_name
) != NULL
)
1310 EVENTHANDLER_INVOKE(ifnet_detach_event
, ifp
);
1312 /* Announce the departure of the interface. */
1313 rt_ifannouncemsg(ifp
, IFAN_DEPARTURE
);
1315 strlcpy(ifp
->if_xname
, new_name
, sizeof(ifp
->if_xname
));
1316 ifa
= TAILQ_FIRST(&ifp
->if_addrheads
[mycpuid
])->ifa
;
1317 /* XXX IFA_LOCK(ifa); */
1318 sdl
= (struct sockaddr_dl
*)ifa
->ifa_addr
;
1319 namelen
= strlen(new_name
);
1320 onamelen
= sdl
->sdl_nlen
;
1322 * Move the address if needed. This is safe because we
1323 * allocate space for a name of length IFNAMSIZ when we
1324 * create this in if_attach().
1326 if (namelen
!= onamelen
) {
1327 bcopy(sdl
->sdl_data
+ onamelen
,
1328 sdl
->sdl_data
+ namelen
, sdl
->sdl_alen
);
1330 bcopy(new_name
, sdl
->sdl_data
, namelen
);
1331 sdl
->sdl_nlen
= namelen
;
1332 sdl
= (struct sockaddr_dl
*)ifa
->ifa_netmask
;
1333 bzero(sdl
->sdl_data
, onamelen
);
1334 while (namelen
!= 0)
1335 sdl
->sdl_data
[--namelen
] = 0xff;
1336 /* XXX IFA_UNLOCK(ifa) */
1338 EVENTHANDLER_INVOKE(ifnet_attach_event
, ifp
);
1340 /* Announce the return of the interface. */
1341 rt_ifannouncemsg(ifp
, IFAN_ARRIVAL
);
1345 error
= suser_cred(cred
, 0);
1348 ifp
->if_metric
= ifr
->ifr_metric
;
1349 getmicrotime(&ifp
->if_lastchange
);
1353 error
= suser_cred(cred
, 0);
1358 lwkt_serialize_enter(ifp
->if_serializer
);
1359 error
= ifp
->if_ioctl(ifp
, cmd
, data
, cred
);
1360 lwkt_serialize_exit(ifp
->if_serializer
);
1362 getmicrotime(&ifp
->if_lastchange
);
1367 u_long oldmtu
= ifp
->if_mtu
;
1369 error
= suser_cred(cred
, 0);
1372 if (ifp
->if_ioctl
== NULL
)
1373 return (EOPNOTSUPP
);
1374 if (ifr
->ifr_mtu
< IF_MINMTU
|| ifr
->ifr_mtu
> IF_MAXMTU
)
1376 lwkt_serialize_enter(ifp
->if_serializer
);
1377 error
= ifp
->if_ioctl(ifp
, cmd
, data
, cred
);
1378 lwkt_serialize_exit(ifp
->if_serializer
);
1380 getmicrotime(&ifp
->if_lastchange
);
1384 * If the link MTU changed, do network layer specific procedure.
1386 if (ifp
->if_mtu
!= oldmtu
) {
1396 error
= suser_cred(cred
, 0);
1400 /* Don't allow group membership on non-multicast interfaces. */
1401 if ((ifp
->if_flags
& IFF_MULTICAST
) == 0)
1404 /* Don't let users screw up protocols' entries. */
1405 if (ifr
->ifr_addr
.sa_family
!= AF_LINK
)
1408 if (cmd
== SIOCADDMULTI
) {
1409 struct ifmultiaddr
*ifma
;
1410 error
= if_addmulti(ifp
, &ifr
->ifr_addr
, &ifma
);
1412 error
= if_delmulti(ifp
, &ifr
->ifr_addr
);
1415 getmicrotime(&ifp
->if_lastchange
);
1418 case SIOCSIFPHYADDR
:
1419 case SIOCDIFPHYADDR
:
1421 case SIOCSIFPHYADDR_IN6
:
1423 case SIOCSLIFPHYADDR
:
1425 case SIOCSIFGENERIC
:
1426 error
= suser_cred(cred
, 0);
1429 if (ifp
->if_ioctl
== 0)
1430 return (EOPNOTSUPP
);
1431 lwkt_serialize_enter(ifp
->if_serializer
);
1432 error
= ifp
->if_ioctl(ifp
, cmd
, data
, cred
);
1433 lwkt_serialize_exit(ifp
->if_serializer
);
1435 getmicrotime(&ifp
->if_lastchange
);
1439 ifs
= (struct ifstat
*)data
;
1440 ifs
->ascii
[0] = '\0';
1442 case SIOCGIFPSRCADDR
:
1443 case SIOCGIFPDSTADDR
:
1444 case SIOCGLIFPHYADDR
:
1446 case SIOCGIFGENERIC
:
1447 if (ifp
->if_ioctl
== NULL
)
1448 return (EOPNOTSUPP
);
1449 lwkt_serialize_enter(ifp
->if_serializer
);
1450 error
= ifp
->if_ioctl(ifp
, cmd
, data
, cred
);
1451 lwkt_serialize_exit(ifp
->if_serializer
);
1455 error
= suser_cred(cred
, 0);
1458 return if_setlladdr(ifp
,
1459 ifr
->ifr_addr
.sa_data
, ifr
->ifr_addr
.sa_len
);
1462 oif_flags
= ifp
->if_flags
;
1463 if (so
->so_proto
== 0)
1464 return (EOPNOTSUPP
);
1466 error
= so_pru_control(so
, cmd
, data
, ifp
);
1473 case SIOCSIFDSTADDR
:
1475 case SIOCSIFBRDADDR
:
1476 case SIOCSIFNETMASK
:
1477 #if BYTE_ORDER != BIG_ENDIAN
1478 if (ifr
->ifr_addr
.sa_family
== 0 &&
1479 ifr
->ifr_addr
.sa_len
< 16) {
1480 ifr
->ifr_addr
.sa_family
= ifr
->ifr_addr
.sa_len
;
1481 ifr
->ifr_addr
.sa_len
= 16;
1484 if (ifr
->ifr_addr
.sa_len
== 0)
1485 ifr
->ifr_addr
.sa_len
= 16;
1493 case OSIOCGIFDSTADDR
:
1494 cmd
= SIOCGIFDSTADDR
;
1497 case OSIOCGIFBRDADDR
:
1498 cmd
= SIOCGIFBRDADDR
;
1501 case OSIOCGIFNETMASK
:
1502 cmd
= SIOCGIFNETMASK
;
1504 error
= so_pru_control(so
, cmd
, data
, ifp
);
1508 case OSIOCGIFDSTADDR
:
1509 case OSIOCGIFBRDADDR
:
1510 case OSIOCGIFNETMASK
:
1511 *(u_short
*)&ifr
->ifr_addr
= ifr
->ifr_addr
.sa_family
;
1515 #endif /* COMPAT_43 */
1517 if ((oif_flags
^ ifp
->if_flags
) & IFF_UP
) {
1519 DELAY(100);/* XXX: temporary workaround for fxp issue*/
1520 if (ifp
->if_flags
& IFF_UP
) {
1534 * Set/clear promiscuous mode on interface ifp based on the truth value
1535 * of pswitch. The calls are reference counted so that only the first
1536 * "on" request actually has an effect, as does the final "off" request.
1537 * Results are undefined if the "off" and "on" requests are not matched.
1540 ifpromisc(struct ifnet
*ifp
, int pswitch
)
1546 oldflags
= ifp
->if_flags
;
1547 if (ifp
->if_flags
& IFF_PPROMISC
) {
1548 /* Do nothing if device is in permanently promiscuous mode */
1549 ifp
->if_pcount
+= pswitch
? 1 : -1;
1554 * If the device is not configured up, we cannot put it in
1557 if ((ifp
->if_flags
& IFF_UP
) == 0)
1559 if (ifp
->if_pcount
++ != 0)
1561 ifp
->if_flags
|= IFF_PROMISC
;
1562 log(LOG_INFO
, "%s: promiscuous mode enabled\n",
1565 if (--ifp
->if_pcount
> 0)
1567 ifp
->if_flags
&= ~IFF_PROMISC
;
1568 log(LOG_INFO
, "%s: promiscuous mode disabled\n",
1571 ifr
.ifr_flags
= ifp
->if_flags
;
1572 ifr
.ifr_flagshigh
= ifp
->if_flags
>> 16;
1573 lwkt_serialize_enter(ifp
->if_serializer
);
1574 error
= ifp
->if_ioctl(ifp
, SIOCSIFFLAGS
, (caddr_t
)&ifr
,
1575 (struct ucred
*)NULL
);
1576 lwkt_serialize_exit(ifp
->if_serializer
);
1580 ifp
->if_flags
= oldflags
;
1585 * Return interface configuration
1586 * of system. List may be used
1587 * in later ioctl's (above) to get
1588 * other information.
1591 ifconf(u_long cmd
, caddr_t data
, struct ucred
*cred
)
1593 struct ifconf
*ifc
= (struct ifconf
*)data
;
1595 struct sockaddr
*sa
;
1596 struct ifreq ifr
, *ifrp
;
1597 int space
= ifc
->ifc_len
, error
= 0;
1599 ifrp
= ifc
->ifc_req
;
1600 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
1601 struct ifaddr_container
*ifac
;
1604 if (space
<= sizeof ifr
)
1608 * Zero the stack declared structure first to prevent
1609 * memory disclosure.
1611 bzero(&ifr
, sizeof(ifr
));
1612 if (strlcpy(ifr
.ifr_name
, ifp
->if_xname
, sizeof(ifr
.ifr_name
))
1613 >= sizeof(ifr
.ifr_name
)) {
1614 error
= ENAMETOOLONG
;
1619 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
1620 struct ifaddr
*ifa
= ifac
->ifa
;
1622 if (space
<= sizeof ifr
)
1625 if (cred
->cr_prison
&&
1626 prison_if(cred
, sa
))
1630 if (cmd
== OSIOCGIFCONF
) {
1631 struct osockaddr
*osa
=
1632 (struct osockaddr
*)&ifr
.ifr_addr
;
1634 osa
->sa_family
= sa
->sa_family
;
1635 error
= copyout(&ifr
, ifrp
, sizeof ifr
);
1639 if (sa
->sa_len
<= sizeof(*sa
)) {
1641 error
= copyout(&ifr
, ifrp
, sizeof ifr
);
1644 if (space
< (sizeof ifr
) + sa
->sa_len
-
1647 space
-= sa
->sa_len
- sizeof(*sa
);
1648 error
= copyout(&ifr
, ifrp
,
1649 sizeof ifr
.ifr_name
);
1651 error
= copyout(sa
, &ifrp
->ifr_addr
,
1653 ifrp
= (struct ifreq
*)
1654 (sa
->sa_len
+ (caddr_t
)&ifrp
->ifr_addr
);
1658 space
-= sizeof ifr
;
1663 bzero(&ifr
.ifr_addr
, sizeof ifr
.ifr_addr
);
1664 error
= copyout(&ifr
, ifrp
, sizeof ifr
);
1667 space
-= sizeof ifr
;
1671 ifc
->ifc_len
-= space
;
1676 * Just like if_promisc(), but for all-multicast-reception mode.
1679 if_allmulti(struct ifnet
*ifp
, int onswitch
)
1687 if (ifp
->if_amcount
++ == 0) {
1688 ifp
->if_flags
|= IFF_ALLMULTI
;
1689 ifr
.ifr_flags
= ifp
->if_flags
;
1690 ifr
.ifr_flagshigh
= ifp
->if_flags
>> 16;
1691 lwkt_serialize_enter(ifp
->if_serializer
);
1692 error
= ifp
->if_ioctl(ifp
, SIOCSIFFLAGS
, (caddr_t
)&ifr
,
1693 (struct ucred
*)NULL
);
1694 lwkt_serialize_exit(ifp
->if_serializer
);
1697 if (ifp
->if_amcount
> 1) {
1700 ifp
->if_amcount
= 0;
1701 ifp
->if_flags
&= ~IFF_ALLMULTI
;
1702 ifr
.ifr_flags
= ifp
->if_flags
;
1703 ifr
.ifr_flagshigh
= ifp
->if_flags
>> 16;
1704 lwkt_serialize_enter(ifp
->if_serializer
);
1705 error
= ifp
->if_ioctl(ifp
, SIOCSIFFLAGS
, (caddr_t
)&ifr
,
1706 (struct ucred
*)NULL
);
1707 lwkt_serialize_exit(ifp
->if_serializer
);
1719 * Add a multicast listenership to the interface in question.
1720 * The link layer provides a routine which converts
1724 struct ifnet
*ifp
, /* interface to manipulate */
1725 struct sockaddr
*sa
, /* address to add */
1726 struct ifmultiaddr
**retifma
)
1728 struct sockaddr
*llsa
, *dupsa
;
1730 struct ifmultiaddr
*ifma
;
1733 * If the matching multicast address already exists
1734 * then don't add a new one, just add a reference
1736 LIST_FOREACH(ifma
, &ifp
->if_multiaddrs
, ifma_link
) {
1737 if (sa_equal(sa
, ifma
->ifma_addr
)) {
1738 ifma
->ifma_refcount
++;
1746 * Give the link layer a chance to accept/reject it, and also
1747 * find out which AF_LINK address this maps to, if it isn't one
1750 if (ifp
->if_resolvemulti
) {
1751 lwkt_serialize_enter(ifp
->if_serializer
);
1752 error
= ifp
->if_resolvemulti(ifp
, &llsa
, sa
);
1753 lwkt_serialize_exit(ifp
->if_serializer
);
1760 MALLOC(ifma
, struct ifmultiaddr
*, sizeof *ifma
, M_IFMADDR
, M_WAITOK
);
1761 MALLOC(dupsa
, struct sockaddr
*, sa
->sa_len
, M_IFMADDR
, M_WAITOK
);
1762 bcopy(sa
, dupsa
, sa
->sa_len
);
1764 ifma
->ifma_addr
= dupsa
;
1765 ifma
->ifma_lladdr
= llsa
;
1766 ifma
->ifma_ifp
= ifp
;
1767 ifma
->ifma_refcount
= 1;
1768 ifma
->ifma_protospec
= 0;
1769 rt_newmaddrmsg(RTM_NEWMADDR
, ifma
);
1772 * Some network interfaces can scan the address list at
1773 * interrupt time; lock them out.
1776 LIST_INSERT_HEAD(&ifp
->if_multiaddrs
, ifma
, ifma_link
);
1781 LIST_FOREACH(ifma
, &ifp
->if_multiaddrs
, ifma_link
) {
1782 if (sa_equal(ifma
->ifma_addr
, llsa
))
1786 ifma
->ifma_refcount
++;
1788 MALLOC(ifma
, struct ifmultiaddr
*, sizeof *ifma
,
1789 M_IFMADDR
, M_WAITOK
);
1790 MALLOC(dupsa
, struct sockaddr
*, llsa
->sa_len
,
1791 M_IFMADDR
, M_WAITOK
);
1792 bcopy(llsa
, dupsa
, llsa
->sa_len
);
1793 ifma
->ifma_addr
= dupsa
;
1794 ifma
->ifma_ifp
= ifp
;
1795 ifma
->ifma_refcount
= 1;
1797 LIST_INSERT_HEAD(&ifp
->if_multiaddrs
, ifma
, ifma_link
);
1802 * We are certain we have added something, so call down to the
1803 * interface to let them know about it.
1806 lwkt_serialize_enter(ifp
->if_serializer
);
1807 ifp
->if_ioctl(ifp
, SIOCADDMULTI
, 0, (struct ucred
*)NULL
);
1808 lwkt_serialize_exit(ifp
->if_serializer
);
1815 * Remove a reference to a multicast address on this interface. Yell
1816 * if the request does not match an existing membership.
1819 if_delmulti(struct ifnet
*ifp
, struct sockaddr
*sa
)
1821 struct ifmultiaddr
*ifma
;
1823 LIST_FOREACH(ifma
, &ifp
->if_multiaddrs
, ifma_link
)
1824 if (sa_equal(sa
, ifma
->ifma_addr
))
1829 if (ifma
->ifma_refcount
> 1) {
1830 ifma
->ifma_refcount
--;
1834 rt_newmaddrmsg(RTM_DELMADDR
, ifma
);
1835 sa
= ifma
->ifma_lladdr
;
1837 LIST_REMOVE(ifma
, ifma_link
);
1839 * Make sure the interface driver is notified
1840 * in the case of a link layer mcast group being left.
1842 if (ifma
->ifma_addr
->sa_family
== AF_LINK
&& sa
== 0) {
1843 lwkt_serialize_enter(ifp
->if_serializer
);
1844 ifp
->if_ioctl(ifp
, SIOCDELMULTI
, 0, (struct ucred
*)NULL
);
1845 lwkt_serialize_exit(ifp
->if_serializer
);
1848 kfree(ifma
->ifma_addr
, M_IFMADDR
);
1849 kfree(ifma
, M_IFMADDR
);
1854 * Now look for the link-layer address which corresponds to
1855 * this network address. It had been squirreled away in
1856 * ifma->ifma_lladdr for this purpose (so we don't have
1857 * to call ifp->if_resolvemulti() again), and we saved that
1858 * value in sa above. If some nasty deleted the
1859 * link-layer address out from underneath us, we can deal because
1860 * the address we stored was is not the same as the one which was
1861 * in the record for the link-layer address. (So we don't complain
1864 LIST_FOREACH(ifma
, &ifp
->if_multiaddrs
, ifma_link
)
1865 if (sa_equal(sa
, ifma
->ifma_addr
))
1870 if (ifma
->ifma_refcount
> 1) {
1871 ifma
->ifma_refcount
--;
1876 lwkt_serialize_enter(ifp
->if_serializer
);
1877 LIST_REMOVE(ifma
, ifma_link
);
1878 ifp
->if_ioctl(ifp
, SIOCDELMULTI
, 0, (struct ucred
*)NULL
);
1879 lwkt_serialize_exit(ifp
->if_serializer
);
1881 kfree(ifma
->ifma_addr
, M_IFMADDR
);
1882 kfree(sa
, M_IFMADDR
);
1883 kfree(ifma
, M_IFMADDR
);
1889 * Set the link layer address on an interface.
1891 * At this time we only support certain types of interfaces,
1892 * and we don't allow the length of the address to change.
1895 if_setlladdr(struct ifnet
*ifp
, const u_char
*lladdr
, int len
)
1897 struct sockaddr_dl
*sdl
;
1900 sdl
= IF_LLSOCKADDR(ifp
);
1903 if (len
!= sdl
->sdl_alen
) /* don't allow length to change */
1905 switch (ifp
->if_type
) {
1906 case IFT_ETHER
: /* these types use struct arpcom */
1909 bcopy(lladdr
, ((struct arpcom
*)ifp
->if_softc
)->ac_enaddr
, len
);
1910 bcopy(lladdr
, LLADDR(sdl
), len
);
1916 * If the interface is already up, we need
1917 * to re-init it in order to reprogram its
1920 lwkt_serialize_enter(ifp
->if_serializer
);
1921 if ((ifp
->if_flags
& IFF_UP
) != 0) {
1922 struct ifaddr_container
*ifac
;
1924 ifp
->if_flags
&= ~IFF_UP
;
1925 ifr
.ifr_flags
= ifp
->if_flags
;
1926 ifr
.ifr_flagshigh
= ifp
->if_flags
>> 16;
1927 ifp
->if_ioctl(ifp
, SIOCSIFFLAGS
, (caddr_t
)&ifr
,
1928 (struct ucred
*)NULL
);
1929 ifp
->if_flags
|= IFF_UP
;
1930 ifr
.ifr_flags
= ifp
->if_flags
;
1931 ifr
.ifr_flagshigh
= ifp
->if_flags
>> 16;
1932 ifp
->if_ioctl(ifp
, SIOCSIFFLAGS
, (caddr_t
)&ifr
,
1933 (struct ucred
*)NULL
);
1936 * Also send gratuitous ARPs to notify other nodes about
1937 * the address change.
1939 TAILQ_FOREACH(ifac
, &ifp
->if_addrheads
[mycpuid
], ifa_link
) {
1940 struct ifaddr
*ifa
= ifac
->ifa
;
1942 if (ifa
->ifa_addr
!= NULL
&&
1943 ifa
->ifa_addr
->sa_family
== AF_INET
)
1944 arp_ifinit(ifp
, ifa
);
1948 lwkt_serialize_exit(ifp
->if_serializer
);
1952 struct ifmultiaddr
*
1953 ifmaof_ifpforaddr(struct sockaddr
*sa
, struct ifnet
*ifp
)
1955 struct ifmultiaddr
*ifma
;
1957 LIST_FOREACH(ifma
, &ifp
->if_multiaddrs
, ifma_link
)
1958 if (sa_equal(ifma
->ifma_addr
, sa
))
1965 * This function locates the first real ethernet MAC from a network
1966 * card and loads it into node, returning 0 on success or ENOENT if
1967 * no suitable interfaces were found. It is used by the uuid code to
1968 * generate a unique 6-byte number.
1971 if_getanyethermac(uint16_t *node
, int minlen
)
1974 struct sockaddr_dl
*sdl
;
1976 TAILQ_FOREACH(ifp
, &ifnet
, if_link
) {
1977 if (ifp
->if_type
!= IFT_ETHER
)
1979 sdl
= IF_LLSOCKADDR(ifp
);
1980 if (sdl
->sdl_alen
< minlen
)
1982 bcopy(((struct arpcom
*)ifp
->if_softc
)->ac_enaddr
, node
,
1990 * The name argument must be a pointer to storage which will last as
1991 * long as the interface does. For physical devices, the result of
1992 * device_get_name(dev) is a good choice and for pseudo-devices a
1993 * static string works well.
1996 if_initname(struct ifnet
*ifp
, const char *name
, int unit
)
1998 ifp
->if_dname
= name
;
1999 ifp
->if_dunit
= unit
;
2000 if (unit
!= IF_DUNIT_NONE
)
2001 ksnprintf(ifp
->if_xname
, IFNAMSIZ
, "%s%d", name
, unit
);
2003 strlcpy(ifp
->if_xname
, name
, IFNAMSIZ
);
2007 if_printf(struct ifnet
*ifp
, const char *fmt
, ...)
2012 retval
= kprintf("%s: ", ifp
->if_xname
);
2013 __va_start(ap
, fmt
);
2014 retval
+= kvprintf(fmt
, ap
);
2020 ifq_set_classic(struct ifaltq
*ifq
)
2022 ifq
->altq_enqueue
= ifq_classic_enqueue
;
2023 ifq
->altq_dequeue
= ifq_classic_dequeue
;
2024 ifq
->altq_request
= ifq_classic_request
;
2028 ifq_classic_enqueue(struct ifaltq
*ifq
, struct mbuf
*m
,
2029 struct altq_pktattr
*pa __unused
)
2031 logifq(enqueue
, ifq
);
2032 if (IF_QFULL(ifq
)) {
2042 ifq_classic_dequeue(struct ifaltq
*ifq
, struct mbuf
*mpolled
, int op
)
2051 logifq(dequeue
, ifq
);
2055 panic("unsupported ALTQ dequeue op: %d", op
);
2057 KKASSERT(mpolled
== NULL
|| mpolled
== m
);
2062 ifq_classic_request(struct ifaltq
*ifq
, int req
, void *arg
)
2069 panic("unsupported ALTQ request: %d", req
);
2075 ifq_dispatch(struct ifnet
*ifp
, struct mbuf
*m
, struct altq_pktattr
*pa
)
2077 struct ifaltq
*ifq
= &ifp
->if_snd
;
2078 int running
= 0, error
, start
= 0;
2080 ASSERT_NOT_SERIALIZED(ifp
->if_serializer
);
2083 error
= ifq_enqueue_locked(ifq
, m
, pa
);
2088 if (!ifq
->altq_started
) {
2090 * Hold the interlock of ifnet.if_start
2092 ifq
->altq_started
= 1;
2097 ifp
->if_obytes
+= m
->m_pkthdr
.len
;
2098 if (m
->m_flags
& M_MCAST
)
2102 logifstart(avoid
, ifp
);
2106 if (ifq_dispatch_schedonly
) {
2108 * Always schedule ifnet.if_start on ifnet's CPU,
2109 * short circuit the rest of this function.
2111 logifstart(sched
, ifp
);
2112 if_start_schedule(ifp
);
2117 * Try to do direct ifnet.if_start first, if there is
2118 * contention on ifnet's serializer, ifnet.if_start will
2119 * be scheduled on ifnet's CPU.
2121 if (!lwkt_serialize_try(ifp
->if_serializer
)) {
2123 * ifnet serializer contention happened,
2124 * ifnet.if_start is scheduled on ifnet's
2125 * CPU, and we keep going.
2127 logifstart(contend_sched
, ifp
);
2128 if_start_schedule(ifp
);
2132 if ((ifp
->if_flags
& IFF_OACTIVE
) == 0) {
2133 logifstart(run
, ifp
);
2135 if ((ifp
->if_flags
&
2136 (IFF_OACTIVE
| IFF_RUNNING
)) == IFF_RUNNING
)
2140 lwkt_serialize_exit(ifp
->if_serializer
);
2142 if (ifq_dispatch_schednochk
|| if_start_need_schedule(ifq
, running
)) {
2144 * More data need to be transmitted, ifnet.if_start is
2145 * scheduled on ifnet's CPU, and we keep going.
2146 * NOTE: ifnet.if_start interlock is not released.
2148 logifstart(sched
, ifp
);
2149 if_start_schedule(ifp
);
2155 ifa_forwardmsg(struct lwkt_msg
*lmsg
, int next_cpu
)
2157 if (next_cpu
< ncpus
)
2158 lwkt_forwardmsg(ifa_portfn(next_cpu
), lmsg
);
2160 lwkt_replymsg(lmsg
, 0);
2164 ifa_domsg(struct lwkt_msg
*lmsg
)
2166 lwkt_domsg(ifa_portfn(0), lmsg
, 0);
2170 ifa_create(int size
, int flags
)
2175 KASSERT(size
>= sizeof(*ifa
), ("ifaddr size too small\n"));
2177 ifa
= kmalloc(size
, M_IFADDR
, flags
| M_ZERO
);
2181 ifa
->ifa_containers
= kmalloc(ncpus
* sizeof(struct ifaddr_container
),
2182 M_IFADDR
, M_WAITOK
| M_ZERO
);
2183 ifa
->ifa_cpumask
= smp_active_mask
;
2184 for (i
= 0; i
< ncpus
; ++i
) {
2185 struct ifaddr_container
*ifac
= &ifa
->ifa_containers
[i
];
2187 ifac
->ifa_magic
= IFA_CONTAINER_MAGIC
;
2189 ifac
->ifa_refcnt
= 1;
2192 kprintf("alloc ifa %p %d\n", ifa
, size
);
2197 struct ifac_free_arg
{
2203 ifac_free_dispatch(struct netmsg
*nmsg
)
2205 struct lwkt_msg
*msg
= &nmsg
->nm_lmsg
;
2206 struct ifac_free_arg
*arg
= msg
->u
.ms_resultp
;
2207 struct ifaddr
*ifa
= arg
->ifa
;
2209 ifa
->ifa_cpumask
&= ~(1 << arg
->cpuid
);
2210 if (ifa
->ifa_cpumask
== 0) {
2212 kprintf("free ifa %p\n", ifa
);
2214 kfree(ifa
->ifa_containers
, M_IFADDR
);
2215 kfree(ifa
, M_IFADDR
);
2217 lwkt_replymsg(msg
, 0);
2221 ifac_free(struct ifaddr_container
*ifac
, int cpu_id
)
2223 struct ifac_free_arg arg
;
2225 struct lwkt_msg
*msg
;
2227 KKASSERT(ifac
->ifa_magic
== IFA_CONTAINER_MAGIC
);
2228 KKASSERT(ifac
->ifa_refcnt
== 0);
2229 KASSERT(ifac
->ifa_listmask
== 0,
2230 ("ifa is still on %#x lists\n", ifac
->ifa_listmask
));
2232 ifac
->ifa_magic
= IFA_CONTAINER_DEAD
;
2234 bzero(&arg
, sizeof(arg
));
2235 arg
.ifa
= ifac
->ifa
;
2237 #ifdef IFADDR_DEBUG_VERBOSE
2238 kprintf("try free ifa %p cpu_id %d\n", ifac
->ifa
, arg
.cpuid
);
2241 netmsg_init(&nmsg
, &curthread
->td_msgport
, 0, ifac_free_dispatch
);
2242 msg
= &nmsg
.nm_lmsg
;
2243 msg
->u
.ms_resultp
= &arg
;
2249 ifa_iflink_dispatch(struct netmsg
*nmsg
)
2251 struct netmsg_ifaddr
*msg
= (struct netmsg_ifaddr
*)nmsg
;
2252 struct ifaddr
*ifa
= msg
->ifa
;
2253 struct ifnet
*ifp
= msg
->ifp
;
2255 struct ifaddr_container
*ifac
;
2259 ifac
= &ifa
->ifa_containers
[cpu
];
2260 ASSERT_IFAC_VALID(ifac
);
2261 KASSERT((ifac
->ifa_listmask
& IFA_LIST_IFADDRHEAD
) == 0,
2262 ("ifaddr is on if_addrheads\n"));
2264 ifac
->ifa_listmask
|= IFA_LIST_IFADDRHEAD
;
2266 TAILQ_INSERT_TAIL(&ifp
->if_addrheads
[cpu
], ifac
, ifa_link
);
2268 TAILQ_INSERT_HEAD(&ifp
->if_addrheads
[cpu
], ifac
, ifa_link
);
2272 ifa_forwardmsg(&nmsg
->nm_lmsg
, cpu
+ 1);
2276 ifa_iflink(struct ifaddr
*ifa
, struct ifnet
*ifp
, int tail
)
2278 struct netmsg_ifaddr msg
;
2280 netmsg_init(&msg
.netmsg
, &curthread
->td_msgport
, 0,
2281 ifa_iflink_dispatch
);
2286 ifa_domsg(&msg
.netmsg
.nm_lmsg
);
2290 ifa_ifunlink_dispatch(struct netmsg
*nmsg
)
2292 struct netmsg_ifaddr
*msg
= (struct netmsg_ifaddr
*)nmsg
;
2293 struct ifaddr
*ifa
= msg
->ifa
;
2294 struct ifnet
*ifp
= msg
->ifp
;
2296 struct ifaddr_container
*ifac
;
2300 ifac
= &ifa
->ifa_containers
[cpu
];
2301 ASSERT_IFAC_VALID(ifac
);
2302 KASSERT(ifac
->ifa_listmask
& IFA_LIST_IFADDRHEAD
,
2303 ("ifaddr is not on if_addrhead\n"));
2305 TAILQ_REMOVE(&ifp
->if_addrheads
[cpu
], ifac
, ifa_link
);
2306 ifac
->ifa_listmask
&= ~IFA_LIST_IFADDRHEAD
;
2310 ifa_forwardmsg(&nmsg
->nm_lmsg
, cpu
+ 1);
2314 ifa_ifunlink(struct ifaddr
*ifa
, struct ifnet
*ifp
)
2316 struct netmsg_ifaddr msg
;
2318 netmsg_init(&msg
.netmsg
, &curthread
->td_msgport
, 0,
2319 ifa_ifunlink_dispatch
);
2323 ifa_domsg(&msg
.netmsg
.nm_lmsg
);
2327 ifa_destroy_dispatch(struct netmsg
*nmsg
)
2329 struct netmsg_ifaddr
*msg
= (struct netmsg_ifaddr
*)nmsg
;
2332 ifa_forwardmsg(&nmsg
->nm_lmsg
, mycpuid
+ 1);
2336 ifa_destroy(struct ifaddr
*ifa
)
2338 struct netmsg_ifaddr msg
;
2340 netmsg_init(&msg
.netmsg
, &curthread
->td_msgport
, 0,
2341 ifa_destroy_dispatch
);
2344 ifa_domsg(&msg
.netmsg
.nm_lmsg
);
2348 ifnet_portfn(int cpu
)
2350 return &ifnet_threads
[cpu
].td_msgport
;
2354 ifnetinit(void *dummy __unused
)
2358 for (i
= 0; i
< ncpus
; ++i
) {
2359 struct thread
*thr
= &ifnet_threads
[i
];
2361 lwkt_create(netmsg_service_loop_mpsafe
, NULL
, NULL
, thr
, 0, i
,
2363 netmsg_service_port_init(&thr
->td_msgport
);