tcp: dont drop MTU reduction indications
[linux-2.6/btrfs-unstable.git] / net / ipv4 / inet_diag.c
blob570e61f9611fe9f62bf3513afc9a5abb365544b7
1 /*
2 * inet_diag.c Module for monitoring INET transport protocols sockets.
4 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
12 #include <linux/kernel.h>
13 #include <linux/module.h>
14 #include <linux/types.h>
15 #include <linux/fcntl.h>
16 #include <linux/random.h>
17 #include <linux/slab.h>
18 #include <linux/cache.h>
19 #include <linux/init.h>
20 #include <linux/time.h>
22 #include <net/icmp.h>
23 #include <net/tcp.h>
24 #include <net/ipv6.h>
25 #include <net/inet_common.h>
26 #include <net/inet_connection_sock.h>
27 #include <net/inet_hashtables.h>
28 #include <net/inet_timewait_sock.h>
29 #include <net/inet6_hashtables.h>
30 #include <net/netlink.h>
32 #include <linux/inet.h>
33 #include <linux/stddef.h>
35 #include <linux/inet_diag.h>
36 #include <linux/sock_diag.h>
38 static const struct inet_diag_handler **inet_diag_table;
40 struct inet_diag_entry {
41 __be32 *saddr;
42 __be32 *daddr;
43 u16 sport;
44 u16 dport;
45 u16 family;
46 u16 userlocks;
49 static DEFINE_MUTEX(inet_diag_table_mutex);
51 static const struct inet_diag_handler *inet_diag_lock_handler(int proto)
53 if (!inet_diag_table[proto])
54 request_module("net-pf-%d-proto-%d-type-%d-%d", PF_NETLINK,
55 NETLINK_SOCK_DIAG, AF_INET, proto);
57 mutex_lock(&inet_diag_table_mutex);
58 if (!inet_diag_table[proto])
59 return ERR_PTR(-ENOENT);
61 return inet_diag_table[proto];
64 static inline void inet_diag_unlock_handler(
65 const struct inet_diag_handler *handler)
67 mutex_unlock(&inet_diag_table_mutex);
70 int inet_sk_diag_fill(struct sock *sk, struct inet_connection_sock *icsk,
71 struct sk_buff *skb, struct inet_diag_req_v2 *req,
72 u32 pid, u32 seq, u16 nlmsg_flags,
73 const struct nlmsghdr *unlh)
75 const struct inet_sock *inet = inet_sk(sk);
76 struct inet_diag_msg *r;
77 struct nlmsghdr *nlh;
78 struct nlattr *attr;
79 void *info = NULL;
80 const struct inet_diag_handler *handler;
81 int ext = req->idiag_ext;
83 handler = inet_diag_table[req->sdiag_protocol];
84 BUG_ON(handler == NULL);
86 nlh = nlmsg_put(skb, pid, seq, unlh->nlmsg_type, sizeof(*r),
87 nlmsg_flags);
88 if (!nlh)
89 return -EMSGSIZE;
91 r = nlmsg_data(nlh);
92 BUG_ON(sk->sk_state == TCP_TIME_WAIT);
94 r->idiag_family = sk->sk_family;
95 r->idiag_state = sk->sk_state;
96 r->idiag_timer = 0;
97 r->idiag_retrans = 0;
99 r->id.idiag_if = sk->sk_bound_dev_if;
100 sock_diag_save_cookie(sk, r->id.idiag_cookie);
102 r->id.idiag_sport = inet->inet_sport;
103 r->id.idiag_dport = inet->inet_dport;
104 r->id.idiag_src[0] = inet->inet_rcv_saddr;
105 r->id.idiag_dst[0] = inet->inet_daddr;
107 /* IPv6 dual-stack sockets use inet->tos for IPv4 connections,
108 * hence this needs to be included regardless of socket family.
110 if (ext & (1 << (INET_DIAG_TOS - 1)))
111 if (nla_put_u8(skb, INET_DIAG_TOS, inet->tos) < 0)
112 goto errout;
114 #if IS_ENABLED(CONFIG_IPV6)
115 if (r->idiag_family == AF_INET6) {
116 const struct ipv6_pinfo *np = inet6_sk(sk);
118 *(struct in6_addr *)r->id.idiag_src = np->rcv_saddr;
119 *(struct in6_addr *)r->id.idiag_dst = np->daddr;
121 if (ext & (1 << (INET_DIAG_TCLASS - 1)))
122 if (nla_put_u8(skb, INET_DIAG_TCLASS, np->tclass) < 0)
123 goto errout;
125 #endif
127 r->idiag_uid = sock_i_uid(sk);
128 r->idiag_inode = sock_i_ino(sk);
130 if (ext & (1 << (INET_DIAG_MEMINFO - 1))) {
131 struct inet_diag_meminfo minfo = {
132 .idiag_rmem = sk_rmem_alloc_get(sk),
133 .idiag_wmem = sk->sk_wmem_queued,
134 .idiag_fmem = sk->sk_forward_alloc,
135 .idiag_tmem = sk_wmem_alloc_get(sk),
138 if (nla_put(skb, INET_DIAG_MEMINFO, sizeof(minfo), &minfo) < 0)
139 goto errout;
142 if (ext & (1 << (INET_DIAG_SKMEMINFO - 1)))
143 if (sock_diag_put_meminfo(sk, skb, INET_DIAG_SKMEMINFO))
144 goto errout;
146 if (icsk == NULL) {
147 handler->idiag_get_info(sk, r, NULL);
148 goto out;
151 #define EXPIRES_IN_MS(tmo) DIV_ROUND_UP((tmo - jiffies) * 1000, HZ)
153 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
154 r->idiag_timer = 1;
155 r->idiag_retrans = icsk->icsk_retransmits;
156 r->idiag_expires = EXPIRES_IN_MS(icsk->icsk_timeout);
157 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
158 r->idiag_timer = 4;
159 r->idiag_retrans = icsk->icsk_probes_out;
160 r->idiag_expires = EXPIRES_IN_MS(icsk->icsk_timeout);
161 } else if (timer_pending(&sk->sk_timer)) {
162 r->idiag_timer = 2;
163 r->idiag_retrans = icsk->icsk_probes_out;
164 r->idiag_expires = EXPIRES_IN_MS(sk->sk_timer.expires);
165 } else {
166 r->idiag_timer = 0;
167 r->idiag_expires = 0;
169 #undef EXPIRES_IN_MS
171 if (ext & (1 << (INET_DIAG_INFO - 1))) {
172 attr = nla_reserve(skb, INET_DIAG_INFO,
173 sizeof(struct tcp_info));
174 if (!attr)
175 goto errout;
177 info = nla_data(attr);
180 if ((ext & (1 << (INET_DIAG_CONG - 1))) && icsk->icsk_ca_ops)
181 if (nla_put_string(skb, INET_DIAG_CONG,
182 icsk->icsk_ca_ops->name) < 0)
183 goto errout;
185 handler->idiag_get_info(sk, r, info);
187 if (sk->sk_state < TCP_TIME_WAIT &&
188 icsk->icsk_ca_ops && icsk->icsk_ca_ops->get_info)
189 icsk->icsk_ca_ops->get_info(sk, ext, skb);
191 out:
192 return nlmsg_end(skb, nlh);
194 errout:
195 nlmsg_cancel(skb, nlh);
196 return -EMSGSIZE;
198 EXPORT_SYMBOL_GPL(inet_sk_diag_fill);
200 static int inet_csk_diag_fill(struct sock *sk,
201 struct sk_buff *skb, struct inet_diag_req_v2 *req,
202 u32 pid, u32 seq, u16 nlmsg_flags,
203 const struct nlmsghdr *unlh)
205 return inet_sk_diag_fill(sk, inet_csk(sk),
206 skb, req, pid, seq, nlmsg_flags, unlh);
209 static int inet_twsk_diag_fill(struct inet_timewait_sock *tw,
210 struct sk_buff *skb, struct inet_diag_req_v2 *req,
211 u32 pid, u32 seq, u16 nlmsg_flags,
212 const struct nlmsghdr *unlh)
214 long tmo;
215 struct inet_diag_msg *r;
216 struct nlmsghdr *nlh;
218 nlh = nlmsg_put(skb, pid, seq, unlh->nlmsg_type, sizeof(*r),
219 nlmsg_flags);
220 if (!nlh)
221 return -EMSGSIZE;
223 r = nlmsg_data(nlh);
224 BUG_ON(tw->tw_state != TCP_TIME_WAIT);
226 tmo = tw->tw_ttd - jiffies;
227 if (tmo < 0)
228 tmo = 0;
230 r->idiag_family = tw->tw_family;
231 r->idiag_retrans = 0;
232 r->id.idiag_if = tw->tw_bound_dev_if;
233 sock_diag_save_cookie(tw, r->id.idiag_cookie);
234 r->id.idiag_sport = tw->tw_sport;
235 r->id.idiag_dport = tw->tw_dport;
236 r->id.idiag_src[0] = tw->tw_rcv_saddr;
237 r->id.idiag_dst[0] = tw->tw_daddr;
238 r->idiag_state = tw->tw_substate;
239 r->idiag_timer = 3;
240 r->idiag_expires = DIV_ROUND_UP(tmo * 1000, HZ);
241 r->idiag_rqueue = 0;
242 r->idiag_wqueue = 0;
243 r->idiag_uid = 0;
244 r->idiag_inode = 0;
245 #if IS_ENABLED(CONFIG_IPV6)
246 if (tw->tw_family == AF_INET6) {
247 const struct inet6_timewait_sock *tw6 =
248 inet6_twsk((struct sock *)tw);
250 *(struct in6_addr *)r->id.idiag_src = tw6->tw_v6_rcv_saddr;
251 *(struct in6_addr *)r->id.idiag_dst = tw6->tw_v6_daddr;
253 #endif
255 return nlmsg_end(skb, nlh);
258 static int sk_diag_fill(struct sock *sk, struct sk_buff *skb,
259 struct inet_diag_req_v2 *r, u32 pid, u32 seq, u16 nlmsg_flags,
260 const struct nlmsghdr *unlh)
262 if (sk->sk_state == TCP_TIME_WAIT)
263 return inet_twsk_diag_fill((struct inet_timewait_sock *)sk,
264 skb, r, pid, seq, nlmsg_flags,
265 unlh);
266 return inet_csk_diag_fill(sk, skb, r, pid, seq, nlmsg_flags, unlh);
269 int inet_diag_dump_one_icsk(struct inet_hashinfo *hashinfo, struct sk_buff *in_skb,
270 const struct nlmsghdr *nlh, struct inet_diag_req_v2 *req)
272 int err;
273 struct sock *sk;
274 struct sk_buff *rep;
275 struct net *net = sock_net(in_skb->sk);
277 err = -EINVAL;
278 if (req->sdiag_family == AF_INET) {
279 sk = inet_lookup(net, hashinfo, req->id.idiag_dst[0],
280 req->id.idiag_dport, req->id.idiag_src[0],
281 req->id.idiag_sport, req->id.idiag_if);
283 #if IS_ENABLED(CONFIG_IPV6)
284 else if (req->sdiag_family == AF_INET6) {
285 sk = inet6_lookup(net, hashinfo,
286 (struct in6_addr *)req->id.idiag_dst,
287 req->id.idiag_dport,
288 (struct in6_addr *)req->id.idiag_src,
289 req->id.idiag_sport,
290 req->id.idiag_if);
292 #endif
293 else {
294 goto out_nosk;
297 err = -ENOENT;
298 if (sk == NULL)
299 goto out_nosk;
301 err = sock_diag_check_cookie(sk, req->id.idiag_cookie);
302 if (err)
303 goto out;
305 rep = nlmsg_new(sizeof(struct inet_diag_msg) +
306 sizeof(struct inet_diag_meminfo) +
307 sizeof(struct tcp_info) + 64, GFP_KERNEL);
308 if (!rep) {
309 err = -ENOMEM;
310 goto out;
313 err = sk_diag_fill(sk, rep, req,
314 NETLINK_CB(in_skb).pid,
315 nlh->nlmsg_seq, 0, nlh);
316 if (err < 0) {
317 WARN_ON(err == -EMSGSIZE);
318 nlmsg_free(rep);
319 goto out;
321 err = netlink_unicast(net->diag_nlsk, rep, NETLINK_CB(in_skb).pid,
322 MSG_DONTWAIT);
323 if (err > 0)
324 err = 0;
326 out:
327 if (sk) {
328 if (sk->sk_state == TCP_TIME_WAIT)
329 inet_twsk_put((struct inet_timewait_sock *)sk);
330 else
331 sock_put(sk);
333 out_nosk:
334 return err;
336 EXPORT_SYMBOL_GPL(inet_diag_dump_one_icsk);
338 static int inet_diag_get_exact(struct sk_buff *in_skb,
339 const struct nlmsghdr *nlh,
340 struct inet_diag_req_v2 *req)
342 const struct inet_diag_handler *handler;
343 int err;
345 handler = inet_diag_lock_handler(req->sdiag_protocol);
346 if (IS_ERR(handler))
347 err = PTR_ERR(handler);
348 else
349 err = handler->dump_one(in_skb, nlh, req);
350 inet_diag_unlock_handler(handler);
352 return err;
355 static int bitstring_match(const __be32 *a1, const __be32 *a2, int bits)
357 int words = bits >> 5;
359 bits &= 0x1f;
361 if (words) {
362 if (memcmp(a1, a2, words << 2))
363 return 0;
365 if (bits) {
366 __be32 w1, w2;
367 __be32 mask;
369 w1 = a1[words];
370 w2 = a2[words];
372 mask = htonl((0xffffffff) << (32 - bits));
374 if ((w1 ^ w2) & mask)
375 return 0;
378 return 1;
382 static int inet_diag_bc_run(const struct nlattr *_bc,
383 const struct inet_diag_entry *entry)
385 const void *bc = nla_data(_bc);
386 int len = nla_len(_bc);
388 while (len > 0) {
389 int yes = 1;
390 const struct inet_diag_bc_op *op = bc;
392 switch (op->code) {
393 case INET_DIAG_BC_NOP:
394 break;
395 case INET_DIAG_BC_JMP:
396 yes = 0;
397 break;
398 case INET_DIAG_BC_S_GE:
399 yes = entry->sport >= op[1].no;
400 break;
401 case INET_DIAG_BC_S_LE:
402 yes = entry->sport <= op[1].no;
403 break;
404 case INET_DIAG_BC_D_GE:
405 yes = entry->dport >= op[1].no;
406 break;
407 case INET_DIAG_BC_D_LE:
408 yes = entry->dport <= op[1].no;
409 break;
410 case INET_DIAG_BC_AUTO:
411 yes = !(entry->userlocks & SOCK_BINDPORT_LOCK);
412 break;
413 case INET_DIAG_BC_S_COND:
414 case INET_DIAG_BC_D_COND: {
415 struct inet_diag_hostcond *cond;
416 __be32 *addr;
418 cond = (struct inet_diag_hostcond *)(op + 1);
419 if (cond->port != -1 &&
420 cond->port != (op->code == INET_DIAG_BC_S_COND ?
421 entry->sport : entry->dport)) {
422 yes = 0;
423 break;
426 if (cond->prefix_len == 0)
427 break;
429 if (op->code == INET_DIAG_BC_S_COND)
430 addr = entry->saddr;
431 else
432 addr = entry->daddr;
434 if (bitstring_match(addr, cond->addr,
435 cond->prefix_len))
436 break;
437 if (entry->family == AF_INET6 &&
438 cond->family == AF_INET) {
439 if (addr[0] == 0 && addr[1] == 0 &&
440 addr[2] == htonl(0xffff) &&
441 bitstring_match(addr + 3, cond->addr,
442 cond->prefix_len))
443 break;
445 yes = 0;
446 break;
450 if (yes) {
451 len -= op->yes;
452 bc += op->yes;
453 } else {
454 len -= op->no;
455 bc += op->no;
458 return len == 0;
461 int inet_diag_bc_sk(const struct nlattr *bc, struct sock *sk)
463 struct inet_diag_entry entry;
464 struct inet_sock *inet = inet_sk(sk);
466 if (bc == NULL)
467 return 1;
469 entry.family = sk->sk_family;
470 #if IS_ENABLED(CONFIG_IPV6)
471 if (entry.family == AF_INET6) {
472 struct ipv6_pinfo *np = inet6_sk(sk);
474 entry.saddr = np->rcv_saddr.s6_addr32;
475 entry.daddr = np->daddr.s6_addr32;
476 } else
477 #endif
479 entry.saddr = &inet->inet_rcv_saddr;
480 entry.daddr = &inet->inet_daddr;
482 entry.sport = inet->inet_num;
483 entry.dport = ntohs(inet->inet_dport);
484 entry.userlocks = sk->sk_userlocks;
486 return inet_diag_bc_run(bc, &entry);
488 EXPORT_SYMBOL_GPL(inet_diag_bc_sk);
490 static int valid_cc(const void *bc, int len, int cc)
492 while (len >= 0) {
493 const struct inet_diag_bc_op *op = bc;
495 if (cc > len)
496 return 0;
497 if (cc == len)
498 return 1;
499 if (op->yes < 4 || op->yes & 3)
500 return 0;
501 len -= op->yes;
502 bc += op->yes;
504 return 0;
507 static int inet_diag_bc_audit(const void *bytecode, int bytecode_len)
509 const void *bc = bytecode;
510 int len = bytecode_len;
512 while (len > 0) {
513 const struct inet_diag_bc_op *op = bc;
515 //printk("BC: %d %d %d {%d} / %d\n", op->code, op->yes, op->no, op[1].no, len);
516 switch (op->code) {
517 case INET_DIAG_BC_AUTO:
518 case INET_DIAG_BC_S_COND:
519 case INET_DIAG_BC_D_COND:
520 case INET_DIAG_BC_S_GE:
521 case INET_DIAG_BC_S_LE:
522 case INET_DIAG_BC_D_GE:
523 case INET_DIAG_BC_D_LE:
524 case INET_DIAG_BC_JMP:
525 if (op->no < 4 || op->no > len + 4 || op->no & 3)
526 return -EINVAL;
527 if (op->no < len &&
528 !valid_cc(bytecode, bytecode_len, len - op->no))
529 return -EINVAL;
530 break;
531 case INET_DIAG_BC_NOP:
532 break;
533 default:
534 return -EINVAL;
536 if (op->yes < 4 || op->yes > len + 4 || op->yes & 3)
537 return -EINVAL;
538 bc += op->yes;
539 len -= op->yes;
541 return len == 0 ? 0 : -EINVAL;
544 static int inet_csk_diag_dump(struct sock *sk,
545 struct sk_buff *skb,
546 struct netlink_callback *cb,
547 struct inet_diag_req_v2 *r,
548 const struct nlattr *bc)
550 if (!inet_diag_bc_sk(bc, sk))
551 return 0;
553 return inet_csk_diag_fill(sk, skb, r,
554 NETLINK_CB(cb->skb).pid,
555 cb->nlh->nlmsg_seq, NLM_F_MULTI, cb->nlh);
558 static int inet_twsk_diag_dump(struct inet_timewait_sock *tw,
559 struct sk_buff *skb,
560 struct netlink_callback *cb,
561 struct inet_diag_req_v2 *r,
562 const struct nlattr *bc)
564 if (bc != NULL) {
565 struct inet_diag_entry entry;
567 entry.family = tw->tw_family;
568 #if IS_ENABLED(CONFIG_IPV6)
569 if (tw->tw_family == AF_INET6) {
570 struct inet6_timewait_sock *tw6 =
571 inet6_twsk((struct sock *)tw);
572 entry.saddr = tw6->tw_v6_rcv_saddr.s6_addr32;
573 entry.daddr = tw6->tw_v6_daddr.s6_addr32;
574 } else
575 #endif
577 entry.saddr = &tw->tw_rcv_saddr;
578 entry.daddr = &tw->tw_daddr;
580 entry.sport = tw->tw_num;
581 entry.dport = ntohs(tw->tw_dport);
582 entry.userlocks = 0;
584 if (!inet_diag_bc_run(bc, &entry))
585 return 0;
588 return inet_twsk_diag_fill(tw, skb, r,
589 NETLINK_CB(cb->skb).pid,
590 cb->nlh->nlmsg_seq, NLM_F_MULTI, cb->nlh);
593 static int inet_diag_fill_req(struct sk_buff *skb, struct sock *sk,
594 struct request_sock *req, u32 pid, u32 seq,
595 const struct nlmsghdr *unlh)
597 const struct inet_request_sock *ireq = inet_rsk(req);
598 struct inet_sock *inet = inet_sk(sk);
599 struct inet_diag_msg *r;
600 struct nlmsghdr *nlh;
601 long tmo;
603 nlh = nlmsg_put(skb, pid, seq, unlh->nlmsg_type, sizeof(*r),
604 NLM_F_MULTI);
605 if (!nlh)
606 return -EMSGSIZE;
608 r = nlmsg_data(nlh);
609 r->idiag_family = sk->sk_family;
610 r->idiag_state = TCP_SYN_RECV;
611 r->idiag_timer = 1;
612 r->idiag_retrans = req->retrans;
614 r->id.idiag_if = sk->sk_bound_dev_if;
615 sock_diag_save_cookie(req, r->id.idiag_cookie);
617 tmo = req->expires - jiffies;
618 if (tmo < 0)
619 tmo = 0;
621 r->id.idiag_sport = inet->inet_sport;
622 r->id.idiag_dport = ireq->rmt_port;
623 r->id.idiag_src[0] = ireq->loc_addr;
624 r->id.idiag_dst[0] = ireq->rmt_addr;
625 r->idiag_expires = jiffies_to_msecs(tmo);
626 r->idiag_rqueue = 0;
627 r->idiag_wqueue = 0;
628 r->idiag_uid = sock_i_uid(sk);
629 r->idiag_inode = 0;
630 #if IS_ENABLED(CONFIG_IPV6)
631 if (r->idiag_family == AF_INET6) {
632 *(struct in6_addr *)r->id.idiag_src = inet6_rsk(req)->loc_addr;
633 *(struct in6_addr *)r->id.idiag_dst = inet6_rsk(req)->rmt_addr;
635 #endif
637 return nlmsg_end(skb, nlh);
640 static int inet_diag_dump_reqs(struct sk_buff *skb, struct sock *sk,
641 struct netlink_callback *cb,
642 struct inet_diag_req_v2 *r,
643 const struct nlattr *bc)
645 struct inet_diag_entry entry;
646 struct inet_connection_sock *icsk = inet_csk(sk);
647 struct listen_sock *lopt;
648 struct inet_sock *inet = inet_sk(sk);
649 int j, s_j;
650 int reqnum, s_reqnum;
651 int err = 0;
653 s_j = cb->args[3];
654 s_reqnum = cb->args[4];
656 if (s_j > 0)
657 s_j--;
659 entry.family = sk->sk_family;
661 read_lock_bh(&icsk->icsk_accept_queue.syn_wait_lock);
663 lopt = icsk->icsk_accept_queue.listen_opt;
664 if (!lopt || !lopt->qlen)
665 goto out;
667 if (bc != NULL) {
668 entry.sport = inet->inet_num;
669 entry.userlocks = sk->sk_userlocks;
672 for (j = s_j; j < lopt->nr_table_entries; j++) {
673 struct request_sock *req, *head = lopt->syn_table[j];
675 reqnum = 0;
676 for (req = head; req; reqnum++, req = req->dl_next) {
677 struct inet_request_sock *ireq = inet_rsk(req);
679 if (reqnum < s_reqnum)
680 continue;
681 if (r->id.idiag_dport != ireq->rmt_port &&
682 r->id.idiag_dport)
683 continue;
685 if (bc) {
686 entry.saddr =
687 #if IS_ENABLED(CONFIG_IPV6)
688 (entry.family == AF_INET6) ?
689 inet6_rsk(req)->loc_addr.s6_addr32 :
690 #endif
691 &ireq->loc_addr;
692 entry.daddr =
693 #if IS_ENABLED(CONFIG_IPV6)
694 (entry.family == AF_INET6) ?
695 inet6_rsk(req)->rmt_addr.s6_addr32 :
696 #endif
697 &ireq->rmt_addr;
698 entry.dport = ntohs(ireq->rmt_port);
700 if (!inet_diag_bc_run(bc, &entry))
701 continue;
704 err = inet_diag_fill_req(skb, sk, req,
705 NETLINK_CB(cb->skb).pid,
706 cb->nlh->nlmsg_seq, cb->nlh);
707 if (err < 0) {
708 cb->args[3] = j + 1;
709 cb->args[4] = reqnum;
710 goto out;
714 s_reqnum = 0;
717 out:
718 read_unlock_bh(&icsk->icsk_accept_queue.syn_wait_lock);
720 return err;
723 void inet_diag_dump_icsk(struct inet_hashinfo *hashinfo, struct sk_buff *skb,
724 struct netlink_callback *cb, struct inet_diag_req_v2 *r, struct nlattr *bc)
726 int i, num;
727 int s_i, s_num;
728 struct net *net = sock_net(skb->sk);
730 s_i = cb->args[1];
731 s_num = num = cb->args[2];
733 if (cb->args[0] == 0) {
734 if (!(r->idiag_states & (TCPF_LISTEN | TCPF_SYN_RECV)))
735 goto skip_listen_ht;
737 for (i = s_i; i < INET_LHTABLE_SIZE; i++) {
738 struct sock *sk;
739 struct hlist_nulls_node *node;
740 struct inet_listen_hashbucket *ilb;
742 num = 0;
743 ilb = &hashinfo->listening_hash[i];
744 spin_lock_bh(&ilb->lock);
745 sk_nulls_for_each(sk, node, &ilb->head) {
746 struct inet_sock *inet = inet_sk(sk);
748 if (!net_eq(sock_net(sk), net))
749 continue;
751 if (num < s_num) {
752 num++;
753 continue;
756 if (r->sdiag_family != AF_UNSPEC &&
757 sk->sk_family != r->sdiag_family)
758 goto next_listen;
760 if (r->id.idiag_sport != inet->inet_sport &&
761 r->id.idiag_sport)
762 goto next_listen;
764 if (!(r->idiag_states & TCPF_LISTEN) ||
765 r->id.idiag_dport ||
766 cb->args[3] > 0)
767 goto syn_recv;
769 if (inet_csk_diag_dump(sk, skb, cb, r, bc) < 0) {
770 spin_unlock_bh(&ilb->lock);
771 goto done;
774 syn_recv:
775 if (!(r->idiag_states & TCPF_SYN_RECV))
776 goto next_listen;
778 if (inet_diag_dump_reqs(skb, sk, cb, r, bc) < 0) {
779 spin_unlock_bh(&ilb->lock);
780 goto done;
783 next_listen:
784 cb->args[3] = 0;
785 cb->args[4] = 0;
786 ++num;
788 spin_unlock_bh(&ilb->lock);
790 s_num = 0;
791 cb->args[3] = 0;
792 cb->args[4] = 0;
794 skip_listen_ht:
795 cb->args[0] = 1;
796 s_i = num = s_num = 0;
799 if (!(r->idiag_states & ~(TCPF_LISTEN | TCPF_SYN_RECV)))
800 goto out;
802 for (i = s_i; i <= hashinfo->ehash_mask; i++) {
803 struct inet_ehash_bucket *head = &hashinfo->ehash[i];
804 spinlock_t *lock = inet_ehash_lockp(hashinfo, i);
805 struct sock *sk;
806 struct hlist_nulls_node *node;
808 num = 0;
810 if (hlist_nulls_empty(&head->chain) &&
811 hlist_nulls_empty(&head->twchain))
812 continue;
814 if (i > s_i)
815 s_num = 0;
817 spin_lock_bh(lock);
818 sk_nulls_for_each(sk, node, &head->chain) {
819 struct inet_sock *inet = inet_sk(sk);
821 if (!net_eq(sock_net(sk), net))
822 continue;
823 if (num < s_num)
824 goto next_normal;
825 if (!(r->idiag_states & (1 << sk->sk_state)))
826 goto next_normal;
827 if (r->sdiag_family != AF_UNSPEC &&
828 sk->sk_family != r->sdiag_family)
829 goto next_normal;
830 if (r->id.idiag_sport != inet->inet_sport &&
831 r->id.idiag_sport)
832 goto next_normal;
833 if (r->id.idiag_dport != inet->inet_dport &&
834 r->id.idiag_dport)
835 goto next_normal;
836 if (inet_csk_diag_dump(sk, skb, cb, r, bc) < 0) {
837 spin_unlock_bh(lock);
838 goto done;
840 next_normal:
841 ++num;
844 if (r->idiag_states & TCPF_TIME_WAIT) {
845 struct inet_timewait_sock *tw;
847 inet_twsk_for_each(tw, node,
848 &head->twchain) {
849 if (!net_eq(twsk_net(tw), net))
850 continue;
852 if (num < s_num)
853 goto next_dying;
854 if (r->sdiag_family != AF_UNSPEC &&
855 tw->tw_family != r->sdiag_family)
856 goto next_dying;
857 if (r->id.idiag_sport != tw->tw_sport &&
858 r->id.idiag_sport)
859 goto next_dying;
860 if (r->id.idiag_dport != tw->tw_dport &&
861 r->id.idiag_dport)
862 goto next_dying;
863 if (inet_twsk_diag_dump(tw, skb, cb, r, bc) < 0) {
864 spin_unlock_bh(lock);
865 goto done;
867 next_dying:
868 ++num;
871 spin_unlock_bh(lock);
874 done:
875 cb->args[1] = i;
876 cb->args[2] = num;
877 out:
880 EXPORT_SYMBOL_GPL(inet_diag_dump_icsk);
882 static int __inet_diag_dump(struct sk_buff *skb, struct netlink_callback *cb,
883 struct inet_diag_req_v2 *r, struct nlattr *bc)
885 const struct inet_diag_handler *handler;
887 handler = inet_diag_lock_handler(r->sdiag_protocol);
888 if (!IS_ERR(handler))
889 handler->dump(skb, cb, r, bc);
890 inet_diag_unlock_handler(handler);
892 return skb->len;
895 static int inet_diag_dump(struct sk_buff *skb, struct netlink_callback *cb)
897 struct nlattr *bc = NULL;
898 int hdrlen = sizeof(struct inet_diag_req_v2);
900 if (nlmsg_attrlen(cb->nlh, hdrlen))
901 bc = nlmsg_find_attr(cb->nlh, hdrlen, INET_DIAG_REQ_BYTECODE);
903 return __inet_diag_dump(skb, cb, nlmsg_data(cb->nlh), bc);
906 static inline int inet_diag_type2proto(int type)
908 switch (type) {
909 case TCPDIAG_GETSOCK:
910 return IPPROTO_TCP;
911 case DCCPDIAG_GETSOCK:
912 return IPPROTO_DCCP;
913 default:
914 return 0;
918 static int inet_diag_dump_compat(struct sk_buff *skb, struct netlink_callback *cb)
920 struct inet_diag_req *rc = nlmsg_data(cb->nlh);
921 struct inet_diag_req_v2 req;
922 struct nlattr *bc = NULL;
923 int hdrlen = sizeof(struct inet_diag_req);
925 req.sdiag_family = AF_UNSPEC; /* compatibility */
926 req.sdiag_protocol = inet_diag_type2proto(cb->nlh->nlmsg_type);
927 req.idiag_ext = rc->idiag_ext;
928 req.idiag_states = rc->idiag_states;
929 req.id = rc->id;
931 if (nlmsg_attrlen(cb->nlh, hdrlen))
932 bc = nlmsg_find_attr(cb->nlh, hdrlen, INET_DIAG_REQ_BYTECODE);
934 return __inet_diag_dump(skb, cb, &req, bc);
937 static int inet_diag_get_exact_compat(struct sk_buff *in_skb,
938 const struct nlmsghdr *nlh)
940 struct inet_diag_req *rc = nlmsg_data(nlh);
941 struct inet_diag_req_v2 req;
943 req.sdiag_family = rc->idiag_family;
944 req.sdiag_protocol = inet_diag_type2proto(nlh->nlmsg_type);
945 req.idiag_ext = rc->idiag_ext;
946 req.idiag_states = rc->idiag_states;
947 req.id = rc->id;
949 return inet_diag_get_exact(in_skb, nlh, &req);
952 static int inet_diag_rcv_msg_compat(struct sk_buff *skb, struct nlmsghdr *nlh)
954 int hdrlen = sizeof(struct inet_diag_req);
955 struct net *net = sock_net(skb->sk);
957 if (nlh->nlmsg_type >= INET_DIAG_GETSOCK_MAX ||
958 nlmsg_len(nlh) < hdrlen)
959 return -EINVAL;
961 if (nlh->nlmsg_flags & NLM_F_DUMP) {
962 if (nlmsg_attrlen(nlh, hdrlen)) {
963 struct nlattr *attr;
965 attr = nlmsg_find_attr(nlh, hdrlen,
966 INET_DIAG_REQ_BYTECODE);
967 if (attr == NULL ||
968 nla_len(attr) < sizeof(struct inet_diag_bc_op) ||
969 inet_diag_bc_audit(nla_data(attr), nla_len(attr)))
970 return -EINVAL;
973 struct netlink_dump_control c = {
974 .dump = inet_diag_dump_compat,
976 return netlink_dump_start(net->diag_nlsk, skb, nlh, &c);
980 return inet_diag_get_exact_compat(skb, nlh);
983 static int inet_diag_handler_dump(struct sk_buff *skb, struct nlmsghdr *h)
985 int hdrlen = sizeof(struct inet_diag_req_v2);
986 struct net *net = sock_net(skb->sk);
988 if (nlmsg_len(h) < hdrlen)
989 return -EINVAL;
991 if (h->nlmsg_flags & NLM_F_DUMP) {
992 if (nlmsg_attrlen(h, hdrlen)) {
993 struct nlattr *attr;
994 attr = nlmsg_find_attr(h, hdrlen,
995 INET_DIAG_REQ_BYTECODE);
996 if (attr == NULL ||
997 nla_len(attr) < sizeof(struct inet_diag_bc_op) ||
998 inet_diag_bc_audit(nla_data(attr), nla_len(attr)))
999 return -EINVAL;
1002 struct netlink_dump_control c = {
1003 .dump = inet_diag_dump,
1005 return netlink_dump_start(net->diag_nlsk, skb, h, &c);
1009 return inet_diag_get_exact(skb, h, nlmsg_data(h));
1012 static const struct sock_diag_handler inet_diag_handler = {
1013 .family = AF_INET,
1014 .dump = inet_diag_handler_dump,
1017 static const struct sock_diag_handler inet6_diag_handler = {
1018 .family = AF_INET6,
1019 .dump = inet_diag_handler_dump,
1022 int inet_diag_register(const struct inet_diag_handler *h)
1024 const __u16 type = h->idiag_type;
1025 int err = -EINVAL;
1027 if (type >= IPPROTO_MAX)
1028 goto out;
1030 mutex_lock(&inet_diag_table_mutex);
1031 err = -EEXIST;
1032 if (inet_diag_table[type] == NULL) {
1033 inet_diag_table[type] = h;
1034 err = 0;
1036 mutex_unlock(&inet_diag_table_mutex);
1037 out:
1038 return err;
1040 EXPORT_SYMBOL_GPL(inet_diag_register);
1042 void inet_diag_unregister(const struct inet_diag_handler *h)
1044 const __u16 type = h->idiag_type;
1046 if (type >= IPPROTO_MAX)
1047 return;
1049 mutex_lock(&inet_diag_table_mutex);
1050 inet_diag_table[type] = NULL;
1051 mutex_unlock(&inet_diag_table_mutex);
1053 EXPORT_SYMBOL_GPL(inet_diag_unregister);
1055 static int __init inet_diag_init(void)
1057 const int inet_diag_table_size = (IPPROTO_MAX *
1058 sizeof(struct inet_diag_handler *));
1059 int err = -ENOMEM;
1061 inet_diag_table = kzalloc(inet_diag_table_size, GFP_KERNEL);
1062 if (!inet_diag_table)
1063 goto out;
1065 err = sock_diag_register(&inet_diag_handler);
1066 if (err)
1067 goto out_free_nl;
1069 err = sock_diag_register(&inet6_diag_handler);
1070 if (err)
1071 goto out_free_inet;
1073 sock_diag_register_inet_compat(inet_diag_rcv_msg_compat);
1074 out:
1075 return err;
1077 out_free_inet:
1078 sock_diag_unregister(&inet_diag_handler);
1079 out_free_nl:
1080 kfree(inet_diag_table);
1081 goto out;
1084 static void __exit inet_diag_exit(void)
1086 sock_diag_unregister(&inet6_diag_handler);
1087 sock_diag_unregister(&inet_diag_handler);
1088 sock_diag_unregister_inet_compat(inet_diag_rcv_msg_compat);
1089 kfree(inet_diag_table);
1092 module_init(inet_diag_init);
1093 module_exit(inet_diag_exit);
1094 MODULE_LICENSE("GPL");
1095 MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 2 /* AF_INET */);
1096 MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 10 /* AF_INET6 */);