2 * xt_hashlimit - Netfilter module to limit the number of packets per time
3 * seperately for each hashbucket (sourceip/sourceport/dstip/dstport)
5 * (C) 2003-2004 by Harald Welte <laforge@netfilter.org>
6 * Copyright © CC Computer Consultants GmbH, 2007 - 2008
8 * Development of this code was funded by Astaro AG, http://www.astaro.com/
10 #include <linux/module.h>
11 #include <linux/spinlock.h>
12 #include <linux/random.h>
13 #include <linux/jhash.h>
14 #include <linux/slab.h>
15 #include <linux/vmalloc.h>
16 #include <linux/proc_fs.h>
17 #include <linux/seq_file.h>
18 #include <linux/list.h>
19 #include <linux/skbuff.h>
23 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
24 #include <linux/ipv6.h>
28 #include <net/net_namespace.h>
30 #include <linux/netfilter/x_tables.h>
31 #include <linux/netfilter_ipv4/ip_tables.h>
32 #include <linux/netfilter_ipv6/ip6_tables.h>
33 #include <linux/netfilter/xt_hashlimit.h>
34 #include <linux/mutex.h>
36 MODULE_LICENSE("GPL");
37 MODULE_AUTHOR("Harald Welte <laforge@netfilter.org>");
38 MODULE_AUTHOR("Jan Engelhardt <jengelh@computergmbh.de>");
39 MODULE_DESCRIPTION("Xtables: per hash-bucket rate-limit match");
40 MODULE_ALIAS("ipt_hashlimit");
41 MODULE_ALIAS("ip6t_hashlimit");
43 /* need to declare this at the top */
44 static struct proc_dir_entry
*hashlimit_procdir4
;
45 static struct proc_dir_entry
*hashlimit_procdir6
;
46 static const struct file_operations dl_file_ops
;
55 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
67 /* static / read-only parts in the beginning */
68 struct hlist_node node
;
69 struct dsthash_dst dst
;
71 /* modified structure members in the end */
72 unsigned long expires
; /* precalculated expiry time */
74 unsigned long prev
; /* last modification */
76 u_int32_t credit_cap
, cost
;
80 struct xt_hashlimit_htable
{
81 struct hlist_node node
; /* global list of all htables */
85 struct hashlimit_cfg1 cfg
; /* config */
88 spinlock_t lock
; /* lock for list_head */
89 u_int32_t rnd
; /* random seed for hash */
91 unsigned int count
; /* number entries in table */
92 struct timer_list timer
; /* timer for gc */
95 struct proc_dir_entry
*pde
;
97 struct hlist_head hash
[0]; /* hashtable itself */
100 static DEFINE_SPINLOCK(hashlimit_lock
); /* protects htables list */
101 static DEFINE_MUTEX(hlimit_mutex
); /* additional checkentry protection */
102 static HLIST_HEAD(hashlimit_htables
);
103 static struct kmem_cache
*hashlimit_cachep __read_mostly
;
105 static inline bool dst_cmp(const struct dsthash_ent
*ent
,
106 const struct dsthash_dst
*b
)
108 return !memcmp(&ent
->dst
, b
, sizeof(ent
->dst
));
112 hash_dst(const struct xt_hashlimit_htable
*ht
, const struct dsthash_dst
*dst
)
114 u_int32_t hash
= jhash2((const u32
*)dst
,
115 sizeof(*dst
)/sizeof(u32
),
118 * Instead of returning hash % ht->cfg.size (implying a divide)
119 * we return the high 32 bits of the (hash * ht->cfg.size) that will
120 * give results between [0 and cfg.size-1] and same hash distribution,
121 * but using a multiply, less expensive than a divide
123 return ((u64
)hash
* ht
->cfg
.size
) >> 32;
126 static struct dsthash_ent
*
127 dsthash_find(const struct xt_hashlimit_htable
*ht
,
128 const struct dsthash_dst
*dst
)
130 struct dsthash_ent
*ent
;
131 struct hlist_node
*pos
;
132 u_int32_t hash
= hash_dst(ht
, dst
);
134 if (!hlist_empty(&ht
->hash
[hash
])) {
135 hlist_for_each_entry(ent
, pos
, &ht
->hash
[hash
], node
)
136 if (dst_cmp(ent
, dst
))
142 /* allocate dsthash_ent, initialize dst, put in htable and lock it */
143 static struct dsthash_ent
*
144 dsthash_alloc_init(struct xt_hashlimit_htable
*ht
,
145 const struct dsthash_dst
*dst
)
147 struct dsthash_ent
*ent
;
149 /* initialize hash with random val at the time we allocate
150 * the first hashtable entry */
151 if (!ht
->rnd_initialized
) {
152 get_random_bytes(&ht
->rnd
, 4);
153 ht
->rnd_initialized
= 1;
156 if (ht
->cfg
.max
&& ht
->count
>= ht
->cfg
.max
) {
157 /* FIXME: do something. question is what.. */
160 "xt_hashlimit: max count of %u reached\n",
165 ent
= kmem_cache_alloc(hashlimit_cachep
, GFP_ATOMIC
);
169 "xt_hashlimit: can't allocate dsthash_ent\n");
172 memcpy(&ent
->dst
, dst
, sizeof(ent
->dst
));
174 hlist_add_head(&ent
->node
, &ht
->hash
[hash_dst(ht
, dst
)]);
180 dsthash_free(struct xt_hashlimit_htable
*ht
, struct dsthash_ent
*ent
)
182 hlist_del(&ent
->node
);
183 kmem_cache_free(hashlimit_cachep
, ent
);
186 static void htable_gc(unsigned long htlong
);
188 static int htable_create_v0(struct xt_hashlimit_info
*minfo
, u_int8_t family
)
190 struct xt_hashlimit_htable
*hinfo
;
195 size
= minfo
->cfg
.size
;
197 size
= ((num_physpages
<< PAGE_SHIFT
) / 16384) /
198 sizeof(struct list_head
);
199 if (num_physpages
> (1024 * 1024 * 1024 / PAGE_SIZE
))
204 /* FIXME: don't use vmalloc() here or anywhere else -HW */
205 hinfo
= vmalloc(sizeof(struct xt_hashlimit_htable
) +
206 sizeof(struct list_head
) * size
);
208 printk(KERN_ERR
"xt_hashlimit: unable to create hashtable\n");
211 minfo
->hinfo
= hinfo
;
213 /* copy match config into hashtable config */
214 hinfo
->cfg
.mode
= minfo
->cfg
.mode
;
215 hinfo
->cfg
.avg
= minfo
->cfg
.avg
;
216 hinfo
->cfg
.burst
= minfo
->cfg
.burst
;
217 hinfo
->cfg
.max
= minfo
->cfg
.max
;
218 hinfo
->cfg
.gc_interval
= minfo
->cfg
.gc_interval
;
219 hinfo
->cfg
.expire
= minfo
->cfg
.expire
;
221 if (family
== NFPROTO_IPV4
)
222 hinfo
->cfg
.srcmask
= hinfo
->cfg
.dstmask
= 32;
224 hinfo
->cfg
.srcmask
= hinfo
->cfg
.dstmask
= 128;
226 hinfo
->cfg
.size
= size
;
228 hinfo
->cfg
.max
= 8 * hinfo
->cfg
.size
;
229 else if (hinfo
->cfg
.max
< hinfo
->cfg
.size
)
230 hinfo
->cfg
.max
= hinfo
->cfg
.size
;
232 for (i
= 0; i
< hinfo
->cfg
.size
; i
++)
233 INIT_HLIST_HEAD(&hinfo
->hash
[i
]);
235 atomic_set(&hinfo
->use
, 1);
237 hinfo
->family
= family
;
238 hinfo
->rnd_initialized
= 0;
239 spin_lock_init(&hinfo
->lock
);
240 hinfo
->pde
= proc_create_data(minfo
->name
, 0,
241 (family
== NFPROTO_IPV4
) ?
242 hashlimit_procdir4
: hashlimit_procdir6
,
243 &dl_file_ops
, hinfo
);
249 setup_timer(&hinfo
->timer
, htable_gc
, (unsigned long )hinfo
);
250 hinfo
->timer
.expires
= jiffies
+ msecs_to_jiffies(hinfo
->cfg
.gc_interval
);
251 add_timer(&hinfo
->timer
);
253 spin_lock_bh(&hashlimit_lock
);
254 hlist_add_head(&hinfo
->node
, &hashlimit_htables
);
255 spin_unlock_bh(&hashlimit_lock
);
260 static int htable_create(struct xt_hashlimit_mtinfo1
*minfo
, u_int8_t family
)
262 struct xt_hashlimit_htable
*hinfo
;
266 if (minfo
->cfg
.size
) {
267 size
= minfo
->cfg
.size
;
269 size
= (num_physpages
<< PAGE_SHIFT
) / 16384 /
270 sizeof(struct list_head
);
271 if (num_physpages
> 1024 * 1024 * 1024 / PAGE_SIZE
)
276 /* FIXME: don't use vmalloc() here or anywhere else -HW */
277 hinfo
= vmalloc(sizeof(struct xt_hashlimit_htable
) +
278 sizeof(struct list_head
) * size
);
280 printk(KERN_ERR
"xt_hashlimit: unable to create hashtable\n");
283 minfo
->hinfo
= hinfo
;
285 /* copy match config into hashtable config */
286 memcpy(&hinfo
->cfg
, &minfo
->cfg
, sizeof(hinfo
->cfg
));
287 hinfo
->cfg
.size
= size
;
288 if (hinfo
->cfg
.max
== 0)
289 hinfo
->cfg
.max
= 8 * hinfo
->cfg
.size
;
290 else if (hinfo
->cfg
.max
< hinfo
->cfg
.size
)
291 hinfo
->cfg
.max
= hinfo
->cfg
.size
;
293 for (i
= 0; i
< hinfo
->cfg
.size
; i
++)
294 INIT_HLIST_HEAD(&hinfo
->hash
[i
]);
296 atomic_set(&hinfo
->use
, 1);
298 hinfo
->family
= family
;
299 hinfo
->rnd_initialized
= 0;
300 spin_lock_init(&hinfo
->lock
);
302 hinfo
->pde
= proc_create_data(minfo
->name
, 0,
303 (family
== NFPROTO_IPV4
) ?
304 hashlimit_procdir4
: hashlimit_procdir6
,
305 &dl_file_ops
, hinfo
);
306 if (hinfo
->pde
== NULL
) {
311 setup_timer(&hinfo
->timer
, htable_gc
, (unsigned long)hinfo
);
312 hinfo
->timer
.expires
= jiffies
+ msecs_to_jiffies(hinfo
->cfg
.gc_interval
);
313 add_timer(&hinfo
->timer
);
315 spin_lock_bh(&hashlimit_lock
);
316 hlist_add_head(&hinfo
->node
, &hashlimit_htables
);
317 spin_unlock_bh(&hashlimit_lock
);
322 static bool select_all(const struct xt_hashlimit_htable
*ht
,
323 const struct dsthash_ent
*he
)
328 static bool select_gc(const struct xt_hashlimit_htable
*ht
,
329 const struct dsthash_ent
*he
)
331 return time_after_eq(jiffies
, he
->expires
);
334 static void htable_selective_cleanup(struct xt_hashlimit_htable
*ht
,
335 bool (*select
)(const struct xt_hashlimit_htable
*ht
,
336 const struct dsthash_ent
*he
))
340 /* lock hash table and iterate over it */
341 spin_lock_bh(&ht
->lock
);
342 for (i
= 0; i
< ht
->cfg
.size
; i
++) {
343 struct dsthash_ent
*dh
;
344 struct hlist_node
*pos
, *n
;
345 hlist_for_each_entry_safe(dh
, pos
, n
, &ht
->hash
[i
], node
) {
346 if ((*select
)(ht
, dh
))
347 dsthash_free(ht
, dh
);
350 spin_unlock_bh(&ht
->lock
);
353 /* hash table garbage collector, run by timer */
354 static void htable_gc(unsigned long htlong
)
356 struct xt_hashlimit_htable
*ht
= (struct xt_hashlimit_htable
*)htlong
;
358 htable_selective_cleanup(ht
, select_gc
);
360 /* re-add the timer accordingly */
361 ht
->timer
.expires
= jiffies
+ msecs_to_jiffies(ht
->cfg
.gc_interval
);
362 add_timer(&ht
->timer
);
365 static void htable_destroy(struct xt_hashlimit_htable
*hinfo
)
367 del_timer_sync(&hinfo
->timer
);
369 /* remove proc entry */
370 remove_proc_entry(hinfo
->pde
->name
,
371 hinfo
->family
== NFPROTO_IPV4
? hashlimit_procdir4
:
373 htable_selective_cleanup(hinfo
, select_all
);
377 static struct xt_hashlimit_htable
*htable_find_get(const char *name
,
380 struct xt_hashlimit_htable
*hinfo
;
381 struct hlist_node
*pos
;
383 spin_lock_bh(&hashlimit_lock
);
384 hlist_for_each_entry(hinfo
, pos
, &hashlimit_htables
, node
) {
385 if (!strcmp(name
, hinfo
->pde
->name
) &&
386 hinfo
->family
== family
) {
387 atomic_inc(&hinfo
->use
);
388 spin_unlock_bh(&hashlimit_lock
);
392 spin_unlock_bh(&hashlimit_lock
);
396 static void htable_put(struct xt_hashlimit_htable
*hinfo
)
398 if (atomic_dec_and_test(&hinfo
->use
)) {
399 spin_lock_bh(&hashlimit_lock
);
400 hlist_del(&hinfo
->node
);
401 spin_unlock_bh(&hashlimit_lock
);
402 htable_destroy(hinfo
);
406 /* The algorithm used is the Simple Token Bucket Filter (TBF)
407 * see net/sched/sch_tbf.c in the linux source tree
410 /* Rusty: This is my (non-mathematically-inclined) understanding of
411 this algorithm. The `average rate' in jiffies becomes your initial
412 amount of credit `credit' and the most credit you can ever have
413 `credit_cap'. The `peak rate' becomes the cost of passing the
416 `prev' tracks the last packet hit: you gain one credit per jiffy.
417 If you get credit balance more than this, the extra credit is
418 discarded. Every time the match passes, you lose `cost' credits;
419 if you don't have that many, the test fails.
421 See Alexey's formal explanation in net/sched/sch_tbf.c.
423 To get the maximum range, we multiply by this factor (ie. you get N
424 credits per jiffy). We want to allow a rate as low as 1 per day
425 (slowest userspace tool allows), which means
426 CREDITS_PER_JIFFY*HZ*60*60*24 < 2^32 ie.
428 #define MAX_CPJ (0xFFFFFFFF / (HZ*60*60*24))
430 /* Repeated shift and or gives us all 1s, final shift and add 1 gives
431 * us the power of 2 below the theoretical max, so GCC simply does a
433 #define _POW2_BELOW2(x) ((x)|((x)>>1))
434 #define _POW2_BELOW4(x) (_POW2_BELOW2(x)|_POW2_BELOW2((x)>>2))
435 #define _POW2_BELOW8(x) (_POW2_BELOW4(x)|_POW2_BELOW4((x)>>4))
436 #define _POW2_BELOW16(x) (_POW2_BELOW8(x)|_POW2_BELOW8((x)>>8))
437 #define _POW2_BELOW32(x) (_POW2_BELOW16(x)|_POW2_BELOW16((x)>>16))
438 #define POW2_BELOW32(x) ((_POW2_BELOW32(x)>>1) + 1)
440 #define CREDITS_PER_JIFFY POW2_BELOW32(MAX_CPJ)
442 /* Precision saver. */
443 static inline u_int32_t
444 user2credits(u_int32_t user
)
446 /* If multiplying would overflow... */
447 if (user
> 0xFFFFFFFF / (HZ
*CREDITS_PER_JIFFY
))
449 return (user
/ XT_HASHLIMIT_SCALE
) * HZ
* CREDITS_PER_JIFFY
;
451 return (user
* HZ
* CREDITS_PER_JIFFY
) / XT_HASHLIMIT_SCALE
;
454 static inline void rateinfo_recalc(struct dsthash_ent
*dh
, unsigned long now
)
456 dh
->rateinfo
.credit
+= (now
- dh
->rateinfo
.prev
) * CREDITS_PER_JIFFY
;
457 if (dh
->rateinfo
.credit
> dh
->rateinfo
.credit_cap
)
458 dh
->rateinfo
.credit
= dh
->rateinfo
.credit_cap
;
459 dh
->rateinfo
.prev
= now
;
462 static inline __be32
maskl(__be32 a
, unsigned int l
)
464 return l
? htonl(ntohl(a
) & ~0 << (32 - l
)) : 0;
467 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
468 static void hashlimit_ipv6_mask(__be32
*i
, unsigned int p
)
472 i
[0] = maskl(i
[0], p
);
473 i
[1] = i
[2] = i
[3] = 0;
476 i
[1] = maskl(i
[1], p
- 32);
480 i
[2] = maskl(i
[2], p
- 64);
483 i
[3] = maskl(i
[3], p
- 96);
492 hashlimit_init_dst(const struct xt_hashlimit_htable
*hinfo
,
493 struct dsthash_dst
*dst
,
494 const struct sk_buff
*skb
, unsigned int protoff
)
496 __be16 _ports
[2], *ports
;
499 memset(dst
, 0, sizeof(*dst
));
501 switch (hinfo
->family
) {
503 if (hinfo
->cfg
.mode
& XT_HASHLIMIT_HASH_DIP
)
504 dst
->ip
.dst
= maskl(ip_hdr(skb
)->daddr
,
506 if (hinfo
->cfg
.mode
& XT_HASHLIMIT_HASH_SIP
)
507 dst
->ip
.src
= maskl(ip_hdr(skb
)->saddr
,
510 if (!(hinfo
->cfg
.mode
&
511 (XT_HASHLIMIT_HASH_DPT
| XT_HASHLIMIT_HASH_SPT
)))
513 nexthdr
= ip_hdr(skb
)->protocol
;
515 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
517 if (hinfo
->cfg
.mode
& XT_HASHLIMIT_HASH_DIP
) {
518 memcpy(&dst
->ip6
.dst
, &ipv6_hdr(skb
)->daddr
,
519 sizeof(dst
->ip6
.dst
));
520 hashlimit_ipv6_mask(dst
->ip6
.dst
, hinfo
->cfg
.dstmask
);
522 if (hinfo
->cfg
.mode
& XT_HASHLIMIT_HASH_SIP
) {
523 memcpy(&dst
->ip6
.src
, &ipv6_hdr(skb
)->saddr
,
524 sizeof(dst
->ip6
.src
));
525 hashlimit_ipv6_mask(dst
->ip6
.src
, hinfo
->cfg
.srcmask
);
528 if (!(hinfo
->cfg
.mode
&
529 (XT_HASHLIMIT_HASH_DPT
| XT_HASHLIMIT_HASH_SPT
)))
531 nexthdr
= ipv6_hdr(skb
)->nexthdr
;
532 protoff
= ipv6_skip_exthdr(skb
, sizeof(struct ipv6hdr
), &nexthdr
);
533 if ((int)protoff
< 0)
545 case IPPROTO_UDPLITE
:
548 ports
= skb_header_pointer(skb
, protoff
, sizeof(_ports
),
552 _ports
[0] = _ports
[1] = 0;
558 if (hinfo
->cfg
.mode
& XT_HASHLIMIT_HASH_SPT
)
559 dst
->src_port
= ports
[0];
560 if (hinfo
->cfg
.mode
& XT_HASHLIMIT_HASH_DPT
)
561 dst
->dst_port
= ports
[1];
566 hashlimit_mt_v0(const struct sk_buff
*skb
, const struct xt_match_param
*par
)
568 const struct xt_hashlimit_info
*r
=
569 ((const struct xt_hashlimit_info
*)par
->matchinfo
)->u
.master
;
570 struct xt_hashlimit_htable
*hinfo
= r
->hinfo
;
571 unsigned long now
= jiffies
;
572 struct dsthash_ent
*dh
;
573 struct dsthash_dst dst
;
575 if (hashlimit_init_dst(hinfo
, &dst
, skb
, par
->thoff
) < 0)
578 spin_lock_bh(&hinfo
->lock
);
579 dh
= dsthash_find(hinfo
, &dst
);
581 dh
= dsthash_alloc_init(hinfo
, &dst
);
583 spin_unlock_bh(&hinfo
->lock
);
587 dh
->expires
= jiffies
+ msecs_to_jiffies(hinfo
->cfg
.expire
);
588 dh
->rateinfo
.prev
= jiffies
;
589 dh
->rateinfo
.credit
= user2credits(hinfo
->cfg
.avg
*
591 dh
->rateinfo
.credit_cap
= user2credits(hinfo
->cfg
.avg
*
593 dh
->rateinfo
.cost
= user2credits(hinfo
->cfg
.avg
);
595 /* update expiration timeout */
596 dh
->expires
= now
+ msecs_to_jiffies(hinfo
->cfg
.expire
);
597 rateinfo_recalc(dh
, now
);
600 if (dh
->rateinfo
.credit
>= dh
->rateinfo
.cost
) {
601 /* We're underlimit. */
602 dh
->rateinfo
.credit
-= dh
->rateinfo
.cost
;
603 spin_unlock_bh(&hinfo
->lock
);
607 spin_unlock_bh(&hinfo
->lock
);
609 /* default case: we're overlimit, thus don't match */
613 *par
->hotdrop
= true;
618 hashlimit_mt(const struct sk_buff
*skb
, const struct xt_match_param
*par
)
620 const struct xt_hashlimit_mtinfo1
*info
= par
->matchinfo
;
621 struct xt_hashlimit_htable
*hinfo
= info
->hinfo
;
622 unsigned long now
= jiffies
;
623 struct dsthash_ent
*dh
;
624 struct dsthash_dst dst
;
626 if (hashlimit_init_dst(hinfo
, &dst
, skb
, par
->thoff
) < 0)
629 spin_lock_bh(&hinfo
->lock
);
630 dh
= dsthash_find(hinfo
, &dst
);
632 dh
= dsthash_alloc_init(hinfo
, &dst
);
634 spin_unlock_bh(&hinfo
->lock
);
638 dh
->expires
= jiffies
+ msecs_to_jiffies(hinfo
->cfg
.expire
);
639 dh
->rateinfo
.prev
= jiffies
;
640 dh
->rateinfo
.credit
= user2credits(hinfo
->cfg
.avg
*
642 dh
->rateinfo
.credit_cap
= user2credits(hinfo
->cfg
.avg
*
644 dh
->rateinfo
.cost
= user2credits(hinfo
->cfg
.avg
);
646 /* update expiration timeout */
647 dh
->expires
= now
+ msecs_to_jiffies(hinfo
->cfg
.expire
);
648 rateinfo_recalc(dh
, now
);
651 if (dh
->rateinfo
.credit
>= dh
->rateinfo
.cost
) {
652 /* below the limit */
653 dh
->rateinfo
.credit
-= dh
->rateinfo
.cost
;
654 spin_unlock_bh(&hinfo
->lock
);
655 return !(info
->cfg
.mode
& XT_HASHLIMIT_INVERT
);
658 spin_unlock_bh(&hinfo
->lock
);
659 /* default match is underlimit - so over the limit, we need to invert */
660 return info
->cfg
.mode
& XT_HASHLIMIT_INVERT
;
663 *par
->hotdrop
= true;
667 static bool hashlimit_mt_check_v0(const struct xt_mtchk_param
*par
)
669 struct xt_hashlimit_info
*r
= par
->matchinfo
;
671 /* Check for overflow. */
672 if (r
->cfg
.burst
== 0 ||
673 user2credits(r
->cfg
.avg
* r
->cfg
.burst
) < user2credits(r
->cfg
.avg
)) {
674 printk(KERN_ERR
"xt_hashlimit: overflow, try lower: %u/%u\n",
675 r
->cfg
.avg
, r
->cfg
.burst
);
678 if (r
->cfg
.mode
== 0 ||
679 r
->cfg
.mode
> (XT_HASHLIMIT_HASH_DPT
|
680 XT_HASHLIMIT_HASH_DIP
|
681 XT_HASHLIMIT_HASH_SIP
|
682 XT_HASHLIMIT_HASH_SPT
))
684 if (!r
->cfg
.gc_interval
)
688 if (r
->name
[sizeof(r
->name
) - 1] != '\0')
691 /* This is the best we've got: We cannot release and re-grab lock,
692 * since checkentry() is called before x_tables.c grabs xt_mutex.
693 * We also cannot grab the hashtable spinlock, since htable_create will
694 * call vmalloc, and that can sleep. And we cannot just re-search
695 * the list of htable's in htable_create(), since then we would
696 * create duplicate proc files. -HW */
697 mutex_lock(&hlimit_mutex
);
698 r
->hinfo
= htable_find_get(r
->name
, par
->match
->family
);
699 if (!r
->hinfo
&& htable_create_v0(r
, par
->match
->family
) != 0) {
700 mutex_unlock(&hlimit_mutex
);
703 mutex_unlock(&hlimit_mutex
);
705 /* Ugly hack: For SMP, we only want to use one set */
710 static bool hashlimit_mt_check(const struct xt_mtchk_param
*par
)
712 struct xt_hashlimit_mtinfo1
*info
= par
->matchinfo
;
714 /* Check for overflow. */
715 if (info
->cfg
.burst
== 0 ||
716 user2credits(info
->cfg
.avg
* info
->cfg
.burst
) <
717 user2credits(info
->cfg
.avg
)) {
718 printk(KERN_ERR
"xt_hashlimit: overflow, try lower: %u/%u\n",
719 info
->cfg
.avg
, info
->cfg
.burst
);
722 if (info
->cfg
.gc_interval
== 0 || info
->cfg
.expire
== 0)
724 if (info
->name
[sizeof(info
->name
)-1] != '\0')
726 if (par
->match
->family
== NFPROTO_IPV4
) {
727 if (info
->cfg
.srcmask
> 32 || info
->cfg
.dstmask
> 32)
730 if (info
->cfg
.srcmask
> 128 || info
->cfg
.dstmask
> 128)
734 /* This is the best we've got: We cannot release and re-grab lock,
735 * since checkentry() is called before x_tables.c grabs xt_mutex.
736 * We also cannot grab the hashtable spinlock, since htable_create will
737 * call vmalloc, and that can sleep. And we cannot just re-search
738 * the list of htable's in htable_create(), since then we would
739 * create duplicate proc files. -HW */
740 mutex_lock(&hlimit_mutex
);
741 info
->hinfo
= htable_find_get(info
->name
, par
->match
->family
);
742 if (!info
->hinfo
&& htable_create(info
, par
->match
->family
) != 0) {
743 mutex_unlock(&hlimit_mutex
);
746 mutex_unlock(&hlimit_mutex
);
751 hashlimit_mt_destroy_v0(const struct xt_mtdtor_param
*par
)
753 const struct xt_hashlimit_info
*r
= par
->matchinfo
;
755 htable_put(r
->hinfo
);
758 static void hashlimit_mt_destroy(const struct xt_mtdtor_param
*par
)
760 const struct xt_hashlimit_mtinfo1
*info
= par
->matchinfo
;
762 htable_put(info
->hinfo
);
766 struct compat_xt_hashlimit_info
{
768 struct hashlimit_cfg cfg
;
770 compat_uptr_t master
;
773 static void hashlimit_mt_compat_from_user(void *dst
, void *src
)
775 int off
= offsetof(struct compat_xt_hashlimit_info
, hinfo
);
777 memcpy(dst
, src
, off
);
778 memset(dst
+ off
, 0, sizeof(struct compat_xt_hashlimit_info
) - off
);
781 static int hashlimit_mt_compat_to_user(void __user
*dst
, void *src
)
783 int off
= offsetof(struct compat_xt_hashlimit_info
, hinfo
);
785 return copy_to_user(dst
, src
, off
) ? -EFAULT
: 0;
789 static struct xt_match hashlimit_mt_reg
[] __read_mostly
= {
793 .family
= NFPROTO_IPV4
,
794 .match
= hashlimit_mt_v0
,
795 .matchsize
= sizeof(struct xt_hashlimit_info
),
797 .compatsize
= sizeof(struct compat_xt_hashlimit_info
),
798 .compat_from_user
= hashlimit_mt_compat_from_user
,
799 .compat_to_user
= hashlimit_mt_compat_to_user
,
801 .checkentry
= hashlimit_mt_check_v0
,
802 .destroy
= hashlimit_mt_destroy_v0
,
808 .family
= NFPROTO_IPV4
,
809 .match
= hashlimit_mt
,
810 .matchsize
= sizeof(struct xt_hashlimit_mtinfo1
),
811 .checkentry
= hashlimit_mt_check
,
812 .destroy
= hashlimit_mt_destroy
,
815 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
818 .family
= NFPROTO_IPV6
,
819 .match
= hashlimit_mt_v0
,
820 .matchsize
= sizeof(struct xt_hashlimit_info
),
822 .compatsize
= sizeof(struct compat_xt_hashlimit_info
),
823 .compat_from_user
= hashlimit_mt_compat_from_user
,
824 .compat_to_user
= hashlimit_mt_compat_to_user
,
826 .checkentry
= hashlimit_mt_check_v0
,
827 .destroy
= hashlimit_mt_destroy_v0
,
833 .family
= NFPROTO_IPV6
,
834 .match
= hashlimit_mt
,
835 .matchsize
= sizeof(struct xt_hashlimit_mtinfo1
),
836 .checkentry
= hashlimit_mt_check
,
837 .destroy
= hashlimit_mt_destroy
,
844 static void *dl_seq_start(struct seq_file
*s
, loff_t
*pos
)
845 __acquires(htable
->lock
)
847 struct proc_dir_entry
*pde
= s
->private;
848 struct xt_hashlimit_htable
*htable
= pde
->data
;
849 unsigned int *bucket
;
851 spin_lock_bh(&htable
->lock
);
852 if (*pos
>= htable
->cfg
.size
)
855 bucket
= kmalloc(sizeof(unsigned int), GFP_ATOMIC
);
857 return ERR_PTR(-ENOMEM
);
863 static void *dl_seq_next(struct seq_file
*s
, void *v
, loff_t
*pos
)
865 struct proc_dir_entry
*pde
= s
->private;
866 struct xt_hashlimit_htable
*htable
= pde
->data
;
867 unsigned int *bucket
= (unsigned int *)v
;
870 if (*pos
>= htable
->cfg
.size
) {
877 static void dl_seq_stop(struct seq_file
*s
, void *v
)
878 __releases(htable
->lock
)
880 struct proc_dir_entry
*pde
= s
->private;
881 struct xt_hashlimit_htable
*htable
= pde
->data
;
882 unsigned int *bucket
= (unsigned int *)v
;
885 spin_unlock_bh(&htable
->lock
);
888 static int dl_seq_real_show(struct dsthash_ent
*ent
, u_int8_t family
,
891 /* recalculate to show accurate numbers */
892 rateinfo_recalc(ent
, jiffies
);
896 return seq_printf(s
, "%ld %pI4:%u->%pI4:%u %u %u %u\n",
897 (long)(ent
->expires
- jiffies
)/HZ
,
899 ntohs(ent
->dst
.src_port
),
901 ntohs(ent
->dst
.dst_port
),
902 ent
->rateinfo
.credit
, ent
->rateinfo
.credit_cap
,
904 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
906 return seq_printf(s
, "%ld %pI6:%u->%pI6:%u %u %u %u\n",
907 (long)(ent
->expires
- jiffies
)/HZ
,
909 ntohs(ent
->dst
.src_port
),
911 ntohs(ent
->dst
.dst_port
),
912 ent
->rateinfo
.credit
, ent
->rateinfo
.credit_cap
,
921 static int dl_seq_show(struct seq_file
*s
, void *v
)
923 struct proc_dir_entry
*pde
= s
->private;
924 struct xt_hashlimit_htable
*htable
= pde
->data
;
925 unsigned int *bucket
= (unsigned int *)v
;
926 struct dsthash_ent
*ent
;
927 struct hlist_node
*pos
;
929 if (!hlist_empty(&htable
->hash
[*bucket
])) {
930 hlist_for_each_entry(ent
, pos
, &htable
->hash
[*bucket
], node
)
931 if (dl_seq_real_show(ent
, htable
->family
, s
))
937 static const struct seq_operations dl_seq_ops
= {
938 .start
= dl_seq_start
,
944 static int dl_proc_open(struct inode
*inode
, struct file
*file
)
946 int ret
= seq_open(file
, &dl_seq_ops
);
949 struct seq_file
*sf
= file
->private_data
;
950 sf
->private = PDE(inode
);
955 static const struct file_operations dl_file_ops
= {
956 .owner
= THIS_MODULE
,
957 .open
= dl_proc_open
,
960 .release
= seq_release
963 static int __init
hashlimit_mt_init(void)
967 err
= xt_register_matches(hashlimit_mt_reg
,
968 ARRAY_SIZE(hashlimit_mt_reg
));
973 hashlimit_cachep
= kmem_cache_create("xt_hashlimit",
974 sizeof(struct dsthash_ent
), 0, 0,
976 if (!hashlimit_cachep
) {
977 printk(KERN_ERR
"xt_hashlimit: unable to create slab cache\n");
980 hashlimit_procdir4
= proc_mkdir("ipt_hashlimit", init_net
.proc_net
);
981 if (!hashlimit_procdir4
) {
982 printk(KERN_ERR
"xt_hashlimit: unable to create proc dir "
987 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
988 hashlimit_procdir6
= proc_mkdir("ip6t_hashlimit", init_net
.proc_net
);
989 if (!hashlimit_procdir6
) {
990 printk(KERN_ERR
"xt_hashlimit: unable to create proc dir "
997 remove_proc_entry("ipt_hashlimit", init_net
.proc_net
);
999 kmem_cache_destroy(hashlimit_cachep
);
1001 xt_unregister_matches(hashlimit_mt_reg
, ARRAY_SIZE(hashlimit_mt_reg
));
1007 static void __exit
hashlimit_mt_exit(void)
1009 remove_proc_entry("ipt_hashlimit", init_net
.proc_net
);
1010 #if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
1011 remove_proc_entry("ip6t_hashlimit", init_net
.proc_net
);
1013 kmem_cache_destroy(hashlimit_cachep
);
1014 xt_unregister_matches(hashlimit_mt_reg
, ARRAY_SIZE(hashlimit_mt_reg
));
1017 module_init(hashlimit_mt_init
);
1018 module_exit(hashlimit_mt_exit
);