2 * Checksum updating actions
4 * Copyright (c) 2010 Gregoire Baron <baronchon@n7mm.org>
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the Free
8 * Software Foundation; either version 2 of the License, or (at your option)
13 #include <linux/types.h>
14 #include <linux/init.h>
15 #include <linux/kernel.h>
16 #include <linux/module.h>
17 #include <linux/spinlock.h>
19 #include <linux/netlink.h>
20 #include <net/netlink.h>
21 #include <linux/rtnetlink.h>
23 #include <linux/skbuff.h>
28 #include <linux/icmpv6.h>
29 #include <linux/igmp.h>
32 #include <net/ip6_checksum.h>
34 #include <net/act_api.h>
36 #include <linux/tc_act/tc_csum.h>
37 #include <net/tc_act/tc_csum.h>
39 #define CSUM_TAB_MASK 15
40 static struct tcf_common *tcf_csum_ht[CSUM_TAB_MASK + 1];
41 static u32 csum_idx_gen;
42 static DEFINE_RWLOCK(csum_lock);
44 static struct tcf_hashinfo csum_hash_info = {
46 .hmask = CSUM_TAB_MASK,
50 static const struct nla_policy csum_policy[TCA_CSUM_MAX + 1] = {
51 [TCA_CSUM_PARMS] = { .len = sizeof(struct tc_csum), },
54 static int tcf_csum_init(struct net *n, struct nlattr *nla, struct nlattr *est,
55 struct tc_action *a, int ovr, int bind)
57 struct nlattr *tb[TCA_CSUM_MAX + 1];
59 struct tcf_common *pc;
66 err = nla_parse_nested(tb, TCA_CSUM_MAX, nla, csum_policy);
70 if (tb[TCA_CSUM_PARMS] == NULL)
72 parm = nla_data(tb[TCA_CSUM_PARMS]);
74 pc = tcf_hash_check(parm->index, a, bind, &csum_hash_info);
76 pc = tcf_hash_create(parm->index, est, a, sizeof(*p), bind,
77 &csum_idx_gen, &csum_hash_info);
85 tcf_hash_release(pc, bind, &csum_hash_info);
90 spin_lock_bh(&p->tcf_lock);
91 p->tcf_action = parm->action;
92 p->update_flags = parm->update_flags;
93 spin_unlock_bh(&p->tcf_lock);
95 if (ret == ACT_P_CREATED)
96 tcf_hash_insert(pc, &csum_hash_info);
101 static int tcf_csum_cleanup(struct tc_action *a, int bind)
103 struct tcf_csum *p = a->priv;
104 return tcf_hash_release(&p->common, bind, &csum_hash_info);
108 * tcf_csum_skb_nextlayer - Get next layer pointer
109 * @skb: sk_buff to use
110 * @ihl: previous summed headers length
111 * @ipl: complete packet length
112 * @jhl: next header length
114 * Check the expected next layer availability in the specified sk_buff.
115 * Return the next layer pointer if pass, NULL otherwise.
117 static void *tcf_csum_skb_nextlayer(struct sk_buff *skb,
118 unsigned int ihl, unsigned int ipl,
121 int ntkoff = skb_network_offset(skb);
124 if (!pskb_may_pull(skb, ipl + ntkoff) || (ipl < hl) ||
126 !skb_clone_writable(skb, hl + ntkoff) &&
127 pskb_expand_head(skb, 0, 0, GFP_ATOMIC)))
130 return (void *)(skb_network_header(skb) + ihl);
133 static int tcf_csum_ipv4_icmp(struct sk_buff *skb,
134 unsigned int ihl, unsigned int ipl)
136 struct icmphdr *icmph;
138 icmph = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*icmph));
143 skb->csum = csum_partial(icmph, ipl - ihl, 0);
144 icmph->checksum = csum_fold(skb->csum);
146 skb->ip_summed = CHECKSUM_NONE;
151 static int tcf_csum_ipv4_igmp(struct sk_buff *skb,
152 unsigned int ihl, unsigned int ipl)
154 struct igmphdr *igmph;
156 igmph = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*igmph));
161 skb->csum = csum_partial(igmph, ipl - ihl, 0);
162 igmph->csum = csum_fold(skb->csum);
164 skb->ip_summed = CHECKSUM_NONE;
169 static int tcf_csum_ipv6_icmp(struct sk_buff *skb, struct ipv6hdr *ip6h,
170 unsigned int ihl, unsigned int ipl)
172 struct icmp6hdr *icmp6h;
174 icmp6h = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*icmp6h));
178 icmp6h->icmp6_cksum = 0;
179 skb->csum = csum_partial(icmp6h, ipl - ihl, 0);
180 icmp6h->icmp6_cksum = csum_ipv6_magic(&ip6h->saddr, &ip6h->daddr,
181 ipl - ihl, IPPROTO_ICMPV6,
184 skb->ip_summed = CHECKSUM_NONE;
189 static int tcf_csum_ipv4_tcp(struct sk_buff *skb, struct iphdr *iph,
190 unsigned int ihl, unsigned int ipl)
194 tcph = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*tcph));
199 skb->csum = csum_partial(tcph, ipl - ihl, 0);
200 tcph->check = tcp_v4_check(ipl - ihl,
201 iph->saddr, iph->daddr, skb->csum);
203 skb->ip_summed = CHECKSUM_NONE;
208 static int tcf_csum_ipv6_tcp(struct sk_buff *skb, struct ipv6hdr *ip6h,
209 unsigned int ihl, unsigned int ipl)
213 tcph = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*tcph));
218 skb->csum = csum_partial(tcph, ipl - ihl, 0);
219 tcph->check = csum_ipv6_magic(&ip6h->saddr, &ip6h->daddr,
220 ipl - ihl, IPPROTO_TCP,
223 skb->ip_summed = CHECKSUM_NONE;
228 static int tcf_csum_ipv4_udp(struct sk_buff *skb, struct iphdr *iph,
229 unsigned int ihl, unsigned int ipl, int udplite)
235 * Support both UDP and UDPLITE checksum algorithms, Don't use
236 * udph->len to get the real length without any protocol check,
237 * UDPLITE uses udph->len for another thing,
238 * Use iph->tot_len, or just ipl.
241 udph = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*udph));
245 ul = ntohs(udph->len);
247 if (udplite || udph->check) {
253 skb->csum = csum_partial(udph, ipl - ihl, 0);
254 else if ((ul >= sizeof(*udph)) && (ul <= ipl - ihl))
255 skb->csum = csum_partial(udph, ul, 0);
257 goto ignore_obscure_skb;
260 goto ignore_obscure_skb;
262 skb->csum = csum_partial(udph, ul, 0);
265 udph->check = csum_tcpudp_magic(iph->saddr, iph->daddr,
270 udph->check = CSUM_MANGLED_0;
273 skb->ip_summed = CHECKSUM_NONE;
279 static int tcf_csum_ipv6_udp(struct sk_buff *skb, struct ipv6hdr *ip6h,
280 unsigned int ihl, unsigned int ipl, int udplite)
286 * Support both UDP and UDPLITE checksum algorithms, Don't use
287 * udph->len to get the real length without any protocol check,
288 * UDPLITE uses udph->len for another thing,
289 * Use ip6h->payload_len + sizeof(*ip6h) ... , or just ipl.
292 udph = tcf_csum_skb_nextlayer(skb, ihl, ipl, sizeof(*udph));
296 ul = ntohs(udph->len);
302 skb->csum = csum_partial(udph, ipl - ihl, 0);
304 else if ((ul >= sizeof(*udph)) && (ul <= ipl - ihl))
305 skb->csum = csum_partial(udph, ul, 0);
308 goto ignore_obscure_skb;
311 goto ignore_obscure_skb;
313 skb->csum = csum_partial(udph, ul, 0);
316 udph->check = csum_ipv6_magic(&ip6h->saddr, &ip6h->daddr, ul,
317 udplite ? IPPROTO_UDPLITE : IPPROTO_UDP,
321 udph->check = CSUM_MANGLED_0;
323 skb->ip_summed = CHECKSUM_NONE;
329 static int tcf_csum_ipv4(struct sk_buff *skb, u32 update_flags)
334 ntkoff = skb_network_offset(skb);
336 if (!pskb_may_pull(skb, sizeof(*iph) + ntkoff))
341 switch (iph->frag_off & htons(IP_OFFSET) ? 0 : iph->protocol) {
343 if (update_flags & TCA_CSUM_UPDATE_FLAG_ICMP)
344 if (!tcf_csum_ipv4_icmp(skb, iph->ihl * 4,
345 ntohs(iph->tot_len)))
349 if (update_flags & TCA_CSUM_UPDATE_FLAG_IGMP)
350 if (!tcf_csum_ipv4_igmp(skb, iph->ihl * 4,
351 ntohs(iph->tot_len)))
355 if (update_flags & TCA_CSUM_UPDATE_FLAG_TCP)
356 if (!tcf_csum_ipv4_tcp(skb, iph, iph->ihl * 4,
357 ntohs(iph->tot_len)))
361 if (update_flags & TCA_CSUM_UPDATE_FLAG_UDP)
362 if (!tcf_csum_ipv4_udp(skb, iph, iph->ihl * 4,
363 ntohs(iph->tot_len), 0))
366 case IPPROTO_UDPLITE:
367 if (update_flags & TCA_CSUM_UPDATE_FLAG_UDPLITE)
368 if (!tcf_csum_ipv4_udp(skb, iph, iph->ihl * 4,
369 ntohs(iph->tot_len), 1))
374 if (update_flags & TCA_CSUM_UPDATE_FLAG_IPV4HDR) {
375 if (skb_cloned(skb) &&
376 !skb_clone_writable(skb, sizeof(*iph) + ntkoff) &&
377 pskb_expand_head(skb, 0, 0, GFP_ATOMIC))
389 static int tcf_csum_ipv6_hopopts(struct ipv6_opt_hdr *ip6xh,
390 unsigned int ixhl, unsigned int *pl)
392 int off, len, optlen;
393 unsigned char *xh = (void *)ip6xh;
395 off = sizeof(*ip6xh);
404 optlen = xh[off + 1] + 2;
405 if (optlen != 6 || len < 6 || (off & 3) != 2)
406 /* wrong jumbo option length/alignment */
408 *pl = ntohl(*(__be32 *)(xh + off + 2));
411 optlen = xh[off + 1] + 2;
413 /* ignore obscure options */
425 static int tcf_csum_ipv6(struct sk_buff *skb, u32 update_flags)
427 struct ipv6hdr *ip6h;
428 struct ipv6_opt_hdr *ip6xh;
429 unsigned int hl, ixhl;
434 ntkoff = skb_network_offset(skb);
438 if (!pskb_may_pull(skb, hl + ntkoff))
441 ip6h = ipv6_hdr(skb);
443 pl = ntohs(ip6h->payload_len);
444 nexthdr = ip6h->nexthdr;
448 case NEXTHDR_FRAGMENT:
450 case NEXTHDR_ROUTING:
453 if (!pskb_may_pull(skb, hl + sizeof(*ip6xh) + ntkoff))
455 ip6xh = (void *)(skb_network_header(skb) + hl);
456 ixhl = ipv6_optlen(ip6xh);
457 if (!pskb_may_pull(skb, hl + ixhl + ntkoff))
459 if ((nexthdr == NEXTHDR_HOP) &&
460 !(tcf_csum_ipv6_hopopts(ip6xh, ixhl, &pl)))
462 nexthdr = ip6xh->nexthdr;
466 if (update_flags & TCA_CSUM_UPDATE_FLAG_ICMP)
467 if (!tcf_csum_ipv6_icmp(skb, ip6h,
468 hl, pl + sizeof(*ip6h)))
472 if (update_flags & TCA_CSUM_UPDATE_FLAG_TCP)
473 if (!tcf_csum_ipv6_tcp(skb, ip6h,
474 hl, pl + sizeof(*ip6h)))
478 if (update_flags & TCA_CSUM_UPDATE_FLAG_UDP)
479 if (!tcf_csum_ipv6_udp(skb, ip6h, hl,
480 pl + sizeof(*ip6h), 0))
483 case IPPROTO_UDPLITE:
484 if (update_flags & TCA_CSUM_UPDATE_FLAG_UDPLITE)
485 if (!tcf_csum_ipv6_udp(skb, ip6h, hl,
486 pl + sizeof(*ip6h), 1))
492 } while (pskb_may_pull(skb, hl + 1 + ntkoff));
502 static int tcf_csum(struct sk_buff *skb,
503 const struct tc_action *a, struct tcf_result *res)
505 struct tcf_csum *p = a->priv;
509 spin_lock(&p->tcf_lock);
510 p->tcf_tm.lastuse = jiffies;
511 bstats_update(&p->tcf_bstats, skb);
512 action = p->tcf_action;
513 update_flags = p->update_flags;
514 spin_unlock(&p->tcf_lock);
516 if (unlikely(action == TC_ACT_SHOT))
519 switch (skb->protocol) {
520 case cpu_to_be16(ETH_P_IP):
521 if (!tcf_csum_ipv4(skb, update_flags))
524 case cpu_to_be16(ETH_P_IPV6):
525 if (!tcf_csum_ipv6(skb, update_flags))
533 spin_lock(&p->tcf_lock);
534 p->tcf_qstats.drops++;
535 spin_unlock(&p->tcf_lock);
539 static int tcf_csum_dump(struct sk_buff *skb,
540 struct tc_action *a, int bind, int ref)
542 unsigned char *b = skb_tail_pointer(skb);
543 struct tcf_csum *p = a->priv;
544 struct tc_csum opt = {
545 .update_flags = p->update_flags,
546 .index = p->tcf_index,
547 .action = p->tcf_action,
548 .refcnt = p->tcf_refcnt - ref,
549 .bindcnt = p->tcf_bindcnt - bind,
553 if (nla_put(skb, TCA_CSUM_PARMS, sizeof(opt), &opt))
554 goto nla_put_failure;
555 t.install = jiffies_to_clock_t(jiffies - p->tcf_tm.install);
556 t.lastuse = jiffies_to_clock_t(jiffies - p->tcf_tm.lastuse);
557 t.expires = jiffies_to_clock_t(p->tcf_tm.expires);
558 if (nla_put(skb, TCA_CSUM_TM, sizeof(t), &t))
559 goto nla_put_failure;
568 static struct tc_action_ops act_csum_ops = {
570 .hinfo = &csum_hash_info,
571 .type = TCA_ACT_CSUM,
572 .capab = TCA_CAP_NONE,
573 .owner = THIS_MODULE,
575 .dump = tcf_csum_dump,
576 .cleanup = tcf_csum_cleanup,
577 .lookup = tcf_hash_search,
578 .init = tcf_csum_init,
579 .walk = tcf_generic_walker
582 MODULE_DESCRIPTION("Checksum updating actions");
583 MODULE_LICENSE("GPL");
585 static int __init csum_init_module(void)
587 return tcf_register_action(&act_csum_ops);
590 static void __exit csum_cleanup_module(void)
592 tcf_unregister_action(&act_csum_ops);
595 module_init(csum_init_module);
596 module_exit(csum_cleanup_module);