Merge branch 'linus' into locking/urgent, to pick up fixes
[cascardo/linux.git] / net / sched / cls_flower.c
1 /*
2  * net/sched/cls_flower.c               Flower classifier
3  *
4  * Copyright (c) 2015 Jiri Pirko <jiri@resnulli.us>
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License as published by
8  * the Free Software Foundation; either version 2 of the License, or
9  * (at your option) any later version.
10  */
11
12 #include <linux/kernel.h>
13 #include <linux/init.h>
14 #include <linux/module.h>
15 #include <linux/rhashtable.h>
16
17 #include <linux/if_ether.h>
18 #include <linux/in6.h>
19 #include <linux/ip.h>
20
21 #include <net/sch_generic.h>
22 #include <net/pkt_cls.h>
23 #include <net/ip.h>
24 #include <net/flow_dissector.h>
25
26 struct fl_flow_key {
27         int     indev_ifindex;
28         struct flow_dissector_key_control control;
29         struct flow_dissector_key_basic basic;
30         struct flow_dissector_key_eth_addrs eth;
31         struct flow_dissector_key_addrs ipaddrs;
32         union {
33                 struct flow_dissector_key_ipv4_addrs ipv4;
34                 struct flow_dissector_key_ipv6_addrs ipv6;
35         };
36         struct flow_dissector_key_ports tp;
37 } __aligned(BITS_PER_LONG / 8); /* Ensure that we can do comparisons as longs. */
38
39 struct fl_flow_mask_range {
40         unsigned short int start;
41         unsigned short int end;
42 };
43
44 struct fl_flow_mask {
45         struct fl_flow_key key;
46         struct fl_flow_mask_range range;
47         struct rcu_head rcu;
48 };
49
50 struct cls_fl_head {
51         struct rhashtable ht;
52         struct fl_flow_mask mask;
53         struct flow_dissector dissector;
54         u32 hgen;
55         bool mask_assigned;
56         struct list_head filters;
57         struct rhashtable_params ht_params;
58         struct rcu_head rcu;
59 };
60
61 struct cls_fl_filter {
62         struct rhash_head ht_node;
63         struct fl_flow_key mkey;
64         struct tcf_exts exts;
65         struct tcf_result res;
66         struct fl_flow_key key;
67         struct list_head list;
68         u32 handle;
69         u32 flags;
70         struct rcu_head rcu;
71 };
72
73 static unsigned short int fl_mask_range(const struct fl_flow_mask *mask)
74 {
75         return mask->range.end - mask->range.start;
76 }
77
78 static void fl_mask_update_range(struct fl_flow_mask *mask)
79 {
80         const u8 *bytes = (const u8 *) &mask->key;
81         size_t size = sizeof(mask->key);
82         size_t i, first = 0, last = size - 1;
83
84         for (i = 0; i < sizeof(mask->key); i++) {
85                 if (bytes[i]) {
86                         if (!first && i)
87                                 first = i;
88                         last = i;
89                 }
90         }
91         mask->range.start = rounddown(first, sizeof(long));
92         mask->range.end = roundup(last + 1, sizeof(long));
93 }
94
95 static void *fl_key_get_start(struct fl_flow_key *key,
96                               const struct fl_flow_mask *mask)
97 {
98         return (u8 *) key + mask->range.start;
99 }
100
101 static void fl_set_masked_key(struct fl_flow_key *mkey, struct fl_flow_key *key,
102                               struct fl_flow_mask *mask)
103 {
104         const long *lkey = fl_key_get_start(key, mask);
105         const long *lmask = fl_key_get_start(&mask->key, mask);
106         long *lmkey = fl_key_get_start(mkey, mask);
107         int i;
108
109         for (i = 0; i < fl_mask_range(mask); i += sizeof(long))
110                 *lmkey++ = *lkey++ & *lmask++;
111 }
112
113 static void fl_clear_masked_range(struct fl_flow_key *key,
114                                   struct fl_flow_mask *mask)
115 {
116         memset(fl_key_get_start(key, mask), 0, fl_mask_range(mask));
117 }
118
119 static int fl_classify(struct sk_buff *skb, const struct tcf_proto *tp,
120                        struct tcf_result *res)
121 {
122         struct cls_fl_head *head = rcu_dereference_bh(tp->root);
123         struct cls_fl_filter *f;
124         struct fl_flow_key skb_key;
125         struct fl_flow_key skb_mkey;
126
127         if (!atomic_read(&head->ht.nelems))
128                 return -1;
129
130         fl_clear_masked_range(&skb_key, &head->mask);
131         skb_key.indev_ifindex = skb->skb_iif;
132         /* skb_flow_dissect() does not set n_proto in case an unknown protocol,
133          * so do it rather here.
134          */
135         skb_key.basic.n_proto = skb->protocol;
136         skb_flow_dissect(skb, &head->dissector, &skb_key, 0);
137
138         fl_set_masked_key(&skb_mkey, &skb_key, &head->mask);
139
140         f = rhashtable_lookup_fast(&head->ht,
141                                    fl_key_get_start(&skb_mkey, &head->mask),
142                                    head->ht_params);
143         if (f && !tc_skip_sw(f->flags)) {
144                 *res = f->res;
145                 return tcf_exts_exec(skb, &f->exts, res);
146         }
147         return -1;
148 }
149
150 static int fl_init(struct tcf_proto *tp)
151 {
152         struct cls_fl_head *head;
153
154         head = kzalloc(sizeof(*head), GFP_KERNEL);
155         if (!head)
156                 return -ENOBUFS;
157
158         INIT_LIST_HEAD_RCU(&head->filters);
159         rcu_assign_pointer(tp->root, head);
160
161         return 0;
162 }
163
164 static void fl_destroy_filter(struct rcu_head *head)
165 {
166         struct cls_fl_filter *f = container_of(head, struct cls_fl_filter, rcu);
167
168         tcf_exts_destroy(&f->exts);
169         kfree(f);
170 }
171
172 static void fl_hw_destroy_filter(struct tcf_proto *tp, unsigned long cookie)
173 {
174         struct net_device *dev = tp->q->dev_queue->dev;
175         struct tc_cls_flower_offload offload = {0};
176         struct tc_to_netdev tc;
177
178         if (!tc_should_offload(dev, tp, 0))
179                 return;
180
181         offload.command = TC_CLSFLOWER_DESTROY;
182         offload.cookie = cookie;
183
184         tc.type = TC_SETUP_CLSFLOWER;
185         tc.cls_flower = &offload;
186
187         dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, tp->protocol, &tc);
188 }
189
190 static int fl_hw_replace_filter(struct tcf_proto *tp,
191                                 struct flow_dissector *dissector,
192                                 struct fl_flow_key *mask,
193                                 struct fl_flow_key *key,
194                                 struct tcf_exts *actions,
195                                 unsigned long cookie, u32 flags)
196 {
197         struct net_device *dev = tp->q->dev_queue->dev;
198         struct tc_cls_flower_offload offload = {0};
199         struct tc_to_netdev tc;
200         int err;
201
202         if (!tc_should_offload(dev, tp, flags))
203                 return tc_skip_sw(flags) ? -EINVAL : 0;
204
205         offload.command = TC_CLSFLOWER_REPLACE;
206         offload.cookie = cookie;
207         offload.dissector = dissector;
208         offload.mask = mask;
209         offload.key = key;
210         offload.exts = actions;
211
212         tc.type = TC_SETUP_CLSFLOWER;
213         tc.cls_flower = &offload;
214
215         err = dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, tp->protocol, &tc);
216
217         if (tc_skip_sw(flags))
218                 return err;
219
220         return 0;
221 }
222
223 static void fl_hw_update_stats(struct tcf_proto *tp, struct cls_fl_filter *f)
224 {
225         struct net_device *dev = tp->q->dev_queue->dev;
226         struct tc_cls_flower_offload offload = {0};
227         struct tc_to_netdev tc;
228
229         if (!tc_should_offload(dev, tp, 0))
230                 return;
231
232         offload.command = TC_CLSFLOWER_STATS;
233         offload.cookie = (unsigned long)f;
234         offload.exts = &f->exts;
235
236         tc.type = TC_SETUP_CLSFLOWER;
237         tc.cls_flower = &offload;
238
239         dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, tp->protocol, &tc);
240 }
241
242 static bool fl_destroy(struct tcf_proto *tp, bool force)
243 {
244         struct cls_fl_head *head = rtnl_dereference(tp->root);
245         struct cls_fl_filter *f, *next;
246
247         if (!force && !list_empty(&head->filters))
248                 return false;
249
250         list_for_each_entry_safe(f, next, &head->filters, list) {
251                 fl_hw_destroy_filter(tp, (unsigned long)f);
252                 list_del_rcu(&f->list);
253                 call_rcu(&f->rcu, fl_destroy_filter);
254         }
255         RCU_INIT_POINTER(tp->root, NULL);
256         if (head->mask_assigned)
257                 rhashtable_destroy(&head->ht);
258         kfree_rcu(head, rcu);
259         return true;
260 }
261
262 static unsigned long fl_get(struct tcf_proto *tp, u32 handle)
263 {
264         struct cls_fl_head *head = rtnl_dereference(tp->root);
265         struct cls_fl_filter *f;
266
267         list_for_each_entry(f, &head->filters, list)
268                 if (f->handle == handle)
269                         return (unsigned long) f;
270         return 0;
271 }
272
273 static const struct nla_policy fl_policy[TCA_FLOWER_MAX + 1] = {
274         [TCA_FLOWER_UNSPEC]             = { .type = NLA_UNSPEC },
275         [TCA_FLOWER_CLASSID]            = { .type = NLA_U32 },
276         [TCA_FLOWER_INDEV]              = { .type = NLA_STRING,
277                                             .len = IFNAMSIZ },
278         [TCA_FLOWER_KEY_ETH_DST]        = { .len = ETH_ALEN },
279         [TCA_FLOWER_KEY_ETH_DST_MASK]   = { .len = ETH_ALEN },
280         [TCA_FLOWER_KEY_ETH_SRC]        = { .len = ETH_ALEN },
281         [TCA_FLOWER_KEY_ETH_SRC_MASK]   = { .len = ETH_ALEN },
282         [TCA_FLOWER_KEY_ETH_TYPE]       = { .type = NLA_U16 },
283         [TCA_FLOWER_KEY_IP_PROTO]       = { .type = NLA_U8 },
284         [TCA_FLOWER_KEY_IPV4_SRC]       = { .type = NLA_U32 },
285         [TCA_FLOWER_KEY_IPV4_SRC_MASK]  = { .type = NLA_U32 },
286         [TCA_FLOWER_KEY_IPV4_DST]       = { .type = NLA_U32 },
287         [TCA_FLOWER_KEY_IPV4_DST_MASK]  = { .type = NLA_U32 },
288         [TCA_FLOWER_KEY_IPV6_SRC]       = { .len = sizeof(struct in6_addr) },
289         [TCA_FLOWER_KEY_IPV6_SRC_MASK]  = { .len = sizeof(struct in6_addr) },
290         [TCA_FLOWER_KEY_IPV6_DST]       = { .len = sizeof(struct in6_addr) },
291         [TCA_FLOWER_KEY_IPV6_DST_MASK]  = { .len = sizeof(struct in6_addr) },
292         [TCA_FLOWER_KEY_TCP_SRC]        = { .type = NLA_U16 },
293         [TCA_FLOWER_KEY_TCP_DST]        = { .type = NLA_U16 },
294         [TCA_FLOWER_KEY_UDP_SRC]        = { .type = NLA_U16 },
295         [TCA_FLOWER_KEY_UDP_DST]        = { .type = NLA_U16 },
296 };
297
298 static void fl_set_key_val(struct nlattr **tb,
299                            void *val, int val_type,
300                            void *mask, int mask_type, int len)
301 {
302         if (!tb[val_type])
303                 return;
304         memcpy(val, nla_data(tb[val_type]), len);
305         if (mask_type == TCA_FLOWER_UNSPEC || !tb[mask_type])
306                 memset(mask, 0xff, len);
307         else
308                 memcpy(mask, nla_data(tb[mask_type]), len);
309 }
310
311 static int fl_set_key(struct net *net, struct nlattr **tb,
312                       struct fl_flow_key *key, struct fl_flow_key *mask)
313 {
314 #ifdef CONFIG_NET_CLS_IND
315         if (tb[TCA_FLOWER_INDEV]) {
316                 int err = tcf_change_indev(net, tb[TCA_FLOWER_INDEV]);
317                 if (err < 0)
318                         return err;
319                 key->indev_ifindex = err;
320                 mask->indev_ifindex = 0xffffffff;
321         }
322 #endif
323
324         fl_set_key_val(tb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
325                        mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
326                        sizeof(key->eth.dst));
327         fl_set_key_val(tb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
328                        mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
329                        sizeof(key->eth.src));
330
331         fl_set_key_val(tb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE,
332                        &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
333                        sizeof(key->basic.n_proto));
334
335         if (key->basic.n_proto == htons(ETH_P_IP) ||
336             key->basic.n_proto == htons(ETH_P_IPV6)) {
337                 fl_set_key_val(tb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
338                                &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
339                                sizeof(key->basic.ip_proto));
340         }
341
342         if (tb[TCA_FLOWER_KEY_IPV4_SRC] || tb[TCA_FLOWER_KEY_IPV4_DST]) {
343                 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
344                 fl_set_key_val(tb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
345                                &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
346                                sizeof(key->ipv4.src));
347                 fl_set_key_val(tb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
348                                &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
349                                sizeof(key->ipv4.dst));
350         } else if (tb[TCA_FLOWER_KEY_IPV6_SRC] || tb[TCA_FLOWER_KEY_IPV6_DST]) {
351                 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
352                 fl_set_key_val(tb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
353                                &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
354                                sizeof(key->ipv6.src));
355                 fl_set_key_val(tb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
356                                &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
357                                sizeof(key->ipv6.dst));
358         }
359
360         if (key->basic.ip_proto == IPPROTO_TCP) {
361                 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
362                                &mask->tp.src, TCA_FLOWER_UNSPEC,
363                                sizeof(key->tp.src));
364                 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
365                                &mask->tp.dst, TCA_FLOWER_UNSPEC,
366                                sizeof(key->tp.dst));
367         } else if (key->basic.ip_proto == IPPROTO_UDP) {
368                 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
369                                &mask->tp.src, TCA_FLOWER_UNSPEC,
370                                sizeof(key->tp.src));
371                 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
372                                &mask->tp.dst, TCA_FLOWER_UNSPEC,
373                                sizeof(key->tp.dst));
374         }
375
376         return 0;
377 }
378
379 static bool fl_mask_eq(struct fl_flow_mask *mask1,
380                        struct fl_flow_mask *mask2)
381 {
382         const long *lmask1 = fl_key_get_start(&mask1->key, mask1);
383         const long *lmask2 = fl_key_get_start(&mask2->key, mask2);
384
385         return !memcmp(&mask1->range, &mask2->range, sizeof(mask1->range)) &&
386                !memcmp(lmask1, lmask2, fl_mask_range(mask1));
387 }
388
389 static const struct rhashtable_params fl_ht_params = {
390         .key_offset = offsetof(struct cls_fl_filter, mkey), /* base offset */
391         .head_offset = offsetof(struct cls_fl_filter, ht_node),
392         .automatic_shrinking = true,
393 };
394
395 static int fl_init_hashtable(struct cls_fl_head *head,
396                              struct fl_flow_mask *mask)
397 {
398         head->ht_params = fl_ht_params;
399         head->ht_params.key_len = fl_mask_range(mask);
400         head->ht_params.key_offset += mask->range.start;
401
402         return rhashtable_init(&head->ht, &head->ht_params);
403 }
404
405 #define FL_KEY_MEMBER_OFFSET(member) offsetof(struct fl_flow_key, member)
406 #define FL_KEY_MEMBER_SIZE(member) (sizeof(((struct fl_flow_key *) 0)->member))
407 #define FL_KEY_MEMBER_END_OFFSET(member)                                        \
408         (FL_KEY_MEMBER_OFFSET(member) + FL_KEY_MEMBER_SIZE(member))
409
410 #define FL_KEY_IN_RANGE(mask, member)                                           \
411         (FL_KEY_MEMBER_OFFSET(member) <= (mask)->range.end &&                   \
412          FL_KEY_MEMBER_END_OFFSET(member) >= (mask)->range.start)
413
414 #define FL_KEY_SET(keys, cnt, id, member)                                       \
415         do {                                                                    \
416                 keys[cnt].key_id = id;                                          \
417                 keys[cnt].offset = FL_KEY_MEMBER_OFFSET(member);                \
418                 cnt++;                                                          \
419         } while(0);
420
421 #define FL_KEY_SET_IF_IN_RANGE(mask, keys, cnt, id, member)                     \
422         do {                                                                    \
423                 if (FL_KEY_IN_RANGE(mask, member))                              \
424                         FL_KEY_SET(keys, cnt, id, member);                      \
425         } while(0);
426
427 static void fl_init_dissector(struct cls_fl_head *head,
428                               struct fl_flow_mask *mask)
429 {
430         struct flow_dissector_key keys[FLOW_DISSECTOR_KEY_MAX];
431         size_t cnt = 0;
432
433         FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_CONTROL, control);
434         FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_BASIC, basic);
435         FL_KEY_SET_IF_IN_RANGE(mask, keys, cnt,
436                                FLOW_DISSECTOR_KEY_ETH_ADDRS, eth);
437         FL_KEY_SET_IF_IN_RANGE(mask, keys, cnt,
438                                FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4);
439         FL_KEY_SET_IF_IN_RANGE(mask, keys, cnt,
440                                FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6);
441         FL_KEY_SET_IF_IN_RANGE(mask, keys, cnt,
442                                FLOW_DISSECTOR_KEY_PORTS, tp);
443
444         skb_flow_dissector_init(&head->dissector, keys, cnt);
445 }
446
447 static int fl_check_assign_mask(struct cls_fl_head *head,
448                                 struct fl_flow_mask *mask)
449 {
450         int err;
451
452         if (head->mask_assigned) {
453                 if (!fl_mask_eq(&head->mask, mask))
454                         return -EINVAL;
455                 else
456                         return 0;
457         }
458
459         /* Mask is not assigned yet. So assign it and init hashtable
460          * according to that.
461          */
462         err = fl_init_hashtable(head, mask);
463         if (err)
464                 return err;
465         memcpy(&head->mask, mask, sizeof(head->mask));
466         head->mask_assigned = true;
467
468         fl_init_dissector(head, mask);
469
470         return 0;
471 }
472
473 static int fl_set_parms(struct net *net, struct tcf_proto *tp,
474                         struct cls_fl_filter *f, struct fl_flow_mask *mask,
475                         unsigned long base, struct nlattr **tb,
476                         struct nlattr *est, bool ovr)
477 {
478         struct tcf_exts e;
479         int err;
480
481         tcf_exts_init(&e, TCA_FLOWER_ACT, 0);
482         err = tcf_exts_validate(net, tp, tb, est, &e, ovr);
483         if (err < 0)
484                 return err;
485
486         if (tb[TCA_FLOWER_CLASSID]) {
487                 f->res.classid = nla_get_u32(tb[TCA_FLOWER_CLASSID]);
488                 tcf_bind_filter(tp, &f->res, base);
489         }
490
491         err = fl_set_key(net, tb, &f->key, &mask->key);
492         if (err)
493                 goto errout;
494
495         fl_mask_update_range(mask);
496         fl_set_masked_key(&f->mkey, &f->key, mask);
497
498         tcf_exts_change(tp, &f->exts, &e);
499
500         return 0;
501 errout:
502         tcf_exts_destroy(&e);
503         return err;
504 }
505
506 static u32 fl_grab_new_handle(struct tcf_proto *tp,
507                               struct cls_fl_head *head)
508 {
509         unsigned int i = 0x80000000;
510         u32 handle;
511
512         do {
513                 if (++head->hgen == 0x7FFFFFFF)
514                         head->hgen = 1;
515         } while (--i > 0 && fl_get(tp, head->hgen));
516
517         if (unlikely(i == 0)) {
518                 pr_err("Insufficient number of handles\n");
519                 handle = 0;
520         } else {
521                 handle = head->hgen;
522         }
523
524         return handle;
525 }
526
527 static int fl_change(struct net *net, struct sk_buff *in_skb,
528                      struct tcf_proto *tp, unsigned long base,
529                      u32 handle, struct nlattr **tca,
530                      unsigned long *arg, bool ovr)
531 {
532         struct cls_fl_head *head = rtnl_dereference(tp->root);
533         struct cls_fl_filter *fold = (struct cls_fl_filter *) *arg;
534         struct cls_fl_filter *fnew;
535         struct nlattr *tb[TCA_FLOWER_MAX + 1];
536         struct fl_flow_mask mask = {};
537         int err;
538
539         if (!tca[TCA_OPTIONS])
540                 return -EINVAL;
541
542         err = nla_parse_nested(tb, TCA_FLOWER_MAX, tca[TCA_OPTIONS], fl_policy);
543         if (err < 0)
544                 return err;
545
546         if (fold && handle && fold->handle != handle)
547                 return -EINVAL;
548
549         fnew = kzalloc(sizeof(*fnew), GFP_KERNEL);
550         if (!fnew)
551                 return -ENOBUFS;
552
553         tcf_exts_init(&fnew->exts, TCA_FLOWER_ACT, 0);
554
555         if (!handle) {
556                 handle = fl_grab_new_handle(tp, head);
557                 if (!handle) {
558                         err = -EINVAL;
559                         goto errout;
560                 }
561         }
562         fnew->handle = handle;
563
564         if (tb[TCA_FLOWER_FLAGS]) {
565                 fnew->flags = nla_get_u32(tb[TCA_FLOWER_FLAGS]);
566
567                 if (!tc_flags_valid(fnew->flags)) {
568                         err = -EINVAL;
569                         goto errout;
570                 }
571         }
572
573         err = fl_set_parms(net, tp, fnew, &mask, base, tb, tca[TCA_RATE], ovr);
574         if (err)
575                 goto errout;
576
577         err = fl_check_assign_mask(head, &mask);
578         if (err)
579                 goto errout;
580
581         if (!tc_skip_sw(fnew->flags)) {
582                 err = rhashtable_insert_fast(&head->ht, &fnew->ht_node,
583                                              head->ht_params);
584                 if (err)
585                         goto errout;
586         }
587
588         err = fl_hw_replace_filter(tp,
589                                    &head->dissector,
590                                    &mask.key,
591                                    &fnew->key,
592                                    &fnew->exts,
593                                    (unsigned long)fnew,
594                                    fnew->flags);
595         if (err)
596                 goto errout;
597
598         if (fold) {
599                 rhashtable_remove_fast(&head->ht, &fold->ht_node,
600                                        head->ht_params);
601                 fl_hw_destroy_filter(tp, (unsigned long)fold);
602         }
603
604         *arg = (unsigned long) fnew;
605
606         if (fold) {
607                 list_replace_rcu(&fold->list, &fnew->list);
608                 tcf_unbind_filter(tp, &fold->res);
609                 call_rcu(&fold->rcu, fl_destroy_filter);
610         } else {
611                 list_add_tail_rcu(&fnew->list, &head->filters);
612         }
613
614         return 0;
615
616 errout:
617         kfree(fnew);
618         return err;
619 }
620
621 static int fl_delete(struct tcf_proto *tp, unsigned long arg)
622 {
623         struct cls_fl_head *head = rtnl_dereference(tp->root);
624         struct cls_fl_filter *f = (struct cls_fl_filter *) arg;
625
626         rhashtable_remove_fast(&head->ht, &f->ht_node,
627                                head->ht_params);
628         list_del_rcu(&f->list);
629         fl_hw_destroy_filter(tp, (unsigned long)f);
630         tcf_unbind_filter(tp, &f->res);
631         call_rcu(&f->rcu, fl_destroy_filter);
632         return 0;
633 }
634
635 static void fl_walk(struct tcf_proto *tp, struct tcf_walker *arg)
636 {
637         struct cls_fl_head *head = rtnl_dereference(tp->root);
638         struct cls_fl_filter *f;
639
640         list_for_each_entry_rcu(f, &head->filters, list) {
641                 if (arg->count < arg->skip)
642                         goto skip;
643                 if (arg->fn(tp, (unsigned long) f, arg) < 0) {
644                         arg->stop = 1;
645                         break;
646                 }
647 skip:
648                 arg->count++;
649         }
650 }
651
652 static int fl_dump_key_val(struct sk_buff *skb,
653                            void *val, int val_type,
654                            void *mask, int mask_type, int len)
655 {
656         int err;
657
658         if (!memchr_inv(mask, 0, len))
659                 return 0;
660         err = nla_put(skb, val_type, len, val);
661         if (err)
662                 return err;
663         if (mask_type != TCA_FLOWER_UNSPEC) {
664                 err = nla_put(skb, mask_type, len, mask);
665                 if (err)
666                         return err;
667         }
668         return 0;
669 }
670
671 static int fl_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
672                    struct sk_buff *skb, struct tcmsg *t)
673 {
674         struct cls_fl_head *head = rtnl_dereference(tp->root);
675         struct cls_fl_filter *f = (struct cls_fl_filter *) fh;
676         struct nlattr *nest;
677         struct fl_flow_key *key, *mask;
678
679         if (!f)
680                 return skb->len;
681
682         t->tcm_handle = f->handle;
683
684         nest = nla_nest_start(skb, TCA_OPTIONS);
685         if (!nest)
686                 goto nla_put_failure;
687
688         if (f->res.classid &&
689             nla_put_u32(skb, TCA_FLOWER_CLASSID, f->res.classid))
690                 goto nla_put_failure;
691
692         key = &f->key;
693         mask = &head->mask.key;
694
695         if (mask->indev_ifindex) {
696                 struct net_device *dev;
697
698                 dev = __dev_get_by_index(net, key->indev_ifindex);
699                 if (dev && nla_put_string(skb, TCA_FLOWER_INDEV, dev->name))
700                         goto nla_put_failure;
701         }
702
703         fl_hw_update_stats(tp, f);
704
705         if (fl_dump_key_val(skb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
706                             mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
707                             sizeof(key->eth.dst)) ||
708             fl_dump_key_val(skb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
709                             mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
710                             sizeof(key->eth.src)) ||
711             fl_dump_key_val(skb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE,
712                             &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
713                             sizeof(key->basic.n_proto)))
714                 goto nla_put_failure;
715         if ((key->basic.n_proto == htons(ETH_P_IP) ||
716              key->basic.n_proto == htons(ETH_P_IPV6)) &&
717             fl_dump_key_val(skb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
718                             &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
719                             sizeof(key->basic.ip_proto)))
720                 goto nla_put_failure;
721
722         if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
723             (fl_dump_key_val(skb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
724                              &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
725                              sizeof(key->ipv4.src)) ||
726              fl_dump_key_val(skb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
727                              &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
728                              sizeof(key->ipv4.dst))))
729                 goto nla_put_failure;
730         else if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
731                  (fl_dump_key_val(skb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
732                                   &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
733                                   sizeof(key->ipv6.src)) ||
734                   fl_dump_key_val(skb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
735                                   &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
736                                   sizeof(key->ipv6.dst))))
737                 goto nla_put_failure;
738
739         if (key->basic.ip_proto == IPPROTO_TCP &&
740             (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
741                              &mask->tp.src, TCA_FLOWER_UNSPEC,
742                              sizeof(key->tp.src)) ||
743              fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
744                              &mask->tp.dst, TCA_FLOWER_UNSPEC,
745                              sizeof(key->tp.dst))))
746                 goto nla_put_failure;
747         else if (key->basic.ip_proto == IPPROTO_UDP &&
748                  (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
749                                   &mask->tp.src, TCA_FLOWER_UNSPEC,
750                                   sizeof(key->tp.src)) ||
751                   fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
752                                   &mask->tp.dst, TCA_FLOWER_UNSPEC,
753                                   sizeof(key->tp.dst))))
754                 goto nla_put_failure;
755
756         nla_put_u32(skb, TCA_FLOWER_FLAGS, f->flags);
757
758         if (tcf_exts_dump(skb, &f->exts))
759                 goto nla_put_failure;
760
761         nla_nest_end(skb, nest);
762
763         if (tcf_exts_dump_stats(skb, &f->exts) < 0)
764                 goto nla_put_failure;
765
766         return skb->len;
767
768 nla_put_failure:
769         nla_nest_cancel(skb, nest);
770         return -1;
771 }
772
773 static struct tcf_proto_ops cls_fl_ops __read_mostly = {
774         .kind           = "flower",
775         .classify       = fl_classify,
776         .init           = fl_init,
777         .destroy        = fl_destroy,
778         .get            = fl_get,
779         .change         = fl_change,
780         .delete         = fl_delete,
781         .walk           = fl_walk,
782         .dump           = fl_dump,
783         .owner          = THIS_MODULE,
784 };
785
786 static int __init cls_fl_init(void)
787 {
788         return register_tcf_proto_ops(&cls_fl_ops);
789 }
790
791 static void __exit cls_fl_exit(void)
792 {
793         unregister_tcf_proto_ops(&cls_fl_ops);
794 }
795
796 module_init(cls_fl_init);
797 module_exit(cls_fl_exit);
798
799 MODULE_AUTHOR("Jiri Pirko <jiri@resnulli.us>");
800 MODULE_DESCRIPTION("Flower classifier");
801 MODULE_LICENSE("GPL v2");