Merge remote-tracking branch 'net-next/master'
[deliverable/linux.git] / net / sched / cls_flower.c
CommitLineData
77b9900e
JP
1/*
2 * net/sched/cls_flower.c Flower classifier
3 *
4 * Copyright (c) 2015 Jiri Pirko <jiri@resnulli.us>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 */
11
12#include <linux/kernel.h>
13#include <linux/init.h>
14#include <linux/module.h>
15#include <linux/rhashtable.h>
16
17#include <linux/if_ether.h>
18#include <linux/in6.h>
19#include <linux/ip.h>
20
21#include <net/sch_generic.h>
22#include <net/pkt_cls.h>
23#include <net/ip.h>
24#include <net/flow_dissector.h>
25
bc3103f1
AV
26#include <net/dst.h>
27#include <net/dst_metadata.h>
28
77b9900e
JP
29struct fl_flow_key {
30 int indev_ifindex;
42aecaa9 31 struct flow_dissector_key_control control;
bc3103f1 32 struct flow_dissector_key_control enc_control;
77b9900e
JP
33 struct flow_dissector_key_basic basic;
34 struct flow_dissector_key_eth_addrs eth;
9399ae9a 35 struct flow_dissector_key_vlan vlan;
c3f83241 36 struct flow_dissector_key_addrs ipaddrs;
77b9900e 37 union {
c3f83241 38 struct flow_dissector_key_ipv4_addrs ipv4;
77b9900e
JP
39 struct flow_dissector_key_ipv6_addrs ipv6;
40 };
41 struct flow_dissector_key_ports tp;
bc3103f1
AV
42 struct flow_dissector_key_keyid enc_key_id;
43 union {
44 struct flow_dissector_key_ipv4_addrs enc_ipv4;
45 struct flow_dissector_key_ipv6_addrs enc_ipv6;
46 };
77b9900e
JP
47} __aligned(BITS_PER_LONG / 8); /* Ensure that we can do comparisons as longs. */
48
49struct fl_flow_mask_range {
50 unsigned short int start;
51 unsigned short int end;
52};
53
54struct fl_flow_mask {
55 struct fl_flow_key key;
56 struct fl_flow_mask_range range;
57 struct rcu_head rcu;
58};
59
60struct cls_fl_head {
61 struct rhashtable ht;
62 struct fl_flow_mask mask;
63 struct flow_dissector dissector;
64 u32 hgen;
65 bool mask_assigned;
66 struct list_head filters;
67 struct rhashtable_params ht_params;
68 struct rcu_head rcu;
69};
70
71struct cls_fl_filter {
72 struct rhash_head ht_node;
73 struct fl_flow_key mkey;
74 struct tcf_exts exts;
75 struct tcf_result res;
76 struct fl_flow_key key;
77 struct list_head list;
78 u32 handle;
e69985c6 79 u32 flags;
77b9900e
JP
80 struct rcu_head rcu;
81};
82
83static unsigned short int fl_mask_range(const struct fl_flow_mask *mask)
84{
85 return mask->range.end - mask->range.start;
86}
87
88static void fl_mask_update_range(struct fl_flow_mask *mask)
89{
90 const u8 *bytes = (const u8 *) &mask->key;
91 size_t size = sizeof(mask->key);
92 size_t i, first = 0, last = size - 1;
93
94 for (i = 0; i < sizeof(mask->key); i++) {
95 if (bytes[i]) {
96 if (!first && i)
97 first = i;
98 last = i;
99 }
100 }
101 mask->range.start = rounddown(first, sizeof(long));
102 mask->range.end = roundup(last + 1, sizeof(long));
103}
104
105static void *fl_key_get_start(struct fl_flow_key *key,
106 const struct fl_flow_mask *mask)
107{
108 return (u8 *) key + mask->range.start;
109}
110
111static void fl_set_masked_key(struct fl_flow_key *mkey, struct fl_flow_key *key,
112 struct fl_flow_mask *mask)
113{
114 const long *lkey = fl_key_get_start(key, mask);
115 const long *lmask = fl_key_get_start(&mask->key, mask);
116 long *lmkey = fl_key_get_start(mkey, mask);
117 int i;
118
119 for (i = 0; i < fl_mask_range(mask); i += sizeof(long))
120 *lmkey++ = *lkey++ & *lmask++;
121}
122
123static void fl_clear_masked_range(struct fl_flow_key *key,
124 struct fl_flow_mask *mask)
125{
126 memset(fl_key_get_start(key, mask), 0, fl_mask_range(mask));
127}
128
129static int fl_classify(struct sk_buff *skb, const struct tcf_proto *tp,
130 struct tcf_result *res)
131{
132 struct cls_fl_head *head = rcu_dereference_bh(tp->root);
133 struct cls_fl_filter *f;
134 struct fl_flow_key skb_key;
135 struct fl_flow_key skb_mkey;
bc3103f1 136 struct ip_tunnel_info *info;
77b9900e 137
e69985c6
AV
138 if (!atomic_read(&head->ht.nelems))
139 return -1;
140
77b9900e 141 fl_clear_masked_range(&skb_key, &head->mask);
bc3103f1
AV
142
143 info = skb_tunnel_info(skb);
144 if (info) {
145 struct ip_tunnel_key *key = &info->key;
146
147 switch (ip_tunnel_info_af(info)) {
148 case AF_INET:
149 skb_key.enc_ipv4.src = key->u.ipv4.src;
150 skb_key.enc_ipv4.dst = key->u.ipv4.dst;
151 break;
152 case AF_INET6:
153 skb_key.enc_ipv6.src = key->u.ipv6.src;
154 skb_key.enc_ipv6.dst = key->u.ipv6.dst;
155 break;
156 }
157
158 skb_key.enc_key_id.keyid = tunnel_id_to_key32(key->tun_id);
159 }
160
77b9900e
JP
161 skb_key.indev_ifindex = skb->skb_iif;
162 /* skb_flow_dissect() does not set n_proto in case an unknown protocol,
163 * so do it rather here.
164 */
165 skb_key.basic.n_proto = skb->protocol;
cd79a238 166 skb_flow_dissect(skb, &head->dissector, &skb_key, 0);
77b9900e
JP
167
168 fl_set_masked_key(&skb_mkey, &skb_key, &head->mask);
169
170 f = rhashtable_lookup_fast(&head->ht,
171 fl_key_get_start(&skb_mkey, &head->mask),
172 head->ht_params);
e8eb36cd 173 if (f && !tc_skip_sw(f->flags)) {
77b9900e
JP
174 *res = f->res;
175 return tcf_exts_exec(skb, &f->exts, res);
176 }
177 return -1;
178}
179
180static int fl_init(struct tcf_proto *tp)
181{
182 struct cls_fl_head *head;
183
184 head = kzalloc(sizeof(*head), GFP_KERNEL);
185 if (!head)
186 return -ENOBUFS;
187
188 INIT_LIST_HEAD_RCU(&head->filters);
189 rcu_assign_pointer(tp->root, head);
190
191 return 0;
192}
193
194static void fl_destroy_filter(struct rcu_head *head)
195{
196 struct cls_fl_filter *f = container_of(head, struct cls_fl_filter, rcu);
197
198 tcf_exts_destroy(&f->exts);
199 kfree(f);
200}
201
8208d21b 202static void fl_hw_destroy_filter(struct tcf_proto *tp, unsigned long cookie)
5b33f488
AV
203{
204 struct net_device *dev = tp->q->dev_queue->dev;
205 struct tc_cls_flower_offload offload = {0};
206 struct tc_to_netdev tc;
207
92c075db 208 if (!tc_should_offload(dev, tp, 0))
5b33f488
AV
209 return;
210
211 offload.command = TC_CLSFLOWER_DESTROY;
212 offload.cookie = cookie;
213
214 tc.type = TC_SETUP_CLSFLOWER;
215 tc.cls_flower = &offload;
216
217 dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, tp->protocol, &tc);
218}
219
e8eb36cd
AV
220static int fl_hw_replace_filter(struct tcf_proto *tp,
221 struct flow_dissector *dissector,
222 struct fl_flow_key *mask,
223 struct fl_flow_key *key,
224 struct tcf_exts *actions,
225 unsigned long cookie, u32 flags)
5b33f488
AV
226{
227 struct net_device *dev = tp->q->dev_queue->dev;
228 struct tc_cls_flower_offload offload = {0};
229 struct tc_to_netdev tc;
e8eb36cd 230 int err;
5b33f488 231
92c075db 232 if (!tc_should_offload(dev, tp, flags))
e8eb36cd 233 return tc_skip_sw(flags) ? -EINVAL : 0;
5b33f488
AV
234
235 offload.command = TC_CLSFLOWER_REPLACE;
236 offload.cookie = cookie;
237 offload.dissector = dissector;
238 offload.mask = mask;
239 offload.key = key;
240 offload.exts = actions;
241
242 tc.type = TC_SETUP_CLSFLOWER;
243 tc.cls_flower = &offload;
244
e8eb36cd
AV
245 err = dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, tp->protocol, &tc);
246
247 if (tc_skip_sw(flags))
248 return err;
249
250 return 0;
5b33f488
AV
251}
252
10cbc684
AV
253static void fl_hw_update_stats(struct tcf_proto *tp, struct cls_fl_filter *f)
254{
255 struct net_device *dev = tp->q->dev_queue->dev;
256 struct tc_cls_flower_offload offload = {0};
257 struct tc_to_netdev tc;
258
92c075db 259 if (!tc_should_offload(dev, tp, 0))
10cbc684
AV
260 return;
261
262 offload.command = TC_CLSFLOWER_STATS;
263 offload.cookie = (unsigned long)f;
264 offload.exts = &f->exts;
265
266 tc.type = TC_SETUP_CLSFLOWER;
267 tc.cls_flower = &offload;
268
269 dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, tp->protocol, &tc);
270}
271
77b9900e
JP
272static bool fl_destroy(struct tcf_proto *tp, bool force)
273{
274 struct cls_fl_head *head = rtnl_dereference(tp->root);
275 struct cls_fl_filter *f, *next;
276
277 if (!force && !list_empty(&head->filters))
278 return false;
279
280 list_for_each_entry_safe(f, next, &head->filters, list) {
8208d21b 281 fl_hw_destroy_filter(tp, (unsigned long)f);
77b9900e
JP
282 list_del_rcu(&f->list);
283 call_rcu(&f->rcu, fl_destroy_filter);
284 }
285 RCU_INIT_POINTER(tp->root, NULL);
286 if (head->mask_assigned)
287 rhashtable_destroy(&head->ht);
288 kfree_rcu(head, rcu);
289 return true;
290}
291
292static unsigned long fl_get(struct tcf_proto *tp, u32 handle)
293{
294 struct cls_fl_head *head = rtnl_dereference(tp->root);
295 struct cls_fl_filter *f;
296
297 list_for_each_entry(f, &head->filters, list)
298 if (f->handle == handle)
299 return (unsigned long) f;
300 return 0;
301}
302
303static const struct nla_policy fl_policy[TCA_FLOWER_MAX + 1] = {
304 [TCA_FLOWER_UNSPEC] = { .type = NLA_UNSPEC },
305 [TCA_FLOWER_CLASSID] = { .type = NLA_U32 },
306 [TCA_FLOWER_INDEV] = { .type = NLA_STRING,
307 .len = IFNAMSIZ },
308 [TCA_FLOWER_KEY_ETH_DST] = { .len = ETH_ALEN },
309 [TCA_FLOWER_KEY_ETH_DST_MASK] = { .len = ETH_ALEN },
310 [TCA_FLOWER_KEY_ETH_SRC] = { .len = ETH_ALEN },
311 [TCA_FLOWER_KEY_ETH_SRC_MASK] = { .len = ETH_ALEN },
312 [TCA_FLOWER_KEY_ETH_TYPE] = { .type = NLA_U16 },
313 [TCA_FLOWER_KEY_IP_PROTO] = { .type = NLA_U8 },
314 [TCA_FLOWER_KEY_IPV4_SRC] = { .type = NLA_U32 },
315 [TCA_FLOWER_KEY_IPV4_SRC_MASK] = { .type = NLA_U32 },
316 [TCA_FLOWER_KEY_IPV4_DST] = { .type = NLA_U32 },
317 [TCA_FLOWER_KEY_IPV4_DST_MASK] = { .type = NLA_U32 },
318 [TCA_FLOWER_KEY_IPV6_SRC] = { .len = sizeof(struct in6_addr) },
319 [TCA_FLOWER_KEY_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) },
320 [TCA_FLOWER_KEY_IPV6_DST] = { .len = sizeof(struct in6_addr) },
321 [TCA_FLOWER_KEY_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) },
322 [TCA_FLOWER_KEY_TCP_SRC] = { .type = NLA_U16 },
323 [TCA_FLOWER_KEY_TCP_DST] = { .type = NLA_U16 },
b175c3a4
JHS
324 [TCA_FLOWER_KEY_UDP_SRC] = { .type = NLA_U16 },
325 [TCA_FLOWER_KEY_UDP_DST] = { .type = NLA_U16 },
9399ae9a
HHZ
326 [TCA_FLOWER_KEY_VLAN_ID] = { .type = NLA_U16 },
327 [TCA_FLOWER_KEY_VLAN_PRIO] = { .type = NLA_U8 },
328 [TCA_FLOWER_KEY_VLAN_ETH_TYPE] = { .type = NLA_U16 },
bc3103f1
AV
329 [TCA_FLOWER_KEY_ENC_KEY_ID] = { .type = NLA_U32 },
330 [TCA_FLOWER_KEY_ENC_IPV4_SRC] = { .type = NLA_U32 },
331 [TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK] = { .type = NLA_U32 },
332 [TCA_FLOWER_KEY_ENC_IPV4_DST] = { .type = NLA_U32 },
333 [TCA_FLOWER_KEY_ENC_IPV4_DST_MASK] = { .type = NLA_U32 },
334 [TCA_FLOWER_KEY_ENC_IPV6_SRC] = { .len = sizeof(struct in6_addr) },
335 [TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) },
336 [TCA_FLOWER_KEY_ENC_IPV6_DST] = { .len = sizeof(struct in6_addr) },
337 [TCA_FLOWER_KEY_ENC_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) },
77b9900e
JP
338};
339
340static void fl_set_key_val(struct nlattr **tb,
341 void *val, int val_type,
342 void *mask, int mask_type, int len)
343{
344 if (!tb[val_type])
345 return;
346 memcpy(val, nla_data(tb[val_type]), len);
347 if (mask_type == TCA_FLOWER_UNSPEC || !tb[mask_type])
348 memset(mask, 0xff, len);
349 else
350 memcpy(mask, nla_data(tb[mask_type]), len);
351}
352
9399ae9a
HHZ
353static void fl_set_key_vlan(struct nlattr **tb,
354 struct flow_dissector_key_vlan *key_val,
355 struct flow_dissector_key_vlan *key_mask)
356{
357#define VLAN_PRIORITY_MASK 0x7
358
359 if (tb[TCA_FLOWER_KEY_VLAN_ID]) {
360 key_val->vlan_id =
361 nla_get_u16(tb[TCA_FLOWER_KEY_VLAN_ID]) & VLAN_VID_MASK;
362 key_mask->vlan_id = VLAN_VID_MASK;
363 }
364 if (tb[TCA_FLOWER_KEY_VLAN_PRIO]) {
365 key_val->vlan_priority =
366 nla_get_u8(tb[TCA_FLOWER_KEY_VLAN_PRIO]) &
367 VLAN_PRIORITY_MASK;
368 key_mask->vlan_priority = VLAN_PRIORITY_MASK;
369 }
370}
371
77b9900e
JP
372static int fl_set_key(struct net *net, struct nlattr **tb,
373 struct fl_flow_key *key, struct fl_flow_key *mask)
374{
9399ae9a 375 __be16 ethertype;
dd3aa3b5 376#ifdef CONFIG_NET_CLS_IND
77b9900e 377 if (tb[TCA_FLOWER_INDEV]) {
dd3aa3b5 378 int err = tcf_change_indev(net, tb[TCA_FLOWER_INDEV]);
77b9900e
JP
379 if (err < 0)
380 return err;
381 key->indev_ifindex = err;
382 mask->indev_ifindex = 0xffffffff;
383 }
dd3aa3b5 384#endif
77b9900e
JP
385
386 fl_set_key_val(tb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
387 mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
388 sizeof(key->eth.dst));
389 fl_set_key_val(tb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
390 mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
391 sizeof(key->eth.src));
66530bdf 392
0b498a52 393 if (tb[TCA_FLOWER_KEY_ETH_TYPE]) {
9399ae9a
HHZ
394 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_ETH_TYPE]);
395
0b498a52
AB
396 if (ethertype == htons(ETH_P_8021Q)) {
397 fl_set_key_vlan(tb, &key->vlan, &mask->vlan);
398 fl_set_key_val(tb, &key->basic.n_proto,
399 TCA_FLOWER_KEY_VLAN_ETH_TYPE,
400 &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
401 sizeof(key->basic.n_proto));
402 } else {
403 key->basic.n_proto = ethertype;
404 mask->basic.n_proto = cpu_to_be16(~0);
405 }
9399ae9a 406 }
66530bdf 407
77b9900e
JP
408 if (key->basic.n_proto == htons(ETH_P_IP) ||
409 key->basic.n_proto == htons(ETH_P_IPV6)) {
410 fl_set_key_val(tb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
411 &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
412 sizeof(key->basic.ip_proto));
413 }
66530bdf
JHS
414
415 if (tb[TCA_FLOWER_KEY_IPV4_SRC] || tb[TCA_FLOWER_KEY_IPV4_DST]) {
416 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
77b9900e
JP
417 fl_set_key_val(tb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
418 &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
419 sizeof(key->ipv4.src));
420 fl_set_key_val(tb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
421 &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
422 sizeof(key->ipv4.dst));
66530bdf
JHS
423 } else if (tb[TCA_FLOWER_KEY_IPV6_SRC] || tb[TCA_FLOWER_KEY_IPV6_DST]) {
424 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
77b9900e
JP
425 fl_set_key_val(tb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
426 &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
427 sizeof(key->ipv6.src));
428 fl_set_key_val(tb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
429 &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
430 sizeof(key->ipv6.dst));
431 }
66530bdf 432
77b9900e
JP
433 if (key->basic.ip_proto == IPPROTO_TCP) {
434 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
435 &mask->tp.src, TCA_FLOWER_UNSPEC,
436 sizeof(key->tp.src));
437 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
438 &mask->tp.dst, TCA_FLOWER_UNSPEC,
439 sizeof(key->tp.dst));
440 } else if (key->basic.ip_proto == IPPROTO_UDP) {
441 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
442 &mask->tp.src, TCA_FLOWER_UNSPEC,
443 sizeof(key->tp.src));
444 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
445 &mask->tp.dst, TCA_FLOWER_UNSPEC,
446 sizeof(key->tp.dst));
447 }
448
bc3103f1
AV
449 if (tb[TCA_FLOWER_KEY_ENC_IPV4_SRC] ||
450 tb[TCA_FLOWER_KEY_ENC_IPV4_DST]) {
451 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
452 fl_set_key_val(tb, &key->enc_ipv4.src,
453 TCA_FLOWER_KEY_ENC_IPV4_SRC,
454 &mask->enc_ipv4.src,
455 TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK,
456 sizeof(key->enc_ipv4.src));
457 fl_set_key_val(tb, &key->enc_ipv4.dst,
458 TCA_FLOWER_KEY_ENC_IPV4_DST,
459 &mask->enc_ipv4.dst,
460 TCA_FLOWER_KEY_ENC_IPV4_DST_MASK,
461 sizeof(key->enc_ipv4.dst));
462 }
463
464 if (tb[TCA_FLOWER_KEY_ENC_IPV6_SRC] ||
465 tb[TCA_FLOWER_KEY_ENC_IPV6_DST]) {
466 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
467 fl_set_key_val(tb, &key->enc_ipv6.src,
468 TCA_FLOWER_KEY_ENC_IPV6_SRC,
469 &mask->enc_ipv6.src,
470 TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK,
471 sizeof(key->enc_ipv6.src));
472 fl_set_key_val(tb, &key->enc_ipv6.dst,
473 TCA_FLOWER_KEY_ENC_IPV6_DST,
474 &mask->enc_ipv6.dst,
475 TCA_FLOWER_KEY_ENC_IPV6_DST_MASK,
476 sizeof(key->enc_ipv6.dst));
477 }
478
479 fl_set_key_val(tb, &key->enc_key_id.keyid, TCA_FLOWER_KEY_ENC_KEY_ID,
480 &mask->enc_key_id.keyid, TCA_FLOWER_KEY_ENC_KEY_ID,
481 sizeof(key->enc_key_id.keyid));
482
77b9900e
JP
483 return 0;
484}
485
486static bool fl_mask_eq(struct fl_flow_mask *mask1,
487 struct fl_flow_mask *mask2)
488{
489 const long *lmask1 = fl_key_get_start(&mask1->key, mask1);
490 const long *lmask2 = fl_key_get_start(&mask2->key, mask2);
491
492 return !memcmp(&mask1->range, &mask2->range, sizeof(mask1->range)) &&
493 !memcmp(lmask1, lmask2, fl_mask_range(mask1));
494}
495
496static const struct rhashtable_params fl_ht_params = {
497 .key_offset = offsetof(struct cls_fl_filter, mkey), /* base offset */
498 .head_offset = offsetof(struct cls_fl_filter, ht_node),
499 .automatic_shrinking = true,
500};
501
502static int fl_init_hashtable(struct cls_fl_head *head,
503 struct fl_flow_mask *mask)
504{
505 head->ht_params = fl_ht_params;
506 head->ht_params.key_len = fl_mask_range(mask);
507 head->ht_params.key_offset += mask->range.start;
508
509 return rhashtable_init(&head->ht, &head->ht_params);
510}
511
512#define FL_KEY_MEMBER_OFFSET(member) offsetof(struct fl_flow_key, member)
513#define FL_KEY_MEMBER_SIZE(member) (sizeof(((struct fl_flow_key *) 0)->member))
77b9900e 514
339ba878
HHZ
515#define FL_KEY_IS_MASKED(mask, member) \
516 memchr_inv(((char *)mask) + FL_KEY_MEMBER_OFFSET(member), \
517 0, FL_KEY_MEMBER_SIZE(member)) \
77b9900e
JP
518
519#define FL_KEY_SET(keys, cnt, id, member) \
520 do { \
521 keys[cnt].key_id = id; \
522 keys[cnt].offset = FL_KEY_MEMBER_OFFSET(member); \
523 cnt++; \
524 } while(0);
525
339ba878 526#define FL_KEY_SET_IF_MASKED(mask, keys, cnt, id, member) \
77b9900e 527 do { \
339ba878 528 if (FL_KEY_IS_MASKED(mask, member)) \
77b9900e
JP
529 FL_KEY_SET(keys, cnt, id, member); \
530 } while(0);
531
532static void fl_init_dissector(struct cls_fl_head *head,
533 struct fl_flow_mask *mask)
534{
535 struct flow_dissector_key keys[FLOW_DISSECTOR_KEY_MAX];
536 size_t cnt = 0;
537
42aecaa9 538 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_CONTROL, control);
77b9900e 539 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_BASIC, basic);
339ba878
HHZ
540 FL_KEY_SET_IF_MASKED(&mask->key, keys, cnt,
541 FLOW_DISSECTOR_KEY_ETH_ADDRS, eth);
542 FL_KEY_SET_IF_MASKED(&mask->key, keys, cnt,
543 FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4);
544 FL_KEY_SET_IF_MASKED(&mask->key, keys, cnt,
545 FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6);
546 FL_KEY_SET_IF_MASKED(&mask->key, keys, cnt,
547 FLOW_DISSECTOR_KEY_PORTS, tp);
9399ae9a
HHZ
548 FL_KEY_SET_IF_MASKED(&mask->key, keys, cnt,
549 FLOW_DISSECTOR_KEY_VLAN, vlan);
77b9900e
JP
550
551 skb_flow_dissector_init(&head->dissector, keys, cnt);
552}
553
554static int fl_check_assign_mask(struct cls_fl_head *head,
555 struct fl_flow_mask *mask)
556{
557 int err;
558
559 if (head->mask_assigned) {
560 if (!fl_mask_eq(&head->mask, mask))
561 return -EINVAL;
562 else
563 return 0;
564 }
565
566 /* Mask is not assigned yet. So assign it and init hashtable
567 * according to that.
568 */
569 err = fl_init_hashtable(head, mask);
570 if (err)
571 return err;
572 memcpy(&head->mask, mask, sizeof(head->mask));
573 head->mask_assigned = true;
574
575 fl_init_dissector(head, mask);
576
577 return 0;
578}
579
580static int fl_set_parms(struct net *net, struct tcf_proto *tp,
581 struct cls_fl_filter *f, struct fl_flow_mask *mask,
582 unsigned long base, struct nlattr **tb,
583 struct nlattr *est, bool ovr)
584{
585 struct tcf_exts e;
586 int err;
587
b9a24bb7 588 err = tcf_exts_init(&e, TCA_FLOWER_ACT, 0);
77b9900e
JP
589 if (err < 0)
590 return err;
b9a24bb7
WC
591 err = tcf_exts_validate(net, tp, tb, est, &e, ovr);
592 if (err < 0)
593 goto errout;
77b9900e
JP
594
595 if (tb[TCA_FLOWER_CLASSID]) {
596 f->res.classid = nla_get_u32(tb[TCA_FLOWER_CLASSID]);
597 tcf_bind_filter(tp, &f->res, base);
598 }
599
600 err = fl_set_key(net, tb, &f->key, &mask->key);
601 if (err)
602 goto errout;
603
604 fl_mask_update_range(mask);
605 fl_set_masked_key(&f->mkey, &f->key, mask);
606
607 tcf_exts_change(tp, &f->exts, &e);
608
609 return 0;
610errout:
611 tcf_exts_destroy(&e);
612 return err;
613}
614
615static u32 fl_grab_new_handle(struct tcf_proto *tp,
616 struct cls_fl_head *head)
617{
618 unsigned int i = 0x80000000;
619 u32 handle;
620
621 do {
622 if (++head->hgen == 0x7FFFFFFF)
623 head->hgen = 1;
624 } while (--i > 0 && fl_get(tp, head->hgen));
625
626 if (unlikely(i == 0)) {
627 pr_err("Insufficient number of handles\n");
628 handle = 0;
629 } else {
630 handle = head->hgen;
631 }
632
633 return handle;
634}
635
636static int fl_change(struct net *net, struct sk_buff *in_skb,
637 struct tcf_proto *tp, unsigned long base,
638 u32 handle, struct nlattr **tca,
639 unsigned long *arg, bool ovr)
640{
641 struct cls_fl_head *head = rtnl_dereference(tp->root);
642 struct cls_fl_filter *fold = (struct cls_fl_filter *) *arg;
643 struct cls_fl_filter *fnew;
644 struct nlattr *tb[TCA_FLOWER_MAX + 1];
645 struct fl_flow_mask mask = {};
646 int err;
647
648 if (!tca[TCA_OPTIONS])
649 return -EINVAL;
650
651 err = nla_parse_nested(tb, TCA_FLOWER_MAX, tca[TCA_OPTIONS], fl_policy);
652 if (err < 0)
653 return err;
654
655 if (fold && handle && fold->handle != handle)
656 return -EINVAL;
657
658 fnew = kzalloc(sizeof(*fnew), GFP_KERNEL);
659 if (!fnew)
660 return -ENOBUFS;
661
b9a24bb7
WC
662 err = tcf_exts_init(&fnew->exts, TCA_FLOWER_ACT, 0);
663 if (err < 0)
664 goto errout;
77b9900e
JP
665
666 if (!handle) {
667 handle = fl_grab_new_handle(tp, head);
668 if (!handle) {
669 err = -EINVAL;
670 goto errout;
671 }
672 }
673 fnew->handle = handle;
674
e69985c6
AV
675 if (tb[TCA_FLOWER_FLAGS]) {
676 fnew->flags = nla_get_u32(tb[TCA_FLOWER_FLAGS]);
677
678 if (!tc_flags_valid(fnew->flags)) {
679 err = -EINVAL;
680 goto errout;
681 }
682 }
5b33f488 683
77b9900e
JP
684 err = fl_set_parms(net, tp, fnew, &mask, base, tb, tca[TCA_RATE], ovr);
685 if (err)
686 goto errout;
687
688 err = fl_check_assign_mask(head, &mask);
689 if (err)
690 goto errout;
691
e8eb36cd 692 if (!tc_skip_sw(fnew->flags)) {
e69985c6
AV
693 err = rhashtable_insert_fast(&head->ht, &fnew->ht_node,
694 head->ht_params);
695 if (err)
696 goto errout;
697 }
5b33f488 698
e8eb36cd
AV
699 err = fl_hw_replace_filter(tp,
700 &head->dissector,
701 &mask.key,
702 &fnew->key,
703 &fnew->exts,
704 (unsigned long)fnew,
705 fnew->flags);
706 if (err)
707 goto errout;
5b33f488
AV
708
709 if (fold) {
77b9900e
JP
710 rhashtable_remove_fast(&head->ht, &fold->ht_node,
711 head->ht_params);
8208d21b 712 fl_hw_destroy_filter(tp, (unsigned long)fold);
5b33f488 713 }
77b9900e
JP
714
715 *arg = (unsigned long) fnew;
716
717 if (fold) {
ff3532f2 718 list_replace_rcu(&fold->list, &fnew->list);
77b9900e
JP
719 tcf_unbind_filter(tp, &fold->res);
720 call_rcu(&fold->rcu, fl_destroy_filter);
721 } else {
722 list_add_tail_rcu(&fnew->list, &head->filters);
723 }
724
725 return 0;
726
727errout:
b9a24bb7 728 tcf_exts_destroy(&fnew->exts);
77b9900e
JP
729 kfree(fnew);
730 return err;
731}
732
733static int fl_delete(struct tcf_proto *tp, unsigned long arg)
734{
735 struct cls_fl_head *head = rtnl_dereference(tp->root);
736 struct cls_fl_filter *f = (struct cls_fl_filter *) arg;
737
738 rhashtable_remove_fast(&head->ht, &f->ht_node,
739 head->ht_params);
740 list_del_rcu(&f->list);
8208d21b 741 fl_hw_destroy_filter(tp, (unsigned long)f);
77b9900e
JP
742 tcf_unbind_filter(tp, &f->res);
743 call_rcu(&f->rcu, fl_destroy_filter);
744 return 0;
745}
746
747static void fl_walk(struct tcf_proto *tp, struct tcf_walker *arg)
748{
749 struct cls_fl_head *head = rtnl_dereference(tp->root);
750 struct cls_fl_filter *f;
751
752 list_for_each_entry_rcu(f, &head->filters, list) {
753 if (arg->count < arg->skip)
754 goto skip;
755 if (arg->fn(tp, (unsigned long) f, arg) < 0) {
756 arg->stop = 1;
757 break;
758 }
759skip:
760 arg->count++;
761 }
762}
763
764static int fl_dump_key_val(struct sk_buff *skb,
765 void *val, int val_type,
766 void *mask, int mask_type, int len)
767{
768 int err;
769
770 if (!memchr_inv(mask, 0, len))
771 return 0;
772 err = nla_put(skb, val_type, len, val);
773 if (err)
774 return err;
775 if (mask_type != TCA_FLOWER_UNSPEC) {
776 err = nla_put(skb, mask_type, len, mask);
777 if (err)
778 return err;
779 }
780 return 0;
781}
782
9399ae9a
HHZ
783static int fl_dump_key_vlan(struct sk_buff *skb,
784 struct flow_dissector_key_vlan *vlan_key,
785 struct flow_dissector_key_vlan *vlan_mask)
786{
787 int err;
788
789 if (!memchr_inv(vlan_mask, 0, sizeof(*vlan_mask)))
790 return 0;
791 if (vlan_mask->vlan_id) {
792 err = nla_put_u16(skb, TCA_FLOWER_KEY_VLAN_ID,
793 vlan_key->vlan_id);
794 if (err)
795 return err;
796 }
797 if (vlan_mask->vlan_priority) {
798 err = nla_put_u8(skb, TCA_FLOWER_KEY_VLAN_PRIO,
799 vlan_key->vlan_priority);
800 if (err)
801 return err;
802 }
803 return 0;
804}
805
77b9900e
JP
806static int fl_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
807 struct sk_buff *skb, struct tcmsg *t)
808{
809 struct cls_fl_head *head = rtnl_dereference(tp->root);
810 struct cls_fl_filter *f = (struct cls_fl_filter *) fh;
811 struct nlattr *nest;
812 struct fl_flow_key *key, *mask;
813
814 if (!f)
815 return skb->len;
816
817 t->tcm_handle = f->handle;
818
819 nest = nla_nest_start(skb, TCA_OPTIONS);
820 if (!nest)
821 goto nla_put_failure;
822
823 if (f->res.classid &&
824 nla_put_u32(skb, TCA_FLOWER_CLASSID, f->res.classid))
825 goto nla_put_failure;
826
827 key = &f->key;
828 mask = &head->mask.key;
829
830 if (mask->indev_ifindex) {
831 struct net_device *dev;
832
833 dev = __dev_get_by_index(net, key->indev_ifindex);
834 if (dev && nla_put_string(skb, TCA_FLOWER_INDEV, dev->name))
835 goto nla_put_failure;
836 }
837
10cbc684
AV
838 fl_hw_update_stats(tp, f);
839
77b9900e
JP
840 if (fl_dump_key_val(skb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
841 mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
842 sizeof(key->eth.dst)) ||
843 fl_dump_key_val(skb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
844 mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
845 sizeof(key->eth.src)) ||
846 fl_dump_key_val(skb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE,
847 &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
848 sizeof(key->basic.n_proto)))
849 goto nla_put_failure;
9399ae9a
HHZ
850
851 if (fl_dump_key_vlan(skb, &key->vlan, &mask->vlan))
852 goto nla_put_failure;
853
77b9900e
JP
854 if ((key->basic.n_proto == htons(ETH_P_IP) ||
855 key->basic.n_proto == htons(ETH_P_IPV6)) &&
856 fl_dump_key_val(skb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
857 &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
858 sizeof(key->basic.ip_proto)))
859 goto nla_put_failure;
860
c3f83241 861 if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
77b9900e
JP
862 (fl_dump_key_val(skb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
863 &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
864 sizeof(key->ipv4.src)) ||
865 fl_dump_key_val(skb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
866 &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
867 sizeof(key->ipv4.dst))))
868 goto nla_put_failure;
c3f83241 869 else if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
77b9900e
JP
870 (fl_dump_key_val(skb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
871 &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
872 sizeof(key->ipv6.src)) ||
873 fl_dump_key_val(skb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
874 &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
875 sizeof(key->ipv6.dst))))
876 goto nla_put_failure;
877
878 if (key->basic.ip_proto == IPPROTO_TCP &&
879 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
880 &mask->tp.src, TCA_FLOWER_UNSPEC,
881 sizeof(key->tp.src)) ||
882 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
883 &mask->tp.dst, TCA_FLOWER_UNSPEC,
884 sizeof(key->tp.dst))))
885 goto nla_put_failure;
886 else if (key->basic.ip_proto == IPPROTO_UDP &&
887 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
888 &mask->tp.src, TCA_FLOWER_UNSPEC,
889 sizeof(key->tp.src)) ||
890 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
891 &mask->tp.dst, TCA_FLOWER_UNSPEC,
892 sizeof(key->tp.dst))))
893 goto nla_put_failure;
894
bc3103f1
AV
895 if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
896 (fl_dump_key_val(skb, &key->enc_ipv4.src,
897 TCA_FLOWER_KEY_ENC_IPV4_SRC, &mask->enc_ipv4.src,
898 TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK,
899 sizeof(key->enc_ipv4.src)) ||
900 fl_dump_key_val(skb, &key->enc_ipv4.dst,
901 TCA_FLOWER_KEY_ENC_IPV4_DST, &mask->enc_ipv4.dst,
902 TCA_FLOWER_KEY_ENC_IPV4_DST_MASK,
903 sizeof(key->enc_ipv4.dst))))
904 goto nla_put_failure;
905 else if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
906 (fl_dump_key_val(skb, &key->enc_ipv6.src,
907 TCA_FLOWER_KEY_ENC_IPV6_SRC, &mask->enc_ipv6.src,
908 TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK,
909 sizeof(key->enc_ipv6.src)) ||
910 fl_dump_key_val(skb, &key->enc_ipv6.dst,
911 TCA_FLOWER_KEY_ENC_IPV6_DST,
912 &mask->enc_ipv6.dst,
913 TCA_FLOWER_KEY_ENC_IPV6_DST_MASK,
914 sizeof(key->enc_ipv6.dst))))
915 goto nla_put_failure;
916
917 if (fl_dump_key_val(skb, &key->enc_key_id, TCA_FLOWER_KEY_ENC_KEY_ID,
918 &mask->enc_key_id, TCA_FLOWER_KEY_ENC_KEY_ID,
919 sizeof(key->enc_key_id)))
920 goto nla_put_failure;
921
e69985c6
AV
922 nla_put_u32(skb, TCA_FLOWER_FLAGS, f->flags);
923
77b9900e
JP
924 if (tcf_exts_dump(skb, &f->exts))
925 goto nla_put_failure;
926
927 nla_nest_end(skb, nest);
928
929 if (tcf_exts_dump_stats(skb, &f->exts) < 0)
930 goto nla_put_failure;
931
932 return skb->len;
933
934nla_put_failure:
935 nla_nest_cancel(skb, nest);
936 return -1;
937}
938
939static struct tcf_proto_ops cls_fl_ops __read_mostly = {
940 .kind = "flower",
941 .classify = fl_classify,
942 .init = fl_init,
943 .destroy = fl_destroy,
944 .get = fl_get,
945 .change = fl_change,
946 .delete = fl_delete,
947 .walk = fl_walk,
948 .dump = fl_dump,
949 .owner = THIS_MODULE,
950};
951
952static int __init cls_fl_init(void)
953{
954 return register_tcf_proto_ops(&cls_fl_ops);
955}
956
957static void __exit cls_fl_exit(void)
958{
959 unregister_tcf_proto_ops(&cls_fl_ops);
960}
961
962module_init(cls_fl_init);
963module_exit(cls_fl_exit);
964
965MODULE_AUTHOR("Jiri Pirko <jiri@resnulli.us>");
966MODULE_DESCRIPTION("Flower classifier");
967MODULE_LICENSE("GPL v2");
This page took 0.14522 seconds and 5 git commands to generate.