blob: 09b359784629e46b1ce5f60c42e193196f312549 [file] [log] [blame]
xjb04a4022021-11-25 15:01:52 +08001/*
2 * net/sched/cls_flower.c Flower classifier
3 *
4 * Copyright (c) 2015 Jiri Pirko <jiri@resnulli.us>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 */
11
12#include <linux/kernel.h>
13#include <linux/init.h>
14#include <linux/module.h>
15#include <linux/rhashtable.h>
16#include <linux/workqueue.h>
17
18#include <linux/if_ether.h>
19#include <linux/in6.h>
20#include <linux/ip.h>
21#include <linux/mpls.h>
22
23#include <net/sch_generic.h>
24#include <net/pkt_cls.h>
25#include <net/ip.h>
26#include <net/flow_dissector.h>
27#include <net/geneve.h>
28
29#include <net/dst.h>
30#include <net/dst_metadata.h>
31
32struct fl_flow_key {
33 int indev_ifindex;
34 struct flow_dissector_key_control control;
35 struct flow_dissector_key_control enc_control;
36 struct flow_dissector_key_basic basic;
37 struct flow_dissector_key_eth_addrs eth;
38 struct flow_dissector_key_vlan vlan;
39 struct flow_dissector_key_vlan cvlan;
40 union {
41 struct flow_dissector_key_ipv4_addrs ipv4;
42 struct flow_dissector_key_ipv6_addrs ipv6;
43 };
44 struct flow_dissector_key_ports tp;
45 struct flow_dissector_key_icmp icmp;
46 struct flow_dissector_key_arp arp;
47 struct flow_dissector_key_keyid enc_key_id;
48 union {
49 struct flow_dissector_key_ipv4_addrs enc_ipv4;
50 struct flow_dissector_key_ipv6_addrs enc_ipv6;
51 };
52 struct flow_dissector_key_ports enc_tp;
53 struct flow_dissector_key_mpls mpls;
54 struct flow_dissector_key_tcp tcp;
55 struct flow_dissector_key_ip ip;
56 struct flow_dissector_key_ip enc_ip;
57 struct flow_dissector_key_enc_opts enc_opts;
58} __aligned(BITS_PER_LONG / 8); /* Ensure that we can do comparisons as longs. */
59
60struct fl_flow_mask_range {
61 unsigned short int start;
62 unsigned short int end;
63};
64
65struct fl_flow_mask {
66 struct fl_flow_key key;
67 struct fl_flow_mask_range range;
68 struct rhash_head ht_node;
69 struct rhashtable ht;
70 struct rhashtable_params filter_ht_params;
71 struct flow_dissector dissector;
72 struct list_head filters;
73 struct rcu_work rwork;
74 struct list_head list;
75};
76
77struct fl_flow_tmplt {
78 struct fl_flow_key dummy_key;
79 struct fl_flow_key mask;
80 struct flow_dissector dissector;
81 struct tcf_chain *chain;
82};
83
84struct cls_fl_head {
85 struct rhashtable ht;
86 struct list_head masks;
87 struct rcu_work rwork;
88 struct idr handle_idr;
89};
90
91struct cls_fl_filter {
92 struct fl_flow_mask *mask;
93 struct rhash_head ht_node;
94 struct fl_flow_key mkey;
95 struct tcf_exts exts;
96 struct tcf_result res;
97 struct fl_flow_key key;
98 struct list_head list;
99 u32 handle;
100 u32 flags;
101 unsigned int in_hw_count;
102 struct rcu_work rwork;
103 struct net_device *hw_dev;
104};
105
106static const struct rhashtable_params mask_ht_params = {
107 .key_offset = offsetof(struct fl_flow_mask, key),
108 .key_len = sizeof(struct fl_flow_key),
109 .head_offset = offsetof(struct fl_flow_mask, ht_node),
110 .automatic_shrinking = true,
111};
112
113static unsigned short int fl_mask_range(const struct fl_flow_mask *mask)
114{
115 return mask->range.end - mask->range.start;
116}
117
118static void fl_mask_update_range(struct fl_flow_mask *mask)
119{
120 const u8 *bytes = (const u8 *) &mask->key;
121 size_t size = sizeof(mask->key);
122 size_t i, first = 0, last;
123
124 for (i = 0; i < size; i++) {
125 if (bytes[i]) {
126 first = i;
127 break;
128 }
129 }
130 last = first;
131 for (i = size - 1; i != first; i--) {
132 if (bytes[i]) {
133 last = i;
134 break;
135 }
136 }
137 mask->range.start = rounddown(first, sizeof(long));
138 mask->range.end = roundup(last + 1, sizeof(long));
139}
140
141static void *fl_key_get_start(struct fl_flow_key *key,
142 const struct fl_flow_mask *mask)
143{
144 return (u8 *) key + mask->range.start;
145}
146
147static void fl_set_masked_key(struct fl_flow_key *mkey, struct fl_flow_key *key,
148 struct fl_flow_mask *mask)
149{
150 const long *lkey = fl_key_get_start(key, mask);
151 const long *lmask = fl_key_get_start(&mask->key, mask);
152 long *lmkey = fl_key_get_start(mkey, mask);
153 int i;
154
155 for (i = 0; i < fl_mask_range(mask); i += sizeof(long))
156 *lmkey++ = *lkey++ & *lmask++;
157}
158
159static bool fl_mask_fits_tmplt(struct fl_flow_tmplt *tmplt,
160 struct fl_flow_mask *mask)
161{
162 const long *lmask = fl_key_get_start(&mask->key, mask);
163 const long *ltmplt;
164 int i;
165
166 if (!tmplt)
167 return true;
168 ltmplt = fl_key_get_start(&tmplt->mask, mask);
169 for (i = 0; i < fl_mask_range(mask); i += sizeof(long)) {
170 if (~*ltmplt++ & *lmask++)
171 return false;
172 }
173 return true;
174}
175
176static void fl_clear_masked_range(struct fl_flow_key *key,
177 struct fl_flow_mask *mask)
178{
179 memset(fl_key_get_start(key, mask), 0, fl_mask_range(mask));
180}
181
182static struct cls_fl_filter *fl_lookup(struct fl_flow_mask *mask,
183 struct fl_flow_key *mkey)
184{
185 return rhashtable_lookup_fast(&mask->ht, fl_key_get_start(mkey, mask),
186 mask->filter_ht_params);
187}
188
189static int fl_classify(struct sk_buff *skb, const struct tcf_proto *tp,
190 struct tcf_result *res)
191{
192 struct cls_fl_head *head = rcu_dereference_bh(tp->root);
193 struct cls_fl_filter *f;
194 struct fl_flow_mask *mask;
195 struct fl_flow_key skb_key;
196 struct fl_flow_key skb_mkey;
197
198 list_for_each_entry_rcu(mask, &head->masks, list) {
199 fl_clear_masked_range(&skb_key, mask);
200
201 skb_key.indev_ifindex = skb->skb_iif;
202 /* skb_flow_dissect() does not set n_proto in case an unknown
203 * protocol, so do it rather here.
204 */
205 skb_key.basic.n_proto = skb->protocol;
206 skb_flow_dissect_tunnel_info(skb, &mask->dissector, &skb_key);
207 skb_flow_dissect(skb, &mask->dissector, &skb_key, 0);
208
209 fl_set_masked_key(&skb_mkey, &skb_key, mask);
210
211 f = fl_lookup(mask, &skb_mkey);
212 if (f && !tc_skip_sw(f->flags)) {
213 *res = f->res;
214 return tcf_exts_exec(skb, &f->exts, res);
215 }
216 }
217 return -1;
218}
219
220static int fl_init(struct tcf_proto *tp)
221{
222 struct cls_fl_head *head;
223
224 head = kzalloc(sizeof(*head), GFP_KERNEL);
225 if (!head)
226 return -ENOBUFS;
227
228 INIT_LIST_HEAD_RCU(&head->masks);
229 rcu_assign_pointer(tp->root, head);
230 idr_init(&head->handle_idr);
231
232 return rhashtable_init(&head->ht, &mask_ht_params);
233}
234
235static void fl_mask_free(struct fl_flow_mask *mask)
236{
237 rhashtable_destroy(&mask->ht);
238 kfree(mask);
239}
240
241static void fl_mask_free_work(struct work_struct *work)
242{
243 struct fl_flow_mask *mask = container_of(to_rcu_work(work),
244 struct fl_flow_mask, rwork);
245
246 fl_mask_free(mask);
247}
248
249static bool fl_mask_put(struct cls_fl_head *head, struct fl_flow_mask *mask,
250 bool async)
251{
252 if (!list_empty(&mask->filters))
253 return false;
254
255 rhashtable_remove_fast(&head->ht, &mask->ht_node, mask_ht_params);
256 list_del_rcu(&mask->list);
257 if (async)
258 tcf_queue_work(&mask->rwork, fl_mask_free_work);
259 else
260 fl_mask_free(mask);
261
262 return true;
263}
264
265static void __fl_destroy_filter(struct cls_fl_filter *f)
266{
267 tcf_exts_destroy(&f->exts);
268 tcf_exts_put_net(&f->exts);
269 kfree(f);
270}
271
272static void fl_destroy_filter_work(struct work_struct *work)
273{
274 struct cls_fl_filter *f = container_of(to_rcu_work(work),
275 struct cls_fl_filter, rwork);
276
277 rtnl_lock();
278 __fl_destroy_filter(f);
279 rtnl_unlock();
280}
281
282static void fl_hw_destroy_filter(struct tcf_proto *tp, struct cls_fl_filter *f,
283 struct netlink_ext_ack *extack)
284{
285 struct tc_cls_flower_offload cls_flower = {};
286 struct tcf_block *block = tp->chain->block;
287
288 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, extack);
289 cls_flower.command = TC_CLSFLOWER_DESTROY;
290 cls_flower.cookie = (unsigned long) f;
291
292 tc_setup_cb_call(block, &f->exts, TC_SETUP_CLSFLOWER,
293 &cls_flower, false);
294 tcf_block_offload_dec(block, &f->flags);
295}
296
297static int fl_hw_replace_filter(struct tcf_proto *tp,
298 struct cls_fl_filter *f,
299 struct netlink_ext_ack *extack)
300{
301 struct tc_cls_flower_offload cls_flower = {};
302 struct tcf_block *block = tp->chain->block;
303 bool skip_sw = tc_skip_sw(f->flags);
304 int err;
305
306 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, extack);
307 cls_flower.command = TC_CLSFLOWER_REPLACE;
308 cls_flower.cookie = (unsigned long) f;
309 cls_flower.dissector = &f->mask->dissector;
310 cls_flower.mask = &f->mask->key;
311 cls_flower.key = &f->mkey;
312 cls_flower.exts = &f->exts;
313 cls_flower.classid = f->res.classid;
314
315 err = tc_setup_cb_call(block, &f->exts, TC_SETUP_CLSFLOWER,
316 &cls_flower, skip_sw);
317 if (err < 0) {
318 fl_hw_destroy_filter(tp, f, NULL);
319 return err;
320 } else if (err > 0) {
321 f->in_hw_count = err;
322 tcf_block_offload_inc(block, &f->flags);
323 }
324
325 if (skip_sw && !(f->flags & TCA_CLS_FLAGS_IN_HW))
326 return -EINVAL;
327
328 return 0;
329}
330
331static void fl_hw_update_stats(struct tcf_proto *tp, struct cls_fl_filter *f)
332{
333 struct tc_cls_flower_offload cls_flower = {};
334 struct tcf_block *block = tp->chain->block;
335
336 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, NULL);
337 cls_flower.command = TC_CLSFLOWER_STATS;
338 cls_flower.cookie = (unsigned long) f;
339 cls_flower.exts = &f->exts;
340 cls_flower.classid = f->res.classid;
341
342 tc_setup_cb_call(block, &f->exts, TC_SETUP_CLSFLOWER,
343 &cls_flower, false);
344}
345
346static bool __fl_delete(struct tcf_proto *tp, struct cls_fl_filter *f,
347 struct netlink_ext_ack *extack)
348{
349 struct cls_fl_head *head = rtnl_dereference(tp->root);
350 bool async = tcf_exts_get_net(&f->exts);
351 bool last;
352
353 idr_remove(&head->handle_idr, f->handle);
354 list_del_rcu(&f->list);
355 last = fl_mask_put(head, f->mask, async);
356 if (!tc_skip_hw(f->flags))
357 fl_hw_destroy_filter(tp, f, extack);
358 tcf_unbind_filter(tp, &f->res);
359 if (async)
360 tcf_queue_work(&f->rwork, fl_destroy_filter_work);
361 else
362 __fl_destroy_filter(f);
363
364 return last;
365}
366
367static void fl_destroy_sleepable(struct work_struct *work)
368{
369 struct cls_fl_head *head = container_of(to_rcu_work(work),
370 struct cls_fl_head,
371 rwork);
372
373 rhashtable_destroy(&head->ht);
374 kfree(head);
375 module_put(THIS_MODULE);
376}
377
378static void fl_destroy(struct tcf_proto *tp, struct netlink_ext_ack *extack)
379{
380 struct cls_fl_head *head = rtnl_dereference(tp->root);
381 struct fl_flow_mask *mask, *next_mask;
382 struct cls_fl_filter *f, *next;
383
384 list_for_each_entry_safe(mask, next_mask, &head->masks, list) {
385 list_for_each_entry_safe(f, next, &mask->filters, list) {
386 if (__fl_delete(tp, f, extack))
387 break;
388 }
389 }
390 idr_destroy(&head->handle_idr);
391
392 __module_get(THIS_MODULE);
393 tcf_queue_work(&head->rwork, fl_destroy_sleepable);
394}
395
396static void *fl_get(struct tcf_proto *tp, u32 handle)
397{
398 struct cls_fl_head *head = rtnl_dereference(tp->root);
399
400 return idr_find(&head->handle_idr, handle);
401}
402
403static const struct nla_policy fl_policy[TCA_FLOWER_MAX + 1] = {
404 [TCA_FLOWER_UNSPEC] = { .type = NLA_UNSPEC },
405 [TCA_FLOWER_CLASSID] = { .type = NLA_U32 },
406 [TCA_FLOWER_INDEV] = { .type = NLA_STRING,
407 .len = IFNAMSIZ },
408 [TCA_FLOWER_KEY_ETH_DST] = { .len = ETH_ALEN },
409 [TCA_FLOWER_KEY_ETH_DST_MASK] = { .len = ETH_ALEN },
410 [TCA_FLOWER_KEY_ETH_SRC] = { .len = ETH_ALEN },
411 [TCA_FLOWER_KEY_ETH_SRC_MASK] = { .len = ETH_ALEN },
412 [TCA_FLOWER_KEY_ETH_TYPE] = { .type = NLA_U16 },
413 [TCA_FLOWER_KEY_IP_PROTO] = { .type = NLA_U8 },
414 [TCA_FLOWER_KEY_IPV4_SRC] = { .type = NLA_U32 },
415 [TCA_FLOWER_KEY_IPV4_SRC_MASK] = { .type = NLA_U32 },
416 [TCA_FLOWER_KEY_IPV4_DST] = { .type = NLA_U32 },
417 [TCA_FLOWER_KEY_IPV4_DST_MASK] = { .type = NLA_U32 },
418 [TCA_FLOWER_KEY_IPV6_SRC] = { .len = sizeof(struct in6_addr) },
419 [TCA_FLOWER_KEY_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) },
420 [TCA_FLOWER_KEY_IPV6_DST] = { .len = sizeof(struct in6_addr) },
421 [TCA_FLOWER_KEY_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) },
422 [TCA_FLOWER_KEY_TCP_SRC] = { .type = NLA_U16 },
423 [TCA_FLOWER_KEY_TCP_DST] = { .type = NLA_U16 },
424 [TCA_FLOWER_KEY_UDP_SRC] = { .type = NLA_U16 },
425 [TCA_FLOWER_KEY_UDP_DST] = { .type = NLA_U16 },
426 [TCA_FLOWER_KEY_VLAN_ID] = { .type = NLA_U16 },
427 [TCA_FLOWER_KEY_VLAN_PRIO] = { .type = NLA_U8 },
428 [TCA_FLOWER_KEY_VLAN_ETH_TYPE] = { .type = NLA_U16 },
429 [TCA_FLOWER_KEY_ENC_KEY_ID] = { .type = NLA_U32 },
430 [TCA_FLOWER_KEY_ENC_IPV4_SRC] = { .type = NLA_U32 },
431 [TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK] = { .type = NLA_U32 },
432 [TCA_FLOWER_KEY_ENC_IPV4_DST] = { .type = NLA_U32 },
433 [TCA_FLOWER_KEY_ENC_IPV4_DST_MASK] = { .type = NLA_U32 },
434 [TCA_FLOWER_KEY_ENC_IPV6_SRC] = { .len = sizeof(struct in6_addr) },
435 [TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) },
436 [TCA_FLOWER_KEY_ENC_IPV6_DST] = { .len = sizeof(struct in6_addr) },
437 [TCA_FLOWER_KEY_ENC_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) },
438 [TCA_FLOWER_KEY_TCP_SRC_MASK] = { .type = NLA_U16 },
439 [TCA_FLOWER_KEY_TCP_DST_MASK] = { .type = NLA_U16 },
440 [TCA_FLOWER_KEY_UDP_SRC_MASK] = { .type = NLA_U16 },
441 [TCA_FLOWER_KEY_UDP_DST_MASK] = { .type = NLA_U16 },
442 [TCA_FLOWER_KEY_SCTP_SRC_MASK] = { .type = NLA_U16 },
443 [TCA_FLOWER_KEY_SCTP_DST_MASK] = { .type = NLA_U16 },
444 [TCA_FLOWER_KEY_SCTP_SRC] = { .type = NLA_U16 },
445 [TCA_FLOWER_KEY_SCTP_DST] = { .type = NLA_U16 },
446 [TCA_FLOWER_KEY_ENC_UDP_SRC_PORT] = { .type = NLA_U16 },
447 [TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK] = { .type = NLA_U16 },
448 [TCA_FLOWER_KEY_ENC_UDP_DST_PORT] = { .type = NLA_U16 },
449 [TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK] = { .type = NLA_U16 },
450 [TCA_FLOWER_KEY_FLAGS] = { .type = NLA_U32 },
451 [TCA_FLOWER_KEY_FLAGS_MASK] = { .type = NLA_U32 },
452 [TCA_FLOWER_KEY_ICMPV4_TYPE] = { .type = NLA_U8 },
453 [TCA_FLOWER_KEY_ICMPV4_TYPE_MASK] = { .type = NLA_U8 },
454 [TCA_FLOWER_KEY_ICMPV4_CODE] = { .type = NLA_U8 },
455 [TCA_FLOWER_KEY_ICMPV4_CODE_MASK] = { .type = NLA_U8 },
456 [TCA_FLOWER_KEY_ICMPV6_TYPE] = { .type = NLA_U8 },
457 [TCA_FLOWER_KEY_ICMPV6_TYPE_MASK] = { .type = NLA_U8 },
458 [TCA_FLOWER_KEY_ICMPV6_CODE] = { .type = NLA_U8 },
459 [TCA_FLOWER_KEY_ICMPV6_CODE_MASK] = { .type = NLA_U8 },
460 [TCA_FLOWER_KEY_ARP_SIP] = { .type = NLA_U32 },
461 [TCA_FLOWER_KEY_ARP_SIP_MASK] = { .type = NLA_U32 },
462 [TCA_FLOWER_KEY_ARP_TIP] = { .type = NLA_U32 },
463 [TCA_FLOWER_KEY_ARP_TIP_MASK] = { .type = NLA_U32 },
464 [TCA_FLOWER_KEY_ARP_OP] = { .type = NLA_U8 },
465 [TCA_FLOWER_KEY_ARP_OP_MASK] = { .type = NLA_U8 },
466 [TCA_FLOWER_KEY_ARP_SHA] = { .len = ETH_ALEN },
467 [TCA_FLOWER_KEY_ARP_SHA_MASK] = { .len = ETH_ALEN },
468 [TCA_FLOWER_KEY_ARP_THA] = { .len = ETH_ALEN },
469 [TCA_FLOWER_KEY_ARP_THA_MASK] = { .len = ETH_ALEN },
470 [TCA_FLOWER_KEY_MPLS_TTL] = { .type = NLA_U8 },
471 [TCA_FLOWER_KEY_MPLS_BOS] = { .type = NLA_U8 },
472 [TCA_FLOWER_KEY_MPLS_TC] = { .type = NLA_U8 },
473 [TCA_FLOWER_KEY_MPLS_LABEL] = { .type = NLA_U32 },
474 [TCA_FLOWER_KEY_TCP_FLAGS] = { .type = NLA_U16 },
475 [TCA_FLOWER_KEY_TCP_FLAGS_MASK] = { .type = NLA_U16 },
476 [TCA_FLOWER_KEY_IP_TOS] = { .type = NLA_U8 },
477 [TCA_FLOWER_KEY_IP_TOS_MASK] = { .type = NLA_U8 },
478 [TCA_FLOWER_KEY_IP_TTL] = { .type = NLA_U8 },
479 [TCA_FLOWER_KEY_IP_TTL_MASK] = { .type = NLA_U8 },
480 [TCA_FLOWER_KEY_CVLAN_ID] = { .type = NLA_U16 },
481 [TCA_FLOWER_KEY_CVLAN_PRIO] = { .type = NLA_U8 },
482 [TCA_FLOWER_KEY_CVLAN_ETH_TYPE] = { .type = NLA_U16 },
483 [TCA_FLOWER_KEY_ENC_IP_TOS] = { .type = NLA_U8 },
484 [TCA_FLOWER_KEY_ENC_IP_TOS_MASK] = { .type = NLA_U8 },
485 [TCA_FLOWER_KEY_ENC_IP_TTL] = { .type = NLA_U8 },
486 [TCA_FLOWER_KEY_ENC_IP_TTL_MASK] = { .type = NLA_U8 },
487 [TCA_FLOWER_KEY_ENC_OPTS] = { .type = NLA_NESTED },
488 [TCA_FLOWER_KEY_ENC_OPTS_MASK] = { .type = NLA_NESTED },
489};
490
491static const struct nla_policy
492enc_opts_policy[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1] = {
493 [TCA_FLOWER_KEY_ENC_OPTS_GENEVE] = { .type = NLA_NESTED },
494};
495
496static const struct nla_policy
497geneve_opt_policy[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1] = {
498 [TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS] = { .type = NLA_U16 },
499 [TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE] = { .type = NLA_U8 },
500 [TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA] = { .type = NLA_BINARY,
501 .len = 128 },
502};
503
504static void fl_set_key_val(struct nlattr **tb,
505 void *val, int val_type,
506 void *mask, int mask_type, int len)
507{
508 if (!tb[val_type])
509 return;
510 memcpy(val, nla_data(tb[val_type]), len);
511 if (mask_type == TCA_FLOWER_UNSPEC || !tb[mask_type])
512 memset(mask, 0xff, len);
513 else
514 memcpy(mask, nla_data(tb[mask_type]), len);
515}
516
517static int fl_set_key_mpls(struct nlattr **tb,
518 struct flow_dissector_key_mpls *key_val,
519 struct flow_dissector_key_mpls *key_mask)
520{
521 if (tb[TCA_FLOWER_KEY_MPLS_TTL]) {
522 key_val->mpls_ttl = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_TTL]);
523 key_mask->mpls_ttl = MPLS_TTL_MASK;
524 }
525 if (tb[TCA_FLOWER_KEY_MPLS_BOS]) {
526 u8 bos = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_BOS]);
527
528 if (bos & ~MPLS_BOS_MASK)
529 return -EINVAL;
530 key_val->mpls_bos = bos;
531 key_mask->mpls_bos = MPLS_BOS_MASK;
532 }
533 if (tb[TCA_FLOWER_KEY_MPLS_TC]) {
534 u8 tc = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_TC]);
535
536 if (tc & ~MPLS_TC_MASK)
537 return -EINVAL;
538 key_val->mpls_tc = tc;
539 key_mask->mpls_tc = MPLS_TC_MASK;
540 }
541 if (tb[TCA_FLOWER_KEY_MPLS_LABEL]) {
542 u32 label = nla_get_u32(tb[TCA_FLOWER_KEY_MPLS_LABEL]);
543
544 if (label & ~MPLS_LABEL_MASK)
545 return -EINVAL;
546 key_val->mpls_label = label;
547 key_mask->mpls_label = MPLS_LABEL_MASK;
548 }
549 return 0;
550}
551
552static void fl_set_key_vlan(struct nlattr **tb,
553 __be16 ethertype,
554 int vlan_id_key, int vlan_prio_key,
555 struct flow_dissector_key_vlan *key_val,
556 struct flow_dissector_key_vlan *key_mask)
557{
558#define VLAN_PRIORITY_MASK 0x7
559
560 if (tb[vlan_id_key]) {
561 key_val->vlan_id =
562 nla_get_u16(tb[vlan_id_key]) & VLAN_VID_MASK;
563 key_mask->vlan_id = VLAN_VID_MASK;
564 }
565 if (tb[vlan_prio_key]) {
566 key_val->vlan_priority =
567 nla_get_u8(tb[vlan_prio_key]) &
568 VLAN_PRIORITY_MASK;
569 key_mask->vlan_priority = VLAN_PRIORITY_MASK;
570 }
571 key_val->vlan_tpid = ethertype;
572 key_mask->vlan_tpid = cpu_to_be16(~0);
573}
574
575static void fl_set_key_flag(u32 flower_key, u32 flower_mask,
576 u32 *dissector_key, u32 *dissector_mask,
577 u32 flower_flag_bit, u32 dissector_flag_bit)
578{
579 if (flower_mask & flower_flag_bit) {
580 *dissector_mask |= dissector_flag_bit;
581 if (flower_key & flower_flag_bit)
582 *dissector_key |= dissector_flag_bit;
583 }
584}
585
586static int fl_set_key_flags(struct nlattr **tb,
587 u32 *flags_key, u32 *flags_mask)
588{
589 u32 key, mask;
590
591 /* mask is mandatory for flags */
592 if (!tb[TCA_FLOWER_KEY_FLAGS_MASK])
593 return -EINVAL;
594
595 key = be32_to_cpu(nla_get_u32(tb[TCA_FLOWER_KEY_FLAGS]));
596 mask = be32_to_cpu(nla_get_u32(tb[TCA_FLOWER_KEY_FLAGS_MASK]));
597
598 *flags_key = 0;
599 *flags_mask = 0;
600
601 fl_set_key_flag(key, mask, flags_key, flags_mask,
602 TCA_FLOWER_KEY_FLAGS_IS_FRAGMENT, FLOW_DIS_IS_FRAGMENT);
603 fl_set_key_flag(key, mask, flags_key, flags_mask,
604 TCA_FLOWER_KEY_FLAGS_FRAG_IS_FIRST,
605 FLOW_DIS_FIRST_FRAG);
606
607 return 0;
608}
609
610static void fl_set_key_ip(struct nlattr **tb, bool encap,
611 struct flow_dissector_key_ip *key,
612 struct flow_dissector_key_ip *mask)
613{
614 int tos_key = encap ? TCA_FLOWER_KEY_ENC_IP_TOS : TCA_FLOWER_KEY_IP_TOS;
615 int ttl_key = encap ? TCA_FLOWER_KEY_ENC_IP_TTL : TCA_FLOWER_KEY_IP_TTL;
616 int tos_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TOS_MASK : TCA_FLOWER_KEY_IP_TOS_MASK;
617 int ttl_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TTL_MASK : TCA_FLOWER_KEY_IP_TTL_MASK;
618
619 fl_set_key_val(tb, &key->tos, tos_key, &mask->tos, tos_mask, sizeof(key->tos));
620 fl_set_key_val(tb, &key->ttl, ttl_key, &mask->ttl, ttl_mask, sizeof(key->ttl));
621}
622
623static int fl_set_geneve_opt(const struct nlattr *nla, struct fl_flow_key *key,
624 int depth, int option_len,
625 struct netlink_ext_ack *extack)
626{
627 struct nlattr *tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1];
628 struct nlattr *class = NULL, *type = NULL, *data = NULL;
629 struct geneve_opt *opt;
630 int err, data_len = 0;
631
632 if (option_len > sizeof(struct geneve_opt))
633 data_len = option_len - sizeof(struct geneve_opt);
634
635 opt = (struct geneve_opt *)&key->enc_opts.data[key->enc_opts.len];
636 memset(opt, 0xff, option_len);
637 opt->length = data_len / 4;
638 opt->r1 = 0;
639 opt->r2 = 0;
640 opt->r3 = 0;
641
642 /* If no mask has been prodived we assume an exact match. */
643 if (!depth)
644 return sizeof(struct geneve_opt) + data_len;
645
646 if (nla_type(nla) != TCA_FLOWER_KEY_ENC_OPTS_GENEVE) {
647 NL_SET_ERR_MSG(extack, "Non-geneve option type for mask");
648 return -EINVAL;
649 }
650
651 err = nla_parse_nested(tb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX,
652 nla, geneve_opt_policy, extack);
653 if (err < 0)
654 return err;
655
656 /* We are not allowed to omit any of CLASS, TYPE or DATA
657 * fields from the key.
658 */
659 if (!option_len &&
660 (!tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS] ||
661 !tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE] ||
662 !tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA])) {
663 NL_SET_ERR_MSG(extack, "Missing tunnel key geneve option class, type or data");
664 return -EINVAL;
665 }
666
667 /* Omitting any of CLASS, TYPE or DATA fields is allowed
668 * for the mask.
669 */
670 if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]) {
671 int new_len = key->enc_opts.len;
672
673 data = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA];
674 data_len = nla_len(data);
675 if (data_len < 4) {
676 NL_SET_ERR_MSG(extack, "Tunnel key geneve option data is less than 4 bytes long");
677 return -ERANGE;
678 }
679 if (data_len % 4) {
680 NL_SET_ERR_MSG(extack, "Tunnel key geneve option data is not a multiple of 4 bytes long");
681 return -ERANGE;
682 }
683
684 new_len += sizeof(struct geneve_opt) + data_len;
685 BUILD_BUG_ON(FLOW_DIS_TUN_OPTS_MAX != IP_TUNNEL_OPTS_MAX);
686 if (new_len > FLOW_DIS_TUN_OPTS_MAX) {
687 NL_SET_ERR_MSG(extack, "Tunnel options exceeds max size");
688 return -ERANGE;
689 }
690 opt->length = data_len / 4;
691 memcpy(opt->opt_data, nla_data(data), data_len);
692 }
693
694 if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]) {
695 class = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS];
696 opt->opt_class = nla_get_be16(class);
697 }
698
699 if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]) {
700 type = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE];
701 opt->type = nla_get_u8(type);
702 }
703
704 return sizeof(struct geneve_opt) + data_len;
705}
706
707static int fl_set_enc_opt(struct nlattr **tb, struct fl_flow_key *key,
708 struct fl_flow_key *mask,
709 struct netlink_ext_ack *extack)
710{
711 const struct nlattr *nla_enc_key, *nla_opt_key, *nla_opt_msk = NULL;
712 int err, option_len, key_depth, msk_depth = 0;
713
714 err = nla_validate_nested(tb[TCA_FLOWER_KEY_ENC_OPTS],
715 TCA_FLOWER_KEY_ENC_OPTS_MAX,
716 enc_opts_policy, extack);
717 if (err)
718 return err;
719
720 nla_enc_key = nla_data(tb[TCA_FLOWER_KEY_ENC_OPTS]);
721
722 if (tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]) {
723 err = nla_validate_nested(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK],
724 TCA_FLOWER_KEY_ENC_OPTS_MAX,
725 enc_opts_policy, extack);
726 if (err)
727 return err;
728
729 nla_opt_msk = nla_data(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]);
730 msk_depth = nla_len(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]);
731 }
732
733 nla_for_each_attr(nla_opt_key, nla_enc_key,
734 nla_len(tb[TCA_FLOWER_KEY_ENC_OPTS]), key_depth) {
735 switch (nla_type(nla_opt_key)) {
736 case TCA_FLOWER_KEY_ENC_OPTS_GENEVE:
737 option_len = 0;
738 key->enc_opts.dst_opt_type = TUNNEL_GENEVE_OPT;
739 option_len = fl_set_geneve_opt(nla_opt_key, key,
740 key_depth, option_len,
741 extack);
742 if (option_len < 0)
743 return option_len;
744
745 key->enc_opts.len += option_len;
746 /* At the same time we need to parse through the mask
747 * in order to verify exact and mask attribute lengths.
748 */
749 mask->enc_opts.dst_opt_type = TUNNEL_GENEVE_OPT;
750 option_len = fl_set_geneve_opt(nla_opt_msk, mask,
751 msk_depth, option_len,
752 extack);
753 if (option_len < 0)
754 return option_len;
755
756 mask->enc_opts.len += option_len;
757 if (key->enc_opts.len != mask->enc_opts.len) {
758 NL_SET_ERR_MSG(extack, "Key and mask miss aligned");
759 return -EINVAL;
760 }
761
762 if (msk_depth)
763 nla_opt_msk = nla_next(nla_opt_msk, &msk_depth);
764 break;
765 default:
766 NL_SET_ERR_MSG(extack, "Unknown tunnel option type");
767 return -EINVAL;
768 }
769 }
770
771 return 0;
772}
773
774static int fl_set_key(struct net *net, struct nlattr **tb,
775 struct fl_flow_key *key, struct fl_flow_key *mask,
776 struct netlink_ext_ack *extack)
777{
778 __be16 ethertype;
779 int ret = 0;
780#ifdef CONFIG_NET_CLS_IND
781 if (tb[TCA_FLOWER_INDEV]) {
782 int err = tcf_change_indev(net, tb[TCA_FLOWER_INDEV], extack);
783 if (err < 0)
784 return err;
785 key->indev_ifindex = err;
786 mask->indev_ifindex = 0xffffffff;
787 }
788#endif
789
790 fl_set_key_val(tb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
791 mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
792 sizeof(key->eth.dst));
793 fl_set_key_val(tb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
794 mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
795 sizeof(key->eth.src));
796
797 if (tb[TCA_FLOWER_KEY_ETH_TYPE]) {
798 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_ETH_TYPE]);
799
800 if (eth_type_vlan(ethertype)) {
801 fl_set_key_vlan(tb, ethertype, TCA_FLOWER_KEY_VLAN_ID,
802 TCA_FLOWER_KEY_VLAN_PRIO, &key->vlan,
803 &mask->vlan);
804
805 if (tb[TCA_FLOWER_KEY_VLAN_ETH_TYPE]) {
806 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_VLAN_ETH_TYPE]);
807 if (eth_type_vlan(ethertype)) {
808 fl_set_key_vlan(tb, ethertype,
809 TCA_FLOWER_KEY_CVLAN_ID,
810 TCA_FLOWER_KEY_CVLAN_PRIO,
811 &key->cvlan, &mask->cvlan);
812 fl_set_key_val(tb, &key->basic.n_proto,
813 TCA_FLOWER_KEY_CVLAN_ETH_TYPE,
814 &mask->basic.n_proto,
815 TCA_FLOWER_UNSPEC,
816 sizeof(key->basic.n_proto));
817 } else {
818 key->basic.n_proto = ethertype;
819 mask->basic.n_proto = cpu_to_be16(~0);
820 }
821 }
822 } else {
823 key->basic.n_proto = ethertype;
824 mask->basic.n_proto = cpu_to_be16(~0);
825 }
826 }
827
828 if (key->basic.n_proto == htons(ETH_P_IP) ||
829 key->basic.n_proto == htons(ETH_P_IPV6)) {
830 fl_set_key_val(tb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
831 &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
832 sizeof(key->basic.ip_proto));
833 fl_set_key_ip(tb, false, &key->ip, &mask->ip);
834 }
835
836 if (tb[TCA_FLOWER_KEY_IPV4_SRC] || tb[TCA_FLOWER_KEY_IPV4_DST]) {
837 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
838 mask->control.addr_type = ~0;
839 fl_set_key_val(tb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
840 &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
841 sizeof(key->ipv4.src));
842 fl_set_key_val(tb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
843 &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
844 sizeof(key->ipv4.dst));
845 } else if (tb[TCA_FLOWER_KEY_IPV6_SRC] || tb[TCA_FLOWER_KEY_IPV6_DST]) {
846 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
847 mask->control.addr_type = ~0;
848 fl_set_key_val(tb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
849 &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
850 sizeof(key->ipv6.src));
851 fl_set_key_val(tb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
852 &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
853 sizeof(key->ipv6.dst));
854 }
855
856 if (key->basic.ip_proto == IPPROTO_TCP) {
857 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
858 &mask->tp.src, TCA_FLOWER_KEY_TCP_SRC_MASK,
859 sizeof(key->tp.src));
860 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
861 &mask->tp.dst, TCA_FLOWER_KEY_TCP_DST_MASK,
862 sizeof(key->tp.dst));
863 fl_set_key_val(tb, &key->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS,
864 &mask->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS_MASK,
865 sizeof(key->tcp.flags));
866 } else if (key->basic.ip_proto == IPPROTO_UDP) {
867 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
868 &mask->tp.src, TCA_FLOWER_KEY_UDP_SRC_MASK,
869 sizeof(key->tp.src));
870 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
871 &mask->tp.dst, TCA_FLOWER_KEY_UDP_DST_MASK,
872 sizeof(key->tp.dst));
873 } else if (key->basic.ip_proto == IPPROTO_SCTP) {
874 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_SCTP_SRC,
875 &mask->tp.src, TCA_FLOWER_KEY_SCTP_SRC_MASK,
876 sizeof(key->tp.src));
877 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_SCTP_DST,
878 &mask->tp.dst, TCA_FLOWER_KEY_SCTP_DST_MASK,
879 sizeof(key->tp.dst));
880 } else if (key->basic.n_proto == htons(ETH_P_IP) &&
881 key->basic.ip_proto == IPPROTO_ICMP) {
882 fl_set_key_val(tb, &key->icmp.type, TCA_FLOWER_KEY_ICMPV4_TYPE,
883 &mask->icmp.type,
884 TCA_FLOWER_KEY_ICMPV4_TYPE_MASK,
885 sizeof(key->icmp.type));
886 fl_set_key_val(tb, &key->icmp.code, TCA_FLOWER_KEY_ICMPV4_CODE,
887 &mask->icmp.code,
888 TCA_FLOWER_KEY_ICMPV4_CODE_MASK,
889 sizeof(key->icmp.code));
890 } else if (key->basic.n_proto == htons(ETH_P_IPV6) &&
891 key->basic.ip_proto == IPPROTO_ICMPV6) {
892 fl_set_key_val(tb, &key->icmp.type, TCA_FLOWER_KEY_ICMPV6_TYPE,
893 &mask->icmp.type,
894 TCA_FLOWER_KEY_ICMPV6_TYPE_MASK,
895 sizeof(key->icmp.type));
896 fl_set_key_val(tb, &key->icmp.code, TCA_FLOWER_KEY_ICMPV6_CODE,
897 &mask->icmp.code,
898 TCA_FLOWER_KEY_ICMPV6_CODE_MASK,
899 sizeof(key->icmp.code));
900 } else if (key->basic.n_proto == htons(ETH_P_MPLS_UC) ||
901 key->basic.n_proto == htons(ETH_P_MPLS_MC)) {
902 ret = fl_set_key_mpls(tb, &key->mpls, &mask->mpls);
903 if (ret)
904 return ret;
905 } else if (key->basic.n_proto == htons(ETH_P_ARP) ||
906 key->basic.n_proto == htons(ETH_P_RARP)) {
907 fl_set_key_val(tb, &key->arp.sip, TCA_FLOWER_KEY_ARP_SIP,
908 &mask->arp.sip, TCA_FLOWER_KEY_ARP_SIP_MASK,
909 sizeof(key->arp.sip));
910 fl_set_key_val(tb, &key->arp.tip, TCA_FLOWER_KEY_ARP_TIP,
911 &mask->arp.tip, TCA_FLOWER_KEY_ARP_TIP_MASK,
912 sizeof(key->arp.tip));
913 fl_set_key_val(tb, &key->arp.op, TCA_FLOWER_KEY_ARP_OP,
914 &mask->arp.op, TCA_FLOWER_KEY_ARP_OP_MASK,
915 sizeof(key->arp.op));
916 fl_set_key_val(tb, key->arp.sha, TCA_FLOWER_KEY_ARP_SHA,
917 mask->arp.sha, TCA_FLOWER_KEY_ARP_SHA_MASK,
918 sizeof(key->arp.sha));
919 fl_set_key_val(tb, key->arp.tha, TCA_FLOWER_KEY_ARP_THA,
920 mask->arp.tha, TCA_FLOWER_KEY_ARP_THA_MASK,
921 sizeof(key->arp.tha));
922 }
923
924 if (tb[TCA_FLOWER_KEY_ENC_IPV4_SRC] ||
925 tb[TCA_FLOWER_KEY_ENC_IPV4_DST]) {
926 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
927 mask->enc_control.addr_type = ~0;
928 fl_set_key_val(tb, &key->enc_ipv4.src,
929 TCA_FLOWER_KEY_ENC_IPV4_SRC,
930 &mask->enc_ipv4.src,
931 TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK,
932 sizeof(key->enc_ipv4.src));
933 fl_set_key_val(tb, &key->enc_ipv4.dst,
934 TCA_FLOWER_KEY_ENC_IPV4_DST,
935 &mask->enc_ipv4.dst,
936 TCA_FLOWER_KEY_ENC_IPV4_DST_MASK,
937 sizeof(key->enc_ipv4.dst));
938 }
939
940 if (tb[TCA_FLOWER_KEY_ENC_IPV6_SRC] ||
941 tb[TCA_FLOWER_KEY_ENC_IPV6_DST]) {
942 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
943 mask->enc_control.addr_type = ~0;
944 fl_set_key_val(tb, &key->enc_ipv6.src,
945 TCA_FLOWER_KEY_ENC_IPV6_SRC,
946 &mask->enc_ipv6.src,
947 TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK,
948 sizeof(key->enc_ipv6.src));
949 fl_set_key_val(tb, &key->enc_ipv6.dst,
950 TCA_FLOWER_KEY_ENC_IPV6_DST,
951 &mask->enc_ipv6.dst,
952 TCA_FLOWER_KEY_ENC_IPV6_DST_MASK,
953 sizeof(key->enc_ipv6.dst));
954 }
955
956 fl_set_key_val(tb, &key->enc_key_id.keyid, TCA_FLOWER_KEY_ENC_KEY_ID,
957 &mask->enc_key_id.keyid, TCA_FLOWER_UNSPEC,
958 sizeof(key->enc_key_id.keyid));
959
960 fl_set_key_val(tb, &key->enc_tp.src, TCA_FLOWER_KEY_ENC_UDP_SRC_PORT,
961 &mask->enc_tp.src, TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK,
962 sizeof(key->enc_tp.src));
963
964 fl_set_key_val(tb, &key->enc_tp.dst, TCA_FLOWER_KEY_ENC_UDP_DST_PORT,
965 &mask->enc_tp.dst, TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK,
966 sizeof(key->enc_tp.dst));
967
968 fl_set_key_ip(tb, true, &key->enc_ip, &mask->enc_ip);
969
970 if (tb[TCA_FLOWER_KEY_ENC_OPTS]) {
971 ret = fl_set_enc_opt(tb, key, mask, extack);
972 if (ret)
973 return ret;
974 }
975
976 if (tb[TCA_FLOWER_KEY_FLAGS])
977 ret = fl_set_key_flags(tb, &key->control.flags, &mask->control.flags);
978
979 return ret;
980}
981
982static void fl_mask_copy(struct fl_flow_mask *dst,
983 struct fl_flow_mask *src)
984{
985 const void *psrc = fl_key_get_start(&src->key, src);
986 void *pdst = fl_key_get_start(&dst->key, src);
987
988 memcpy(pdst, psrc, fl_mask_range(src));
989 dst->range = src->range;
990}
991
992static const struct rhashtable_params fl_ht_params = {
993 .key_offset = offsetof(struct cls_fl_filter, mkey), /* base offset */
994 .head_offset = offsetof(struct cls_fl_filter, ht_node),
995 .automatic_shrinking = true,
996};
997
998static int fl_init_mask_hashtable(struct fl_flow_mask *mask)
999{
1000 mask->filter_ht_params = fl_ht_params;
1001 mask->filter_ht_params.key_len = fl_mask_range(mask);
1002 mask->filter_ht_params.key_offset += mask->range.start;
1003
1004 return rhashtable_init(&mask->ht, &mask->filter_ht_params);
1005}
1006
1007#define FL_KEY_MEMBER_OFFSET(member) offsetof(struct fl_flow_key, member)
1008#define FL_KEY_MEMBER_SIZE(member) (sizeof(((struct fl_flow_key *) 0)->member))
1009
1010#define FL_KEY_IS_MASKED(mask, member) \
1011 memchr_inv(((char *)mask) + FL_KEY_MEMBER_OFFSET(member), \
1012 0, FL_KEY_MEMBER_SIZE(member)) \
1013
1014#define FL_KEY_SET(keys, cnt, id, member) \
1015 do { \
1016 keys[cnt].key_id = id; \
1017 keys[cnt].offset = FL_KEY_MEMBER_OFFSET(member); \
1018 cnt++; \
1019 } while(0);
1020
1021#define FL_KEY_SET_IF_MASKED(mask, keys, cnt, id, member) \
1022 do { \
1023 if (FL_KEY_IS_MASKED(mask, member)) \
1024 FL_KEY_SET(keys, cnt, id, member); \
1025 } while(0);
1026
1027static void fl_init_dissector(struct flow_dissector *dissector,
1028 struct fl_flow_key *mask)
1029{
1030 struct flow_dissector_key keys[FLOW_DISSECTOR_KEY_MAX];
1031 size_t cnt = 0;
1032
1033 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_CONTROL, control);
1034 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_BASIC, basic);
1035 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1036 FLOW_DISSECTOR_KEY_ETH_ADDRS, eth);
1037 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1038 FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4);
1039 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1040 FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6);
1041 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1042 FLOW_DISSECTOR_KEY_PORTS, tp);
1043 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1044 FLOW_DISSECTOR_KEY_IP, ip);
1045 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1046 FLOW_DISSECTOR_KEY_TCP, tcp);
1047 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1048 FLOW_DISSECTOR_KEY_ICMP, icmp);
1049 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1050 FLOW_DISSECTOR_KEY_ARP, arp);
1051 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1052 FLOW_DISSECTOR_KEY_MPLS, mpls);
1053 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1054 FLOW_DISSECTOR_KEY_VLAN, vlan);
1055 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1056 FLOW_DISSECTOR_KEY_CVLAN, cvlan);
1057 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1058 FLOW_DISSECTOR_KEY_ENC_KEYID, enc_key_id);
1059 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1060 FLOW_DISSECTOR_KEY_ENC_IPV4_ADDRS, enc_ipv4);
1061 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1062 FLOW_DISSECTOR_KEY_ENC_IPV6_ADDRS, enc_ipv6);
1063 if (FL_KEY_IS_MASKED(mask, enc_ipv4) ||
1064 FL_KEY_IS_MASKED(mask, enc_ipv6))
1065 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_ENC_CONTROL,
1066 enc_control);
1067 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1068 FLOW_DISSECTOR_KEY_ENC_PORTS, enc_tp);
1069 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1070 FLOW_DISSECTOR_KEY_ENC_IP, enc_ip);
1071 FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1072 FLOW_DISSECTOR_KEY_ENC_OPTS, enc_opts);
1073
1074 skb_flow_dissector_init(dissector, keys, cnt);
1075}
1076
1077static struct fl_flow_mask *fl_create_new_mask(struct cls_fl_head *head,
1078 struct fl_flow_mask *mask)
1079{
1080 struct fl_flow_mask *newmask;
1081 int err;
1082
1083 newmask = kzalloc(sizeof(*newmask), GFP_KERNEL);
1084 if (!newmask)
1085 return ERR_PTR(-ENOMEM);
1086
1087 fl_mask_copy(newmask, mask);
1088
1089 err = fl_init_mask_hashtable(newmask);
1090 if (err)
1091 goto errout_free;
1092
1093 fl_init_dissector(&newmask->dissector, &newmask->key);
1094
1095 INIT_LIST_HEAD_RCU(&newmask->filters);
1096
1097 err = rhashtable_insert_fast(&head->ht, &newmask->ht_node,
1098 mask_ht_params);
1099 if (err)
1100 goto errout_destroy;
1101
1102 list_add_tail_rcu(&newmask->list, &head->masks);
1103
1104 return newmask;
1105
1106errout_destroy:
1107 rhashtable_destroy(&newmask->ht);
1108errout_free:
1109 kfree(newmask);
1110
1111 return ERR_PTR(err);
1112}
1113
1114static int fl_check_assign_mask(struct cls_fl_head *head,
1115 struct cls_fl_filter *fnew,
1116 struct cls_fl_filter *fold,
1117 struct fl_flow_mask *mask)
1118{
1119 struct fl_flow_mask *newmask;
1120
1121 fnew->mask = rhashtable_lookup_fast(&head->ht, mask, mask_ht_params);
1122 if (!fnew->mask) {
1123 if (fold)
1124 return -EINVAL;
1125
1126 newmask = fl_create_new_mask(head, mask);
1127 if (IS_ERR(newmask))
1128 return PTR_ERR(newmask);
1129
1130 fnew->mask = newmask;
1131 } else if (fold && fold->mask != fnew->mask) {
1132 return -EINVAL;
1133 }
1134
1135 return 0;
1136}
1137
1138static int fl_set_parms(struct net *net, struct tcf_proto *tp,
1139 struct cls_fl_filter *f, struct fl_flow_mask *mask,
1140 unsigned long base, struct nlattr **tb,
1141 struct nlattr *est, bool ovr,
1142 struct fl_flow_tmplt *tmplt,
1143 struct netlink_ext_ack *extack)
1144{
1145 int err;
1146
1147 err = tcf_exts_validate(net, tp, tb, est, &f->exts, ovr, extack);
1148 if (err < 0)
1149 return err;
1150
1151 if (tb[TCA_FLOWER_CLASSID]) {
1152 f->res.classid = nla_get_u32(tb[TCA_FLOWER_CLASSID]);
1153 tcf_bind_filter(tp, &f->res, base);
1154 }
1155
1156 err = fl_set_key(net, tb, &f->key, &mask->key, extack);
1157 if (err)
1158 return err;
1159
1160 fl_mask_update_range(mask);
1161 fl_set_masked_key(&f->mkey, &f->key, mask);
1162
1163 if (!fl_mask_fits_tmplt(tmplt, mask)) {
1164 NL_SET_ERR_MSG_MOD(extack, "Mask does not fit the template");
1165 return -EINVAL;
1166 }
1167
1168 return 0;
1169}
1170
1171static int fl_change(struct net *net, struct sk_buff *in_skb,
1172 struct tcf_proto *tp, unsigned long base,
1173 u32 handle, struct nlattr **tca,
1174 void **arg, bool ovr, struct netlink_ext_ack *extack)
1175{
1176 struct cls_fl_head *head = rtnl_dereference(tp->root);
1177 struct cls_fl_filter *fold = *arg;
1178 struct cls_fl_filter *fnew;
1179 struct fl_flow_mask *mask;
1180 struct nlattr **tb;
1181 int err;
1182
1183 if (!tca[TCA_OPTIONS])
1184 return -EINVAL;
1185
1186 mask = kzalloc(sizeof(struct fl_flow_mask), GFP_KERNEL);
1187 if (!mask)
1188 return -ENOBUFS;
1189
1190 tb = kcalloc(TCA_FLOWER_MAX + 1, sizeof(struct nlattr *), GFP_KERNEL);
1191 if (!tb) {
1192 err = -ENOBUFS;
1193 goto errout_mask_alloc;
1194 }
1195
1196 err = nla_parse_nested(tb, TCA_FLOWER_MAX, tca[TCA_OPTIONS],
1197 fl_policy, NULL);
1198 if (err < 0)
1199 goto errout_tb;
1200
1201 if (fold && handle && fold->handle != handle) {
1202 err = -EINVAL;
1203 goto errout_tb;
1204 }
1205
1206 fnew = kzalloc(sizeof(*fnew), GFP_KERNEL);
1207 if (!fnew) {
1208 err = -ENOBUFS;
1209 goto errout_tb;
1210 }
1211
1212 err = tcf_exts_init(&fnew->exts, TCA_FLOWER_ACT, 0);
1213 if (err < 0)
1214 goto errout;
1215
1216 if (tb[TCA_FLOWER_FLAGS]) {
1217 fnew->flags = nla_get_u32(tb[TCA_FLOWER_FLAGS]);
1218
1219 if (!tc_flags_valid(fnew->flags)) {
1220 err = -EINVAL;
1221 goto errout;
1222 }
1223 }
1224
1225 err = fl_set_parms(net, tp, fnew, mask, base, tb, tca[TCA_RATE], ovr,
1226 tp->chain->tmplt_priv, extack);
1227 if (err)
1228 goto errout;
1229
1230 err = fl_check_assign_mask(head, fnew, fold, mask);
1231 if (err)
1232 goto errout;
1233
1234 if (!handle) {
1235 handle = 1;
1236 err = idr_alloc_u32(&head->handle_idr, fnew, &handle,
1237 INT_MAX, GFP_KERNEL);
1238 } else if (!fold) {
1239 /* user specifies a handle and it doesn't exist */
1240 err = idr_alloc_u32(&head->handle_idr, fnew, &handle,
1241 handle, GFP_KERNEL);
1242 }
1243 if (err)
1244 goto errout_mask;
1245 fnew->handle = handle;
1246
1247 if (!tc_skip_sw(fnew->flags)) {
1248 if (!fold && fl_lookup(fnew->mask, &fnew->mkey)) {
1249 err = -EEXIST;
1250 goto errout_idr;
1251 }
1252
1253 err = rhashtable_insert_fast(&fnew->mask->ht, &fnew->ht_node,
1254 fnew->mask->filter_ht_params);
1255 if (err)
1256 goto errout_idr;
1257 }
1258
1259 if (!tc_skip_hw(fnew->flags)) {
1260 err = fl_hw_replace_filter(tp, fnew, extack);
1261 if (err)
1262 goto errout_mask;
1263 }
1264
1265 if (!tc_in_hw(fnew->flags))
1266 fnew->flags |= TCA_CLS_FLAGS_NOT_IN_HW;
1267
1268 if (fold) {
1269 if (!tc_skip_sw(fold->flags))
1270 rhashtable_remove_fast(&fold->mask->ht,
1271 &fold->ht_node,
1272 fold->mask->filter_ht_params);
1273 if (!tc_skip_hw(fold->flags))
1274 fl_hw_destroy_filter(tp, fold, NULL);
1275 }
1276
1277 *arg = fnew;
1278
1279 if (fold) {
1280 idr_replace(&head->handle_idr, fnew, fnew->handle);
1281 list_replace_rcu(&fold->list, &fnew->list);
1282 tcf_unbind_filter(tp, &fold->res);
1283 tcf_exts_get_net(&fold->exts);
1284 tcf_queue_work(&fold->rwork, fl_destroy_filter_work);
1285 } else {
1286 list_add_tail_rcu(&fnew->list, &fnew->mask->filters);
1287 }
1288
1289 kfree(tb);
1290 kfree(mask);
1291 return 0;
1292
1293errout_idr:
1294 if (!fold)
1295 idr_remove(&head->handle_idr, fnew->handle);
1296
1297errout_mask:
1298 fl_mask_put(head, fnew->mask, false);
1299
1300errout:
1301 tcf_exts_destroy(&fnew->exts);
1302 kfree(fnew);
1303errout_tb:
1304 kfree(tb);
1305errout_mask_alloc:
1306 kfree(mask);
1307 return err;
1308}
1309
1310static int fl_delete(struct tcf_proto *tp, void *arg, bool *last,
1311 struct netlink_ext_ack *extack)
1312{
1313 struct cls_fl_head *head = rtnl_dereference(tp->root);
1314 struct cls_fl_filter *f = arg;
1315
1316 if (!tc_skip_sw(f->flags))
1317 rhashtable_remove_fast(&f->mask->ht, &f->ht_node,
1318 f->mask->filter_ht_params);
1319 __fl_delete(tp, f, extack);
1320 *last = list_empty(&head->masks);
1321 return 0;
1322}
1323
1324static void fl_walk(struct tcf_proto *tp, struct tcf_walker *arg)
1325{
1326 struct cls_fl_head *head = rtnl_dereference(tp->root);
1327 struct cls_fl_filter *f;
1328
1329 arg->count = arg->skip;
1330
1331 while ((f = idr_get_next_ul(&head->handle_idr,
1332 &arg->cookie)) != NULL) {
1333 if (arg->fn(tp, f, arg) < 0) {
1334 arg->stop = 1;
1335 break;
1336 }
1337 arg->cookie = f->handle + 1;
1338 arg->count++;
1339 }
1340}
1341
1342static int fl_reoffload(struct tcf_proto *tp, bool add, tc_setup_cb_t *cb,
1343 void *cb_priv, struct netlink_ext_ack *extack)
1344{
1345 struct cls_fl_head *head = rtnl_dereference(tp->root);
1346 struct tc_cls_flower_offload cls_flower = {};
1347 struct tcf_block *block = tp->chain->block;
1348 struct fl_flow_mask *mask;
1349 struct cls_fl_filter *f;
1350 int err;
1351
1352 list_for_each_entry(mask, &head->masks, list) {
1353 list_for_each_entry(f, &mask->filters, list) {
1354 if (tc_skip_hw(f->flags))
1355 continue;
1356
1357 tc_cls_common_offload_init(&cls_flower.common, tp,
1358 f->flags, extack);
1359 cls_flower.command = add ?
1360 TC_CLSFLOWER_REPLACE : TC_CLSFLOWER_DESTROY;
1361 cls_flower.cookie = (unsigned long)f;
1362 cls_flower.dissector = &mask->dissector;
1363 cls_flower.mask = &mask->key;
1364 cls_flower.key = &f->mkey;
1365 cls_flower.exts = &f->exts;
1366 cls_flower.classid = f->res.classid;
1367
1368 err = cb(TC_SETUP_CLSFLOWER, &cls_flower, cb_priv);
1369 if (err) {
1370 if (add && tc_skip_sw(f->flags))
1371 return err;
1372 continue;
1373 }
1374
1375 tc_cls_offload_cnt_update(block, &f->in_hw_count,
1376 &f->flags, add);
1377 }
1378 }
1379
1380 return 0;
1381}
1382
1383static void fl_hw_create_tmplt(struct tcf_chain *chain,
1384 struct fl_flow_tmplt *tmplt)
1385{
1386 struct tc_cls_flower_offload cls_flower = {};
1387 struct tcf_block *block = chain->block;
1388 struct tcf_exts dummy_exts = { 0, };
1389
1390 cls_flower.common.chain_index = chain->index;
1391 cls_flower.command = TC_CLSFLOWER_TMPLT_CREATE;
1392 cls_flower.cookie = (unsigned long) tmplt;
1393 cls_flower.dissector = &tmplt->dissector;
1394 cls_flower.mask = &tmplt->mask;
1395 cls_flower.key = &tmplt->dummy_key;
1396 cls_flower.exts = &dummy_exts;
1397
1398 /* We don't care if driver (any of them) fails to handle this
1399 * call. It serves just as a hint for it.
1400 */
1401 tc_setup_cb_call(block, NULL, TC_SETUP_CLSFLOWER,
1402 &cls_flower, false);
1403}
1404
1405static void fl_hw_destroy_tmplt(struct tcf_chain *chain,
1406 struct fl_flow_tmplt *tmplt)
1407{
1408 struct tc_cls_flower_offload cls_flower = {};
1409 struct tcf_block *block = chain->block;
1410
1411 cls_flower.common.chain_index = chain->index;
1412 cls_flower.command = TC_CLSFLOWER_TMPLT_DESTROY;
1413 cls_flower.cookie = (unsigned long) tmplt;
1414
1415 tc_setup_cb_call(block, NULL, TC_SETUP_CLSFLOWER,
1416 &cls_flower, false);
1417}
1418
1419static void *fl_tmplt_create(struct net *net, struct tcf_chain *chain,
1420 struct nlattr **tca,
1421 struct netlink_ext_ack *extack)
1422{
1423 struct fl_flow_tmplt *tmplt;
1424 struct nlattr **tb;
1425 int err;
1426
1427 if (!tca[TCA_OPTIONS])
1428 return ERR_PTR(-EINVAL);
1429
1430 tb = kcalloc(TCA_FLOWER_MAX + 1, sizeof(struct nlattr *), GFP_KERNEL);
1431 if (!tb)
1432 return ERR_PTR(-ENOBUFS);
1433 err = nla_parse_nested(tb, TCA_FLOWER_MAX, tca[TCA_OPTIONS],
1434 fl_policy, NULL);
1435 if (err)
1436 goto errout_tb;
1437
1438 tmplt = kzalloc(sizeof(*tmplt), GFP_KERNEL);
1439 if (!tmplt) {
1440 err = -ENOMEM;
1441 goto errout_tb;
1442 }
1443 tmplt->chain = chain;
1444 err = fl_set_key(net, tb, &tmplt->dummy_key, &tmplt->mask, extack);
1445 if (err)
1446 goto errout_tmplt;
1447 kfree(tb);
1448
1449 fl_init_dissector(&tmplt->dissector, &tmplt->mask);
1450
1451 fl_hw_create_tmplt(chain, tmplt);
1452
1453 return tmplt;
1454
1455errout_tmplt:
1456 kfree(tmplt);
1457errout_tb:
1458 kfree(tb);
1459 return ERR_PTR(err);
1460}
1461
1462static void fl_tmplt_destroy(void *tmplt_priv)
1463{
1464 struct fl_flow_tmplt *tmplt = tmplt_priv;
1465
1466 fl_hw_destroy_tmplt(tmplt->chain, tmplt);
1467 kfree(tmplt);
1468}
1469
1470static int fl_dump_key_val(struct sk_buff *skb,
1471 void *val, int val_type,
1472 void *mask, int mask_type, int len)
1473{
1474 int err;
1475
1476 if (!memchr_inv(mask, 0, len))
1477 return 0;
1478 err = nla_put(skb, val_type, len, val);
1479 if (err)
1480 return err;
1481 if (mask_type != TCA_FLOWER_UNSPEC) {
1482 err = nla_put(skb, mask_type, len, mask);
1483 if (err)
1484 return err;
1485 }
1486 return 0;
1487}
1488
1489static int fl_dump_key_mpls(struct sk_buff *skb,
1490 struct flow_dissector_key_mpls *mpls_key,
1491 struct flow_dissector_key_mpls *mpls_mask)
1492{
1493 int err;
1494
1495 if (!memchr_inv(mpls_mask, 0, sizeof(*mpls_mask)))
1496 return 0;
1497 if (mpls_mask->mpls_ttl) {
1498 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_TTL,
1499 mpls_key->mpls_ttl);
1500 if (err)
1501 return err;
1502 }
1503 if (mpls_mask->mpls_tc) {
1504 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_TC,
1505 mpls_key->mpls_tc);
1506 if (err)
1507 return err;
1508 }
1509 if (mpls_mask->mpls_label) {
1510 err = nla_put_u32(skb, TCA_FLOWER_KEY_MPLS_LABEL,
1511 mpls_key->mpls_label);
1512 if (err)
1513 return err;
1514 }
1515 if (mpls_mask->mpls_bos) {
1516 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_BOS,
1517 mpls_key->mpls_bos);
1518 if (err)
1519 return err;
1520 }
1521 return 0;
1522}
1523
1524static int fl_dump_key_ip(struct sk_buff *skb, bool encap,
1525 struct flow_dissector_key_ip *key,
1526 struct flow_dissector_key_ip *mask)
1527{
1528 int tos_key = encap ? TCA_FLOWER_KEY_ENC_IP_TOS : TCA_FLOWER_KEY_IP_TOS;
1529 int ttl_key = encap ? TCA_FLOWER_KEY_ENC_IP_TTL : TCA_FLOWER_KEY_IP_TTL;
1530 int tos_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TOS_MASK : TCA_FLOWER_KEY_IP_TOS_MASK;
1531 int ttl_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TTL_MASK : TCA_FLOWER_KEY_IP_TTL_MASK;
1532
1533 if (fl_dump_key_val(skb, &key->tos, tos_key, &mask->tos, tos_mask, sizeof(key->tos)) ||
1534 fl_dump_key_val(skb, &key->ttl, ttl_key, &mask->ttl, ttl_mask, sizeof(key->ttl)))
1535 return -1;
1536
1537 return 0;
1538}
1539
1540static int fl_dump_key_vlan(struct sk_buff *skb,
1541 int vlan_id_key, int vlan_prio_key,
1542 struct flow_dissector_key_vlan *vlan_key,
1543 struct flow_dissector_key_vlan *vlan_mask)
1544{
1545 int err;
1546
1547 if (!memchr_inv(vlan_mask, 0, sizeof(*vlan_mask)))
1548 return 0;
1549 if (vlan_mask->vlan_id) {
1550 err = nla_put_u16(skb, vlan_id_key,
1551 vlan_key->vlan_id);
1552 if (err)
1553 return err;
1554 }
1555 if (vlan_mask->vlan_priority) {
1556 err = nla_put_u8(skb, vlan_prio_key,
1557 vlan_key->vlan_priority);
1558 if (err)
1559 return err;
1560 }
1561 return 0;
1562}
1563
1564static void fl_get_key_flag(u32 dissector_key, u32 dissector_mask,
1565 u32 *flower_key, u32 *flower_mask,
1566 u32 flower_flag_bit, u32 dissector_flag_bit)
1567{
1568 if (dissector_mask & dissector_flag_bit) {
1569 *flower_mask |= flower_flag_bit;
1570 if (dissector_key & dissector_flag_bit)
1571 *flower_key |= flower_flag_bit;
1572 }
1573}
1574
1575static int fl_dump_key_flags(struct sk_buff *skb, u32 flags_key, u32 flags_mask)
1576{
1577 u32 key, mask;
1578 __be32 _key, _mask;
1579 int err;
1580
1581 if (!memchr_inv(&flags_mask, 0, sizeof(flags_mask)))
1582 return 0;
1583
1584 key = 0;
1585 mask = 0;
1586
1587 fl_get_key_flag(flags_key, flags_mask, &key, &mask,
1588 TCA_FLOWER_KEY_FLAGS_IS_FRAGMENT, FLOW_DIS_IS_FRAGMENT);
1589 fl_get_key_flag(flags_key, flags_mask, &key, &mask,
1590 TCA_FLOWER_KEY_FLAGS_FRAG_IS_FIRST,
1591 FLOW_DIS_FIRST_FRAG);
1592
1593 _key = cpu_to_be32(key);
1594 _mask = cpu_to_be32(mask);
1595
1596 err = nla_put(skb, TCA_FLOWER_KEY_FLAGS, 4, &_key);
1597 if (err)
1598 return err;
1599
1600 return nla_put(skb, TCA_FLOWER_KEY_FLAGS_MASK, 4, &_mask);
1601}
1602
1603static int fl_dump_key_geneve_opt(struct sk_buff *skb,
1604 struct flow_dissector_key_enc_opts *enc_opts)
1605{
1606 struct geneve_opt *opt;
1607 struct nlattr *nest;
1608 int opt_off = 0;
1609
1610 nest = nla_nest_start(skb, TCA_FLOWER_KEY_ENC_OPTS_GENEVE);
1611 if (!nest)
1612 goto nla_put_failure;
1613
1614 while (enc_opts->len > opt_off) {
1615 opt = (struct geneve_opt *)&enc_opts->data[opt_off];
1616
1617 if (nla_put_be16(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS,
1618 opt->opt_class))
1619 goto nla_put_failure;
1620 if (nla_put_u8(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE,
1621 opt->type))
1622 goto nla_put_failure;
1623 if (nla_put(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA,
1624 opt->length * 4, opt->opt_data))
1625 goto nla_put_failure;
1626
1627 opt_off += sizeof(struct geneve_opt) + opt->length * 4;
1628 }
1629 nla_nest_end(skb, nest);
1630 return 0;
1631
1632nla_put_failure:
1633 nla_nest_cancel(skb, nest);
1634 return -EMSGSIZE;
1635}
1636
1637static int fl_dump_key_options(struct sk_buff *skb, int enc_opt_type,
1638 struct flow_dissector_key_enc_opts *enc_opts)
1639{
1640 struct nlattr *nest;
1641 int err;
1642
1643 if (!enc_opts->len)
1644 return 0;
1645
1646 nest = nla_nest_start(skb, enc_opt_type);
1647 if (!nest)
1648 goto nla_put_failure;
1649
1650 switch (enc_opts->dst_opt_type) {
1651 case TUNNEL_GENEVE_OPT:
1652 err = fl_dump_key_geneve_opt(skb, enc_opts);
1653 if (err)
1654 goto nla_put_failure;
1655 break;
1656 default:
1657 goto nla_put_failure;
1658 }
1659 nla_nest_end(skb, nest);
1660 return 0;
1661
1662nla_put_failure:
1663 nla_nest_cancel(skb, nest);
1664 return -EMSGSIZE;
1665}
1666
1667static int fl_dump_key_enc_opt(struct sk_buff *skb,
1668 struct flow_dissector_key_enc_opts *key_opts,
1669 struct flow_dissector_key_enc_opts *msk_opts)
1670{
1671 int err;
1672
1673 err = fl_dump_key_options(skb, TCA_FLOWER_KEY_ENC_OPTS, key_opts);
1674 if (err)
1675 return err;
1676
1677 return fl_dump_key_options(skb, TCA_FLOWER_KEY_ENC_OPTS_MASK, msk_opts);
1678}
1679
1680static int fl_dump_key(struct sk_buff *skb, struct net *net,
1681 struct fl_flow_key *key, struct fl_flow_key *mask)
1682{
1683 if (mask->indev_ifindex) {
1684 struct net_device *dev;
1685
1686 dev = __dev_get_by_index(net, key->indev_ifindex);
1687 if (dev && nla_put_string(skb, TCA_FLOWER_INDEV, dev->name))
1688 goto nla_put_failure;
1689 }
1690
1691 if (fl_dump_key_val(skb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
1692 mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
1693 sizeof(key->eth.dst)) ||
1694 fl_dump_key_val(skb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
1695 mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
1696 sizeof(key->eth.src)) ||
1697 fl_dump_key_val(skb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE,
1698 &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
1699 sizeof(key->basic.n_proto)))
1700 goto nla_put_failure;
1701
1702 if (fl_dump_key_mpls(skb, &key->mpls, &mask->mpls))
1703 goto nla_put_failure;
1704
1705 if (fl_dump_key_vlan(skb, TCA_FLOWER_KEY_VLAN_ID,
1706 TCA_FLOWER_KEY_VLAN_PRIO, &key->vlan, &mask->vlan))
1707 goto nla_put_failure;
1708
1709 if (fl_dump_key_vlan(skb, TCA_FLOWER_KEY_CVLAN_ID,
1710 TCA_FLOWER_KEY_CVLAN_PRIO,
1711 &key->cvlan, &mask->cvlan) ||
1712 (mask->cvlan.vlan_tpid &&
1713 nla_put_be16(skb, TCA_FLOWER_KEY_VLAN_ETH_TYPE,
1714 key->cvlan.vlan_tpid)))
1715 goto nla_put_failure;
1716
1717 if (mask->basic.n_proto) {
1718 if (mask->cvlan.vlan_tpid) {
1719 if (nla_put_be16(skb, TCA_FLOWER_KEY_CVLAN_ETH_TYPE,
1720 key->basic.n_proto))
1721 goto nla_put_failure;
1722 } else if (mask->vlan.vlan_tpid) {
1723 if (nla_put_be16(skb, TCA_FLOWER_KEY_VLAN_ETH_TYPE,
1724 key->basic.n_proto))
1725 goto nla_put_failure;
1726 }
1727 }
1728
1729 if ((key->basic.n_proto == htons(ETH_P_IP) ||
1730 key->basic.n_proto == htons(ETH_P_IPV6)) &&
1731 (fl_dump_key_val(skb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
1732 &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
1733 sizeof(key->basic.ip_proto)) ||
1734 fl_dump_key_ip(skb, false, &key->ip, &mask->ip)))
1735 goto nla_put_failure;
1736
1737 if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
1738 (fl_dump_key_val(skb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
1739 &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
1740 sizeof(key->ipv4.src)) ||
1741 fl_dump_key_val(skb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
1742 &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
1743 sizeof(key->ipv4.dst))))
1744 goto nla_put_failure;
1745 else if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
1746 (fl_dump_key_val(skb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
1747 &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
1748 sizeof(key->ipv6.src)) ||
1749 fl_dump_key_val(skb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
1750 &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
1751 sizeof(key->ipv6.dst))))
1752 goto nla_put_failure;
1753
1754 if (key->basic.ip_proto == IPPROTO_TCP &&
1755 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
1756 &mask->tp.src, TCA_FLOWER_KEY_TCP_SRC_MASK,
1757 sizeof(key->tp.src)) ||
1758 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
1759 &mask->tp.dst, TCA_FLOWER_KEY_TCP_DST_MASK,
1760 sizeof(key->tp.dst)) ||
1761 fl_dump_key_val(skb, &key->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS,
1762 &mask->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS_MASK,
1763 sizeof(key->tcp.flags))))
1764 goto nla_put_failure;
1765 else if (key->basic.ip_proto == IPPROTO_UDP &&
1766 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
1767 &mask->tp.src, TCA_FLOWER_KEY_UDP_SRC_MASK,
1768 sizeof(key->tp.src)) ||
1769 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
1770 &mask->tp.dst, TCA_FLOWER_KEY_UDP_DST_MASK,
1771 sizeof(key->tp.dst))))
1772 goto nla_put_failure;
1773 else if (key->basic.ip_proto == IPPROTO_SCTP &&
1774 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_SCTP_SRC,
1775 &mask->tp.src, TCA_FLOWER_KEY_SCTP_SRC_MASK,
1776 sizeof(key->tp.src)) ||
1777 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_SCTP_DST,
1778 &mask->tp.dst, TCA_FLOWER_KEY_SCTP_DST_MASK,
1779 sizeof(key->tp.dst))))
1780 goto nla_put_failure;
1781 else if (key->basic.n_proto == htons(ETH_P_IP) &&
1782 key->basic.ip_proto == IPPROTO_ICMP &&
1783 (fl_dump_key_val(skb, &key->icmp.type,
1784 TCA_FLOWER_KEY_ICMPV4_TYPE, &mask->icmp.type,
1785 TCA_FLOWER_KEY_ICMPV4_TYPE_MASK,
1786 sizeof(key->icmp.type)) ||
1787 fl_dump_key_val(skb, &key->icmp.code,
1788 TCA_FLOWER_KEY_ICMPV4_CODE, &mask->icmp.code,
1789 TCA_FLOWER_KEY_ICMPV4_CODE_MASK,
1790 sizeof(key->icmp.code))))
1791 goto nla_put_failure;
1792 else if (key->basic.n_proto == htons(ETH_P_IPV6) &&
1793 key->basic.ip_proto == IPPROTO_ICMPV6 &&
1794 (fl_dump_key_val(skb, &key->icmp.type,
1795 TCA_FLOWER_KEY_ICMPV6_TYPE, &mask->icmp.type,
1796 TCA_FLOWER_KEY_ICMPV6_TYPE_MASK,
1797 sizeof(key->icmp.type)) ||
1798 fl_dump_key_val(skb, &key->icmp.code,
1799 TCA_FLOWER_KEY_ICMPV6_CODE, &mask->icmp.code,
1800 TCA_FLOWER_KEY_ICMPV6_CODE_MASK,
1801 sizeof(key->icmp.code))))
1802 goto nla_put_failure;
1803 else if ((key->basic.n_proto == htons(ETH_P_ARP) ||
1804 key->basic.n_proto == htons(ETH_P_RARP)) &&
1805 (fl_dump_key_val(skb, &key->arp.sip,
1806 TCA_FLOWER_KEY_ARP_SIP, &mask->arp.sip,
1807 TCA_FLOWER_KEY_ARP_SIP_MASK,
1808 sizeof(key->arp.sip)) ||
1809 fl_dump_key_val(skb, &key->arp.tip,
1810 TCA_FLOWER_KEY_ARP_TIP, &mask->arp.tip,
1811 TCA_FLOWER_KEY_ARP_TIP_MASK,
1812 sizeof(key->arp.tip)) ||
1813 fl_dump_key_val(skb, &key->arp.op,
1814 TCA_FLOWER_KEY_ARP_OP, &mask->arp.op,
1815 TCA_FLOWER_KEY_ARP_OP_MASK,
1816 sizeof(key->arp.op)) ||
1817 fl_dump_key_val(skb, key->arp.sha, TCA_FLOWER_KEY_ARP_SHA,
1818 mask->arp.sha, TCA_FLOWER_KEY_ARP_SHA_MASK,
1819 sizeof(key->arp.sha)) ||
1820 fl_dump_key_val(skb, key->arp.tha, TCA_FLOWER_KEY_ARP_THA,
1821 mask->arp.tha, TCA_FLOWER_KEY_ARP_THA_MASK,
1822 sizeof(key->arp.tha))))
1823 goto nla_put_failure;
1824
1825 if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
1826 (fl_dump_key_val(skb, &key->enc_ipv4.src,
1827 TCA_FLOWER_KEY_ENC_IPV4_SRC, &mask->enc_ipv4.src,
1828 TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK,
1829 sizeof(key->enc_ipv4.src)) ||
1830 fl_dump_key_val(skb, &key->enc_ipv4.dst,
1831 TCA_FLOWER_KEY_ENC_IPV4_DST, &mask->enc_ipv4.dst,
1832 TCA_FLOWER_KEY_ENC_IPV4_DST_MASK,
1833 sizeof(key->enc_ipv4.dst))))
1834 goto nla_put_failure;
1835 else if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
1836 (fl_dump_key_val(skb, &key->enc_ipv6.src,
1837 TCA_FLOWER_KEY_ENC_IPV6_SRC, &mask->enc_ipv6.src,
1838 TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK,
1839 sizeof(key->enc_ipv6.src)) ||
1840 fl_dump_key_val(skb, &key->enc_ipv6.dst,
1841 TCA_FLOWER_KEY_ENC_IPV6_DST,
1842 &mask->enc_ipv6.dst,
1843 TCA_FLOWER_KEY_ENC_IPV6_DST_MASK,
1844 sizeof(key->enc_ipv6.dst))))
1845 goto nla_put_failure;
1846
1847 if (fl_dump_key_val(skb, &key->enc_key_id, TCA_FLOWER_KEY_ENC_KEY_ID,
1848 &mask->enc_key_id, TCA_FLOWER_UNSPEC,
1849 sizeof(key->enc_key_id)) ||
1850 fl_dump_key_val(skb, &key->enc_tp.src,
1851 TCA_FLOWER_KEY_ENC_UDP_SRC_PORT,
1852 &mask->enc_tp.src,
1853 TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK,
1854 sizeof(key->enc_tp.src)) ||
1855 fl_dump_key_val(skb, &key->enc_tp.dst,
1856 TCA_FLOWER_KEY_ENC_UDP_DST_PORT,
1857 &mask->enc_tp.dst,
1858 TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK,
1859 sizeof(key->enc_tp.dst)) ||
1860 fl_dump_key_ip(skb, true, &key->enc_ip, &mask->enc_ip) ||
1861 fl_dump_key_enc_opt(skb, &key->enc_opts, &mask->enc_opts))
1862 goto nla_put_failure;
1863
1864 if (fl_dump_key_flags(skb, key->control.flags, mask->control.flags))
1865 goto nla_put_failure;
1866
1867 return 0;
1868
1869nla_put_failure:
1870 return -EMSGSIZE;
1871}
1872
1873static int fl_dump(struct net *net, struct tcf_proto *tp, void *fh,
1874 struct sk_buff *skb, struct tcmsg *t)
1875{
1876 struct cls_fl_filter *f = fh;
1877 struct nlattr *nest;
1878 struct fl_flow_key *key, *mask;
1879
1880 if (!f)
1881 return skb->len;
1882
1883 t->tcm_handle = f->handle;
1884
1885 nest = nla_nest_start(skb, TCA_OPTIONS);
1886 if (!nest)
1887 goto nla_put_failure;
1888
1889 if (f->res.classid &&
1890 nla_put_u32(skb, TCA_FLOWER_CLASSID, f->res.classid))
1891 goto nla_put_failure;
1892
1893 key = &f->key;
1894 mask = &f->mask->key;
1895
1896 if (fl_dump_key(skb, net, key, mask))
1897 goto nla_put_failure;
1898
1899 if (!tc_skip_hw(f->flags))
1900 fl_hw_update_stats(tp, f);
1901
1902 if (f->flags && nla_put_u32(skb, TCA_FLOWER_FLAGS, f->flags))
1903 goto nla_put_failure;
1904
1905 if (tcf_exts_dump(skb, &f->exts))
1906 goto nla_put_failure;
1907
1908 nla_nest_end(skb, nest);
1909
1910 if (tcf_exts_dump_stats(skb, &f->exts) < 0)
1911 goto nla_put_failure;
1912
1913 return skb->len;
1914
1915nla_put_failure:
1916 nla_nest_cancel(skb, nest);
1917 return -1;
1918}
1919
1920static int fl_tmplt_dump(struct sk_buff *skb, struct net *net, void *tmplt_priv)
1921{
1922 struct fl_flow_tmplt *tmplt = tmplt_priv;
1923 struct fl_flow_key *key, *mask;
1924 struct nlattr *nest;
1925
1926 nest = nla_nest_start(skb, TCA_OPTIONS);
1927 if (!nest)
1928 goto nla_put_failure;
1929
1930 key = &tmplt->dummy_key;
1931 mask = &tmplt->mask;
1932
1933 if (fl_dump_key(skb, net, key, mask))
1934 goto nla_put_failure;
1935
1936 nla_nest_end(skb, nest);
1937
1938 return skb->len;
1939
1940nla_put_failure:
1941 nla_nest_cancel(skb, nest);
1942 return -EMSGSIZE;
1943}
1944
1945static void fl_bind_class(void *fh, u32 classid, unsigned long cl)
1946{
1947 struct cls_fl_filter *f = fh;
1948
1949 if (f && f->res.classid == classid)
1950 f->res.class = cl;
1951}
1952
1953static struct tcf_proto_ops cls_fl_ops __read_mostly = {
1954 .kind = "flower",
1955 .classify = fl_classify,
1956 .init = fl_init,
1957 .destroy = fl_destroy,
1958 .get = fl_get,
1959 .change = fl_change,
1960 .delete = fl_delete,
1961 .walk = fl_walk,
1962 .reoffload = fl_reoffload,
1963 .dump = fl_dump,
1964 .bind_class = fl_bind_class,
1965 .tmplt_create = fl_tmplt_create,
1966 .tmplt_destroy = fl_tmplt_destroy,
1967 .tmplt_dump = fl_tmplt_dump,
1968 .owner = THIS_MODULE,
1969};
1970
1971static int __init cls_fl_init(void)
1972{
1973 return register_tcf_proto_ops(&cls_fl_ops);
1974}
1975
1976static void __exit cls_fl_exit(void)
1977{
1978 unregister_tcf_proto_ops(&cls_fl_ops);
1979}
1980
1981module_init(cls_fl_init);
1982module_exit(cls_fl_exit);
1983
1984MODULE_AUTHOR("Jiri Pirko <jiri@resnulli.us>");
1985MODULE_DESCRIPTION("Flower classifier");
1986MODULE_LICENSE("GPL v2");