Merge branch 'parisc-4.21-1' of git://git.kernel.org/pub/scm/linux/kernel/git/deller...
[linux-2.6-microblaze.git] / net / sched / cls_flower.c
1 /*
2  * net/sched/cls_flower.c               Flower classifier
3  *
4  * Copyright (c) 2015 Jiri Pirko <jiri@resnulli.us>
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License as published by
8  * the Free Software Foundation; either version 2 of the License, or
9  * (at your option) any later version.
10  */
11
12 #include <linux/kernel.h>
13 #include <linux/init.h>
14 #include <linux/module.h>
15 #include <linux/rhashtable.h>
16 #include <linux/workqueue.h>
17
18 #include <linux/if_ether.h>
19 #include <linux/in6.h>
20 #include <linux/ip.h>
21 #include <linux/mpls.h>
22
23 #include <net/sch_generic.h>
24 #include <net/pkt_cls.h>
25 #include <net/ip.h>
26 #include <net/flow_dissector.h>
27 #include <net/geneve.h>
28
29 #include <net/dst.h>
30 #include <net/dst_metadata.h>
31
32 struct fl_flow_key {
33         int     indev_ifindex;
34         struct flow_dissector_key_control control;
35         struct flow_dissector_key_control enc_control;
36         struct flow_dissector_key_basic basic;
37         struct flow_dissector_key_eth_addrs eth;
38         struct flow_dissector_key_vlan vlan;
39         struct flow_dissector_key_vlan cvlan;
40         union {
41                 struct flow_dissector_key_ipv4_addrs ipv4;
42                 struct flow_dissector_key_ipv6_addrs ipv6;
43         };
44         struct flow_dissector_key_ports tp;
45         struct flow_dissector_key_icmp icmp;
46         struct flow_dissector_key_arp arp;
47         struct flow_dissector_key_keyid enc_key_id;
48         union {
49                 struct flow_dissector_key_ipv4_addrs enc_ipv4;
50                 struct flow_dissector_key_ipv6_addrs enc_ipv6;
51         };
52         struct flow_dissector_key_ports enc_tp;
53         struct flow_dissector_key_mpls mpls;
54         struct flow_dissector_key_tcp tcp;
55         struct flow_dissector_key_ip ip;
56         struct flow_dissector_key_ip enc_ip;
57         struct flow_dissector_key_enc_opts enc_opts;
58 } __aligned(BITS_PER_LONG / 8); /* Ensure that we can do comparisons as longs. */
59
60 struct fl_flow_mask_range {
61         unsigned short int start;
62         unsigned short int end;
63 };
64
65 struct fl_flow_mask {
66         struct fl_flow_key key;
67         struct fl_flow_mask_range range;
68         struct rhash_head ht_node;
69         struct rhashtable ht;
70         struct rhashtable_params filter_ht_params;
71         struct flow_dissector dissector;
72         struct list_head filters;
73         struct rcu_work rwork;
74         struct list_head list;
75 };
76
77 struct fl_flow_tmplt {
78         struct fl_flow_key dummy_key;
79         struct fl_flow_key mask;
80         struct flow_dissector dissector;
81         struct tcf_chain *chain;
82 };
83
84 struct cls_fl_head {
85         struct rhashtable ht;
86         struct list_head masks;
87         struct rcu_work rwork;
88         struct idr handle_idr;
89 };
90
91 struct cls_fl_filter {
92         struct fl_flow_mask *mask;
93         struct rhash_head ht_node;
94         struct fl_flow_key mkey;
95         struct tcf_exts exts;
96         struct tcf_result res;
97         struct fl_flow_key key;
98         struct list_head list;
99         u32 handle;
100         u32 flags;
101         u32 in_hw_count;
102         struct rcu_work rwork;
103         struct net_device *hw_dev;
104 };
105
106 static const struct rhashtable_params mask_ht_params = {
107         .key_offset = offsetof(struct fl_flow_mask, key),
108         .key_len = sizeof(struct fl_flow_key),
109         .head_offset = offsetof(struct fl_flow_mask, ht_node),
110         .automatic_shrinking = true,
111 };
112
113 static unsigned short int fl_mask_range(const struct fl_flow_mask *mask)
114 {
115         return mask->range.end - mask->range.start;
116 }
117
118 static void fl_mask_update_range(struct fl_flow_mask *mask)
119 {
120         const u8 *bytes = (const u8 *) &mask->key;
121         size_t size = sizeof(mask->key);
122         size_t i, first = 0, last;
123
124         for (i = 0; i < size; i++) {
125                 if (bytes[i]) {
126                         first = i;
127                         break;
128                 }
129         }
130         last = first;
131         for (i = size - 1; i != first; i--) {
132                 if (bytes[i]) {
133                         last = i;
134                         break;
135                 }
136         }
137         mask->range.start = rounddown(first, sizeof(long));
138         mask->range.end = roundup(last + 1, sizeof(long));
139 }
140
141 static void *fl_key_get_start(struct fl_flow_key *key,
142                               const struct fl_flow_mask *mask)
143 {
144         return (u8 *) key + mask->range.start;
145 }
146
147 static void fl_set_masked_key(struct fl_flow_key *mkey, struct fl_flow_key *key,
148                               struct fl_flow_mask *mask)
149 {
150         const long *lkey = fl_key_get_start(key, mask);
151         const long *lmask = fl_key_get_start(&mask->key, mask);
152         long *lmkey = fl_key_get_start(mkey, mask);
153         int i;
154
155         for (i = 0; i < fl_mask_range(mask); i += sizeof(long))
156                 *lmkey++ = *lkey++ & *lmask++;
157 }
158
159 static bool fl_mask_fits_tmplt(struct fl_flow_tmplt *tmplt,
160                                struct fl_flow_mask *mask)
161 {
162         const long *lmask = fl_key_get_start(&mask->key, mask);
163         const long *ltmplt;
164         int i;
165
166         if (!tmplt)
167                 return true;
168         ltmplt = fl_key_get_start(&tmplt->mask, mask);
169         for (i = 0; i < fl_mask_range(mask); i += sizeof(long)) {
170                 if (~*ltmplt++ & *lmask++)
171                         return false;
172         }
173         return true;
174 }
175
176 static void fl_clear_masked_range(struct fl_flow_key *key,
177                                   struct fl_flow_mask *mask)
178 {
179         memset(fl_key_get_start(key, mask), 0, fl_mask_range(mask));
180 }
181
182 static struct cls_fl_filter *fl_lookup(struct fl_flow_mask *mask,
183                                        struct fl_flow_key *mkey)
184 {
185         return rhashtable_lookup_fast(&mask->ht, fl_key_get_start(mkey, mask),
186                                       mask->filter_ht_params);
187 }
188
189 static int fl_classify(struct sk_buff *skb, const struct tcf_proto *tp,
190                        struct tcf_result *res)
191 {
192         struct cls_fl_head *head = rcu_dereference_bh(tp->root);
193         struct cls_fl_filter *f;
194         struct fl_flow_mask *mask;
195         struct fl_flow_key skb_key;
196         struct fl_flow_key skb_mkey;
197
198         list_for_each_entry_rcu(mask, &head->masks, list) {
199                 fl_clear_masked_range(&skb_key, mask);
200
201                 skb_key.indev_ifindex = skb->skb_iif;
202                 /* skb_flow_dissect() does not set n_proto in case an unknown
203                  * protocol, so do it rather here.
204                  */
205                 skb_key.basic.n_proto = skb->protocol;
206                 skb_flow_dissect_tunnel_info(skb, &mask->dissector, &skb_key);
207                 skb_flow_dissect(skb, &mask->dissector, &skb_key, 0);
208
209                 fl_set_masked_key(&skb_mkey, &skb_key, mask);
210
211                 f = fl_lookup(mask, &skb_mkey);
212                 if (f && !tc_skip_sw(f->flags)) {
213                         *res = f->res;
214                         return tcf_exts_exec(skb, &f->exts, res);
215                 }
216         }
217         return -1;
218 }
219
220 static int fl_init(struct tcf_proto *tp)
221 {
222         struct cls_fl_head *head;
223
224         head = kzalloc(sizeof(*head), GFP_KERNEL);
225         if (!head)
226                 return -ENOBUFS;
227
228         INIT_LIST_HEAD_RCU(&head->masks);
229         rcu_assign_pointer(tp->root, head);
230         idr_init(&head->handle_idr);
231
232         return rhashtable_init(&head->ht, &mask_ht_params);
233 }
234
235 static void fl_mask_free(struct fl_flow_mask *mask)
236 {
237         rhashtable_destroy(&mask->ht);
238         kfree(mask);
239 }
240
241 static void fl_mask_free_work(struct work_struct *work)
242 {
243         struct fl_flow_mask *mask = container_of(to_rcu_work(work),
244                                                  struct fl_flow_mask, rwork);
245
246         fl_mask_free(mask);
247 }
248
249 static bool fl_mask_put(struct cls_fl_head *head, struct fl_flow_mask *mask,
250                         bool async)
251 {
252         if (!list_empty(&mask->filters))
253                 return false;
254
255         rhashtable_remove_fast(&head->ht, &mask->ht_node, mask_ht_params);
256         list_del_rcu(&mask->list);
257         if (async)
258                 tcf_queue_work(&mask->rwork, fl_mask_free_work);
259         else
260                 fl_mask_free(mask);
261
262         return true;
263 }
264
265 static void __fl_destroy_filter(struct cls_fl_filter *f)
266 {
267         tcf_exts_destroy(&f->exts);
268         tcf_exts_put_net(&f->exts);
269         kfree(f);
270 }
271
272 static void fl_destroy_filter_work(struct work_struct *work)
273 {
274         struct cls_fl_filter *f = container_of(to_rcu_work(work),
275                                         struct cls_fl_filter, rwork);
276
277         rtnl_lock();
278         __fl_destroy_filter(f);
279         rtnl_unlock();
280 }
281
282 static void fl_hw_destroy_filter(struct tcf_proto *tp, struct cls_fl_filter *f,
283                                  struct netlink_ext_ack *extack)
284 {
285         struct tc_cls_flower_offload cls_flower = {};
286         struct tcf_block *block = tp->chain->block;
287
288         tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, extack);
289         cls_flower.command = TC_CLSFLOWER_DESTROY;
290         cls_flower.cookie = (unsigned long) f;
291
292         tc_setup_cb_call(block, &f->exts, TC_SETUP_CLSFLOWER,
293                          &cls_flower, false);
294         tcf_block_offload_dec(block, &f->flags);
295 }
296
297 static int fl_hw_replace_filter(struct tcf_proto *tp,
298                                 struct cls_fl_filter *f,
299                                 struct netlink_ext_ack *extack)
300 {
301         struct tc_cls_flower_offload cls_flower = {};
302         struct tcf_block *block = tp->chain->block;
303         bool skip_sw = tc_skip_sw(f->flags);
304         int err;
305
306         tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, extack);
307         cls_flower.command = TC_CLSFLOWER_REPLACE;
308         cls_flower.cookie = (unsigned long) f;
309         cls_flower.dissector = &f->mask->dissector;
310         cls_flower.mask = &f->mask->key;
311         cls_flower.key = &f->mkey;
312         cls_flower.exts = &f->exts;
313         cls_flower.classid = f->res.classid;
314
315         err = tc_setup_cb_call(block, &f->exts, TC_SETUP_CLSFLOWER,
316                                &cls_flower, skip_sw);
317         if (err < 0) {
318                 fl_hw_destroy_filter(tp, f, NULL);
319                 return err;
320         } else if (err > 0) {
321                 f->in_hw_count = err;
322                 tcf_block_offload_inc(block, &f->flags);
323         }
324
325         if (skip_sw && !(f->flags & TCA_CLS_FLAGS_IN_HW))
326                 return -EINVAL;
327
328         return 0;
329 }
330
331 static void fl_hw_update_stats(struct tcf_proto *tp, struct cls_fl_filter *f)
332 {
333         struct tc_cls_flower_offload cls_flower = {};
334         struct tcf_block *block = tp->chain->block;
335
336         tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, NULL);
337         cls_flower.command = TC_CLSFLOWER_STATS;
338         cls_flower.cookie = (unsigned long) f;
339         cls_flower.exts = &f->exts;
340         cls_flower.classid = f->res.classid;
341
342         tc_setup_cb_call(block, &f->exts, TC_SETUP_CLSFLOWER,
343                          &cls_flower, false);
344 }
345
346 static bool __fl_delete(struct tcf_proto *tp, struct cls_fl_filter *f,
347                         struct netlink_ext_ack *extack)
348 {
349         struct cls_fl_head *head = rtnl_dereference(tp->root);
350         bool async = tcf_exts_get_net(&f->exts);
351         bool last;
352
353         idr_remove(&head->handle_idr, f->handle);
354         list_del_rcu(&f->list);
355         last = fl_mask_put(head, f->mask, async);
356         if (!tc_skip_hw(f->flags))
357                 fl_hw_destroy_filter(tp, f, extack);
358         tcf_unbind_filter(tp, &f->res);
359         if (async)
360                 tcf_queue_work(&f->rwork, fl_destroy_filter_work);
361         else
362                 __fl_destroy_filter(f);
363
364         return last;
365 }
366
367 static void fl_destroy_sleepable(struct work_struct *work)
368 {
369         struct cls_fl_head *head = container_of(to_rcu_work(work),
370                                                 struct cls_fl_head,
371                                                 rwork);
372
373         rhashtable_destroy(&head->ht);
374         kfree(head);
375         module_put(THIS_MODULE);
376 }
377
378 static void fl_destroy(struct tcf_proto *tp, struct netlink_ext_ack *extack)
379 {
380         struct cls_fl_head *head = rtnl_dereference(tp->root);
381         struct fl_flow_mask *mask, *next_mask;
382         struct cls_fl_filter *f, *next;
383
384         list_for_each_entry_safe(mask, next_mask, &head->masks, list) {
385                 list_for_each_entry_safe(f, next, &mask->filters, list) {
386                         if (__fl_delete(tp, f, extack))
387                                 break;
388                 }
389         }
390         idr_destroy(&head->handle_idr);
391
392         __module_get(THIS_MODULE);
393         tcf_queue_work(&head->rwork, fl_destroy_sleepable);
394 }
395
396 static void *fl_get(struct tcf_proto *tp, u32 handle)
397 {
398         struct cls_fl_head *head = rtnl_dereference(tp->root);
399
400         return idr_find(&head->handle_idr, handle);
401 }
402
403 static const struct nla_policy fl_policy[TCA_FLOWER_MAX + 1] = {
404         [TCA_FLOWER_UNSPEC]             = { .type = NLA_UNSPEC },
405         [TCA_FLOWER_CLASSID]            = { .type = NLA_U32 },
406         [TCA_FLOWER_INDEV]              = { .type = NLA_STRING,
407                                             .len = IFNAMSIZ },
408         [TCA_FLOWER_KEY_ETH_DST]        = { .len = ETH_ALEN },
409         [TCA_FLOWER_KEY_ETH_DST_MASK]   = { .len = ETH_ALEN },
410         [TCA_FLOWER_KEY_ETH_SRC]        = { .len = ETH_ALEN },
411         [TCA_FLOWER_KEY_ETH_SRC_MASK]   = { .len = ETH_ALEN },
412         [TCA_FLOWER_KEY_ETH_TYPE]       = { .type = NLA_U16 },
413         [TCA_FLOWER_KEY_IP_PROTO]       = { .type = NLA_U8 },
414         [TCA_FLOWER_KEY_IPV4_SRC]       = { .type = NLA_U32 },
415         [TCA_FLOWER_KEY_IPV4_SRC_MASK]  = { .type = NLA_U32 },
416         [TCA_FLOWER_KEY_IPV4_DST]       = { .type = NLA_U32 },
417         [TCA_FLOWER_KEY_IPV4_DST_MASK]  = { .type = NLA_U32 },
418         [TCA_FLOWER_KEY_IPV6_SRC]       = { .len = sizeof(struct in6_addr) },
419         [TCA_FLOWER_KEY_IPV6_SRC_MASK]  = { .len = sizeof(struct in6_addr) },
420         [TCA_FLOWER_KEY_IPV6_DST]       = { .len = sizeof(struct in6_addr) },
421         [TCA_FLOWER_KEY_IPV6_DST_MASK]  = { .len = sizeof(struct in6_addr) },
422         [TCA_FLOWER_KEY_TCP_SRC]        = { .type = NLA_U16 },
423         [TCA_FLOWER_KEY_TCP_DST]        = { .type = NLA_U16 },
424         [TCA_FLOWER_KEY_UDP_SRC]        = { .type = NLA_U16 },
425         [TCA_FLOWER_KEY_UDP_DST]        = { .type = NLA_U16 },
426         [TCA_FLOWER_KEY_VLAN_ID]        = { .type = NLA_U16 },
427         [TCA_FLOWER_KEY_VLAN_PRIO]      = { .type = NLA_U8 },
428         [TCA_FLOWER_KEY_VLAN_ETH_TYPE]  = { .type = NLA_U16 },
429         [TCA_FLOWER_KEY_ENC_KEY_ID]     = { .type = NLA_U32 },
430         [TCA_FLOWER_KEY_ENC_IPV4_SRC]   = { .type = NLA_U32 },
431         [TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK] = { .type = NLA_U32 },
432         [TCA_FLOWER_KEY_ENC_IPV4_DST]   = { .type = NLA_U32 },
433         [TCA_FLOWER_KEY_ENC_IPV4_DST_MASK] = { .type = NLA_U32 },
434         [TCA_FLOWER_KEY_ENC_IPV6_SRC]   = { .len = sizeof(struct in6_addr) },
435         [TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) },
436         [TCA_FLOWER_KEY_ENC_IPV6_DST]   = { .len = sizeof(struct in6_addr) },
437         [TCA_FLOWER_KEY_ENC_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) },
438         [TCA_FLOWER_KEY_TCP_SRC_MASK]   = { .type = NLA_U16 },
439         [TCA_FLOWER_KEY_TCP_DST_MASK]   = { .type = NLA_U16 },
440         [TCA_FLOWER_KEY_UDP_SRC_MASK]   = { .type = NLA_U16 },
441         [TCA_FLOWER_KEY_UDP_DST_MASK]   = { .type = NLA_U16 },
442         [TCA_FLOWER_KEY_SCTP_SRC_MASK]  = { .type = NLA_U16 },
443         [TCA_FLOWER_KEY_SCTP_DST_MASK]  = { .type = NLA_U16 },
444         [TCA_FLOWER_KEY_SCTP_SRC]       = { .type = NLA_U16 },
445         [TCA_FLOWER_KEY_SCTP_DST]       = { .type = NLA_U16 },
446         [TCA_FLOWER_KEY_ENC_UDP_SRC_PORT]       = { .type = NLA_U16 },
447         [TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK]  = { .type = NLA_U16 },
448         [TCA_FLOWER_KEY_ENC_UDP_DST_PORT]       = { .type = NLA_U16 },
449         [TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK]  = { .type = NLA_U16 },
450         [TCA_FLOWER_KEY_FLAGS]          = { .type = NLA_U32 },
451         [TCA_FLOWER_KEY_FLAGS_MASK]     = { .type = NLA_U32 },
452         [TCA_FLOWER_KEY_ICMPV4_TYPE]    = { .type = NLA_U8 },
453         [TCA_FLOWER_KEY_ICMPV4_TYPE_MASK] = { .type = NLA_U8 },
454         [TCA_FLOWER_KEY_ICMPV4_CODE]    = { .type = NLA_U8 },
455         [TCA_FLOWER_KEY_ICMPV4_CODE_MASK] = { .type = NLA_U8 },
456         [TCA_FLOWER_KEY_ICMPV6_TYPE]    = { .type = NLA_U8 },
457         [TCA_FLOWER_KEY_ICMPV6_TYPE_MASK] = { .type = NLA_U8 },
458         [TCA_FLOWER_KEY_ICMPV6_CODE]    = { .type = NLA_U8 },
459         [TCA_FLOWER_KEY_ICMPV6_CODE_MASK] = { .type = NLA_U8 },
460         [TCA_FLOWER_KEY_ARP_SIP]        = { .type = NLA_U32 },
461         [TCA_FLOWER_KEY_ARP_SIP_MASK]   = { .type = NLA_U32 },
462         [TCA_FLOWER_KEY_ARP_TIP]        = { .type = NLA_U32 },
463         [TCA_FLOWER_KEY_ARP_TIP_MASK]   = { .type = NLA_U32 },
464         [TCA_FLOWER_KEY_ARP_OP]         = { .type = NLA_U8 },
465         [TCA_FLOWER_KEY_ARP_OP_MASK]    = { .type = NLA_U8 },
466         [TCA_FLOWER_KEY_ARP_SHA]        = { .len = ETH_ALEN },
467         [TCA_FLOWER_KEY_ARP_SHA_MASK]   = { .len = ETH_ALEN },
468         [TCA_FLOWER_KEY_ARP_THA]        = { .len = ETH_ALEN },
469         [TCA_FLOWER_KEY_ARP_THA_MASK]   = { .len = ETH_ALEN },
470         [TCA_FLOWER_KEY_MPLS_TTL]       = { .type = NLA_U8 },
471         [TCA_FLOWER_KEY_MPLS_BOS]       = { .type = NLA_U8 },
472         [TCA_FLOWER_KEY_MPLS_TC]        = { .type = NLA_U8 },
473         [TCA_FLOWER_KEY_MPLS_LABEL]     = { .type = NLA_U32 },
474         [TCA_FLOWER_KEY_TCP_FLAGS]      = { .type = NLA_U16 },
475         [TCA_FLOWER_KEY_TCP_FLAGS_MASK] = { .type = NLA_U16 },
476         [TCA_FLOWER_KEY_IP_TOS]         = { .type = NLA_U8 },
477         [TCA_FLOWER_KEY_IP_TOS_MASK]    = { .type = NLA_U8 },
478         [TCA_FLOWER_KEY_IP_TTL]         = { .type = NLA_U8 },
479         [TCA_FLOWER_KEY_IP_TTL_MASK]    = { .type = NLA_U8 },
480         [TCA_FLOWER_KEY_CVLAN_ID]       = { .type = NLA_U16 },
481         [TCA_FLOWER_KEY_CVLAN_PRIO]     = { .type = NLA_U8 },
482         [TCA_FLOWER_KEY_CVLAN_ETH_TYPE] = { .type = NLA_U16 },
483         [TCA_FLOWER_KEY_ENC_IP_TOS]     = { .type = NLA_U8 },
484         [TCA_FLOWER_KEY_ENC_IP_TOS_MASK] = { .type = NLA_U8 },
485         [TCA_FLOWER_KEY_ENC_IP_TTL]      = { .type = NLA_U8 },
486         [TCA_FLOWER_KEY_ENC_IP_TTL_MASK] = { .type = NLA_U8 },
487         [TCA_FLOWER_KEY_ENC_OPTS]       = { .type = NLA_NESTED },
488         [TCA_FLOWER_KEY_ENC_OPTS_MASK]  = { .type = NLA_NESTED },
489 };
490
491 static const struct nla_policy
492 enc_opts_policy[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1] = {
493         [TCA_FLOWER_KEY_ENC_OPTS_GENEVE]        = { .type = NLA_NESTED },
494 };
495
496 static const struct nla_policy
497 geneve_opt_policy[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1] = {
498         [TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]      = { .type = NLA_U16 },
499         [TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]       = { .type = NLA_U8 },
500         [TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]       = { .type = NLA_BINARY,
501                                                        .len = 128 },
502 };
503
504 static void fl_set_key_val(struct nlattr **tb,
505                            void *val, int val_type,
506                            void *mask, int mask_type, int len)
507 {
508         if (!tb[val_type])
509                 return;
510         memcpy(val, nla_data(tb[val_type]), len);
511         if (mask_type == TCA_FLOWER_UNSPEC || !tb[mask_type])
512                 memset(mask, 0xff, len);
513         else
514                 memcpy(mask, nla_data(tb[mask_type]), len);
515 }
516
517 static int fl_set_key_mpls(struct nlattr **tb,
518                            struct flow_dissector_key_mpls *key_val,
519                            struct flow_dissector_key_mpls *key_mask)
520 {
521         if (tb[TCA_FLOWER_KEY_MPLS_TTL]) {
522                 key_val->mpls_ttl = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_TTL]);
523                 key_mask->mpls_ttl = MPLS_TTL_MASK;
524         }
525         if (tb[TCA_FLOWER_KEY_MPLS_BOS]) {
526                 u8 bos = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_BOS]);
527
528                 if (bos & ~MPLS_BOS_MASK)
529                         return -EINVAL;
530                 key_val->mpls_bos = bos;
531                 key_mask->mpls_bos = MPLS_BOS_MASK;
532         }
533         if (tb[TCA_FLOWER_KEY_MPLS_TC]) {
534                 u8 tc = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_TC]);
535
536                 if (tc & ~MPLS_TC_MASK)
537                         return -EINVAL;
538                 key_val->mpls_tc = tc;
539                 key_mask->mpls_tc = MPLS_TC_MASK;
540         }
541         if (tb[TCA_FLOWER_KEY_MPLS_LABEL]) {
542                 u32 label = nla_get_u32(tb[TCA_FLOWER_KEY_MPLS_LABEL]);
543
544                 if (label & ~MPLS_LABEL_MASK)
545                         return -EINVAL;
546                 key_val->mpls_label = label;
547                 key_mask->mpls_label = MPLS_LABEL_MASK;
548         }
549         return 0;
550 }
551
552 static void fl_set_key_vlan(struct nlattr **tb,
553                             __be16 ethertype,
554                             int vlan_id_key, int vlan_prio_key,
555                             struct flow_dissector_key_vlan *key_val,
556                             struct flow_dissector_key_vlan *key_mask)
557 {
558 #define VLAN_PRIORITY_MASK      0x7
559
560         if (tb[vlan_id_key]) {
561                 key_val->vlan_id =
562                         nla_get_u16(tb[vlan_id_key]) & VLAN_VID_MASK;
563                 key_mask->vlan_id = VLAN_VID_MASK;
564         }
565         if (tb[vlan_prio_key]) {
566                 key_val->vlan_priority =
567                         nla_get_u8(tb[vlan_prio_key]) &
568                         VLAN_PRIORITY_MASK;
569                 key_mask->vlan_priority = VLAN_PRIORITY_MASK;
570         }
571         key_val->vlan_tpid = ethertype;
572         key_mask->vlan_tpid = cpu_to_be16(~0);
573 }
574
575 static void fl_set_key_flag(u32 flower_key, u32 flower_mask,
576                             u32 *dissector_key, u32 *dissector_mask,
577                             u32 flower_flag_bit, u32 dissector_flag_bit)
578 {
579         if (flower_mask & flower_flag_bit) {
580                 *dissector_mask |= dissector_flag_bit;
581                 if (flower_key & flower_flag_bit)
582                         *dissector_key |= dissector_flag_bit;
583         }
584 }
585
586 static int fl_set_key_flags(struct nlattr **tb,
587                             u32 *flags_key, u32 *flags_mask)
588 {
589         u32 key, mask;
590
591         /* mask is mandatory for flags */
592         if (!tb[TCA_FLOWER_KEY_FLAGS_MASK])
593                 return -EINVAL;
594
595         key = be32_to_cpu(nla_get_u32(tb[TCA_FLOWER_KEY_FLAGS]));
596         mask = be32_to_cpu(nla_get_u32(tb[TCA_FLOWER_KEY_FLAGS_MASK]));
597
598         *flags_key  = 0;
599         *flags_mask = 0;
600
601         fl_set_key_flag(key, mask, flags_key, flags_mask,
602                         TCA_FLOWER_KEY_FLAGS_IS_FRAGMENT, FLOW_DIS_IS_FRAGMENT);
603         fl_set_key_flag(key, mask, flags_key, flags_mask,
604                         TCA_FLOWER_KEY_FLAGS_FRAG_IS_FIRST,
605                         FLOW_DIS_FIRST_FRAG);
606
607         return 0;
608 }
609
610 static void fl_set_key_ip(struct nlattr **tb, bool encap,
611                           struct flow_dissector_key_ip *key,
612                           struct flow_dissector_key_ip *mask)
613 {
614         int tos_key = encap ? TCA_FLOWER_KEY_ENC_IP_TOS : TCA_FLOWER_KEY_IP_TOS;
615         int ttl_key = encap ? TCA_FLOWER_KEY_ENC_IP_TTL : TCA_FLOWER_KEY_IP_TTL;
616         int tos_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TOS_MASK : TCA_FLOWER_KEY_IP_TOS_MASK;
617         int ttl_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TTL_MASK : TCA_FLOWER_KEY_IP_TTL_MASK;
618
619         fl_set_key_val(tb, &key->tos, tos_key, &mask->tos, tos_mask, sizeof(key->tos));
620         fl_set_key_val(tb, &key->ttl, ttl_key, &mask->ttl, ttl_mask, sizeof(key->ttl));
621 }
622
623 static int fl_set_geneve_opt(const struct nlattr *nla, struct fl_flow_key *key,
624                              int depth, int option_len,
625                              struct netlink_ext_ack *extack)
626 {
627         struct nlattr *tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1];
628         struct nlattr *class = NULL, *type = NULL, *data = NULL;
629         struct geneve_opt *opt;
630         int err, data_len = 0;
631
632         if (option_len > sizeof(struct geneve_opt))
633                 data_len = option_len - sizeof(struct geneve_opt);
634
635         opt = (struct geneve_opt *)&key->enc_opts.data[key->enc_opts.len];
636         memset(opt, 0xff, option_len);
637         opt->length = data_len / 4;
638         opt->r1 = 0;
639         opt->r2 = 0;
640         opt->r3 = 0;
641
642         /* If no mask has been prodived we assume an exact match. */
643         if (!depth)
644                 return sizeof(struct geneve_opt) + data_len;
645
646         if (nla_type(nla) != TCA_FLOWER_KEY_ENC_OPTS_GENEVE) {
647                 NL_SET_ERR_MSG(extack, "Non-geneve option type for mask");
648                 return -EINVAL;
649         }
650
651         err = nla_parse_nested(tb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX,
652                                nla, geneve_opt_policy, extack);
653         if (err < 0)
654                 return err;
655
656         /* We are not allowed to omit any of CLASS, TYPE or DATA
657          * fields from the key.
658          */
659         if (!option_len &&
660             (!tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS] ||
661              !tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE] ||
662              !tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA])) {
663                 NL_SET_ERR_MSG(extack, "Missing tunnel key geneve option class, type or data");
664                 return -EINVAL;
665         }
666
667         /* Omitting any of CLASS, TYPE or DATA fields is allowed
668          * for the mask.
669          */
670         if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]) {
671                 int new_len = key->enc_opts.len;
672
673                 data = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA];
674                 data_len = nla_len(data);
675                 if (data_len < 4) {
676                         NL_SET_ERR_MSG(extack, "Tunnel key geneve option data is less than 4 bytes long");
677                         return -ERANGE;
678                 }
679                 if (data_len % 4) {
680                         NL_SET_ERR_MSG(extack, "Tunnel key geneve option data is not a multiple of 4 bytes long");
681                         return -ERANGE;
682                 }
683
684                 new_len += sizeof(struct geneve_opt) + data_len;
685                 BUILD_BUG_ON(FLOW_DIS_TUN_OPTS_MAX != IP_TUNNEL_OPTS_MAX);
686                 if (new_len > FLOW_DIS_TUN_OPTS_MAX) {
687                         NL_SET_ERR_MSG(extack, "Tunnel options exceeds max size");
688                         return -ERANGE;
689                 }
690                 opt->length = data_len / 4;
691                 memcpy(opt->opt_data, nla_data(data), data_len);
692         }
693
694         if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]) {
695                 class = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS];
696                 opt->opt_class = nla_get_be16(class);
697         }
698
699         if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]) {
700                 type = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE];
701                 opt->type = nla_get_u8(type);
702         }
703
704         return sizeof(struct geneve_opt) + data_len;
705 }
706
707 static int fl_set_enc_opt(struct nlattr **tb, struct fl_flow_key *key,
708                           struct fl_flow_key *mask,
709                           struct netlink_ext_ack *extack)
710 {
711         const struct nlattr *nla_enc_key, *nla_opt_key, *nla_opt_msk = NULL;
712         int err, option_len, key_depth, msk_depth = 0;
713
714         err = nla_validate_nested(tb[TCA_FLOWER_KEY_ENC_OPTS],
715                                   TCA_FLOWER_KEY_ENC_OPTS_MAX,
716                                   enc_opts_policy, extack);
717         if (err)
718                 return err;
719
720         nla_enc_key = nla_data(tb[TCA_FLOWER_KEY_ENC_OPTS]);
721
722         if (tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]) {
723                 err = nla_validate_nested(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK],
724                                           TCA_FLOWER_KEY_ENC_OPTS_MAX,
725                                           enc_opts_policy, extack);
726                 if (err)
727                         return err;
728
729                 nla_opt_msk = nla_data(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]);
730                 msk_depth = nla_len(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]);
731         }
732
733         nla_for_each_attr(nla_opt_key, nla_enc_key,
734                           nla_len(tb[TCA_FLOWER_KEY_ENC_OPTS]), key_depth) {
735                 switch (nla_type(nla_opt_key)) {
736                 case TCA_FLOWER_KEY_ENC_OPTS_GENEVE:
737                         option_len = 0;
738                         key->enc_opts.dst_opt_type = TUNNEL_GENEVE_OPT;
739                         option_len = fl_set_geneve_opt(nla_opt_key, key,
740                                                        key_depth, option_len,
741                                                        extack);
742                         if (option_len < 0)
743                                 return option_len;
744
745                         key->enc_opts.len += option_len;
746                         /* At the same time we need to parse through the mask
747                          * in order to verify exact and mask attribute lengths.
748                          */
749                         mask->enc_opts.dst_opt_type = TUNNEL_GENEVE_OPT;
750                         option_len = fl_set_geneve_opt(nla_opt_msk, mask,
751                                                        msk_depth, option_len,
752                                                        extack);
753                         if (option_len < 0)
754                                 return option_len;
755
756                         mask->enc_opts.len += option_len;
757                         if (key->enc_opts.len != mask->enc_opts.len) {
758                                 NL_SET_ERR_MSG(extack, "Key and mask miss aligned");
759                                 return -EINVAL;
760                         }
761
762                         if (msk_depth)
763                                 nla_opt_msk = nla_next(nla_opt_msk, &msk_depth);
764                         break;
765                 default:
766                         NL_SET_ERR_MSG(extack, "Unknown tunnel option type");
767                         return -EINVAL;
768                 }
769         }
770
771         return 0;
772 }
773
774 static int fl_set_key(struct net *net, struct nlattr **tb,
775                       struct fl_flow_key *key, struct fl_flow_key *mask,
776                       struct netlink_ext_ack *extack)
777 {
778         __be16 ethertype;
779         int ret = 0;
780 #ifdef CONFIG_NET_CLS_IND
781         if (tb[TCA_FLOWER_INDEV]) {
782                 int err = tcf_change_indev(net, tb[TCA_FLOWER_INDEV], extack);
783                 if (err < 0)
784                         return err;
785                 key->indev_ifindex = err;
786                 mask->indev_ifindex = 0xffffffff;
787         }
788 #endif
789
790         fl_set_key_val(tb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
791                        mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
792                        sizeof(key->eth.dst));
793         fl_set_key_val(tb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
794                        mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
795                        sizeof(key->eth.src));
796
797         if (tb[TCA_FLOWER_KEY_ETH_TYPE]) {
798                 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_ETH_TYPE]);
799
800                 if (eth_type_vlan(ethertype)) {
801                         fl_set_key_vlan(tb, ethertype, TCA_FLOWER_KEY_VLAN_ID,
802                                         TCA_FLOWER_KEY_VLAN_PRIO, &key->vlan,
803                                         &mask->vlan);
804
805                         if (tb[TCA_FLOWER_KEY_VLAN_ETH_TYPE]) {
806                                 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_VLAN_ETH_TYPE]);
807                                 if (eth_type_vlan(ethertype)) {
808                                         fl_set_key_vlan(tb, ethertype,
809                                                         TCA_FLOWER_KEY_CVLAN_ID,
810                                                         TCA_FLOWER_KEY_CVLAN_PRIO,
811                                                         &key->cvlan, &mask->cvlan);
812                                         fl_set_key_val(tb, &key->basic.n_proto,
813                                                        TCA_FLOWER_KEY_CVLAN_ETH_TYPE,
814                                                        &mask->basic.n_proto,
815                                                        TCA_FLOWER_UNSPEC,
816                                                        sizeof(key->basic.n_proto));
817                                 } else {
818                                         key->basic.n_proto = ethertype;
819                                         mask->basic.n_proto = cpu_to_be16(~0);
820                                 }
821                         }
822                 } else {
823                         key->basic.n_proto = ethertype;
824                         mask->basic.n_proto = cpu_to_be16(~0);
825                 }
826         }
827
828         if (key->basic.n_proto == htons(ETH_P_IP) ||
829             key->basic.n_proto == htons(ETH_P_IPV6)) {
830                 fl_set_key_val(tb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
831                                &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
832                                sizeof(key->basic.ip_proto));
833                 fl_set_key_ip(tb, false, &key->ip, &mask->ip);
834         }
835
836         if (tb[TCA_FLOWER_KEY_IPV4_SRC] || tb[TCA_FLOWER_KEY_IPV4_DST]) {
837                 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
838                 mask->control.addr_type = ~0;
839                 fl_set_key_val(tb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
840                                &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
841                                sizeof(key->ipv4.src));
842                 fl_set_key_val(tb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
843                                &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
844                                sizeof(key->ipv4.dst));
845         } else if (tb[TCA_FLOWER_KEY_IPV6_SRC] || tb[TCA_FLOWER_KEY_IPV6_DST]) {
846                 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
847                 mask->control.addr_type = ~0;
848                 fl_set_key_val(tb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
849                                &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
850                                sizeof(key->ipv6.src));
851                 fl_set_key_val(tb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
852                                &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
853                                sizeof(key->ipv6.dst));
854         }
855
856         if (key->basic.ip_proto == IPPROTO_TCP) {
857                 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
858                                &mask->tp.src, TCA_FLOWER_KEY_TCP_SRC_MASK,
859                                sizeof(key->tp.src));
860                 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
861                                &mask->tp.dst, TCA_FLOWER_KEY_TCP_DST_MASK,
862                                sizeof(key->tp.dst));
863                 fl_set_key_val(tb, &key->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS,
864                                &mask->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS_MASK,
865                                sizeof(key->tcp.flags));
866         } else if (key->basic.ip_proto == IPPROTO_UDP) {
867                 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
868                                &mask->tp.src, TCA_FLOWER_KEY_UDP_SRC_MASK,
869                                sizeof(key->tp.src));
870                 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
871                                &mask->tp.dst, TCA_FLOWER_KEY_UDP_DST_MASK,
872                                sizeof(key->tp.dst));
873         } else if (key->basic.ip_proto == IPPROTO_SCTP) {
874                 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_SCTP_SRC,
875                                &mask->tp.src, TCA_FLOWER_KEY_SCTP_SRC_MASK,
876                                sizeof(key->tp.src));
877                 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_SCTP_DST,
878                                &mask->tp.dst, TCA_FLOWER_KEY_SCTP_DST_MASK,
879                                sizeof(key->tp.dst));
880         } else if (key->basic.n_proto == htons(ETH_P_IP) &&
881                    key->basic.ip_proto == IPPROTO_ICMP) {
882                 fl_set_key_val(tb, &key->icmp.type, TCA_FLOWER_KEY_ICMPV4_TYPE,
883                                &mask->icmp.type,
884                                TCA_FLOWER_KEY_ICMPV4_TYPE_MASK,
885                                sizeof(key->icmp.type));
886                 fl_set_key_val(tb, &key->icmp.code, TCA_FLOWER_KEY_ICMPV4_CODE,
887                                &mask->icmp.code,
888                                TCA_FLOWER_KEY_ICMPV4_CODE_MASK,
889                                sizeof(key->icmp.code));
890         } else if (key->basic.n_proto == htons(ETH_P_IPV6) &&
891                    key->basic.ip_proto == IPPROTO_ICMPV6) {
892                 fl_set_key_val(tb, &key->icmp.type, TCA_FLOWER_KEY_ICMPV6_TYPE,
893                                &mask->icmp.type,
894                                TCA_FLOWER_KEY_ICMPV6_TYPE_MASK,
895                                sizeof(key->icmp.type));
896                 fl_set_key_val(tb, &key->icmp.code, TCA_FLOWER_KEY_ICMPV6_CODE,
897                                &mask->icmp.code,
898                                TCA_FLOWER_KEY_ICMPV6_CODE_MASK,
899                                sizeof(key->icmp.code));
900         } else if (key->basic.n_proto == htons(ETH_P_MPLS_UC) ||
901                    key->basic.n_proto == htons(ETH_P_MPLS_MC)) {
902                 ret = fl_set_key_mpls(tb, &key->mpls, &mask->mpls);
903                 if (ret)
904                         return ret;
905         } else if (key->basic.n_proto == htons(ETH_P_ARP) ||
906                    key->basic.n_proto == htons(ETH_P_RARP)) {
907                 fl_set_key_val(tb, &key->arp.sip, TCA_FLOWER_KEY_ARP_SIP,
908                                &mask->arp.sip, TCA_FLOWER_KEY_ARP_SIP_MASK,
909                                sizeof(key->arp.sip));
910                 fl_set_key_val(tb, &key->arp.tip, TCA_FLOWER_KEY_ARP_TIP,
911                                &mask->arp.tip, TCA_FLOWER_KEY_ARP_TIP_MASK,
912                                sizeof(key->arp.tip));
913                 fl_set_key_val(tb, &key->arp.op, TCA_FLOWER_KEY_ARP_OP,
914                                &mask->arp.op, TCA_FLOWER_KEY_ARP_OP_MASK,
915                                sizeof(key->arp.op));
916                 fl_set_key_val(tb, key->arp.sha, TCA_FLOWER_KEY_ARP_SHA,
917                                mask->arp.sha, TCA_FLOWER_KEY_ARP_SHA_MASK,
918                                sizeof(key->arp.sha));
919                 fl_set_key_val(tb, key->arp.tha, TCA_FLOWER_KEY_ARP_THA,
920                                mask->arp.tha, TCA_FLOWER_KEY_ARP_THA_MASK,
921                                sizeof(key->arp.tha));
922         }
923
924         if (tb[TCA_FLOWER_KEY_ENC_IPV4_SRC] ||
925             tb[TCA_FLOWER_KEY_ENC_IPV4_DST]) {
926                 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
927                 mask->enc_control.addr_type = ~0;
928                 fl_set_key_val(tb, &key->enc_ipv4.src,
929                                TCA_FLOWER_KEY_ENC_IPV4_SRC,
930                                &mask->enc_ipv4.src,
931                                TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK,
932                                sizeof(key->enc_ipv4.src));
933                 fl_set_key_val(tb, &key->enc_ipv4.dst,
934                                TCA_FLOWER_KEY_ENC_IPV4_DST,
935                                &mask->enc_ipv4.dst,
936                                TCA_FLOWER_KEY_ENC_IPV4_DST_MASK,
937                                sizeof(key->enc_ipv4.dst));
938         }
939
940         if (tb[TCA_FLOWER_KEY_ENC_IPV6_SRC] ||
941             tb[TCA_FLOWER_KEY_ENC_IPV6_DST]) {
942                 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
943                 mask->enc_control.addr_type = ~0;
944                 fl_set_key_val(tb, &key->enc_ipv6.src,
945                                TCA_FLOWER_KEY_ENC_IPV6_SRC,
946                                &mask->enc_ipv6.src,
947                                TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK,
948                                sizeof(key->enc_ipv6.src));
949                 fl_set_key_val(tb, &key->enc_ipv6.dst,
950                                TCA_FLOWER_KEY_ENC_IPV6_DST,
951                                &mask->enc_ipv6.dst,
952                                TCA_FLOWER_KEY_ENC_IPV6_DST_MASK,
953                                sizeof(key->enc_ipv6.dst));
954         }
955
956         fl_set_key_val(tb, &key->enc_key_id.keyid, TCA_FLOWER_KEY_ENC_KEY_ID,
957                        &mask->enc_key_id.keyid, TCA_FLOWER_UNSPEC,
958                        sizeof(key->enc_key_id.keyid));
959
960         fl_set_key_val(tb, &key->enc_tp.src, TCA_FLOWER_KEY_ENC_UDP_SRC_PORT,
961                        &mask->enc_tp.src, TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK,
962                        sizeof(key->enc_tp.src));
963
964         fl_set_key_val(tb, &key->enc_tp.dst, TCA_FLOWER_KEY_ENC_UDP_DST_PORT,
965                        &mask->enc_tp.dst, TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK,
966                        sizeof(key->enc_tp.dst));
967
968         fl_set_key_ip(tb, true, &key->enc_ip, &mask->enc_ip);
969
970         if (tb[TCA_FLOWER_KEY_ENC_OPTS]) {
971                 ret = fl_set_enc_opt(tb, key, mask, extack);
972                 if (ret)
973                         return ret;
974         }
975
976         if (tb[TCA_FLOWER_KEY_FLAGS])
977                 ret = fl_set_key_flags(tb, &key->control.flags, &mask->control.flags);
978
979         return ret;
980 }
981
982 static void fl_mask_copy(struct fl_flow_mask *dst,
983                          struct fl_flow_mask *src)
984 {
985         const void *psrc = fl_key_get_start(&src->key, src);
986         void *pdst = fl_key_get_start(&dst->key, src);
987
988         memcpy(pdst, psrc, fl_mask_range(src));
989         dst->range = src->range;
990 }
991
992 static const struct rhashtable_params fl_ht_params = {
993         .key_offset = offsetof(struct cls_fl_filter, mkey), /* base offset */
994         .head_offset = offsetof(struct cls_fl_filter, ht_node),
995         .automatic_shrinking = true,
996 };
997
998 static int fl_init_mask_hashtable(struct fl_flow_mask *mask)
999 {
1000         mask->filter_ht_params = fl_ht_params;
1001         mask->filter_ht_params.key_len = fl_mask_range(mask);
1002         mask->filter_ht_params.key_offset += mask->range.start;
1003
1004         return rhashtable_init(&mask->ht, &mask->filter_ht_params);
1005 }
1006
1007 #define FL_KEY_MEMBER_OFFSET(member) offsetof(struct fl_flow_key, member)
1008 #define FL_KEY_MEMBER_SIZE(member) FIELD_SIZEOF(struct fl_flow_key, member)
1009
1010 #define FL_KEY_IS_MASKED(mask, member)                                          \
1011         memchr_inv(((char *)mask) + FL_KEY_MEMBER_OFFSET(member),               \
1012                    0, FL_KEY_MEMBER_SIZE(member))                               \
1013
1014 #define FL_KEY_SET(keys, cnt, id, member)                                       \
1015         do {                                                                    \
1016                 keys[cnt].key_id = id;                                          \
1017                 keys[cnt].offset = FL_KEY_MEMBER_OFFSET(member);                \
1018                 cnt++;                                                          \
1019         } while(0);
1020
1021 #define FL_KEY_SET_IF_MASKED(mask, keys, cnt, id, member)                       \
1022         do {                                                                    \
1023                 if (FL_KEY_IS_MASKED(mask, member))                             \
1024                         FL_KEY_SET(keys, cnt, id, member);                      \
1025         } while(0);
1026
1027 static void fl_init_dissector(struct flow_dissector *dissector,
1028                               struct fl_flow_key *mask)
1029 {
1030         struct flow_dissector_key keys[FLOW_DISSECTOR_KEY_MAX];
1031         size_t cnt = 0;
1032
1033         FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_CONTROL, control);
1034         FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_BASIC, basic);
1035         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1036                              FLOW_DISSECTOR_KEY_ETH_ADDRS, eth);
1037         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1038                              FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4);
1039         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1040                              FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6);
1041         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1042                              FLOW_DISSECTOR_KEY_PORTS, tp);
1043         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1044                              FLOW_DISSECTOR_KEY_IP, ip);
1045         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1046                              FLOW_DISSECTOR_KEY_TCP, tcp);
1047         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1048                              FLOW_DISSECTOR_KEY_ICMP, icmp);
1049         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1050                              FLOW_DISSECTOR_KEY_ARP, arp);
1051         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1052                              FLOW_DISSECTOR_KEY_MPLS, mpls);
1053         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1054                              FLOW_DISSECTOR_KEY_VLAN, vlan);
1055         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1056                              FLOW_DISSECTOR_KEY_CVLAN, cvlan);
1057         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1058                              FLOW_DISSECTOR_KEY_ENC_KEYID, enc_key_id);
1059         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1060                              FLOW_DISSECTOR_KEY_ENC_IPV4_ADDRS, enc_ipv4);
1061         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1062                              FLOW_DISSECTOR_KEY_ENC_IPV6_ADDRS, enc_ipv6);
1063         if (FL_KEY_IS_MASKED(mask, enc_ipv4) ||
1064             FL_KEY_IS_MASKED(mask, enc_ipv6))
1065                 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_ENC_CONTROL,
1066                            enc_control);
1067         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1068                              FLOW_DISSECTOR_KEY_ENC_PORTS, enc_tp);
1069         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1070                              FLOW_DISSECTOR_KEY_ENC_IP, enc_ip);
1071         FL_KEY_SET_IF_MASKED(mask, keys, cnt,
1072                              FLOW_DISSECTOR_KEY_ENC_OPTS, enc_opts);
1073
1074         skb_flow_dissector_init(dissector, keys, cnt);
1075 }
1076
1077 static struct fl_flow_mask *fl_create_new_mask(struct cls_fl_head *head,
1078                                                struct fl_flow_mask *mask)
1079 {
1080         struct fl_flow_mask *newmask;
1081         int err;
1082
1083         newmask = kzalloc(sizeof(*newmask), GFP_KERNEL);
1084         if (!newmask)
1085                 return ERR_PTR(-ENOMEM);
1086
1087         fl_mask_copy(newmask, mask);
1088
1089         err = fl_init_mask_hashtable(newmask);
1090         if (err)
1091                 goto errout_free;
1092
1093         fl_init_dissector(&newmask->dissector, &newmask->key);
1094
1095         INIT_LIST_HEAD_RCU(&newmask->filters);
1096
1097         err = rhashtable_insert_fast(&head->ht, &newmask->ht_node,
1098                                      mask_ht_params);
1099         if (err)
1100                 goto errout_destroy;
1101
1102         list_add_tail_rcu(&newmask->list, &head->masks);
1103
1104         return newmask;
1105
1106 errout_destroy:
1107         rhashtable_destroy(&newmask->ht);
1108 errout_free:
1109         kfree(newmask);
1110
1111         return ERR_PTR(err);
1112 }
1113
1114 static int fl_check_assign_mask(struct cls_fl_head *head,
1115                                 struct cls_fl_filter *fnew,
1116                                 struct cls_fl_filter *fold,
1117                                 struct fl_flow_mask *mask)
1118 {
1119         struct fl_flow_mask *newmask;
1120
1121         fnew->mask = rhashtable_lookup_fast(&head->ht, mask, mask_ht_params);
1122         if (!fnew->mask) {
1123                 if (fold)
1124                         return -EINVAL;
1125
1126                 newmask = fl_create_new_mask(head, mask);
1127                 if (IS_ERR(newmask))
1128                         return PTR_ERR(newmask);
1129
1130                 fnew->mask = newmask;
1131         } else if (fold && fold->mask != fnew->mask) {
1132                 return -EINVAL;
1133         }
1134
1135         return 0;
1136 }
1137
1138 static int fl_set_parms(struct net *net, struct tcf_proto *tp,
1139                         struct cls_fl_filter *f, struct fl_flow_mask *mask,
1140                         unsigned long base, struct nlattr **tb,
1141                         struct nlattr *est, bool ovr,
1142                         struct fl_flow_tmplt *tmplt,
1143                         struct netlink_ext_ack *extack)
1144 {
1145         int err;
1146
1147         err = tcf_exts_validate(net, tp, tb, est, &f->exts, ovr, extack);
1148         if (err < 0)
1149                 return err;
1150
1151         if (tb[TCA_FLOWER_CLASSID]) {
1152                 f->res.classid = nla_get_u32(tb[TCA_FLOWER_CLASSID]);
1153                 tcf_bind_filter(tp, &f->res, base);
1154         }
1155
1156         err = fl_set_key(net, tb, &f->key, &mask->key, extack);
1157         if (err)
1158                 return err;
1159
1160         fl_mask_update_range(mask);
1161         fl_set_masked_key(&f->mkey, &f->key, mask);
1162
1163         if (!fl_mask_fits_tmplt(tmplt, mask)) {
1164                 NL_SET_ERR_MSG_MOD(extack, "Mask does not fit the template");
1165                 return -EINVAL;
1166         }
1167
1168         return 0;
1169 }
1170
1171 static int fl_change(struct net *net, struct sk_buff *in_skb,
1172                      struct tcf_proto *tp, unsigned long base,
1173                      u32 handle, struct nlattr **tca,
1174                      void **arg, bool ovr, struct netlink_ext_ack *extack)
1175 {
1176         struct cls_fl_head *head = rtnl_dereference(tp->root);
1177         struct cls_fl_filter *fold = *arg;
1178         struct cls_fl_filter *fnew;
1179         struct nlattr **tb;
1180         struct fl_flow_mask mask = {};
1181         int err;
1182
1183         if (!tca[TCA_OPTIONS])
1184                 return -EINVAL;
1185
1186         tb = kcalloc(TCA_FLOWER_MAX + 1, sizeof(struct nlattr *), GFP_KERNEL);
1187         if (!tb)
1188                 return -ENOBUFS;
1189
1190         err = nla_parse_nested(tb, TCA_FLOWER_MAX, tca[TCA_OPTIONS],
1191                                fl_policy, NULL);
1192         if (err < 0)
1193                 goto errout_tb;
1194
1195         if (fold && handle && fold->handle != handle) {
1196                 err = -EINVAL;
1197                 goto errout_tb;
1198         }
1199
1200         fnew = kzalloc(sizeof(*fnew), GFP_KERNEL);
1201         if (!fnew) {
1202                 err = -ENOBUFS;
1203                 goto errout_tb;
1204         }
1205
1206         err = tcf_exts_init(&fnew->exts, TCA_FLOWER_ACT, 0);
1207         if (err < 0)
1208                 goto errout;
1209
1210         if (!handle) {
1211                 handle = 1;
1212                 err = idr_alloc_u32(&head->handle_idr, fnew, &handle,
1213                                     INT_MAX, GFP_KERNEL);
1214         } else if (!fold) {
1215                 /* user specifies a handle and it doesn't exist */
1216                 err = idr_alloc_u32(&head->handle_idr, fnew, &handle,
1217                                     handle, GFP_KERNEL);
1218         }
1219         if (err)
1220                 goto errout;
1221         fnew->handle = handle;
1222
1223         if (tb[TCA_FLOWER_FLAGS]) {
1224                 fnew->flags = nla_get_u32(tb[TCA_FLOWER_FLAGS]);
1225
1226                 if (!tc_flags_valid(fnew->flags)) {
1227                         err = -EINVAL;
1228                         goto errout_idr;
1229                 }
1230         }
1231
1232         err = fl_set_parms(net, tp, fnew, &mask, base, tb, tca[TCA_RATE], ovr,
1233                            tp->chain->tmplt_priv, extack);
1234         if (err)
1235                 goto errout_idr;
1236
1237         err = fl_check_assign_mask(head, fnew, fold, &mask);
1238         if (err)
1239                 goto errout_idr;
1240
1241         if (!fold && fl_lookup(fnew->mask, &fnew->mkey)) {
1242                 err = -EEXIST;
1243                 goto errout_mask;
1244         }
1245
1246         err = rhashtable_insert_fast(&fnew->mask->ht, &fnew->ht_node,
1247                                      fnew->mask->filter_ht_params);
1248         if (err)
1249                 goto errout_mask;
1250
1251         if (!tc_skip_hw(fnew->flags)) {
1252                 err = fl_hw_replace_filter(tp, fnew, extack);
1253                 if (err)
1254                         goto errout_mask;
1255         }
1256
1257         if (!tc_in_hw(fnew->flags))
1258                 fnew->flags |= TCA_CLS_FLAGS_NOT_IN_HW;
1259
1260         if (fold) {
1261                 rhashtable_remove_fast(&fold->mask->ht,
1262                                        &fold->ht_node,
1263                                        fold->mask->filter_ht_params);
1264                 if (!tc_skip_hw(fold->flags))
1265                         fl_hw_destroy_filter(tp, fold, NULL);
1266         }
1267
1268         *arg = fnew;
1269
1270         if (fold) {
1271                 idr_replace(&head->handle_idr, fnew, fnew->handle);
1272                 list_replace_rcu(&fold->list, &fnew->list);
1273                 tcf_unbind_filter(tp, &fold->res);
1274                 tcf_exts_get_net(&fold->exts);
1275                 tcf_queue_work(&fold->rwork, fl_destroy_filter_work);
1276         } else {
1277                 list_add_tail_rcu(&fnew->list, &fnew->mask->filters);
1278         }
1279
1280         kfree(tb);
1281         return 0;
1282
1283 errout_mask:
1284         fl_mask_put(head, fnew->mask, false);
1285
1286 errout_idr:
1287         if (!fold)
1288                 idr_remove(&head->handle_idr, fnew->handle);
1289 errout:
1290         tcf_exts_destroy(&fnew->exts);
1291         kfree(fnew);
1292 errout_tb:
1293         kfree(tb);
1294         return err;
1295 }
1296
1297 static int fl_delete(struct tcf_proto *tp, void *arg, bool *last,
1298                      struct netlink_ext_ack *extack)
1299 {
1300         struct cls_fl_head *head = rtnl_dereference(tp->root);
1301         struct cls_fl_filter *f = arg;
1302
1303         rhashtable_remove_fast(&f->mask->ht, &f->ht_node,
1304                                f->mask->filter_ht_params);
1305         __fl_delete(tp, f, extack);
1306         *last = list_empty(&head->masks);
1307         return 0;
1308 }
1309
1310 static void fl_walk(struct tcf_proto *tp, struct tcf_walker *arg)
1311 {
1312         struct cls_fl_head *head = rtnl_dereference(tp->root);
1313         struct cls_fl_filter *f;
1314
1315         arg->count = arg->skip;
1316
1317         while ((f = idr_get_next_ul(&head->handle_idr,
1318                                     &arg->cookie)) != NULL) {
1319                 if (arg->fn(tp, f, arg) < 0) {
1320                         arg->stop = 1;
1321                         break;
1322                 }
1323                 arg->cookie = f->handle + 1;
1324                 arg->count++;
1325         }
1326 }
1327
1328 static int fl_reoffload(struct tcf_proto *tp, bool add, tc_setup_cb_t *cb,
1329                         void *cb_priv, struct netlink_ext_ack *extack)
1330 {
1331         struct cls_fl_head *head = rtnl_dereference(tp->root);
1332         struct tc_cls_flower_offload cls_flower = {};
1333         struct tcf_block *block = tp->chain->block;
1334         struct fl_flow_mask *mask;
1335         struct cls_fl_filter *f;
1336         int err;
1337
1338         list_for_each_entry(mask, &head->masks, list) {
1339                 list_for_each_entry(f, &mask->filters, list) {
1340                         if (tc_skip_hw(f->flags))
1341                                 continue;
1342
1343                         tc_cls_common_offload_init(&cls_flower.common, tp,
1344                                                    f->flags, extack);
1345                         cls_flower.command = add ?
1346                                 TC_CLSFLOWER_REPLACE : TC_CLSFLOWER_DESTROY;
1347                         cls_flower.cookie = (unsigned long)f;
1348                         cls_flower.dissector = &mask->dissector;
1349                         cls_flower.mask = &mask->key;
1350                         cls_flower.key = &f->mkey;
1351                         cls_flower.exts = &f->exts;
1352                         cls_flower.classid = f->res.classid;
1353
1354                         err = cb(TC_SETUP_CLSFLOWER, &cls_flower, cb_priv);
1355                         if (err) {
1356                                 if (add && tc_skip_sw(f->flags))
1357                                         return err;
1358                                 continue;
1359                         }
1360
1361                         tc_cls_offload_cnt_update(block, &f->in_hw_count,
1362                                                   &f->flags, add);
1363                 }
1364         }
1365
1366         return 0;
1367 }
1368
1369 static void fl_hw_create_tmplt(struct tcf_chain *chain,
1370                                struct fl_flow_tmplt *tmplt)
1371 {
1372         struct tc_cls_flower_offload cls_flower = {};
1373         struct tcf_block *block = chain->block;
1374         struct tcf_exts dummy_exts = { 0, };
1375
1376         cls_flower.common.chain_index = chain->index;
1377         cls_flower.command = TC_CLSFLOWER_TMPLT_CREATE;
1378         cls_flower.cookie = (unsigned long) tmplt;
1379         cls_flower.dissector = &tmplt->dissector;
1380         cls_flower.mask = &tmplt->mask;
1381         cls_flower.key = &tmplt->dummy_key;
1382         cls_flower.exts = &dummy_exts;
1383
1384         /* We don't care if driver (any of them) fails to handle this
1385          * call. It serves just as a hint for it.
1386          */
1387         tc_setup_cb_call(block, NULL, TC_SETUP_CLSFLOWER,
1388                          &cls_flower, false);
1389 }
1390
1391 static void fl_hw_destroy_tmplt(struct tcf_chain *chain,
1392                                 struct fl_flow_tmplt *tmplt)
1393 {
1394         struct tc_cls_flower_offload cls_flower = {};
1395         struct tcf_block *block = chain->block;
1396
1397         cls_flower.common.chain_index = chain->index;
1398         cls_flower.command = TC_CLSFLOWER_TMPLT_DESTROY;
1399         cls_flower.cookie = (unsigned long) tmplt;
1400
1401         tc_setup_cb_call(block, NULL, TC_SETUP_CLSFLOWER,
1402                          &cls_flower, false);
1403 }
1404
1405 static void *fl_tmplt_create(struct net *net, struct tcf_chain *chain,
1406                              struct nlattr **tca,
1407                              struct netlink_ext_ack *extack)
1408 {
1409         struct fl_flow_tmplt *tmplt;
1410         struct nlattr **tb;
1411         int err;
1412
1413         if (!tca[TCA_OPTIONS])
1414                 return ERR_PTR(-EINVAL);
1415
1416         tb = kcalloc(TCA_FLOWER_MAX + 1, sizeof(struct nlattr *), GFP_KERNEL);
1417         if (!tb)
1418                 return ERR_PTR(-ENOBUFS);
1419         err = nla_parse_nested(tb, TCA_FLOWER_MAX, tca[TCA_OPTIONS],
1420                                fl_policy, NULL);
1421         if (err)
1422                 goto errout_tb;
1423
1424         tmplt = kzalloc(sizeof(*tmplt), GFP_KERNEL);
1425         if (!tmplt) {
1426                 err = -ENOMEM;
1427                 goto errout_tb;
1428         }
1429         tmplt->chain = chain;
1430         err = fl_set_key(net, tb, &tmplt->dummy_key, &tmplt->mask, extack);
1431         if (err)
1432                 goto errout_tmplt;
1433         kfree(tb);
1434
1435         fl_init_dissector(&tmplt->dissector, &tmplt->mask);
1436
1437         fl_hw_create_tmplt(chain, tmplt);
1438
1439         return tmplt;
1440
1441 errout_tmplt:
1442         kfree(tmplt);
1443 errout_tb:
1444         kfree(tb);
1445         return ERR_PTR(err);
1446 }
1447
1448 static void fl_tmplt_destroy(void *tmplt_priv)
1449 {
1450         struct fl_flow_tmplt *tmplt = tmplt_priv;
1451
1452         fl_hw_destroy_tmplt(tmplt->chain, tmplt);
1453         kfree(tmplt);
1454 }
1455
1456 static int fl_dump_key_val(struct sk_buff *skb,
1457                            void *val, int val_type,
1458                            void *mask, int mask_type, int len)
1459 {
1460         int err;
1461
1462         if (!memchr_inv(mask, 0, len))
1463                 return 0;
1464         err = nla_put(skb, val_type, len, val);
1465         if (err)
1466                 return err;
1467         if (mask_type != TCA_FLOWER_UNSPEC) {
1468                 err = nla_put(skb, mask_type, len, mask);
1469                 if (err)
1470                         return err;
1471         }
1472         return 0;
1473 }
1474
1475 static int fl_dump_key_mpls(struct sk_buff *skb,
1476                             struct flow_dissector_key_mpls *mpls_key,
1477                             struct flow_dissector_key_mpls *mpls_mask)
1478 {
1479         int err;
1480
1481         if (!memchr_inv(mpls_mask, 0, sizeof(*mpls_mask)))
1482                 return 0;
1483         if (mpls_mask->mpls_ttl) {
1484                 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_TTL,
1485                                  mpls_key->mpls_ttl);
1486                 if (err)
1487                         return err;
1488         }
1489         if (mpls_mask->mpls_tc) {
1490                 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_TC,
1491                                  mpls_key->mpls_tc);
1492                 if (err)
1493                         return err;
1494         }
1495         if (mpls_mask->mpls_label) {
1496                 err = nla_put_u32(skb, TCA_FLOWER_KEY_MPLS_LABEL,
1497                                   mpls_key->mpls_label);
1498                 if (err)
1499                         return err;
1500         }
1501         if (mpls_mask->mpls_bos) {
1502                 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_BOS,
1503                                  mpls_key->mpls_bos);
1504                 if (err)
1505                         return err;
1506         }
1507         return 0;
1508 }
1509
1510 static int fl_dump_key_ip(struct sk_buff *skb, bool encap,
1511                           struct flow_dissector_key_ip *key,
1512                           struct flow_dissector_key_ip *mask)
1513 {
1514         int tos_key = encap ? TCA_FLOWER_KEY_ENC_IP_TOS : TCA_FLOWER_KEY_IP_TOS;
1515         int ttl_key = encap ? TCA_FLOWER_KEY_ENC_IP_TTL : TCA_FLOWER_KEY_IP_TTL;
1516         int tos_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TOS_MASK : TCA_FLOWER_KEY_IP_TOS_MASK;
1517         int ttl_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TTL_MASK : TCA_FLOWER_KEY_IP_TTL_MASK;
1518
1519         if (fl_dump_key_val(skb, &key->tos, tos_key, &mask->tos, tos_mask, sizeof(key->tos)) ||
1520             fl_dump_key_val(skb, &key->ttl, ttl_key, &mask->ttl, ttl_mask, sizeof(key->ttl)))
1521                 return -1;
1522
1523         return 0;
1524 }
1525
1526 static int fl_dump_key_vlan(struct sk_buff *skb,
1527                             int vlan_id_key, int vlan_prio_key,
1528                             struct flow_dissector_key_vlan *vlan_key,
1529                             struct flow_dissector_key_vlan *vlan_mask)
1530 {
1531         int err;
1532
1533         if (!memchr_inv(vlan_mask, 0, sizeof(*vlan_mask)))
1534                 return 0;
1535         if (vlan_mask->vlan_id) {
1536                 err = nla_put_u16(skb, vlan_id_key,
1537                                   vlan_key->vlan_id);
1538                 if (err)
1539                         return err;
1540         }
1541         if (vlan_mask->vlan_priority) {
1542                 err = nla_put_u8(skb, vlan_prio_key,
1543                                  vlan_key->vlan_priority);
1544                 if (err)
1545                         return err;
1546         }
1547         return 0;
1548 }
1549
1550 static void fl_get_key_flag(u32 dissector_key, u32 dissector_mask,
1551                             u32 *flower_key, u32 *flower_mask,
1552                             u32 flower_flag_bit, u32 dissector_flag_bit)
1553 {
1554         if (dissector_mask & dissector_flag_bit) {
1555                 *flower_mask |= flower_flag_bit;
1556                 if (dissector_key & dissector_flag_bit)
1557                         *flower_key |= flower_flag_bit;
1558         }
1559 }
1560
1561 static int fl_dump_key_flags(struct sk_buff *skb, u32 flags_key, u32 flags_mask)
1562 {
1563         u32 key, mask;
1564         __be32 _key, _mask;
1565         int err;
1566
1567         if (!memchr_inv(&flags_mask, 0, sizeof(flags_mask)))
1568                 return 0;
1569
1570         key = 0;
1571         mask = 0;
1572
1573         fl_get_key_flag(flags_key, flags_mask, &key, &mask,
1574                         TCA_FLOWER_KEY_FLAGS_IS_FRAGMENT, FLOW_DIS_IS_FRAGMENT);
1575         fl_get_key_flag(flags_key, flags_mask, &key, &mask,
1576                         TCA_FLOWER_KEY_FLAGS_FRAG_IS_FIRST,
1577                         FLOW_DIS_FIRST_FRAG);
1578
1579         _key = cpu_to_be32(key);
1580         _mask = cpu_to_be32(mask);
1581
1582         err = nla_put(skb, TCA_FLOWER_KEY_FLAGS, 4, &_key);
1583         if (err)
1584                 return err;
1585
1586         return nla_put(skb, TCA_FLOWER_KEY_FLAGS_MASK, 4, &_mask);
1587 }
1588
1589 static int fl_dump_key_geneve_opt(struct sk_buff *skb,
1590                                   struct flow_dissector_key_enc_opts *enc_opts)
1591 {
1592         struct geneve_opt *opt;
1593         struct nlattr *nest;
1594         int opt_off = 0;
1595
1596         nest = nla_nest_start(skb, TCA_FLOWER_KEY_ENC_OPTS_GENEVE);
1597         if (!nest)
1598                 goto nla_put_failure;
1599
1600         while (enc_opts->len > opt_off) {
1601                 opt = (struct geneve_opt *)&enc_opts->data[opt_off];
1602
1603                 if (nla_put_be16(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS,
1604                                  opt->opt_class))
1605                         goto nla_put_failure;
1606                 if (nla_put_u8(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE,
1607                                opt->type))
1608                         goto nla_put_failure;
1609                 if (nla_put(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA,
1610                             opt->length * 4, opt->opt_data))
1611                         goto nla_put_failure;
1612
1613                 opt_off += sizeof(struct geneve_opt) + opt->length * 4;
1614         }
1615         nla_nest_end(skb, nest);
1616         return 0;
1617
1618 nla_put_failure:
1619         nla_nest_cancel(skb, nest);
1620         return -EMSGSIZE;
1621 }
1622
1623 static int fl_dump_key_options(struct sk_buff *skb, int enc_opt_type,
1624                                struct flow_dissector_key_enc_opts *enc_opts)
1625 {
1626         struct nlattr *nest;
1627         int err;
1628
1629         if (!enc_opts->len)
1630                 return 0;
1631
1632         nest = nla_nest_start(skb, enc_opt_type);
1633         if (!nest)
1634                 goto nla_put_failure;
1635
1636         switch (enc_opts->dst_opt_type) {
1637         case TUNNEL_GENEVE_OPT:
1638                 err = fl_dump_key_geneve_opt(skb, enc_opts);
1639                 if (err)
1640                         goto nla_put_failure;
1641                 break;
1642         default:
1643                 goto nla_put_failure;
1644         }
1645         nla_nest_end(skb, nest);
1646         return 0;
1647
1648 nla_put_failure:
1649         nla_nest_cancel(skb, nest);
1650         return -EMSGSIZE;
1651 }
1652
1653 static int fl_dump_key_enc_opt(struct sk_buff *skb,
1654                                struct flow_dissector_key_enc_opts *key_opts,
1655                                struct flow_dissector_key_enc_opts *msk_opts)
1656 {
1657         int err;
1658
1659         err = fl_dump_key_options(skb, TCA_FLOWER_KEY_ENC_OPTS, key_opts);
1660         if (err)
1661                 return err;
1662
1663         return fl_dump_key_options(skb, TCA_FLOWER_KEY_ENC_OPTS_MASK, msk_opts);
1664 }
1665
1666 static int fl_dump_key(struct sk_buff *skb, struct net *net,
1667                        struct fl_flow_key *key, struct fl_flow_key *mask)
1668 {
1669         if (mask->indev_ifindex) {
1670                 struct net_device *dev;
1671
1672                 dev = __dev_get_by_index(net, key->indev_ifindex);
1673                 if (dev && nla_put_string(skb, TCA_FLOWER_INDEV, dev->name))
1674                         goto nla_put_failure;
1675         }
1676
1677         if (fl_dump_key_val(skb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST,
1678                             mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK,
1679                             sizeof(key->eth.dst)) ||
1680             fl_dump_key_val(skb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
1681                             mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
1682                             sizeof(key->eth.src)) ||
1683             fl_dump_key_val(skb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE,
1684                             &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
1685                             sizeof(key->basic.n_proto)))
1686                 goto nla_put_failure;
1687
1688         if (fl_dump_key_mpls(skb, &key->mpls, &mask->mpls))
1689                 goto nla_put_failure;
1690
1691         if (fl_dump_key_vlan(skb, TCA_FLOWER_KEY_VLAN_ID,
1692                              TCA_FLOWER_KEY_VLAN_PRIO, &key->vlan, &mask->vlan))
1693                 goto nla_put_failure;
1694
1695         if (fl_dump_key_vlan(skb, TCA_FLOWER_KEY_CVLAN_ID,
1696                              TCA_FLOWER_KEY_CVLAN_PRIO,
1697                              &key->cvlan, &mask->cvlan) ||
1698             (mask->cvlan.vlan_tpid &&
1699              nla_put_be16(skb, TCA_FLOWER_KEY_VLAN_ETH_TYPE,
1700                           key->cvlan.vlan_tpid)))
1701                 goto nla_put_failure;
1702
1703         if (mask->basic.n_proto) {
1704                 if (mask->cvlan.vlan_tpid) {
1705                         if (nla_put_be16(skb, TCA_FLOWER_KEY_CVLAN_ETH_TYPE,
1706                                          key->basic.n_proto))
1707                                 goto nla_put_failure;
1708                 } else if (mask->vlan.vlan_tpid) {
1709                         if (nla_put_be16(skb, TCA_FLOWER_KEY_VLAN_ETH_TYPE,
1710                                          key->basic.n_proto))
1711                                 goto nla_put_failure;
1712                 }
1713         }
1714
1715         if ((key->basic.n_proto == htons(ETH_P_IP) ||
1716              key->basic.n_proto == htons(ETH_P_IPV6)) &&
1717             (fl_dump_key_val(skb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
1718                             &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
1719                             sizeof(key->basic.ip_proto)) ||
1720             fl_dump_key_ip(skb, false, &key->ip, &mask->ip)))
1721                 goto nla_put_failure;
1722
1723         if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
1724             (fl_dump_key_val(skb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
1725                              &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
1726                              sizeof(key->ipv4.src)) ||
1727              fl_dump_key_val(skb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
1728                              &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
1729                              sizeof(key->ipv4.dst))))
1730                 goto nla_put_failure;
1731         else if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
1732                  (fl_dump_key_val(skb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
1733                                   &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
1734                                   sizeof(key->ipv6.src)) ||
1735                   fl_dump_key_val(skb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST,
1736                                   &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
1737                                   sizeof(key->ipv6.dst))))
1738                 goto nla_put_failure;
1739
1740         if (key->basic.ip_proto == IPPROTO_TCP &&
1741             (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
1742                              &mask->tp.src, TCA_FLOWER_KEY_TCP_SRC_MASK,
1743                              sizeof(key->tp.src)) ||
1744              fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST,
1745                              &mask->tp.dst, TCA_FLOWER_KEY_TCP_DST_MASK,
1746                              sizeof(key->tp.dst)) ||
1747              fl_dump_key_val(skb, &key->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS,
1748                              &mask->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS_MASK,
1749                              sizeof(key->tcp.flags))))
1750                 goto nla_put_failure;
1751         else if (key->basic.ip_proto == IPPROTO_UDP &&
1752                  (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC,
1753                                   &mask->tp.src, TCA_FLOWER_KEY_UDP_SRC_MASK,
1754                                   sizeof(key->tp.src)) ||
1755                   fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST,
1756                                   &mask->tp.dst, TCA_FLOWER_KEY_UDP_DST_MASK,
1757                                   sizeof(key->tp.dst))))
1758                 goto nla_put_failure;
1759         else if (key->basic.ip_proto == IPPROTO_SCTP &&
1760                  (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_SCTP_SRC,
1761                                   &mask->tp.src, TCA_FLOWER_KEY_SCTP_SRC_MASK,
1762                                   sizeof(key->tp.src)) ||
1763                   fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_SCTP_DST,
1764                                   &mask->tp.dst, TCA_FLOWER_KEY_SCTP_DST_MASK,
1765                                   sizeof(key->tp.dst))))
1766                 goto nla_put_failure;
1767         else if (key->basic.n_proto == htons(ETH_P_IP) &&
1768                  key->basic.ip_proto == IPPROTO_ICMP &&
1769                  (fl_dump_key_val(skb, &key->icmp.type,
1770                                   TCA_FLOWER_KEY_ICMPV4_TYPE, &mask->icmp.type,
1771                                   TCA_FLOWER_KEY_ICMPV4_TYPE_MASK,
1772                                   sizeof(key->icmp.type)) ||
1773                   fl_dump_key_val(skb, &key->icmp.code,
1774                                   TCA_FLOWER_KEY_ICMPV4_CODE, &mask->icmp.code,
1775                                   TCA_FLOWER_KEY_ICMPV4_CODE_MASK,
1776                                   sizeof(key->icmp.code))))
1777                 goto nla_put_failure;
1778         else if (key->basic.n_proto == htons(ETH_P_IPV6) &&
1779                  key->basic.ip_proto == IPPROTO_ICMPV6 &&
1780                  (fl_dump_key_val(skb, &key->icmp.type,
1781                                   TCA_FLOWER_KEY_ICMPV6_TYPE, &mask->icmp.type,
1782                                   TCA_FLOWER_KEY_ICMPV6_TYPE_MASK,
1783                                   sizeof(key->icmp.type)) ||
1784                   fl_dump_key_val(skb, &key->icmp.code,
1785                                   TCA_FLOWER_KEY_ICMPV6_CODE, &mask->icmp.code,
1786                                   TCA_FLOWER_KEY_ICMPV6_CODE_MASK,
1787                                   sizeof(key->icmp.code))))
1788                 goto nla_put_failure;
1789         else if ((key->basic.n_proto == htons(ETH_P_ARP) ||
1790                   key->basic.n_proto == htons(ETH_P_RARP)) &&
1791                  (fl_dump_key_val(skb, &key->arp.sip,
1792                                   TCA_FLOWER_KEY_ARP_SIP, &mask->arp.sip,
1793                                   TCA_FLOWER_KEY_ARP_SIP_MASK,
1794                                   sizeof(key->arp.sip)) ||
1795                   fl_dump_key_val(skb, &key->arp.tip,
1796                                   TCA_FLOWER_KEY_ARP_TIP, &mask->arp.tip,
1797                                   TCA_FLOWER_KEY_ARP_TIP_MASK,
1798                                   sizeof(key->arp.tip)) ||
1799                   fl_dump_key_val(skb, &key->arp.op,
1800                                   TCA_FLOWER_KEY_ARP_OP, &mask->arp.op,
1801                                   TCA_FLOWER_KEY_ARP_OP_MASK,
1802                                   sizeof(key->arp.op)) ||
1803                   fl_dump_key_val(skb, key->arp.sha, TCA_FLOWER_KEY_ARP_SHA,
1804                                   mask->arp.sha, TCA_FLOWER_KEY_ARP_SHA_MASK,
1805                                   sizeof(key->arp.sha)) ||
1806                   fl_dump_key_val(skb, key->arp.tha, TCA_FLOWER_KEY_ARP_THA,
1807                                   mask->arp.tha, TCA_FLOWER_KEY_ARP_THA_MASK,
1808                                   sizeof(key->arp.tha))))
1809                 goto nla_put_failure;
1810
1811         if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS &&
1812             (fl_dump_key_val(skb, &key->enc_ipv4.src,
1813                             TCA_FLOWER_KEY_ENC_IPV4_SRC, &mask->enc_ipv4.src,
1814                             TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK,
1815                             sizeof(key->enc_ipv4.src)) ||
1816              fl_dump_key_val(skb, &key->enc_ipv4.dst,
1817                              TCA_FLOWER_KEY_ENC_IPV4_DST, &mask->enc_ipv4.dst,
1818                              TCA_FLOWER_KEY_ENC_IPV4_DST_MASK,
1819                              sizeof(key->enc_ipv4.dst))))
1820                 goto nla_put_failure;
1821         else if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS &&
1822                  (fl_dump_key_val(skb, &key->enc_ipv6.src,
1823                             TCA_FLOWER_KEY_ENC_IPV6_SRC, &mask->enc_ipv6.src,
1824                             TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK,
1825                             sizeof(key->enc_ipv6.src)) ||
1826                  fl_dump_key_val(skb, &key->enc_ipv6.dst,
1827                                  TCA_FLOWER_KEY_ENC_IPV6_DST,
1828                                  &mask->enc_ipv6.dst,
1829                                  TCA_FLOWER_KEY_ENC_IPV6_DST_MASK,
1830                             sizeof(key->enc_ipv6.dst))))
1831                 goto nla_put_failure;
1832
1833         if (fl_dump_key_val(skb, &key->enc_key_id, TCA_FLOWER_KEY_ENC_KEY_ID,
1834                             &mask->enc_key_id, TCA_FLOWER_UNSPEC,
1835                             sizeof(key->enc_key_id)) ||
1836             fl_dump_key_val(skb, &key->enc_tp.src,
1837                             TCA_FLOWER_KEY_ENC_UDP_SRC_PORT,
1838                             &mask->enc_tp.src,
1839                             TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK,
1840                             sizeof(key->enc_tp.src)) ||
1841             fl_dump_key_val(skb, &key->enc_tp.dst,
1842                             TCA_FLOWER_KEY_ENC_UDP_DST_PORT,
1843                             &mask->enc_tp.dst,
1844                             TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK,
1845                             sizeof(key->enc_tp.dst)) ||
1846             fl_dump_key_ip(skb, true, &key->enc_ip, &mask->enc_ip) ||
1847             fl_dump_key_enc_opt(skb, &key->enc_opts, &mask->enc_opts))
1848                 goto nla_put_failure;
1849
1850         if (fl_dump_key_flags(skb, key->control.flags, mask->control.flags))
1851                 goto nla_put_failure;
1852
1853         return 0;
1854
1855 nla_put_failure:
1856         return -EMSGSIZE;
1857 }
1858
1859 static int fl_dump(struct net *net, struct tcf_proto *tp, void *fh,
1860                    struct sk_buff *skb, struct tcmsg *t)
1861 {
1862         struct cls_fl_filter *f = fh;
1863         struct nlattr *nest;
1864         struct fl_flow_key *key, *mask;
1865
1866         if (!f)
1867                 return skb->len;
1868
1869         t->tcm_handle = f->handle;
1870
1871         nest = nla_nest_start(skb, TCA_OPTIONS);
1872         if (!nest)
1873                 goto nla_put_failure;
1874
1875         if (f->res.classid &&
1876             nla_put_u32(skb, TCA_FLOWER_CLASSID, f->res.classid))
1877                 goto nla_put_failure;
1878
1879         key = &f->key;
1880         mask = &f->mask->key;
1881
1882         if (fl_dump_key(skb, net, key, mask))
1883                 goto nla_put_failure;
1884
1885         if (!tc_skip_hw(f->flags))
1886                 fl_hw_update_stats(tp, f);
1887
1888         if (f->flags && nla_put_u32(skb, TCA_FLOWER_FLAGS, f->flags))
1889                 goto nla_put_failure;
1890
1891         if (nla_put_u32(skb, TCA_FLOWER_IN_HW_COUNT, f->in_hw_count))
1892                 goto nla_put_failure;
1893
1894         if (tcf_exts_dump(skb, &f->exts))
1895                 goto nla_put_failure;
1896
1897         nla_nest_end(skb, nest);
1898
1899         if (tcf_exts_dump_stats(skb, &f->exts) < 0)
1900                 goto nla_put_failure;
1901
1902         return skb->len;
1903
1904 nla_put_failure:
1905         nla_nest_cancel(skb, nest);
1906         return -1;
1907 }
1908
1909 static int fl_tmplt_dump(struct sk_buff *skb, struct net *net, void *tmplt_priv)
1910 {
1911         struct fl_flow_tmplt *tmplt = tmplt_priv;
1912         struct fl_flow_key *key, *mask;
1913         struct nlattr *nest;
1914
1915         nest = nla_nest_start(skb, TCA_OPTIONS);
1916         if (!nest)
1917                 goto nla_put_failure;
1918
1919         key = &tmplt->dummy_key;
1920         mask = &tmplt->mask;
1921
1922         if (fl_dump_key(skb, net, key, mask))
1923                 goto nla_put_failure;
1924
1925         nla_nest_end(skb, nest);
1926
1927         return skb->len;
1928
1929 nla_put_failure:
1930         nla_nest_cancel(skb, nest);
1931         return -EMSGSIZE;
1932 }
1933
1934 static void fl_bind_class(void *fh, u32 classid, unsigned long cl)
1935 {
1936         struct cls_fl_filter *f = fh;
1937
1938         if (f && f->res.classid == classid)
1939                 f->res.class = cl;
1940 }
1941
1942 static struct tcf_proto_ops cls_fl_ops __read_mostly = {
1943         .kind           = "flower",
1944         .classify       = fl_classify,
1945         .init           = fl_init,
1946         .destroy        = fl_destroy,
1947         .get            = fl_get,
1948         .change         = fl_change,
1949         .delete         = fl_delete,
1950         .walk           = fl_walk,
1951         .reoffload      = fl_reoffload,
1952         .dump           = fl_dump,
1953         .bind_class     = fl_bind_class,
1954         .tmplt_create   = fl_tmplt_create,
1955         .tmplt_destroy  = fl_tmplt_destroy,
1956         .tmplt_dump     = fl_tmplt_dump,
1957         .owner          = THIS_MODULE,
1958 };
1959
1960 static int __init cls_fl_init(void)
1961 {
1962         return register_tcf_proto_ops(&cls_fl_ops);
1963 }
1964
1965 static void __exit cls_fl_exit(void)
1966 {
1967         unregister_tcf_proto_ops(&cls_fl_ops);
1968 }
1969
1970 module_init(cls_fl_init);
1971 module_exit(cls_fl_exit);
1972
1973 MODULE_AUTHOR("Jiri Pirko <jiri@resnulli.us>");
1974 MODULE_DESCRIPTION("Flower classifier");
1975 MODULE_LICENSE("GPL v2");