Merge branch 'for-5.0' of https://git.kernel.org/pub/scm/linux/kernel/git/broonie...
[linux-2.6-microblaze.git] / kernel / bpf / offload.c
1 /*
2  * Copyright (C) 2017-2018 Netronome Systems, Inc.
3  *
4  * This software is licensed under the GNU General License Version 2,
5  * June 1991 as shown in the file COPYING in the top-level directory of this
6  * source tree.
7  *
8  * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9  * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11  * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12  * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13  * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
14  */
15
16 #include <linux/bpf.h>
17 #include <linux/bpf_verifier.h>
18 #include <linux/bug.h>
19 #include <linux/kdev_t.h>
20 #include <linux/list.h>
21 #include <linux/lockdep.h>
22 #include <linux/netdevice.h>
23 #include <linux/printk.h>
24 #include <linux/proc_ns.h>
25 #include <linux/rhashtable.h>
26 #include <linux/rtnetlink.h>
27 #include <linux/rwsem.h>
28
29 /* Protects offdevs, members of bpf_offload_netdev and offload members
30  * of all progs.
31  * RTNL lock cannot be taken when holding this lock.
32  */
33 static DECLARE_RWSEM(bpf_devs_lock);
34
35 struct bpf_offload_dev {
36         const struct bpf_prog_offload_ops *ops;
37         struct list_head netdevs;
38 };
39
40 struct bpf_offload_netdev {
41         struct rhash_head l;
42         struct net_device *netdev;
43         struct bpf_offload_dev *offdev;
44         struct list_head progs;
45         struct list_head maps;
46         struct list_head offdev_netdevs;
47 };
48
49 static const struct rhashtable_params offdevs_params = {
50         .nelem_hint             = 4,
51         .key_len                = sizeof(struct net_device *),
52         .key_offset             = offsetof(struct bpf_offload_netdev, netdev),
53         .head_offset            = offsetof(struct bpf_offload_netdev, l),
54         .automatic_shrinking    = true,
55 };
56
57 static struct rhashtable offdevs;
58 static bool offdevs_inited;
59
60 static int bpf_dev_offload_check(struct net_device *netdev)
61 {
62         if (!netdev)
63                 return -EINVAL;
64         if (!netdev->netdev_ops->ndo_bpf)
65                 return -EOPNOTSUPP;
66         return 0;
67 }
68
69 static struct bpf_offload_netdev *
70 bpf_offload_find_netdev(struct net_device *netdev)
71 {
72         lockdep_assert_held(&bpf_devs_lock);
73
74         if (!offdevs_inited)
75                 return NULL;
76         return rhashtable_lookup_fast(&offdevs, &netdev, offdevs_params);
77 }
78
79 int bpf_prog_offload_init(struct bpf_prog *prog, union bpf_attr *attr)
80 {
81         struct bpf_offload_netdev *ondev;
82         struct bpf_prog_offload *offload;
83         int err;
84
85         if (attr->prog_type != BPF_PROG_TYPE_SCHED_CLS &&
86             attr->prog_type != BPF_PROG_TYPE_XDP)
87                 return -EINVAL;
88
89         if (attr->prog_flags)
90                 return -EINVAL;
91
92         offload = kzalloc(sizeof(*offload), GFP_USER);
93         if (!offload)
94                 return -ENOMEM;
95
96         offload->prog = prog;
97
98         offload->netdev = dev_get_by_index(current->nsproxy->net_ns,
99                                            attr->prog_ifindex);
100         err = bpf_dev_offload_check(offload->netdev);
101         if (err)
102                 goto err_maybe_put;
103
104         down_write(&bpf_devs_lock);
105         ondev = bpf_offload_find_netdev(offload->netdev);
106         if (!ondev) {
107                 err = -EINVAL;
108                 goto err_unlock;
109         }
110         offload->offdev = ondev->offdev;
111         prog->aux->offload = offload;
112         list_add_tail(&offload->offloads, &ondev->progs);
113         dev_put(offload->netdev);
114         up_write(&bpf_devs_lock);
115
116         return 0;
117 err_unlock:
118         up_write(&bpf_devs_lock);
119 err_maybe_put:
120         if (offload->netdev)
121                 dev_put(offload->netdev);
122         kfree(offload);
123         return err;
124 }
125
126 int bpf_prog_offload_verifier_prep(struct bpf_prog *prog)
127 {
128         struct bpf_prog_offload *offload;
129         int ret = -ENODEV;
130
131         down_read(&bpf_devs_lock);
132         offload = prog->aux->offload;
133         if (offload) {
134                 ret = offload->offdev->ops->prepare(prog);
135                 offload->dev_state = !ret;
136         }
137         up_read(&bpf_devs_lock);
138
139         return ret;
140 }
141
142 int bpf_prog_offload_verify_insn(struct bpf_verifier_env *env,
143                                  int insn_idx, int prev_insn_idx)
144 {
145         struct bpf_prog_offload *offload;
146         int ret = -ENODEV;
147
148         down_read(&bpf_devs_lock);
149         offload = env->prog->aux->offload;
150         if (offload)
151                 ret = offload->offdev->ops->insn_hook(env, insn_idx,
152                                                       prev_insn_idx);
153         up_read(&bpf_devs_lock);
154
155         return ret;
156 }
157
158 int bpf_prog_offload_finalize(struct bpf_verifier_env *env)
159 {
160         struct bpf_prog_offload *offload;
161         int ret = -ENODEV;
162
163         down_read(&bpf_devs_lock);
164         offload = env->prog->aux->offload;
165         if (offload) {
166                 if (offload->offdev->ops->finalize)
167                         ret = offload->offdev->ops->finalize(env);
168                 else
169                         ret = 0;
170         }
171         up_read(&bpf_devs_lock);
172
173         return ret;
174 }
175
176 static void __bpf_prog_offload_destroy(struct bpf_prog *prog)
177 {
178         struct bpf_prog_offload *offload = prog->aux->offload;
179
180         if (offload->dev_state)
181                 offload->offdev->ops->destroy(prog);
182
183         /* Make sure BPF_PROG_GET_NEXT_ID can't find this dead program */
184         bpf_prog_free_id(prog, true);
185
186         list_del_init(&offload->offloads);
187         kfree(offload);
188         prog->aux->offload = NULL;
189 }
190
191 void bpf_prog_offload_destroy(struct bpf_prog *prog)
192 {
193         down_write(&bpf_devs_lock);
194         if (prog->aux->offload)
195                 __bpf_prog_offload_destroy(prog);
196         up_write(&bpf_devs_lock);
197 }
198
199 static int bpf_prog_offload_translate(struct bpf_prog *prog)
200 {
201         struct bpf_prog_offload *offload;
202         int ret = -ENODEV;
203
204         down_read(&bpf_devs_lock);
205         offload = prog->aux->offload;
206         if (offload)
207                 ret = offload->offdev->ops->translate(prog);
208         up_read(&bpf_devs_lock);
209
210         return ret;
211 }
212
213 static unsigned int bpf_prog_warn_on_exec(const void *ctx,
214                                           const struct bpf_insn *insn)
215 {
216         WARN(1, "attempt to execute device eBPF program on the host!");
217         return 0;
218 }
219
220 int bpf_prog_offload_compile(struct bpf_prog *prog)
221 {
222         prog->bpf_func = bpf_prog_warn_on_exec;
223
224         return bpf_prog_offload_translate(prog);
225 }
226
227 struct ns_get_path_bpf_prog_args {
228         struct bpf_prog *prog;
229         struct bpf_prog_info *info;
230 };
231
232 static struct ns_common *bpf_prog_offload_info_fill_ns(void *private_data)
233 {
234         struct ns_get_path_bpf_prog_args *args = private_data;
235         struct bpf_prog_aux *aux = args->prog->aux;
236         struct ns_common *ns;
237         struct net *net;
238
239         rtnl_lock();
240         down_read(&bpf_devs_lock);
241
242         if (aux->offload) {
243                 args->info->ifindex = aux->offload->netdev->ifindex;
244                 net = dev_net(aux->offload->netdev);
245                 get_net(net);
246                 ns = &net->ns;
247         } else {
248                 args->info->ifindex = 0;
249                 ns = NULL;
250         }
251
252         up_read(&bpf_devs_lock);
253         rtnl_unlock();
254
255         return ns;
256 }
257
258 int bpf_prog_offload_info_fill(struct bpf_prog_info *info,
259                                struct bpf_prog *prog)
260 {
261         struct ns_get_path_bpf_prog_args args = {
262                 .prog   = prog,
263                 .info   = info,
264         };
265         struct bpf_prog_aux *aux = prog->aux;
266         struct inode *ns_inode;
267         struct path ns_path;
268         char __user *uinsns;
269         void *res;
270         u32 ulen;
271
272         res = ns_get_path_cb(&ns_path, bpf_prog_offload_info_fill_ns, &args);
273         if (IS_ERR(res)) {
274                 if (!info->ifindex)
275                         return -ENODEV;
276                 return PTR_ERR(res);
277         }
278
279         down_read(&bpf_devs_lock);
280
281         if (!aux->offload) {
282                 up_read(&bpf_devs_lock);
283                 return -ENODEV;
284         }
285
286         ulen = info->jited_prog_len;
287         info->jited_prog_len = aux->offload->jited_len;
288         if (info->jited_prog_len & ulen) {
289                 uinsns = u64_to_user_ptr(info->jited_prog_insns);
290                 ulen = min_t(u32, info->jited_prog_len, ulen);
291                 if (copy_to_user(uinsns, aux->offload->jited_image, ulen)) {
292                         up_read(&bpf_devs_lock);
293                         return -EFAULT;
294                 }
295         }
296
297         up_read(&bpf_devs_lock);
298
299         ns_inode = ns_path.dentry->d_inode;
300         info->netns_dev = new_encode_dev(ns_inode->i_sb->s_dev);
301         info->netns_ino = ns_inode->i_ino;
302         path_put(&ns_path);
303
304         return 0;
305 }
306
307 const struct bpf_prog_ops bpf_offload_prog_ops = {
308 };
309
310 static int bpf_map_offload_ndo(struct bpf_offloaded_map *offmap,
311                                enum bpf_netdev_command cmd)
312 {
313         struct netdev_bpf data = {};
314         struct net_device *netdev;
315
316         ASSERT_RTNL();
317
318         data.command = cmd;
319         data.offmap = offmap;
320         /* Caller must make sure netdev is valid */
321         netdev = offmap->netdev;
322
323         return netdev->netdev_ops->ndo_bpf(netdev, &data);
324 }
325
326 struct bpf_map *bpf_map_offload_map_alloc(union bpf_attr *attr)
327 {
328         struct net *net = current->nsproxy->net_ns;
329         struct bpf_offload_netdev *ondev;
330         struct bpf_offloaded_map *offmap;
331         int err;
332
333         if (!capable(CAP_SYS_ADMIN))
334                 return ERR_PTR(-EPERM);
335         if (attr->map_type != BPF_MAP_TYPE_ARRAY &&
336             attr->map_type != BPF_MAP_TYPE_HASH)
337                 return ERR_PTR(-EINVAL);
338
339         offmap = kzalloc(sizeof(*offmap), GFP_USER);
340         if (!offmap)
341                 return ERR_PTR(-ENOMEM);
342
343         bpf_map_init_from_attr(&offmap->map, attr);
344
345         rtnl_lock();
346         down_write(&bpf_devs_lock);
347         offmap->netdev = __dev_get_by_index(net, attr->map_ifindex);
348         err = bpf_dev_offload_check(offmap->netdev);
349         if (err)
350                 goto err_unlock;
351
352         ondev = bpf_offload_find_netdev(offmap->netdev);
353         if (!ondev) {
354                 err = -EINVAL;
355                 goto err_unlock;
356         }
357
358         err = bpf_map_offload_ndo(offmap, BPF_OFFLOAD_MAP_ALLOC);
359         if (err)
360                 goto err_unlock;
361
362         list_add_tail(&offmap->offloads, &ondev->maps);
363         up_write(&bpf_devs_lock);
364         rtnl_unlock();
365
366         return &offmap->map;
367
368 err_unlock:
369         up_write(&bpf_devs_lock);
370         rtnl_unlock();
371         kfree(offmap);
372         return ERR_PTR(err);
373 }
374
375 static void __bpf_map_offload_destroy(struct bpf_offloaded_map *offmap)
376 {
377         WARN_ON(bpf_map_offload_ndo(offmap, BPF_OFFLOAD_MAP_FREE));
378         /* Make sure BPF_MAP_GET_NEXT_ID can't find this dead map */
379         bpf_map_free_id(&offmap->map, true);
380         list_del_init(&offmap->offloads);
381         offmap->netdev = NULL;
382 }
383
384 void bpf_map_offload_map_free(struct bpf_map *map)
385 {
386         struct bpf_offloaded_map *offmap = map_to_offmap(map);
387
388         rtnl_lock();
389         down_write(&bpf_devs_lock);
390         if (offmap->netdev)
391                 __bpf_map_offload_destroy(offmap);
392         up_write(&bpf_devs_lock);
393         rtnl_unlock();
394
395         kfree(offmap);
396 }
397
398 int bpf_map_offload_lookup_elem(struct bpf_map *map, void *key, void *value)
399 {
400         struct bpf_offloaded_map *offmap = map_to_offmap(map);
401         int ret = -ENODEV;
402
403         down_read(&bpf_devs_lock);
404         if (offmap->netdev)
405                 ret = offmap->dev_ops->map_lookup_elem(offmap, key, value);
406         up_read(&bpf_devs_lock);
407
408         return ret;
409 }
410
411 int bpf_map_offload_update_elem(struct bpf_map *map,
412                                 void *key, void *value, u64 flags)
413 {
414         struct bpf_offloaded_map *offmap = map_to_offmap(map);
415         int ret = -ENODEV;
416
417         if (unlikely(flags > BPF_EXIST))
418                 return -EINVAL;
419
420         down_read(&bpf_devs_lock);
421         if (offmap->netdev)
422                 ret = offmap->dev_ops->map_update_elem(offmap, key, value,
423                                                        flags);
424         up_read(&bpf_devs_lock);
425
426         return ret;
427 }
428
429 int bpf_map_offload_delete_elem(struct bpf_map *map, void *key)
430 {
431         struct bpf_offloaded_map *offmap = map_to_offmap(map);
432         int ret = -ENODEV;
433
434         down_read(&bpf_devs_lock);
435         if (offmap->netdev)
436                 ret = offmap->dev_ops->map_delete_elem(offmap, key);
437         up_read(&bpf_devs_lock);
438
439         return ret;
440 }
441
442 int bpf_map_offload_get_next_key(struct bpf_map *map, void *key, void *next_key)
443 {
444         struct bpf_offloaded_map *offmap = map_to_offmap(map);
445         int ret = -ENODEV;
446
447         down_read(&bpf_devs_lock);
448         if (offmap->netdev)
449                 ret = offmap->dev_ops->map_get_next_key(offmap, key, next_key);
450         up_read(&bpf_devs_lock);
451
452         return ret;
453 }
454
455 struct ns_get_path_bpf_map_args {
456         struct bpf_offloaded_map *offmap;
457         struct bpf_map_info *info;
458 };
459
460 static struct ns_common *bpf_map_offload_info_fill_ns(void *private_data)
461 {
462         struct ns_get_path_bpf_map_args *args = private_data;
463         struct ns_common *ns;
464         struct net *net;
465
466         rtnl_lock();
467         down_read(&bpf_devs_lock);
468
469         if (args->offmap->netdev) {
470                 args->info->ifindex = args->offmap->netdev->ifindex;
471                 net = dev_net(args->offmap->netdev);
472                 get_net(net);
473                 ns = &net->ns;
474         } else {
475                 args->info->ifindex = 0;
476                 ns = NULL;
477         }
478
479         up_read(&bpf_devs_lock);
480         rtnl_unlock();
481
482         return ns;
483 }
484
485 int bpf_map_offload_info_fill(struct bpf_map_info *info, struct bpf_map *map)
486 {
487         struct ns_get_path_bpf_map_args args = {
488                 .offmap = map_to_offmap(map),
489                 .info   = info,
490         };
491         struct inode *ns_inode;
492         struct path ns_path;
493         void *res;
494
495         res = ns_get_path_cb(&ns_path, bpf_map_offload_info_fill_ns, &args);
496         if (IS_ERR(res)) {
497                 if (!info->ifindex)
498                         return -ENODEV;
499                 return PTR_ERR(res);
500         }
501
502         ns_inode = ns_path.dentry->d_inode;
503         info->netns_dev = new_encode_dev(ns_inode->i_sb->s_dev);
504         info->netns_ino = ns_inode->i_ino;
505         path_put(&ns_path);
506
507         return 0;
508 }
509
510 static bool __bpf_offload_dev_match(struct bpf_prog *prog,
511                                     struct net_device *netdev)
512 {
513         struct bpf_offload_netdev *ondev1, *ondev2;
514         struct bpf_prog_offload *offload;
515
516         if (!bpf_prog_is_dev_bound(prog->aux))
517                 return false;
518
519         offload = prog->aux->offload;
520         if (!offload)
521                 return false;
522         if (offload->netdev == netdev)
523                 return true;
524
525         ondev1 = bpf_offload_find_netdev(offload->netdev);
526         ondev2 = bpf_offload_find_netdev(netdev);
527
528         return ondev1 && ondev2 && ondev1->offdev == ondev2->offdev;
529 }
530
531 bool bpf_offload_dev_match(struct bpf_prog *prog, struct net_device *netdev)
532 {
533         bool ret;
534
535         down_read(&bpf_devs_lock);
536         ret = __bpf_offload_dev_match(prog, netdev);
537         up_read(&bpf_devs_lock);
538
539         return ret;
540 }
541 EXPORT_SYMBOL_GPL(bpf_offload_dev_match);
542
543 bool bpf_offload_prog_map_match(struct bpf_prog *prog, struct bpf_map *map)
544 {
545         struct bpf_offloaded_map *offmap;
546         bool ret;
547
548         if (!bpf_map_is_dev_bound(map))
549                 return bpf_map_offload_neutral(map);
550         offmap = map_to_offmap(map);
551
552         down_read(&bpf_devs_lock);
553         ret = __bpf_offload_dev_match(prog, offmap->netdev);
554         up_read(&bpf_devs_lock);
555
556         return ret;
557 }
558
559 int bpf_offload_dev_netdev_register(struct bpf_offload_dev *offdev,
560                                     struct net_device *netdev)
561 {
562         struct bpf_offload_netdev *ondev;
563         int err;
564
565         ondev = kzalloc(sizeof(*ondev), GFP_KERNEL);
566         if (!ondev)
567                 return -ENOMEM;
568
569         ondev->netdev = netdev;
570         ondev->offdev = offdev;
571         INIT_LIST_HEAD(&ondev->progs);
572         INIT_LIST_HEAD(&ondev->maps);
573
574         down_write(&bpf_devs_lock);
575         err = rhashtable_insert_fast(&offdevs, &ondev->l, offdevs_params);
576         if (err) {
577                 netdev_warn(netdev, "failed to register for BPF offload\n");
578                 goto err_unlock_free;
579         }
580
581         list_add(&ondev->offdev_netdevs, &offdev->netdevs);
582         up_write(&bpf_devs_lock);
583         return 0;
584
585 err_unlock_free:
586         up_write(&bpf_devs_lock);
587         kfree(ondev);
588         return err;
589 }
590 EXPORT_SYMBOL_GPL(bpf_offload_dev_netdev_register);
591
592 void bpf_offload_dev_netdev_unregister(struct bpf_offload_dev *offdev,
593                                        struct net_device *netdev)
594 {
595         struct bpf_offload_netdev *ondev, *altdev;
596         struct bpf_offloaded_map *offmap, *mtmp;
597         struct bpf_prog_offload *offload, *ptmp;
598
599         ASSERT_RTNL();
600
601         down_write(&bpf_devs_lock);
602         ondev = rhashtable_lookup_fast(&offdevs, &netdev, offdevs_params);
603         if (WARN_ON(!ondev))
604                 goto unlock;
605
606         WARN_ON(rhashtable_remove_fast(&offdevs, &ondev->l, offdevs_params));
607         list_del(&ondev->offdev_netdevs);
608
609         /* Try to move the objects to another netdev of the device */
610         altdev = list_first_entry_or_null(&offdev->netdevs,
611                                           struct bpf_offload_netdev,
612                                           offdev_netdevs);
613         if (altdev) {
614                 list_for_each_entry(offload, &ondev->progs, offloads)
615                         offload->netdev = altdev->netdev;
616                 list_splice_init(&ondev->progs, &altdev->progs);
617
618                 list_for_each_entry(offmap, &ondev->maps, offloads)
619                         offmap->netdev = altdev->netdev;
620                 list_splice_init(&ondev->maps, &altdev->maps);
621         } else {
622                 list_for_each_entry_safe(offload, ptmp, &ondev->progs, offloads)
623                         __bpf_prog_offload_destroy(offload->prog);
624                 list_for_each_entry_safe(offmap, mtmp, &ondev->maps, offloads)
625                         __bpf_map_offload_destroy(offmap);
626         }
627
628         WARN_ON(!list_empty(&ondev->progs));
629         WARN_ON(!list_empty(&ondev->maps));
630         kfree(ondev);
631 unlock:
632         up_write(&bpf_devs_lock);
633 }
634 EXPORT_SYMBOL_GPL(bpf_offload_dev_netdev_unregister);
635
636 struct bpf_offload_dev *
637 bpf_offload_dev_create(const struct bpf_prog_offload_ops *ops)
638 {
639         struct bpf_offload_dev *offdev;
640         int err;
641
642         down_write(&bpf_devs_lock);
643         if (!offdevs_inited) {
644                 err = rhashtable_init(&offdevs, &offdevs_params);
645                 if (err)
646                         return ERR_PTR(err);
647                 offdevs_inited = true;
648         }
649         up_write(&bpf_devs_lock);
650
651         offdev = kzalloc(sizeof(*offdev), GFP_KERNEL);
652         if (!offdev)
653                 return ERR_PTR(-ENOMEM);
654
655         offdev->ops = ops;
656         INIT_LIST_HEAD(&offdev->netdevs);
657
658         return offdev;
659 }
660 EXPORT_SYMBOL_GPL(bpf_offload_dev_create);
661
662 void bpf_offload_dev_destroy(struct bpf_offload_dev *offdev)
663 {
664         WARN_ON(!list_empty(&offdev->netdevs));
665         kfree(offdev);
666 }
667 EXPORT_SYMBOL_GPL(bpf_offload_dev_destroy);