net: Special handling for IP & MPLS.
[linux-2.6-microblaze.git] / drivers / net / bareudp.c
1 // SPDX-License-Identifier: GPL-2.0
2 /* Bareudp: UDP  tunnel encasulation for different Payload types like
3  * MPLS, NSH, IP, etc.
4  * Copyright (c) 2019 Nokia, Inc.
5  * Authors:  Martin Varghese, <martin.varghese@nokia.com>
6  */
7
8 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
9
10 #include <linux/kernel.h>
11 #include <linux/module.h>
12 #include <linux/etherdevice.h>
13 #include <linux/hash.h>
14 #include <net/dst_metadata.h>
15 #include <net/gro_cells.h>
16 #include <net/rtnetlink.h>
17 #include <net/protocol.h>
18 #include <net/ip6_tunnel.h>
19 #include <net/ip_tunnels.h>
20 #include <net/udp_tunnel.h>
21 #include <net/bareudp.h>
22
23 #define BAREUDP_BASE_HLEN sizeof(struct udphdr)
24 #define BAREUDP_IPV4_HLEN (sizeof(struct iphdr) + \
25                            sizeof(struct udphdr))
26 #define BAREUDP_IPV6_HLEN (sizeof(struct ipv6hdr) + \
27                            sizeof(struct udphdr))
28
29 static bool log_ecn_error = true;
30 module_param(log_ecn_error, bool, 0644);
31 MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
32
33 /* per-network namespace private data for this module */
34
35 static unsigned int bareudp_net_id;
36
37 struct bareudp_net {
38         struct list_head        bareudp_list;
39 };
40
41 /* Pseudo network device */
42 struct bareudp_dev {
43         struct net         *net;        /* netns for packet i/o */
44         struct net_device  *dev;        /* netdev for bareudp tunnel */
45         __be16             ethertype;
46         __be16             port;
47         u16                sport_min;
48         bool               multi_proto_mode;
49         struct socket      __rcu *sock;
50         struct list_head   next;        /* bareudp node  on namespace list */
51         struct gro_cells   gro_cells;
52 };
53
54 static int bareudp_udp_encap_recv(struct sock *sk, struct sk_buff *skb)
55 {
56         struct metadata_dst *tun_dst = NULL;
57         struct pcpu_sw_netstats *stats;
58         struct bareudp_dev *bareudp;
59         unsigned short family;
60         unsigned int len;
61         __be16 proto;
62         void *oiph;
63         int err;
64
65         bareudp = rcu_dereference_sk_user_data(sk);
66         if (!bareudp)
67                 goto drop;
68
69         if (skb->protocol ==  htons(ETH_P_IP))
70                 family = AF_INET;
71         else
72                 family = AF_INET6;
73
74         if (bareudp->ethertype == htons(ETH_P_IP)) {
75                 struct iphdr *iphdr;
76
77                 iphdr = (struct iphdr *)(skb->data + BAREUDP_BASE_HLEN);
78                 if (iphdr->version == 4) {
79                         proto = bareudp->ethertype;
80                 } else if (bareudp->multi_proto_mode && (iphdr->version == 6)) {
81                         proto = htons(ETH_P_IPV6);
82                 } else {
83                         bareudp->dev->stats.rx_dropped++;
84                         goto drop;
85                 }
86         } else if (bareudp->ethertype == htons(ETH_P_MPLS_UC)) {
87                 struct iphdr *tunnel_hdr;
88
89                 tunnel_hdr = (struct iphdr *)skb_network_header(skb);
90                 if (tunnel_hdr->version == 4) {
91                         if (!ipv4_is_multicast(tunnel_hdr->daddr)) {
92                                 proto = bareudp->ethertype;
93                         } else if (bareudp->multi_proto_mode &&
94                                    ipv4_is_multicast(tunnel_hdr->daddr)) {
95                                 proto = htons(ETH_P_MPLS_MC);
96                         } else {
97                                 bareudp->dev->stats.rx_dropped++;
98                                 goto drop;
99                         }
100                 } else {
101                         int addr_type;
102                         struct ipv6hdr *tunnel_hdr_v6;
103
104                         tunnel_hdr_v6 = (struct ipv6hdr *)skb_network_header(skb);
105                         addr_type =
106                         ipv6_addr_type((struct in6_addr *)&tunnel_hdr_v6->daddr);
107                         if (!(addr_type & IPV6_ADDR_MULTICAST)) {
108                                 proto = bareudp->ethertype;
109                         } else if (bareudp->multi_proto_mode &&
110                                    (addr_type & IPV6_ADDR_MULTICAST)) {
111                                 proto = htons(ETH_P_MPLS_MC);
112                         } else {
113                                 bareudp->dev->stats.rx_dropped++;
114                                 goto drop;
115                         }
116                 }
117         } else {
118                 proto = bareudp->ethertype;
119         }
120
121         if (iptunnel_pull_header(skb, BAREUDP_BASE_HLEN,
122                                  proto,
123                                  !net_eq(bareudp->net,
124                                  dev_net(bareudp->dev)))) {
125                 bareudp->dev->stats.rx_dropped++;
126                 goto drop;
127         }
128
129         tun_dst = udp_tun_rx_dst(skb, family, TUNNEL_KEY, 0, 0);
130         if (!tun_dst) {
131                 bareudp->dev->stats.rx_dropped++;
132                 goto drop;
133         }
134         skb_dst_set(skb, &tun_dst->dst);
135         skb->dev = bareudp->dev;
136         oiph = skb_network_header(skb);
137         skb_reset_network_header(skb);
138
139         if (family == AF_INET)
140                 err = IP_ECN_decapsulate(oiph, skb);
141 #if IS_ENABLED(CONFIG_IPV6)
142         else
143                 err = IP6_ECN_decapsulate(oiph, skb);
144 #endif
145
146         if (unlikely(err)) {
147                 if (log_ecn_error) {
148                         if  (family == AF_INET)
149                                 net_info_ratelimited("non-ECT from %pI4 "
150                                                      "with TOS=%#x\n",
151                                                      &((struct iphdr *)oiph)->saddr,
152                                                      ((struct iphdr *)oiph)->tos);
153 #if IS_ENABLED(CONFIG_IPV6)
154                         else
155                                 net_info_ratelimited("non-ECT from %pI6\n",
156                                                      &((struct ipv6hdr *)oiph)->saddr);
157 #endif
158                 }
159                 if (err > 1) {
160                         ++bareudp->dev->stats.rx_frame_errors;
161                         ++bareudp->dev->stats.rx_errors;
162                         goto drop;
163                 }
164         }
165
166         len = skb->len;
167         err = gro_cells_receive(&bareudp->gro_cells, skb);
168         if (likely(err == NET_RX_SUCCESS)) {
169                 stats = this_cpu_ptr(bareudp->dev->tstats);
170                 u64_stats_update_begin(&stats->syncp);
171                 stats->rx_packets++;
172                 stats->rx_bytes += len;
173                 u64_stats_update_end(&stats->syncp);
174         }
175         return 0;
176 drop:
177         /* Consume bad packet */
178         kfree_skb(skb);
179
180         return 0;
181 }
182
183 static int bareudp_err_lookup(struct sock *sk, struct sk_buff *skb)
184 {
185         return 0;
186 }
187
188 static int bareudp_init(struct net_device *dev)
189 {
190         struct bareudp_dev *bareudp = netdev_priv(dev);
191         int err;
192
193         dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
194         if (!dev->tstats)
195                 return -ENOMEM;
196
197         err = gro_cells_init(&bareudp->gro_cells, dev);
198         if (err) {
199                 free_percpu(dev->tstats);
200                 return err;
201         }
202         return 0;
203 }
204
205 static void bareudp_uninit(struct net_device *dev)
206 {
207         struct bareudp_dev *bareudp = netdev_priv(dev);
208
209         gro_cells_destroy(&bareudp->gro_cells);
210         free_percpu(dev->tstats);
211 }
212
213 static struct socket *bareudp_create_sock(struct net *net, __be16 port)
214 {
215         struct udp_port_cfg udp_conf;
216         struct socket *sock;
217         int err;
218
219         memset(&udp_conf, 0, sizeof(udp_conf));
220 #if IS_ENABLED(CONFIG_IPV6)
221         udp_conf.family = AF_INET6;
222 #else
223         udp_conf.family = AF_INET;
224 #endif
225         udp_conf.local_udp_port = port;
226         /* Open UDP socket */
227         err = udp_sock_create(net, &udp_conf, &sock);
228         if (err < 0)
229                 return ERR_PTR(err);
230
231         return sock;
232 }
233
234 /* Create new listen socket if needed */
235 static int bareudp_socket_create(struct bareudp_dev *bareudp, __be16 port)
236 {
237         struct udp_tunnel_sock_cfg tunnel_cfg;
238         struct socket *sock;
239
240         sock = bareudp_create_sock(bareudp->net, port);
241         if (IS_ERR(sock))
242                 return PTR_ERR(sock);
243
244         /* Mark socket as an encapsulation socket */
245         memset(&tunnel_cfg, 0, sizeof(tunnel_cfg));
246         tunnel_cfg.sk_user_data = bareudp;
247         tunnel_cfg.encap_type = 1;
248         tunnel_cfg.encap_rcv = bareudp_udp_encap_recv;
249         tunnel_cfg.encap_err_lookup = bareudp_err_lookup;
250         tunnel_cfg.encap_destroy = NULL;
251         setup_udp_tunnel_sock(bareudp->net, sock, &tunnel_cfg);
252
253         if (sock->sk->sk_family == AF_INET6)
254                 udp_encap_enable();
255
256         rcu_assign_pointer(bareudp->sock, sock);
257         return 0;
258 }
259
260 static int bareudp_open(struct net_device *dev)
261 {
262         struct bareudp_dev *bareudp = netdev_priv(dev);
263         int ret = 0;
264
265         ret =  bareudp_socket_create(bareudp, bareudp->port);
266         return ret;
267 }
268
269 static void bareudp_sock_release(struct bareudp_dev *bareudp)
270 {
271         struct socket *sock;
272
273         sock = bareudp->sock;
274         rcu_assign_pointer(bareudp->sock, NULL);
275         synchronize_net();
276         udp_tunnel_sock_release(sock);
277 }
278
279 static int bareudp_stop(struct net_device *dev)
280 {
281         struct bareudp_dev *bareudp = netdev_priv(dev);
282
283         bareudp_sock_release(bareudp);
284         return 0;
285 }
286
287 static int bareudp_xmit_skb(struct sk_buff *skb, struct net_device *dev,
288                             struct bareudp_dev *bareudp,
289                             const struct ip_tunnel_info *info)
290 {
291         bool xnet = !net_eq(bareudp->net, dev_net(bareudp->dev));
292         bool use_cache = ip_tunnel_dst_cache_usable(skb, info);
293         struct socket *sock = rcu_dereference(bareudp->sock);
294         bool udp_sum = !!(info->key.tun_flags & TUNNEL_CSUM);
295         const struct ip_tunnel_key *key = &info->key;
296         struct rtable *rt;
297         __be16 sport, df;
298         int min_headroom;
299         __u8 tos, ttl;
300         __be32 saddr;
301         int err;
302
303         if (!sock)
304                 return -ESHUTDOWN;
305
306         rt = ip_route_output_tunnel(skb, dev, bareudp->net, &saddr, info,
307                                     IPPROTO_UDP, use_cache);
308
309         if (IS_ERR(rt))
310                 return PTR_ERR(rt);
311
312         skb_tunnel_check_pmtu(skb, &rt->dst,
313                               BAREUDP_IPV4_HLEN + info->options_len);
314
315         sport = udp_flow_src_port(bareudp->net, skb,
316                                   bareudp->sport_min, USHRT_MAX,
317                                   true);
318         tos = ip_tunnel_ecn_encap(key->tos, ip_hdr(skb), skb);
319         ttl = key->ttl;
320         df = key->tun_flags & TUNNEL_DONT_FRAGMENT ? htons(IP_DF) : 0;
321         skb_scrub_packet(skb, xnet);
322
323         if (!skb_pull(skb, skb_network_offset(skb)))
324                 goto free_dst;
325
326         min_headroom = LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len +
327                 BAREUDP_BASE_HLEN + info->options_len + sizeof(struct iphdr);
328
329         err = skb_cow_head(skb, min_headroom);
330         if (unlikely(err))
331                 goto free_dst;
332
333         err = udp_tunnel_handle_offloads(skb, udp_sum);
334         if (err)
335                 goto free_dst;
336
337         skb_set_inner_protocol(skb, bareudp->ethertype);
338         udp_tunnel_xmit_skb(rt, sock->sk, skb, saddr, info->key.u.ipv4.dst,
339                             tos, ttl, df, sport, bareudp->port,
340                             !net_eq(bareudp->net, dev_net(bareudp->dev)),
341                             !(info->key.tun_flags & TUNNEL_CSUM));
342         return 0;
343
344 free_dst:
345         dst_release(&rt->dst);
346         return err;
347 }
348
349 #if IS_ENABLED(CONFIG_IPV6)
350 static int bareudp6_xmit_skb(struct sk_buff *skb, struct net_device *dev,
351                              struct bareudp_dev *bareudp,
352                              const struct ip_tunnel_info *info)
353 {
354         bool xnet = !net_eq(bareudp->net, dev_net(bareudp->dev));
355         bool use_cache = ip_tunnel_dst_cache_usable(skb, info);
356         struct socket *sock  = rcu_dereference(bareudp->sock);
357         bool udp_sum = !!(info->key.tun_flags & TUNNEL_CSUM);
358         const struct ip_tunnel_key *key = &info->key;
359         struct dst_entry *dst = NULL;
360         struct in6_addr saddr, daddr;
361         int min_headroom;
362         __u8 prio, ttl;
363         __be16 sport;
364         int err;
365
366         if (!sock)
367                 return -ESHUTDOWN;
368
369         dst = ip6_dst_lookup_tunnel(skb, dev, bareudp->net, sock, &saddr, info,
370                                     IPPROTO_UDP, use_cache);
371         if (IS_ERR(dst))
372                 return PTR_ERR(dst);
373
374         skb_tunnel_check_pmtu(skb, dst, BAREUDP_IPV6_HLEN + info->options_len);
375
376         sport = udp_flow_src_port(bareudp->net, skb,
377                                   bareudp->sport_min, USHRT_MAX,
378                                   true);
379         prio = ip_tunnel_ecn_encap(key->tos, ip_hdr(skb), skb);
380         ttl = key->ttl;
381
382         skb_scrub_packet(skb, xnet);
383
384         if (!skb_pull(skb, skb_network_offset(skb)))
385                 goto free_dst;
386
387         min_headroom = LL_RESERVED_SPACE(dst->dev) + dst->header_len +
388                 BAREUDP_BASE_HLEN + info->options_len + sizeof(struct iphdr);
389
390         err = skb_cow_head(skb, min_headroom);
391         if (unlikely(err))
392                 goto free_dst;
393
394         err = udp_tunnel_handle_offloads(skb, udp_sum);
395         if (err)
396                 goto free_dst;
397
398         daddr = info->key.u.ipv6.dst;
399         udp_tunnel6_xmit_skb(dst, sock->sk, skb, dev,
400                              &saddr, &daddr, prio, ttl,
401                              info->key.label, sport, bareudp->port,
402                              !(info->key.tun_flags & TUNNEL_CSUM));
403         return 0;
404
405 free_dst:
406         dst_release(dst);
407         return err;
408 }
409 #endif
410
411 static netdev_tx_t bareudp_xmit(struct sk_buff *skb, struct net_device *dev)
412 {
413         struct bareudp_dev *bareudp = netdev_priv(dev);
414         struct ip_tunnel_info *info = NULL;
415         int err;
416
417         if (skb->protocol != bareudp->ethertype) {
418                 if (!bareudp->multi_proto_mode ||
419                     (skb->protocol !=  htons(ETH_P_MPLS_MC) &&
420                      skb->protocol !=  htons(ETH_P_IPV6))) {
421                         err = -EINVAL;
422                         goto tx_error;
423                 }
424         }
425
426         info = skb_tunnel_info(skb);
427         if (unlikely(!info || !(info->mode & IP_TUNNEL_INFO_TX))) {
428                 err = -EINVAL;
429                 goto tx_error;
430         }
431
432         rcu_read_lock();
433 #if IS_ENABLED(CONFIG_IPV6)
434         if (info->mode & IP_TUNNEL_INFO_IPV6)
435                 err = bareudp6_xmit_skb(skb, dev, bareudp, info);
436         else
437 #endif
438                 err = bareudp_xmit_skb(skb, dev, bareudp, info);
439
440         rcu_read_unlock();
441
442         if (likely(!err))
443                 return NETDEV_TX_OK;
444 tx_error:
445         dev_kfree_skb(skb);
446
447         if (err == -ELOOP)
448                 dev->stats.collisions++;
449         else if (err == -ENETUNREACH)
450                 dev->stats.tx_carrier_errors++;
451
452         dev->stats.tx_errors++;
453         return NETDEV_TX_OK;
454 }
455
456 static int bareudp_fill_metadata_dst(struct net_device *dev,
457                                      struct sk_buff *skb)
458 {
459         struct ip_tunnel_info *info = skb_tunnel_info(skb);
460         struct bareudp_dev *bareudp = netdev_priv(dev);
461         bool use_cache;
462
463         use_cache = ip_tunnel_dst_cache_usable(skb, info);
464
465         if (ip_tunnel_info_af(info) == AF_INET) {
466                 struct rtable *rt;
467                 __be32 saddr;
468
469                 rt = ip_route_output_tunnel(skb, dev, bareudp->net, &saddr,
470                                             info, IPPROTO_UDP, use_cache);
471                 if (IS_ERR(rt))
472                         return PTR_ERR(rt);
473
474                 ip_rt_put(rt);
475                 info->key.u.ipv4.src = saddr;
476 #if IS_ENABLED(CONFIG_IPV6)
477         } else if (ip_tunnel_info_af(info) == AF_INET6) {
478                 struct dst_entry *dst;
479                 struct in6_addr saddr;
480                 struct socket *sock = rcu_dereference(bareudp->sock);
481
482                 dst = ip6_dst_lookup_tunnel(skb, dev, bareudp->net, sock,
483                                             &saddr, info, IPPROTO_UDP,
484                                             use_cache);
485                 if (IS_ERR(dst))
486                         return PTR_ERR(dst);
487
488                 dst_release(dst);
489                 info->key.u.ipv6.src = saddr;
490 #endif
491         } else {
492                 return -EINVAL;
493         }
494
495         info->key.tp_src = udp_flow_src_port(bareudp->net, skb,
496                                              bareudp->sport_min,
497                         USHRT_MAX, true);
498         info->key.tp_dst = bareudp->port;
499         return 0;
500 }
501
502 static const struct net_device_ops bareudp_netdev_ops = {
503         .ndo_init               = bareudp_init,
504         .ndo_uninit             = bareudp_uninit,
505         .ndo_open               = bareudp_open,
506         .ndo_stop               = bareudp_stop,
507         .ndo_start_xmit         = bareudp_xmit,
508         .ndo_get_stats64        = ip_tunnel_get_stats64,
509         .ndo_fill_metadata_dst  = bareudp_fill_metadata_dst,
510 };
511
512 static const struct nla_policy bareudp_policy[IFLA_BAREUDP_MAX + 1] = {
513         [IFLA_BAREUDP_PORT]                = { .type = NLA_U16 },
514         [IFLA_BAREUDP_ETHERTYPE]           = { .type = NLA_U16 },
515         [IFLA_BAREUDP_SRCPORT_MIN]         = { .type = NLA_U16 },
516         [IFLA_BAREUDP_MULTIPROTO_MODE]     = { .type = NLA_FLAG },
517 };
518
519 /* Info for udev, that this is a virtual tunnel endpoint */
520 static struct device_type bareudp_type = {
521         .name = "bareudp",
522 };
523
524 /* Initialize the device structure. */
525 static void bareudp_setup(struct net_device *dev)
526 {
527         dev->netdev_ops = &bareudp_netdev_ops;
528         dev->needs_free_netdev = true;
529         SET_NETDEV_DEVTYPE(dev, &bareudp_type);
530         dev->features    |= NETIF_F_SG | NETIF_F_HW_CSUM;
531         dev->features    |= NETIF_F_RXCSUM;
532         dev->features    |= NETIF_F_GSO_SOFTWARE;
533         dev->hw_features |= NETIF_F_SG | NETIF_F_HW_CSUM | NETIF_F_RXCSUM;
534         dev->hw_features |= NETIF_F_GSO_SOFTWARE;
535         dev->hard_header_len = 0;
536         dev->addr_len = 0;
537         dev->mtu = ETH_DATA_LEN;
538         dev->min_mtu = IPV4_MIN_MTU;
539         dev->max_mtu = IP_MAX_MTU - BAREUDP_BASE_HLEN;
540         dev->type = ARPHRD_NONE;
541         netif_keep_dst(dev);
542         dev->priv_flags |= IFF_NO_QUEUE;
543         dev->flags = IFF_POINTOPOINT | IFF_NOARP | IFF_MULTICAST;
544 }
545
546 static int bareudp_validate(struct nlattr *tb[], struct nlattr *data[],
547                             struct netlink_ext_ack *extack)
548 {
549         if (!data) {
550                 NL_SET_ERR_MSG(extack,
551                                "Not enough attributes provided to perform the operation");
552                 return -EINVAL;
553         }
554         return 0;
555 }
556
557 static int bareudp2info(struct nlattr *data[], struct bareudp_conf *conf)
558 {
559         if (!data[IFLA_BAREUDP_PORT] || !data[IFLA_BAREUDP_ETHERTYPE])
560                 return -EINVAL;
561
562         if (data[IFLA_BAREUDP_PORT])
563                 conf->port =  nla_get_u16(data[IFLA_BAREUDP_PORT]);
564
565         if (data[IFLA_BAREUDP_ETHERTYPE])
566                 conf->ethertype =  nla_get_u16(data[IFLA_BAREUDP_ETHERTYPE]);
567
568         if (data[IFLA_BAREUDP_SRCPORT_MIN])
569                 conf->sport_min =  nla_get_u16(data[IFLA_BAREUDP_SRCPORT_MIN]);
570
571         return 0;
572 }
573
574 static struct bareudp_dev *bareudp_find_dev(struct bareudp_net *bn,
575                                             const struct bareudp_conf *conf)
576 {
577         struct bareudp_dev *bareudp, *t = NULL;
578
579         list_for_each_entry(bareudp, &bn->bareudp_list, next) {
580                 if (conf->port == bareudp->port)
581                         t = bareudp;
582         }
583         return t;
584 }
585
586 static int bareudp_configure(struct net *net, struct net_device *dev,
587                              struct bareudp_conf *conf)
588 {
589         struct bareudp_net *bn = net_generic(net, bareudp_net_id);
590         struct bareudp_dev *t, *bareudp = netdev_priv(dev);
591         int err;
592
593         bareudp->net = net;
594         bareudp->dev = dev;
595         t = bareudp_find_dev(bn, conf);
596         if (t)
597                 return -EBUSY;
598
599         if (conf->multi_proto_mode &&
600             (conf->ethertype != htons(ETH_P_MPLS_UC) &&
601              conf->ethertype != htons(ETH_P_IP)))
602                 return -EINVAL;
603
604         bareudp->port = conf->port;
605         bareudp->ethertype = conf->ethertype;
606         bareudp->sport_min = conf->sport_min;
607         bareudp->multi_proto_mode = conf->multi_proto_mode;
608         err = register_netdevice(dev);
609         if (err)
610                 return err;
611
612         list_add(&bareudp->next, &bn->bareudp_list);
613         return 0;
614 }
615
616 static int bareudp_link_config(struct net_device *dev,
617                                struct nlattr *tb[])
618 {
619         int err;
620
621         if (tb[IFLA_MTU]) {
622                 err = dev_set_mtu(dev, nla_get_u32(tb[IFLA_MTU]));
623                 if (err)
624                         return err;
625         }
626         return 0;
627 }
628
629 static int bareudp_newlink(struct net *net, struct net_device *dev,
630                            struct nlattr *tb[], struct nlattr *data[],
631                            struct netlink_ext_ack *extack)
632 {
633         struct bareudp_conf conf;
634         int err;
635
636         err = bareudp2info(data, &conf);
637         if (err)
638                 return err;
639
640         err = bareudp_configure(net, dev, &conf);
641         if (err)
642                 return err;
643
644         err = bareudp_link_config(dev, tb);
645         if (err)
646                 return err;
647
648         return 0;
649 }
650
651 static void bareudp_dellink(struct net_device *dev, struct list_head *head)
652 {
653         struct bareudp_dev *bareudp = netdev_priv(dev);
654
655         list_del(&bareudp->next);
656         unregister_netdevice_queue(dev, head);
657 }
658
659 static size_t bareudp_get_size(const struct net_device *dev)
660 {
661         return  nla_total_size(sizeof(__be16)) +  /* IFLA_BAREUDP_PORT */
662                 nla_total_size(sizeof(__be16)) +  /* IFLA_BAREUDP_ETHERTYPE */
663                 nla_total_size(sizeof(__u16))  +  /* IFLA_BAREUDP_SRCPORT_MIN */
664                 nla_total_size(0)              +  /* IFLA_BAREUDP_MULTIPROTO_MODE */
665                 0;
666 }
667
668 static int bareudp_fill_info(struct sk_buff *skb, const struct net_device *dev)
669 {
670         struct bareudp_dev *bareudp = netdev_priv(dev);
671
672         if (nla_put_be16(skb, IFLA_BAREUDP_PORT, bareudp->port))
673                 goto nla_put_failure;
674         if (nla_put_be16(skb, IFLA_BAREUDP_ETHERTYPE, bareudp->ethertype))
675                 goto nla_put_failure;
676         if (nla_put_u16(skb, IFLA_BAREUDP_SRCPORT_MIN, bareudp->sport_min))
677                 goto nla_put_failure;
678         if (bareudp->multi_proto_mode &&
679             nla_put_flag(skb, IFLA_BAREUDP_MULTIPROTO_MODE))
680                 goto nla_put_failure;
681
682         return 0;
683
684 nla_put_failure:
685         return -EMSGSIZE;
686 }
687
688 static struct rtnl_link_ops bareudp_link_ops __read_mostly = {
689         .kind           = "bareudp",
690         .maxtype        = IFLA_BAREUDP_MAX,
691         .policy         = bareudp_policy,
692         .priv_size      = sizeof(struct bareudp_dev),
693         .setup          = bareudp_setup,
694         .validate       = bareudp_validate,
695         .newlink        = bareudp_newlink,
696         .dellink        = bareudp_dellink,
697         .get_size       = bareudp_get_size,
698         .fill_info      = bareudp_fill_info,
699 };
700
701 struct net_device *bareudp_dev_create(struct net *net, const char *name,
702                                       u8 name_assign_type,
703                                       struct bareudp_conf *conf)
704 {
705         struct nlattr *tb[IFLA_MAX + 1];
706         struct net_device *dev;
707         LIST_HEAD(list_kill);
708         int err;
709
710         memset(tb, 0, sizeof(tb));
711         dev = rtnl_create_link(net, name, name_assign_type,
712                                &bareudp_link_ops, tb, NULL);
713         if (IS_ERR(dev))
714                 return dev;
715
716         err = bareudp_configure(net, dev, conf);
717         if (err) {
718                 free_netdev(dev);
719                 return ERR_PTR(err);
720         }
721         err = dev_set_mtu(dev, IP_MAX_MTU - BAREUDP_BASE_HLEN);
722         if (err)
723                 goto err;
724
725         err = rtnl_configure_link(dev, NULL);
726         if (err < 0)
727                 goto err;
728
729         return dev;
730 err:
731         bareudp_dellink(dev, &list_kill);
732         unregister_netdevice_many(&list_kill);
733         return ERR_PTR(err);
734 }
735 EXPORT_SYMBOL_GPL(bareudp_dev_create);
736
737 static __net_init int bareudp_init_net(struct net *net)
738 {
739         struct bareudp_net *bn = net_generic(net, bareudp_net_id);
740
741         INIT_LIST_HEAD(&bn->bareudp_list);
742         return 0;
743 }
744
745 static void bareudp_destroy_tunnels(struct net *net, struct list_head *head)
746 {
747         struct bareudp_net *bn = net_generic(net, bareudp_net_id);
748         struct bareudp_dev *bareudp, *next;
749
750         list_for_each_entry_safe(bareudp, next, &bn->bareudp_list, next)
751                 unregister_netdevice_queue(bareudp->dev, head);
752 }
753
754 static void __net_exit bareudp_exit_batch_net(struct list_head *net_list)
755 {
756         struct net *net;
757         LIST_HEAD(list);
758
759         rtnl_lock();
760         list_for_each_entry(net, net_list, exit_list)
761                 bareudp_destroy_tunnels(net, &list);
762
763         /* unregister the devices gathered above */
764         unregister_netdevice_many(&list);
765         rtnl_unlock();
766 }
767
768 static struct pernet_operations bareudp_net_ops = {
769         .init = bareudp_init_net,
770         .exit_batch = bareudp_exit_batch_net,
771         .id   = &bareudp_net_id,
772         .size = sizeof(struct bareudp_net),
773 };
774
775 static int __init bareudp_init_module(void)
776 {
777         int rc;
778
779         rc = register_pernet_subsys(&bareudp_net_ops);
780         if (rc)
781                 goto out1;
782
783         rc = rtnl_link_register(&bareudp_link_ops);
784         if (rc)
785                 goto out2;
786
787         return 0;
788 out2:
789         unregister_pernet_subsys(&bareudp_net_ops);
790 out1:
791         return rc;
792 }
793 late_initcall(bareudp_init_module);
794
795 static void __exit bareudp_cleanup_module(void)
796 {
797         rtnl_link_unregister(&bareudp_link_ops);
798         unregister_pernet_subsys(&bareudp_net_ops);
799 }
800 module_exit(bareudp_cleanup_module);
801
802 MODULE_LICENSE("GPL");
803 MODULE_AUTHOR("Martin Varghese <martin.varghese@nokia.com>");
804 MODULE_DESCRIPTION("Interface driver for UDP encapsulated traffic");