2 #include <linux/igmp.h>
3 #include <linux/kernel.h>
4 #include <linux/netdevice.h>
5 #include <linux/rculist.h>
6 #include <linux/skbuff.h>
7 #include <linux/if_ether.h>
9 #include <net/netlink.h>
10 #include <net/switchdev.h>
11 #if IS_ENABLED(CONFIG_IPV6)
13 #include <net/addrconf.h>
16 #include "br_private.h"
18 static int br_rports_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
19 struct net_device *dev)
21 struct net_bridge *br = netdev_priv(dev);
22 struct net_bridge_port *p;
23 struct nlattr *nest, *port_nest;
25 if (!br->multicast_router || hlist_empty(&br->router_list))
28 nest = nla_nest_start(skb, MDBA_ROUTER);
32 hlist_for_each_entry_rcu(p, &br->router_list, rlist) {
35 port_nest = nla_nest_start(skb, MDBA_ROUTER_PORT);
38 if (nla_put_nohdr(skb, sizeof(u32), &p->dev->ifindex) ||
39 nla_put_u32(skb, MDBA_ROUTER_PATTR_TIMER,
40 br_timer_value(&p->multicast_router_timer)) ||
41 nla_put_u8(skb, MDBA_ROUTER_PATTR_TYPE,
42 p->multicast_router)) {
43 nla_nest_cancel(skb, port_nest);
46 nla_nest_end(skb, port_nest);
49 nla_nest_end(skb, nest);
52 nla_nest_cancel(skb, nest);
56 static void __mdb_entry_fill_flags(struct br_mdb_entry *e, unsigned char flags)
58 e->state = flags & MDB_PG_FLAGS_PERMANENT;
60 if (flags & MDB_PG_FLAGS_OFFLOAD)
61 e->flags |= MDB_FLAGS_OFFLOAD;
64 static void __mdb_entry_to_br_ip(struct br_mdb_entry *entry, struct br_ip *ip)
66 memset(ip, 0, sizeof(struct br_ip));
68 ip->proto = entry->addr.proto;
69 if (ip->proto == htons(ETH_P_IP))
70 ip->u.ip4 = entry->addr.u.ip4;
71 #if IS_ENABLED(CONFIG_IPV6)
73 ip->u.ip6 = entry->addr.u.ip6;
77 static int br_mdb_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
78 struct net_device *dev)
80 struct net_bridge *br = netdev_priv(dev);
81 struct net_bridge_mdb_htable *mdb;
82 struct nlattr *nest, *nest2;
84 int idx = 0, s_idx = cb->args[1];
86 if (br->multicast_disabled)
89 mdb = rcu_dereference(br->mdb);
93 nest = nla_nest_start(skb, MDBA_MDB);
97 for (i = 0; i < mdb->max; i++) {
98 struct net_bridge_mdb_entry *mp;
99 struct net_bridge_port_group *p;
100 struct net_bridge_port_group __rcu **pp;
101 struct net_bridge_port *port;
103 hlist_for_each_entry_rcu(mp, &mdb->mhash[i], hlist[mdb->ver]) {
107 nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
113 for (pp = &mp->ports;
114 (p = rcu_dereference(*pp)) != NULL;
116 struct nlattr *nest_ent;
117 struct br_mdb_entry e;
123 memset(&e, 0, sizeof(e));
124 e.ifindex = port->dev->ifindex;
126 __mdb_entry_fill_flags(&e, p->flags);
127 if (p->addr.proto == htons(ETH_P_IP))
128 e.addr.u.ip4 = p->addr.u.ip4;
129 #if IS_ENABLED(CONFIG_IPV6)
130 if (p->addr.proto == htons(ETH_P_IPV6))
131 e.addr.u.ip6 = p->addr.u.ip6;
133 e.addr.proto = p->addr.proto;
134 nest_ent = nla_nest_start(skb,
135 MDBA_MDB_ENTRY_INFO);
137 nla_nest_cancel(skb, nest2);
141 if (nla_put_nohdr(skb, sizeof(e), &e) ||
143 MDBA_MDB_EATTR_TIMER,
144 br_timer_value(&p->timer))) {
145 nla_nest_cancel(skb, nest_ent);
146 nla_nest_cancel(skb, nest2);
150 nla_nest_end(skb, nest_ent);
152 nla_nest_end(skb, nest2);
160 nla_nest_end(skb, nest);
164 static int br_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
166 struct net_device *dev;
167 struct net *net = sock_net(skb->sk);
168 struct nlmsghdr *nlh = NULL;
175 /* In theory this could be wrapped to 0... */
176 cb->seq = net->dev_base_seq + br_mdb_rehash_seq;
178 for_each_netdev_rcu(net, dev) {
179 if (dev->priv_flags & IFF_EBRIDGE) {
180 struct br_port_msg *bpm;
185 nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid,
186 cb->nlh->nlmsg_seq, RTM_GETMDB,
187 sizeof(*bpm), NLM_F_MULTI);
191 bpm = nlmsg_data(nlh);
192 memset(bpm, 0, sizeof(*bpm));
193 bpm->ifindex = dev->ifindex;
194 if (br_mdb_fill_info(skb, cb, dev) < 0)
196 if (br_rports_fill_info(skb, cb, dev) < 0)
214 static int nlmsg_populate_mdb_fill(struct sk_buff *skb,
215 struct net_device *dev,
216 struct br_mdb_entry *entry, u32 pid,
217 u32 seq, int type, unsigned int flags)
219 struct nlmsghdr *nlh;
220 struct br_port_msg *bpm;
221 struct nlattr *nest, *nest2;
223 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*bpm), 0);
227 bpm = nlmsg_data(nlh);
228 memset(bpm, 0, sizeof(*bpm));
229 bpm->family = AF_BRIDGE;
230 bpm->ifindex = dev->ifindex;
231 nest = nla_nest_start(skb, MDBA_MDB);
234 nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
238 if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(*entry), entry))
241 nla_nest_end(skb, nest2);
242 nla_nest_end(skb, nest);
247 nla_nest_end(skb, nest);
249 nlmsg_cancel(skb, nlh);
253 static inline size_t rtnl_mdb_nlmsg_size(void)
255 return NLMSG_ALIGN(sizeof(struct br_port_msg))
256 + nla_total_size(sizeof(struct br_mdb_entry));
259 struct br_mdb_complete_info {
260 struct net_bridge_port *port;
264 static void br_mdb_complete(struct net_device *dev, int err, void *priv)
266 struct br_mdb_complete_info *data = priv;
267 struct net_bridge_port_group __rcu **pp;
268 struct net_bridge_port_group *p;
269 struct net_bridge_mdb_htable *mdb;
270 struct net_bridge_mdb_entry *mp;
271 struct net_bridge_port *port = data->port;
272 struct net_bridge *br = port->br;
277 spin_lock_bh(&br->multicast_lock);
278 mdb = mlock_dereference(br->mdb, br);
279 mp = br_mdb_ip_get(mdb, &data->ip);
282 for (pp = &mp->ports; (p = mlock_dereference(*pp, br)) != NULL;
286 p->flags |= MDB_PG_FLAGS_OFFLOAD;
289 spin_unlock_bh(&br->multicast_lock);
294 static void __br_mdb_notify(struct net_device *dev, struct net_bridge_port *p,
295 struct br_mdb_entry *entry, int type)
297 struct br_mdb_complete_info *complete_info;
298 struct switchdev_obj_port_mdb mdb = {
300 .id = SWITCHDEV_OBJ_ID_PORT_MDB,
301 .flags = SWITCHDEV_F_DEFER,
305 struct net_device *port_dev;
306 struct net *net = dev_net(dev);
310 port_dev = __dev_get_by_index(net, entry->ifindex);
311 if (entry->addr.proto == htons(ETH_P_IP))
312 ip_eth_mc_map(entry->addr.u.ip4, mdb.addr);
313 #if IS_ENABLED(CONFIG_IPV6)
315 ipv6_eth_mc_map(&entry->addr.u.ip6, mdb.addr);
318 mdb.obj.orig_dev = port_dev;
319 if (port_dev && type == RTM_NEWMDB) {
320 complete_info = kmalloc(sizeof(*complete_info), GFP_ATOMIC);
322 complete_info->port = p;
323 __mdb_entry_to_br_ip(entry, &complete_info->ip);
324 mdb.obj.complete_priv = complete_info;
325 mdb.obj.complete = br_mdb_complete;
326 switchdev_port_obj_add(port_dev, &mdb.obj);
328 } else if (port_dev && type == RTM_DELMDB) {
329 switchdev_port_obj_del(port_dev, &mdb.obj);
332 skb = nlmsg_new(rtnl_mdb_nlmsg_size(), GFP_ATOMIC);
336 err = nlmsg_populate_mdb_fill(skb, dev, entry, 0, 0, type, NTF_SELF);
342 rtnl_notify(skb, net, 0, RTNLGRP_MDB, NULL, GFP_ATOMIC);
345 rtnl_set_sk_err(net, RTNLGRP_MDB, err);
348 void br_mdb_notify(struct net_device *dev, struct net_bridge_port *port,
349 struct br_ip *group, int type, u8 flags)
351 struct br_mdb_entry entry;
353 memset(&entry, 0, sizeof(entry));
354 entry.ifindex = port->dev->ifindex;
355 entry.addr.proto = group->proto;
356 entry.addr.u.ip4 = group->u.ip4;
357 #if IS_ENABLED(CONFIG_IPV6)
358 entry.addr.u.ip6 = group->u.ip6;
360 entry.vid = group->vid;
361 __mdb_entry_fill_flags(&entry, flags);
362 __br_mdb_notify(dev, port, &entry, type);
365 static int nlmsg_populate_rtr_fill(struct sk_buff *skb,
366 struct net_device *dev,
367 int ifindex, u32 pid,
368 u32 seq, int type, unsigned int flags)
370 struct br_port_msg *bpm;
371 struct nlmsghdr *nlh;
374 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*bpm), NLM_F_MULTI);
378 bpm = nlmsg_data(nlh);
379 memset(bpm, 0, sizeof(*bpm));
380 bpm->family = AF_BRIDGE;
381 bpm->ifindex = dev->ifindex;
382 nest = nla_nest_start(skb, MDBA_ROUTER);
386 if (nla_put_u32(skb, MDBA_ROUTER_PORT, ifindex))
389 nla_nest_end(skb, nest);
394 nla_nest_end(skb, nest);
396 nlmsg_cancel(skb, nlh);
400 static inline size_t rtnl_rtr_nlmsg_size(void)
402 return NLMSG_ALIGN(sizeof(struct br_port_msg))
403 + nla_total_size(sizeof(__u32));
406 void br_rtr_notify(struct net_device *dev, struct net_bridge_port *port,
409 struct net *net = dev_net(dev);
414 ifindex = port ? port->dev->ifindex : 0;
415 skb = nlmsg_new(rtnl_rtr_nlmsg_size(), GFP_ATOMIC);
419 err = nlmsg_populate_rtr_fill(skb, dev, ifindex, 0, 0, type, NTF_SELF);
425 rtnl_notify(skb, net, 0, RTNLGRP_MDB, NULL, GFP_ATOMIC);
429 rtnl_set_sk_err(net, RTNLGRP_MDB, err);
432 static bool is_valid_mdb_entry(struct br_mdb_entry *entry)
434 if (entry->ifindex == 0)
437 if (entry->addr.proto == htons(ETH_P_IP)) {
438 if (!ipv4_is_multicast(entry->addr.u.ip4))
440 if (ipv4_is_local_multicast(entry->addr.u.ip4))
442 #if IS_ENABLED(CONFIG_IPV6)
443 } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
444 if (ipv6_addr_is_ll_all_nodes(&entry->addr.u.ip6))
449 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY)
451 if (entry->vid >= VLAN_VID_MASK)
457 static int br_mdb_parse(struct sk_buff *skb, struct nlmsghdr *nlh,
458 struct net_device **pdev, struct br_mdb_entry **pentry)
460 struct net *net = sock_net(skb->sk);
461 struct br_mdb_entry *entry;
462 struct br_port_msg *bpm;
463 struct nlattr *tb[MDBA_SET_ENTRY_MAX+1];
464 struct net_device *dev;
467 err = nlmsg_parse(nlh, sizeof(*bpm), tb, MDBA_SET_ENTRY_MAX, NULL,
472 bpm = nlmsg_data(nlh);
473 if (bpm->ifindex == 0) {
474 pr_info("PF_BRIDGE: br_mdb_parse() with invalid ifindex\n");
478 dev = __dev_get_by_index(net, bpm->ifindex);
480 pr_info("PF_BRIDGE: br_mdb_parse() with unknown ifindex\n");
484 if (!(dev->priv_flags & IFF_EBRIDGE)) {
485 pr_info("PF_BRIDGE: br_mdb_parse() with non-bridge\n");
491 if (!tb[MDBA_SET_ENTRY] ||
492 nla_len(tb[MDBA_SET_ENTRY]) != sizeof(struct br_mdb_entry)) {
493 pr_info("PF_BRIDGE: br_mdb_parse() with invalid attr\n");
497 entry = nla_data(tb[MDBA_SET_ENTRY]);
498 if (!is_valid_mdb_entry(entry)) {
499 pr_info("PF_BRIDGE: br_mdb_parse() with invalid entry\n");
507 static int br_mdb_add_group(struct net_bridge *br, struct net_bridge_port *port,
508 struct br_ip *group, unsigned char state)
510 struct net_bridge_mdb_entry *mp;
511 struct net_bridge_port_group *p;
512 struct net_bridge_port_group __rcu **pp;
513 struct net_bridge_mdb_htable *mdb;
514 unsigned long now = jiffies;
517 mdb = mlock_dereference(br->mdb, br);
518 mp = br_mdb_ip_get(mdb, group);
520 mp = br_multicast_new_group(br, port, group);
521 err = PTR_ERR_OR_ZERO(mp);
526 for (pp = &mp->ports;
527 (p = mlock_dereference(*pp, br)) != NULL;
531 if ((unsigned long)p->port < (unsigned long)port)
535 p = br_multicast_new_port_group(port, group, *pp, state, NULL);
538 rcu_assign_pointer(*pp, p);
539 if (state == MDB_TEMPORARY)
540 mod_timer(&p->timer, now + br->multicast_membership_interval);
545 static int __br_mdb_add(struct net *net, struct net_bridge *br,
546 struct br_mdb_entry *entry)
549 struct net_device *dev;
550 struct net_bridge_port *p;
553 if (!netif_running(br->dev) || br->multicast_disabled)
556 dev = __dev_get_by_index(net, entry->ifindex);
560 p = br_port_get_rtnl(dev);
561 if (!p || p->br != br || p->state == BR_STATE_DISABLED)
564 __mdb_entry_to_br_ip(entry, &ip);
566 spin_lock_bh(&br->multicast_lock);
567 ret = br_mdb_add_group(br, p, &ip, entry->state);
568 spin_unlock_bh(&br->multicast_lock);
572 static int br_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
573 struct netlink_ext_ack *extack)
575 struct net *net = sock_net(skb->sk);
576 struct net_bridge_vlan_group *vg;
577 struct net_device *dev, *pdev;
578 struct br_mdb_entry *entry;
579 struct net_bridge_port *p;
580 struct net_bridge_vlan *v;
581 struct net_bridge *br;
584 err = br_mdb_parse(skb, nlh, &dev, &entry);
588 br = netdev_priv(dev);
590 /* If vlan filtering is enabled and VLAN is not specified
591 * install mdb entry on all vlans configured on the port.
593 pdev = __dev_get_by_index(net, entry->ifindex);
597 p = br_port_get_rtnl(pdev);
598 if (!p || p->br != br || p->state == BR_STATE_DISABLED)
601 vg = nbp_vlan_group(p);
602 if (br_vlan_enabled(br->dev) && vg && entry->vid == 0) {
603 list_for_each_entry(v, &vg->vlan_list, vlist) {
605 err = __br_mdb_add(net, br, entry);
608 __br_mdb_notify(dev, p, entry, RTM_NEWMDB);
611 err = __br_mdb_add(net, br, entry);
613 __br_mdb_notify(dev, p, entry, RTM_NEWMDB);
619 static int __br_mdb_del(struct net_bridge *br, struct br_mdb_entry *entry)
621 struct net_bridge_mdb_htable *mdb;
622 struct net_bridge_mdb_entry *mp;
623 struct net_bridge_port_group *p;
624 struct net_bridge_port_group __rcu **pp;
628 if (!netif_running(br->dev) || br->multicast_disabled)
631 __mdb_entry_to_br_ip(entry, &ip);
633 spin_lock_bh(&br->multicast_lock);
634 mdb = mlock_dereference(br->mdb, br);
636 mp = br_mdb_ip_get(mdb, &ip);
640 for (pp = &mp->ports;
641 (p = mlock_dereference(*pp, br)) != NULL;
643 if (!p->port || p->port->dev->ifindex != entry->ifindex)
646 if (p->port->state == BR_STATE_DISABLED)
649 __mdb_entry_fill_flags(entry, p->flags);
650 rcu_assign_pointer(*pp, p->next);
651 hlist_del_init(&p->mglist);
652 del_timer(&p->timer);
653 call_rcu_bh(&p->rcu, br_multicast_free_pg);
656 if (!mp->ports && !mp->mglist &&
657 netif_running(br->dev))
658 mod_timer(&mp->timer, jiffies);
663 spin_unlock_bh(&br->multicast_lock);
667 static int br_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
668 struct netlink_ext_ack *extack)
670 struct net *net = sock_net(skb->sk);
671 struct net_bridge_vlan_group *vg;
672 struct net_device *dev, *pdev;
673 struct br_mdb_entry *entry;
674 struct net_bridge_port *p;
675 struct net_bridge_vlan *v;
676 struct net_bridge *br;
679 err = br_mdb_parse(skb, nlh, &dev, &entry);
683 br = netdev_priv(dev);
685 /* If vlan filtering is enabled and VLAN is not specified
686 * delete mdb entry on all vlans configured on the port.
688 pdev = __dev_get_by_index(net, entry->ifindex);
692 p = br_port_get_rtnl(pdev);
693 if (!p || p->br != br || p->state == BR_STATE_DISABLED)
696 vg = nbp_vlan_group(p);
697 if (br_vlan_enabled(br->dev) && vg && entry->vid == 0) {
698 list_for_each_entry(v, &vg->vlan_list, vlist) {
700 err = __br_mdb_del(br, entry);
702 __br_mdb_notify(dev, p, entry, RTM_DELMDB);
705 err = __br_mdb_del(br, entry);
707 __br_mdb_notify(dev, p, entry, RTM_DELMDB);
713 void br_mdb_init(void)
715 rtnl_register(PF_BRIDGE, RTM_GETMDB, NULL, br_mdb_dump, NULL);
716 rtnl_register(PF_BRIDGE, RTM_NEWMDB, br_mdb_add, NULL, NULL);
717 rtnl_register(PF_BRIDGE, RTM_DELMDB, br_mdb_del, NULL, NULL);
720 void br_mdb_uninit(void)
722 rtnl_unregister(PF_BRIDGE, RTM_GETMDB);
723 rtnl_unregister(PF_BRIDGE, RTM_NEWMDB);
724 rtnl_unregister(PF_BRIDGE, RTM_DELMDB);