bridge: fix rcu check warning in multicast port group
[cascardo/linux.git] / net / bridge / br_mdb.c
1 #include <linux/err.h>
2 #include <linux/igmp.h>
3 #include <linux/kernel.h>
4 #include <linux/netdevice.h>
5 #include <linux/rculist.h>
6 #include <linux/skbuff.h>
7 #include <linux/if_ether.h>
8 #include <net/ip.h>
9 #include <net/netlink.h>
10 #if IS_ENABLED(CONFIG_IPV6)
11 #include <net/ipv6.h>
12 #endif
13
14 #include "br_private.h"
15
16 static int br_rports_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
17                                struct net_device *dev)
18 {
19         struct net_bridge *br = netdev_priv(dev);
20         struct net_bridge_port *p;
21         struct nlattr *nest;
22
23         if (!br->multicast_router || hlist_empty(&br->router_list))
24                 return 0;
25
26         nest = nla_nest_start(skb, MDBA_ROUTER);
27         if (nest == NULL)
28                 return -EMSGSIZE;
29
30         hlist_for_each_entry_rcu(p, &br->router_list, rlist) {
31                 if (p && nla_put_u32(skb, MDBA_ROUTER_PORT, p->dev->ifindex))
32                         goto fail;
33         }
34
35         nla_nest_end(skb, nest);
36         return 0;
37 fail:
38         nla_nest_cancel(skb, nest);
39         return -EMSGSIZE;
40 }
41
42 static int br_mdb_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
43                             struct net_device *dev)
44 {
45         struct net_bridge *br = netdev_priv(dev);
46         struct net_bridge_mdb_htable *mdb;
47         struct nlattr *nest, *nest2;
48         int i, err = 0;
49         int idx = 0, s_idx = cb->args[1];
50
51         if (br->multicast_disabled)
52                 return 0;
53
54         mdb = rcu_dereference(br->mdb);
55         if (!mdb)
56                 return 0;
57
58         nest = nla_nest_start(skb, MDBA_MDB);
59         if (nest == NULL)
60                 return -EMSGSIZE;
61
62         for (i = 0; i < mdb->max; i++) {
63                 struct net_bridge_mdb_entry *mp;
64                 struct net_bridge_port_group *p;
65                 struct net_bridge_port_group __rcu **pp;
66                 struct net_bridge_port *port;
67
68                 hlist_for_each_entry_rcu(mp, &mdb->mhash[i], hlist[mdb->ver]) {
69                         if (idx < s_idx)
70                                 goto skip;
71
72                         nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
73                         if (nest2 == NULL) {
74                                 err = -EMSGSIZE;
75                                 goto out;
76                         }
77
78                         for (pp = &mp->ports;
79                              (p = rcu_dereference(*pp)) != NULL;
80                               pp = &p->next) {
81                                 port = p->port;
82                                 if (port) {
83                                         struct br_mdb_entry e;
84                                         memset(&e, 0, sizeof(e));
85                                         e.ifindex = port->dev->ifindex;
86                                         e.state = p->state;
87                                         if (p->addr.proto == htons(ETH_P_IP))
88                                                 e.addr.u.ip4 = p->addr.u.ip4;
89 #if IS_ENABLED(CONFIG_IPV6)
90                                         if (p->addr.proto == htons(ETH_P_IPV6))
91                                                 e.addr.u.ip6 = p->addr.u.ip6;
92 #endif
93                                         e.addr.proto = p->addr.proto;
94                                         if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(e), &e)) {
95                                                 nla_nest_cancel(skb, nest2);
96                                                 err = -EMSGSIZE;
97                                                 goto out;
98                                         }
99                                 }
100                         }
101                         nla_nest_end(skb, nest2);
102                 skip:
103                         idx++;
104                 }
105         }
106
107 out:
108         cb->args[1] = idx;
109         nla_nest_end(skb, nest);
110         return err;
111 }
112
113 static int br_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
114 {
115         struct net_device *dev;
116         struct net *net = sock_net(skb->sk);
117         struct nlmsghdr *nlh = NULL;
118         int idx = 0, s_idx;
119
120         s_idx = cb->args[0];
121
122         rcu_read_lock();
123
124         /* In theory this could be wrapped to 0... */
125         cb->seq = net->dev_base_seq + br_mdb_rehash_seq;
126
127         for_each_netdev_rcu(net, dev) {
128                 if (dev->priv_flags & IFF_EBRIDGE) {
129                         struct br_port_msg *bpm;
130
131                         if (idx < s_idx)
132                                 goto skip;
133
134                         nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid,
135                                         cb->nlh->nlmsg_seq, RTM_GETMDB,
136                                         sizeof(*bpm), NLM_F_MULTI);
137                         if (nlh == NULL)
138                                 break;
139
140                         bpm = nlmsg_data(nlh);
141                         memset(bpm, 0, sizeof(*bpm));
142                         bpm->ifindex = dev->ifindex;
143                         if (br_mdb_fill_info(skb, cb, dev) < 0)
144                                 goto out;
145                         if (br_rports_fill_info(skb, cb, dev) < 0)
146                                 goto out;
147
148                         cb->args[1] = 0;
149                         nlmsg_end(skb, nlh);
150                 skip:
151                         idx++;
152                 }
153         }
154
155 out:
156         if (nlh)
157                 nlmsg_end(skb, nlh);
158         rcu_read_unlock();
159         cb->args[0] = idx;
160         return skb->len;
161 }
162
163 static int nlmsg_populate_mdb_fill(struct sk_buff *skb,
164                                    struct net_device *dev,
165                                    struct br_mdb_entry *entry, u32 pid,
166                                    u32 seq, int type, unsigned int flags)
167 {
168         struct nlmsghdr *nlh;
169         struct br_port_msg *bpm;
170         struct nlattr *nest, *nest2;
171
172         nlh = nlmsg_put(skb, pid, seq, type, sizeof(*bpm), NLM_F_MULTI);
173         if (!nlh)
174                 return -EMSGSIZE;
175
176         bpm = nlmsg_data(nlh);
177         memset(bpm, 0, sizeof(*bpm));
178         bpm->family  = AF_BRIDGE;
179         bpm->ifindex = dev->ifindex;
180         nest = nla_nest_start(skb, MDBA_MDB);
181         if (nest == NULL)
182                 goto cancel;
183         nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
184         if (nest2 == NULL)
185                 goto end;
186
187         if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(*entry), entry))
188                 goto end;
189
190         nla_nest_end(skb, nest2);
191         nla_nest_end(skb, nest);
192         return nlmsg_end(skb, nlh);
193
194 end:
195         nla_nest_end(skb, nest);
196 cancel:
197         nlmsg_cancel(skb, nlh);
198         return -EMSGSIZE;
199 }
200
201 static inline size_t rtnl_mdb_nlmsg_size(void)
202 {
203         return NLMSG_ALIGN(sizeof(struct br_port_msg))
204                 + nla_total_size(sizeof(struct br_mdb_entry));
205 }
206
207 static void __br_mdb_notify(struct net_device *dev, struct br_mdb_entry *entry,
208                             int type)
209 {
210         struct net *net = dev_net(dev);
211         struct sk_buff *skb;
212         int err = -ENOBUFS;
213
214         skb = nlmsg_new(rtnl_mdb_nlmsg_size(), GFP_ATOMIC);
215         if (!skb)
216                 goto errout;
217
218         err = nlmsg_populate_mdb_fill(skb, dev, entry, 0, 0, type, NTF_SELF);
219         if (err < 0) {
220                 kfree_skb(skb);
221                 goto errout;
222         }
223
224         rtnl_notify(skb, net, 0, RTNLGRP_MDB, NULL, GFP_ATOMIC);
225         return;
226 errout:
227         rtnl_set_sk_err(net, RTNLGRP_MDB, err);
228 }
229
230 void br_mdb_notify(struct net_device *dev, struct net_bridge_port *port,
231                    struct br_ip *group, int type)
232 {
233         struct br_mdb_entry entry;
234
235         memset(&entry, 0, sizeof(entry));
236         entry.ifindex = port->dev->ifindex;
237         entry.addr.proto = group->proto;
238         entry.addr.u.ip4 = group->u.ip4;
239 #if IS_ENABLED(CONFIG_IPV6)
240         entry.addr.u.ip6 = group->u.ip6;
241 #endif
242         __br_mdb_notify(dev, &entry, type);
243 }
244
245 static bool is_valid_mdb_entry(struct br_mdb_entry *entry)
246 {
247         if (entry->ifindex == 0)
248                 return false;
249
250         if (entry->addr.proto == htons(ETH_P_IP)) {
251                 if (!ipv4_is_multicast(entry->addr.u.ip4))
252                         return false;
253                 if (ipv4_is_local_multicast(entry->addr.u.ip4))
254                         return false;
255 #if IS_ENABLED(CONFIG_IPV6)
256         } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
257                 if (!ipv6_is_transient_multicast(&entry->addr.u.ip6))
258                         return false;
259 #endif
260         } else
261                 return false;
262         if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY)
263                 return false;
264
265         return true;
266 }
267
268 static int br_mdb_parse(struct sk_buff *skb, struct nlmsghdr *nlh,
269                         struct net_device **pdev, struct br_mdb_entry **pentry)
270 {
271         struct net *net = sock_net(skb->sk);
272         struct br_mdb_entry *entry;
273         struct br_port_msg *bpm;
274         struct nlattr *tb[MDBA_SET_ENTRY_MAX+1];
275         struct net_device *dev;
276         int err;
277
278         err = nlmsg_parse(nlh, sizeof(*bpm), tb, MDBA_SET_ENTRY, NULL);
279         if (err < 0)
280                 return err;
281
282         bpm = nlmsg_data(nlh);
283         if (bpm->ifindex == 0) {
284                 pr_info("PF_BRIDGE: br_mdb_parse() with invalid ifindex\n");
285                 return -EINVAL;
286         }
287
288         dev = __dev_get_by_index(net, bpm->ifindex);
289         if (dev == NULL) {
290                 pr_info("PF_BRIDGE: br_mdb_parse() with unknown ifindex\n");
291                 return -ENODEV;
292         }
293
294         if (!(dev->priv_flags & IFF_EBRIDGE)) {
295                 pr_info("PF_BRIDGE: br_mdb_parse() with non-bridge\n");
296                 return -EOPNOTSUPP;
297         }
298
299         *pdev = dev;
300
301         if (!tb[MDBA_SET_ENTRY] ||
302             nla_len(tb[MDBA_SET_ENTRY]) != sizeof(struct br_mdb_entry)) {
303                 pr_info("PF_BRIDGE: br_mdb_parse() with invalid attr\n");
304                 return -EINVAL;
305         }
306
307         entry = nla_data(tb[MDBA_SET_ENTRY]);
308         if (!is_valid_mdb_entry(entry)) {
309                 pr_info("PF_BRIDGE: br_mdb_parse() with invalid entry\n");
310                 return -EINVAL;
311         }
312
313         *pentry = entry;
314         return 0;
315 }
316
317 static int br_mdb_add_group(struct net_bridge *br, struct net_bridge_port *port,
318                             struct br_ip *group, unsigned char state)
319 {
320         struct net_bridge_mdb_entry *mp;
321         struct net_bridge_port_group *p;
322         struct net_bridge_port_group __rcu **pp;
323         struct net_bridge_mdb_htable *mdb;
324         int err;
325
326         mdb = mlock_dereference(br->mdb, br);
327         mp = br_mdb_ip_get(mdb, group);
328         if (!mp) {
329                 mp = br_multicast_new_group(br, port, group);
330                 err = PTR_ERR(mp);
331                 if (IS_ERR(mp))
332                         return err;
333         }
334
335         for (pp = &mp->ports;
336              (p = mlock_dereference(*pp, br)) != NULL;
337              pp = &p->next) {
338                 if (p->port == port)
339                         return -EEXIST;
340                 if ((unsigned long)p->port < (unsigned long)port)
341                         break;
342         }
343
344         p = br_multicast_new_port_group(port, group, *pp, state);
345         if (unlikely(!p))
346                 return -ENOMEM;
347         rcu_assign_pointer(*pp, p);
348
349         br_mdb_notify(br->dev, port, group, RTM_NEWMDB);
350         return 0;
351 }
352
353 static int __br_mdb_add(struct net *net, struct net_bridge *br,
354                         struct br_mdb_entry *entry)
355 {
356         struct br_ip ip;
357         struct net_device *dev;
358         struct net_bridge_port *p;
359         int ret;
360
361         if (!netif_running(br->dev) || br->multicast_disabled)
362                 return -EINVAL;
363
364         dev = __dev_get_by_index(net, entry->ifindex);
365         if (!dev)
366                 return -ENODEV;
367
368         p = br_port_get_rtnl(dev);
369         if (!p || p->br != br || p->state == BR_STATE_DISABLED)
370                 return -EINVAL;
371
372         ip.proto = entry->addr.proto;
373         if (ip.proto == htons(ETH_P_IP))
374                 ip.u.ip4 = entry->addr.u.ip4;
375 #if IS_ENABLED(CONFIG_IPV6)
376         else
377                 ip.u.ip6 = entry->addr.u.ip6;
378 #endif
379
380         spin_lock_bh(&br->multicast_lock);
381         ret = br_mdb_add_group(br, p, &ip, entry->state);
382         spin_unlock_bh(&br->multicast_lock);
383         return ret;
384 }
385
386 static int br_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh)
387 {
388         struct net *net = sock_net(skb->sk);
389         struct br_mdb_entry *entry;
390         struct net_device *dev;
391         struct net_bridge *br;
392         int err;
393
394         err = br_mdb_parse(skb, nlh, &dev, &entry);
395         if (err < 0)
396                 return err;
397
398         br = netdev_priv(dev);
399
400         err = __br_mdb_add(net, br, entry);
401         if (!err)
402                 __br_mdb_notify(dev, entry, RTM_NEWMDB);
403         return err;
404 }
405
406 static int __br_mdb_del(struct net_bridge *br, struct br_mdb_entry *entry)
407 {
408         struct net_bridge_mdb_htable *mdb;
409         struct net_bridge_mdb_entry *mp;
410         struct net_bridge_port_group *p;
411         struct net_bridge_port_group __rcu **pp;
412         struct br_ip ip;
413         int err = -EINVAL;
414
415         if (!netif_running(br->dev) || br->multicast_disabled)
416                 return -EINVAL;
417
418         if (timer_pending(&br->multicast_querier_timer))
419                 return -EBUSY;
420
421         ip.proto = entry->addr.proto;
422         if (ip.proto == htons(ETH_P_IP))
423                 ip.u.ip4 = entry->addr.u.ip4;
424 #if IS_ENABLED(CONFIG_IPV6)
425         else
426                 ip.u.ip6 = entry->addr.u.ip6;
427 #endif
428
429         spin_lock_bh(&br->multicast_lock);
430         mdb = mlock_dereference(br->mdb, br);
431
432         mp = br_mdb_ip_get(mdb, &ip);
433         if (!mp)
434                 goto unlock;
435
436         for (pp = &mp->ports;
437              (p = mlock_dereference(*pp, br)) != NULL;
438              pp = &p->next) {
439                 if (!p->port || p->port->dev->ifindex != entry->ifindex)
440                         continue;
441
442                 if (p->port->state == BR_STATE_DISABLED)
443                         goto unlock;
444
445                 rcu_assign_pointer(*pp, p->next);
446                 hlist_del_init(&p->mglist);
447                 del_timer(&p->timer);
448                 call_rcu_bh(&p->rcu, br_multicast_free_pg);
449                 err = 0;
450
451                 if (!mp->ports && !mp->mglist && mp->timer_armed &&
452                     netif_running(br->dev))
453                         mod_timer(&mp->timer, jiffies);
454                 break;
455         }
456
457 unlock:
458         spin_unlock_bh(&br->multicast_lock);
459         return err;
460 }
461
462 static int br_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh)
463 {
464         struct net_device *dev;
465         struct br_mdb_entry *entry;
466         struct net_bridge *br;
467         int err;
468
469         err = br_mdb_parse(skb, nlh, &dev, &entry);
470         if (err < 0)
471                 return err;
472
473         br = netdev_priv(dev);
474
475         err = __br_mdb_del(br, entry);
476         if (!err)
477                 __br_mdb_notify(dev, entry, RTM_DELMDB);
478         return err;
479 }
480
481 void br_mdb_init(void)
482 {
483         rtnl_register(PF_BRIDGE, RTM_GETMDB, NULL, br_mdb_dump, NULL);
484         rtnl_register(PF_BRIDGE, RTM_NEWMDB, br_mdb_add, NULL, NULL);
485         rtnl_register(PF_BRIDGE, RTM_DELMDB, br_mdb_del, NULL, NULL);
486 }
487
488 void br_mdb_uninit(void)
489 {
490         rtnl_unregister(PF_BRIDGE, RTM_GETMDB);
491         rtnl_unregister(PF_BRIDGE, RTM_NEWMDB);
492         rtnl_unregister(PF_BRIDGE, RTM_DELMDB);
493 }