]> asedeno.scripts.mit.edu Git - linux.git/blob - net/bridge/br_multicast.c
Merge tag 'vla-v4.20-rc1' of git://git.kernel.org/pub/scm/linux/kernel/git/kees/linux
[linux.git] / net / bridge / br_multicast.c
1 /*
2  * Bridge multicast support.
3  *
4  * Copyright (c) 2010 Herbert Xu <herbert@gondor.apana.org.au>
5  *
6  * This program is free software; you can redistribute it and/or modify it
7  * under the terms of the GNU General Public License as published by the Free
8  * Software Foundation; either version 2 of the License, or (at your option)
9  * any later version.
10  *
11  */
12
13 #include <linux/err.h>
14 #include <linux/export.h>
15 #include <linux/if_ether.h>
16 #include <linux/igmp.h>
17 #include <linux/jhash.h>
18 #include <linux/kernel.h>
19 #include <linux/log2.h>
20 #include <linux/netdevice.h>
21 #include <linux/netfilter_bridge.h>
22 #include <linux/random.h>
23 #include <linux/rculist.h>
24 #include <linux/skbuff.h>
25 #include <linux/slab.h>
26 #include <linux/timer.h>
27 #include <linux/inetdevice.h>
28 #include <linux/mroute.h>
29 #include <net/ip.h>
30 #include <net/switchdev.h>
31 #if IS_ENABLED(CONFIG_IPV6)
32 #include <net/ipv6.h>
33 #include <net/mld.h>
34 #include <net/ip6_checksum.h>
35 #include <net/addrconf.h>
36 #endif
37
38 #include "br_private.h"
39
40 static void br_multicast_start_querier(struct net_bridge *br,
41                                        struct bridge_mcast_own_query *query);
42 static void br_multicast_add_router(struct net_bridge *br,
43                                     struct net_bridge_port *port);
44 static void br_ip4_multicast_leave_group(struct net_bridge *br,
45                                          struct net_bridge_port *port,
46                                          __be32 group,
47                                          __u16 vid,
48                                          const unsigned char *src);
49
50 static void __del_port_router(struct net_bridge_port *p);
51 #if IS_ENABLED(CONFIG_IPV6)
52 static void br_ip6_multicast_leave_group(struct net_bridge *br,
53                                          struct net_bridge_port *port,
54                                          const struct in6_addr *group,
55                                          __u16 vid, const unsigned char *src);
56 #endif
57 unsigned int br_mdb_rehash_seq;
58
59 static inline int br_ip_equal(const struct br_ip *a, const struct br_ip *b)
60 {
61         if (a->proto != b->proto)
62                 return 0;
63         if (a->vid != b->vid)
64                 return 0;
65         switch (a->proto) {
66         case htons(ETH_P_IP):
67                 return a->u.ip4 == b->u.ip4;
68 #if IS_ENABLED(CONFIG_IPV6)
69         case htons(ETH_P_IPV6):
70                 return ipv6_addr_equal(&a->u.ip6, &b->u.ip6);
71 #endif
72         }
73         return 0;
74 }
75
76 static inline int __br_ip4_hash(struct net_bridge_mdb_htable *mdb, __be32 ip,
77                                 __u16 vid)
78 {
79         return jhash_2words((__force u32)ip, vid, mdb->secret) & (mdb->max - 1);
80 }
81
82 #if IS_ENABLED(CONFIG_IPV6)
83 static inline int __br_ip6_hash(struct net_bridge_mdb_htable *mdb,
84                                 const struct in6_addr *ip,
85                                 __u16 vid)
86 {
87         return jhash_2words(ipv6_addr_hash(ip), vid,
88                             mdb->secret) & (mdb->max - 1);
89 }
90 #endif
91
92 static inline int br_ip_hash(struct net_bridge_mdb_htable *mdb,
93                              struct br_ip *ip)
94 {
95         switch (ip->proto) {
96         case htons(ETH_P_IP):
97                 return __br_ip4_hash(mdb, ip->u.ip4, ip->vid);
98 #if IS_ENABLED(CONFIG_IPV6)
99         case htons(ETH_P_IPV6):
100                 return __br_ip6_hash(mdb, &ip->u.ip6, ip->vid);
101 #endif
102         }
103         return 0;
104 }
105
106 static struct net_bridge_mdb_entry *__br_mdb_ip_get(
107         struct net_bridge_mdb_htable *mdb, struct br_ip *dst, int hash)
108 {
109         struct net_bridge_mdb_entry *mp;
110
111         hlist_for_each_entry_rcu(mp, &mdb->mhash[hash], hlist[mdb->ver]) {
112                 if (br_ip_equal(&mp->addr, dst))
113                         return mp;
114         }
115
116         return NULL;
117 }
118
119 struct net_bridge_mdb_entry *br_mdb_ip_get(struct net_bridge_mdb_htable *mdb,
120                                            struct br_ip *dst)
121 {
122         if (!mdb)
123                 return NULL;
124
125         return __br_mdb_ip_get(mdb, dst, br_ip_hash(mdb, dst));
126 }
127
128 static struct net_bridge_mdb_entry *br_mdb_ip4_get(
129         struct net_bridge_mdb_htable *mdb, __be32 dst, __u16 vid)
130 {
131         struct br_ip br_dst;
132
133         br_dst.u.ip4 = dst;
134         br_dst.proto = htons(ETH_P_IP);
135         br_dst.vid = vid;
136
137         return br_mdb_ip_get(mdb, &br_dst);
138 }
139
140 #if IS_ENABLED(CONFIG_IPV6)
141 static struct net_bridge_mdb_entry *br_mdb_ip6_get(
142         struct net_bridge_mdb_htable *mdb, const struct in6_addr *dst,
143         __u16 vid)
144 {
145         struct br_ip br_dst;
146
147         br_dst.u.ip6 = *dst;
148         br_dst.proto = htons(ETH_P_IPV6);
149         br_dst.vid = vid;
150
151         return br_mdb_ip_get(mdb, &br_dst);
152 }
153 #endif
154
155 struct net_bridge_mdb_entry *br_mdb_get(struct net_bridge *br,
156                                         struct sk_buff *skb, u16 vid)
157 {
158         struct net_bridge_mdb_htable *mdb = rcu_dereference(br->mdb);
159         struct br_ip ip;
160
161         if (!br_opt_get(br, BROPT_MULTICAST_ENABLED))
162                 return NULL;
163
164         if (BR_INPUT_SKB_CB(skb)->igmp)
165                 return NULL;
166
167         ip.proto = skb->protocol;
168         ip.vid = vid;
169
170         switch (skb->protocol) {
171         case htons(ETH_P_IP):
172                 ip.u.ip4 = ip_hdr(skb)->daddr;
173                 break;
174 #if IS_ENABLED(CONFIG_IPV6)
175         case htons(ETH_P_IPV6):
176                 ip.u.ip6 = ipv6_hdr(skb)->daddr;
177                 break;
178 #endif
179         default:
180                 return NULL;
181         }
182
183         return br_mdb_ip_get(mdb, &ip);
184 }
185
186 static void br_mdb_free(struct rcu_head *head)
187 {
188         struct net_bridge_mdb_htable *mdb =
189                 container_of(head, struct net_bridge_mdb_htable, rcu);
190         struct net_bridge_mdb_htable *old = mdb->old;
191
192         mdb->old = NULL;
193         kfree(old->mhash);
194         kfree(old);
195 }
196
197 static int br_mdb_copy(struct net_bridge_mdb_htable *new,
198                        struct net_bridge_mdb_htable *old,
199                        int elasticity)
200 {
201         struct net_bridge_mdb_entry *mp;
202         int maxlen;
203         int len;
204         int i;
205
206         for (i = 0; i < old->max; i++)
207                 hlist_for_each_entry(mp, &old->mhash[i], hlist[old->ver])
208                         hlist_add_head(&mp->hlist[new->ver],
209                                        &new->mhash[br_ip_hash(new, &mp->addr)]);
210
211         if (!elasticity)
212                 return 0;
213
214         maxlen = 0;
215         for (i = 0; i < new->max; i++) {
216                 len = 0;
217                 hlist_for_each_entry(mp, &new->mhash[i], hlist[new->ver])
218                         len++;
219                 if (len > maxlen)
220                         maxlen = len;
221         }
222
223         return maxlen > elasticity ? -EINVAL : 0;
224 }
225
226 void br_multicast_free_pg(struct rcu_head *head)
227 {
228         struct net_bridge_port_group *p =
229                 container_of(head, struct net_bridge_port_group, rcu);
230
231         kfree(p);
232 }
233
234 static void br_multicast_free_group(struct rcu_head *head)
235 {
236         struct net_bridge_mdb_entry *mp =
237                 container_of(head, struct net_bridge_mdb_entry, rcu);
238
239         kfree(mp);
240 }
241
242 static void br_multicast_group_expired(struct timer_list *t)
243 {
244         struct net_bridge_mdb_entry *mp = from_timer(mp, t, timer);
245         struct net_bridge *br = mp->br;
246         struct net_bridge_mdb_htable *mdb;
247
248         spin_lock(&br->multicast_lock);
249         if (!netif_running(br->dev) || timer_pending(&mp->timer))
250                 goto out;
251
252         mp->host_joined = false;
253         br_mdb_notify(br->dev, NULL, &mp->addr, RTM_DELMDB, 0);
254
255         if (mp->ports)
256                 goto out;
257
258         mdb = mlock_dereference(br->mdb, br);
259
260         hlist_del_rcu(&mp->hlist[mdb->ver]);
261         mdb->size--;
262
263         call_rcu_bh(&mp->rcu, br_multicast_free_group);
264
265 out:
266         spin_unlock(&br->multicast_lock);
267 }
268
269 static void br_multicast_del_pg(struct net_bridge *br,
270                                 struct net_bridge_port_group *pg)
271 {
272         struct net_bridge_mdb_htable *mdb;
273         struct net_bridge_mdb_entry *mp;
274         struct net_bridge_port_group *p;
275         struct net_bridge_port_group __rcu **pp;
276
277         mdb = mlock_dereference(br->mdb, br);
278
279         mp = br_mdb_ip_get(mdb, &pg->addr);
280         if (WARN_ON(!mp))
281                 return;
282
283         for (pp = &mp->ports;
284              (p = mlock_dereference(*pp, br)) != NULL;
285              pp = &p->next) {
286                 if (p != pg)
287                         continue;
288
289                 rcu_assign_pointer(*pp, p->next);
290                 hlist_del_init(&p->mglist);
291                 del_timer(&p->timer);
292                 br_mdb_notify(br->dev, p->port, &pg->addr, RTM_DELMDB,
293                               p->flags);
294                 call_rcu_bh(&p->rcu, br_multicast_free_pg);
295
296                 if (!mp->ports && !mp->host_joined &&
297                     netif_running(br->dev))
298                         mod_timer(&mp->timer, jiffies);
299
300                 return;
301         }
302
303         WARN_ON(1);
304 }
305
306 static void br_multicast_port_group_expired(struct timer_list *t)
307 {
308         struct net_bridge_port_group *pg = from_timer(pg, t, timer);
309         struct net_bridge *br = pg->port->br;
310
311         spin_lock(&br->multicast_lock);
312         if (!netif_running(br->dev) || timer_pending(&pg->timer) ||
313             hlist_unhashed(&pg->mglist) || pg->flags & MDB_PG_FLAGS_PERMANENT)
314                 goto out;
315
316         br_multicast_del_pg(br, pg);
317
318 out:
319         spin_unlock(&br->multicast_lock);
320 }
321
322 static int br_mdb_rehash(struct net_bridge_mdb_htable __rcu **mdbp, int max,
323                          int elasticity)
324 {
325         struct net_bridge_mdb_htable *old = rcu_dereference_protected(*mdbp, 1);
326         struct net_bridge_mdb_htable *mdb;
327         int err;
328
329         mdb = kmalloc(sizeof(*mdb), GFP_ATOMIC);
330         if (!mdb)
331                 return -ENOMEM;
332
333         mdb->max = max;
334         mdb->old = old;
335
336         mdb->mhash = kcalloc(max, sizeof(*mdb->mhash), GFP_ATOMIC);
337         if (!mdb->mhash) {
338                 kfree(mdb);
339                 return -ENOMEM;
340         }
341
342         mdb->size = old ? old->size : 0;
343         mdb->ver = old ? old->ver ^ 1 : 0;
344
345         if (!old || elasticity)
346                 get_random_bytes(&mdb->secret, sizeof(mdb->secret));
347         else
348                 mdb->secret = old->secret;
349
350         if (!old)
351                 goto out;
352
353         err = br_mdb_copy(mdb, old, elasticity);
354         if (err) {
355                 kfree(mdb->mhash);
356                 kfree(mdb);
357                 return err;
358         }
359
360         br_mdb_rehash_seq++;
361         call_rcu_bh(&mdb->rcu, br_mdb_free);
362
363 out:
364         rcu_assign_pointer(*mdbp, mdb);
365
366         return 0;
367 }
368
369 static struct sk_buff *br_ip4_multicast_alloc_query(struct net_bridge *br,
370                                                     __be32 group,
371                                                     u8 *igmp_type)
372 {
373         struct igmpv3_query *ihv3;
374         size_t igmp_hdr_size;
375         struct sk_buff *skb;
376         struct igmphdr *ih;
377         struct ethhdr *eth;
378         struct iphdr *iph;
379
380         igmp_hdr_size = sizeof(*ih);
381         if (br->multicast_igmp_version == 3)
382                 igmp_hdr_size = sizeof(*ihv3);
383         skb = netdev_alloc_skb_ip_align(br->dev, sizeof(*eth) + sizeof(*iph) +
384                                                  igmp_hdr_size + 4);
385         if (!skb)
386                 goto out;
387
388         skb->protocol = htons(ETH_P_IP);
389
390         skb_reset_mac_header(skb);
391         eth = eth_hdr(skb);
392
393         ether_addr_copy(eth->h_source, br->dev->dev_addr);
394         eth->h_dest[0] = 1;
395         eth->h_dest[1] = 0;
396         eth->h_dest[2] = 0x5e;
397         eth->h_dest[3] = 0;
398         eth->h_dest[4] = 0;
399         eth->h_dest[5] = 1;
400         eth->h_proto = htons(ETH_P_IP);
401         skb_put(skb, sizeof(*eth));
402
403         skb_set_network_header(skb, skb->len);
404         iph = ip_hdr(skb);
405
406         iph->version = 4;
407         iph->ihl = 6;
408         iph->tos = 0xc0;
409         iph->tot_len = htons(sizeof(*iph) + igmp_hdr_size + 4);
410         iph->id = 0;
411         iph->frag_off = htons(IP_DF);
412         iph->ttl = 1;
413         iph->protocol = IPPROTO_IGMP;
414         iph->saddr = br_opt_get(br, BROPT_MULTICAST_QUERY_USE_IFADDR) ?
415                      inet_select_addr(br->dev, 0, RT_SCOPE_LINK) : 0;
416         iph->daddr = htonl(INADDR_ALLHOSTS_GROUP);
417         ((u8 *)&iph[1])[0] = IPOPT_RA;
418         ((u8 *)&iph[1])[1] = 4;
419         ((u8 *)&iph[1])[2] = 0;
420         ((u8 *)&iph[1])[3] = 0;
421         ip_send_check(iph);
422         skb_put(skb, 24);
423
424         skb_set_transport_header(skb, skb->len);
425         *igmp_type = IGMP_HOST_MEMBERSHIP_QUERY;
426
427         switch (br->multicast_igmp_version) {
428         case 2:
429                 ih = igmp_hdr(skb);
430                 ih->type = IGMP_HOST_MEMBERSHIP_QUERY;
431                 ih->code = (group ? br->multicast_last_member_interval :
432                                     br->multicast_query_response_interval) /
433                            (HZ / IGMP_TIMER_SCALE);
434                 ih->group = group;
435                 ih->csum = 0;
436                 ih->csum = ip_compute_csum((void *)ih, sizeof(*ih));
437                 break;
438         case 3:
439                 ihv3 = igmpv3_query_hdr(skb);
440                 ihv3->type = IGMP_HOST_MEMBERSHIP_QUERY;
441                 ihv3->code = (group ? br->multicast_last_member_interval :
442                                       br->multicast_query_response_interval) /
443                              (HZ / IGMP_TIMER_SCALE);
444                 ihv3->group = group;
445                 ihv3->qqic = br->multicast_query_interval / HZ;
446                 ihv3->nsrcs = 0;
447                 ihv3->resv = 0;
448                 ihv3->suppress = 0;
449                 ihv3->qrv = 2;
450                 ihv3->csum = 0;
451                 ihv3->csum = ip_compute_csum((void *)ihv3, sizeof(*ihv3));
452                 break;
453         }
454
455         skb_put(skb, igmp_hdr_size);
456         __skb_pull(skb, sizeof(*eth));
457
458 out:
459         return skb;
460 }
461
462 #if IS_ENABLED(CONFIG_IPV6)
463 static struct sk_buff *br_ip6_multicast_alloc_query(struct net_bridge *br,
464                                                     const struct in6_addr *grp,
465                                                     u8 *igmp_type)
466 {
467         struct mld2_query *mld2q;
468         unsigned long interval;
469         struct ipv6hdr *ip6h;
470         struct mld_msg *mldq;
471         size_t mld_hdr_size;
472         struct sk_buff *skb;
473         struct ethhdr *eth;
474         u8 *hopopt;
475
476         mld_hdr_size = sizeof(*mldq);
477         if (br->multicast_mld_version == 2)
478                 mld_hdr_size = sizeof(*mld2q);
479         skb = netdev_alloc_skb_ip_align(br->dev, sizeof(*eth) + sizeof(*ip6h) +
480                                                  8 + mld_hdr_size);
481         if (!skb)
482                 goto out;
483
484         skb->protocol = htons(ETH_P_IPV6);
485
486         /* Ethernet header */
487         skb_reset_mac_header(skb);
488         eth = eth_hdr(skb);
489
490         ether_addr_copy(eth->h_source, br->dev->dev_addr);
491         eth->h_proto = htons(ETH_P_IPV6);
492         skb_put(skb, sizeof(*eth));
493
494         /* IPv6 header + HbH option */
495         skb_set_network_header(skb, skb->len);
496         ip6h = ipv6_hdr(skb);
497
498         *(__force __be32 *)ip6h = htonl(0x60000000);
499         ip6h->payload_len = htons(8 + mld_hdr_size);
500         ip6h->nexthdr = IPPROTO_HOPOPTS;
501         ip6h->hop_limit = 1;
502         ipv6_addr_set(&ip6h->daddr, htonl(0xff020000), 0, 0, htonl(1));
503         if (ipv6_dev_get_saddr(dev_net(br->dev), br->dev, &ip6h->daddr, 0,
504                                &ip6h->saddr)) {
505                 kfree_skb(skb);
506                 br_opt_toggle(br, BROPT_HAS_IPV6_ADDR, false);
507                 return NULL;
508         }
509
510         br_opt_toggle(br, BROPT_HAS_IPV6_ADDR, true);
511         ipv6_eth_mc_map(&ip6h->daddr, eth->h_dest);
512
513         hopopt = (u8 *)(ip6h + 1);
514         hopopt[0] = IPPROTO_ICMPV6;             /* next hdr */
515         hopopt[1] = 0;                          /* length of HbH */
516         hopopt[2] = IPV6_TLV_ROUTERALERT;       /* Router Alert */
517         hopopt[3] = 2;                          /* Length of RA Option */
518         hopopt[4] = 0;                          /* Type = 0x0000 (MLD) */
519         hopopt[5] = 0;
520         hopopt[6] = IPV6_TLV_PAD1;              /* Pad1 */
521         hopopt[7] = IPV6_TLV_PAD1;              /* Pad1 */
522
523         skb_put(skb, sizeof(*ip6h) + 8);
524
525         /* ICMPv6 */
526         skb_set_transport_header(skb, skb->len);
527         interval = ipv6_addr_any(grp) ?
528                         br->multicast_query_response_interval :
529                         br->multicast_last_member_interval;
530         *igmp_type = ICMPV6_MGM_QUERY;
531         switch (br->multicast_mld_version) {
532         case 1:
533                 mldq = (struct mld_msg *)icmp6_hdr(skb);
534                 mldq->mld_type = ICMPV6_MGM_QUERY;
535                 mldq->mld_code = 0;
536                 mldq->mld_cksum = 0;
537                 mldq->mld_maxdelay = htons((u16)jiffies_to_msecs(interval));
538                 mldq->mld_reserved = 0;
539                 mldq->mld_mca = *grp;
540                 mldq->mld_cksum = csum_ipv6_magic(&ip6h->saddr, &ip6h->daddr,
541                                                   sizeof(*mldq), IPPROTO_ICMPV6,
542                                                   csum_partial(mldq,
543                                                                sizeof(*mldq),
544                                                                0));
545                 break;
546         case 2:
547                 mld2q = (struct mld2_query *)icmp6_hdr(skb);
548                 mld2q->mld2q_mrc = htons((u16)jiffies_to_msecs(interval));
549                 mld2q->mld2q_type = ICMPV6_MGM_QUERY;
550                 mld2q->mld2q_code = 0;
551                 mld2q->mld2q_cksum = 0;
552                 mld2q->mld2q_resv1 = 0;
553                 mld2q->mld2q_resv2 = 0;
554                 mld2q->mld2q_suppress = 0;
555                 mld2q->mld2q_qrv = 2;
556                 mld2q->mld2q_nsrcs = 0;
557                 mld2q->mld2q_qqic = br->multicast_query_interval / HZ;
558                 mld2q->mld2q_mca = *grp;
559                 mld2q->mld2q_cksum = csum_ipv6_magic(&ip6h->saddr, &ip6h->daddr,
560                                                      sizeof(*mld2q),
561                                                      IPPROTO_ICMPV6,
562                                                      csum_partial(mld2q,
563                                                                   sizeof(*mld2q),
564                                                                   0));
565                 break;
566         }
567         skb_put(skb, mld_hdr_size);
568
569         __skb_pull(skb, sizeof(*eth));
570
571 out:
572         return skb;
573 }
574 #endif
575
576 static struct sk_buff *br_multicast_alloc_query(struct net_bridge *br,
577                                                 struct br_ip *addr,
578                                                 u8 *igmp_type)
579 {
580         switch (addr->proto) {
581         case htons(ETH_P_IP):
582                 return br_ip4_multicast_alloc_query(br, addr->u.ip4, igmp_type);
583 #if IS_ENABLED(CONFIG_IPV6)
584         case htons(ETH_P_IPV6):
585                 return br_ip6_multicast_alloc_query(br, &addr->u.ip6,
586                                                     igmp_type);
587 #endif
588         }
589         return NULL;
590 }
591
592 static struct net_bridge_mdb_entry *br_multicast_get_group(
593         struct net_bridge *br, struct net_bridge_port *port,
594         struct br_ip *group, int hash)
595 {
596         struct net_bridge_mdb_htable *mdb;
597         struct net_bridge_mdb_entry *mp;
598         unsigned int count = 0;
599         unsigned int max;
600         int elasticity;
601         int err;
602
603         mdb = rcu_dereference_protected(br->mdb, 1);
604         hlist_for_each_entry(mp, &mdb->mhash[hash], hlist[mdb->ver]) {
605                 count++;
606                 if (unlikely(br_ip_equal(group, &mp->addr)))
607                         return mp;
608         }
609
610         elasticity = 0;
611         max = mdb->max;
612
613         if (unlikely(count > br->hash_elasticity && count)) {
614                 if (net_ratelimit())
615                         br_info(br, "Multicast hash table "
616                                 "chain limit reached: %s\n",
617                                 port ? port->dev->name : br->dev->name);
618
619                 elasticity = br->hash_elasticity;
620         }
621
622         if (mdb->size >= max) {
623                 max *= 2;
624                 if (unlikely(max > br->hash_max)) {
625                         br_warn(br, "Multicast hash table maximum of %d "
626                                 "reached, disabling snooping: %s\n",
627                                 br->hash_max,
628                                 port ? port->dev->name : br->dev->name);
629                         err = -E2BIG;
630 disable:
631                         br_opt_toggle(br, BROPT_MULTICAST_ENABLED, false);
632                         goto err;
633                 }
634         }
635
636         if (max > mdb->max || elasticity) {
637                 if (mdb->old) {
638                         if (net_ratelimit())
639                                 br_info(br, "Multicast hash table "
640                                         "on fire: %s\n",
641                                         port ? port->dev->name : br->dev->name);
642                         err = -EEXIST;
643                         goto err;
644                 }
645
646                 err = br_mdb_rehash(&br->mdb, max, elasticity);
647                 if (err) {
648                         br_warn(br, "Cannot rehash multicast "
649                                 "hash table, disabling snooping: %s, %d, %d\n",
650                                 port ? port->dev->name : br->dev->name,
651                                 mdb->size, err);
652                         goto disable;
653                 }
654
655                 err = -EAGAIN;
656                 goto err;
657         }
658
659         return NULL;
660
661 err:
662         mp = ERR_PTR(err);
663         return mp;
664 }
665
666 struct net_bridge_mdb_entry *br_multicast_new_group(struct net_bridge *br,
667                                                     struct net_bridge_port *p,
668                                                     struct br_ip *group)
669 {
670         struct net_bridge_mdb_htable *mdb;
671         struct net_bridge_mdb_entry *mp;
672         int hash;
673         int err;
674
675         mdb = rcu_dereference_protected(br->mdb, 1);
676         if (!mdb) {
677                 err = br_mdb_rehash(&br->mdb, BR_HASH_SIZE, 0);
678                 if (err)
679                         return ERR_PTR(err);
680                 goto rehash;
681         }
682
683         hash = br_ip_hash(mdb, group);
684         mp = br_multicast_get_group(br, p, group, hash);
685         switch (PTR_ERR(mp)) {
686         case 0:
687                 break;
688
689         case -EAGAIN:
690 rehash:
691                 mdb = rcu_dereference_protected(br->mdb, 1);
692                 hash = br_ip_hash(mdb, group);
693                 break;
694
695         default:
696                 goto out;
697         }
698
699         mp = kzalloc(sizeof(*mp), GFP_ATOMIC);
700         if (unlikely(!mp))
701                 return ERR_PTR(-ENOMEM);
702
703         mp->br = br;
704         mp->addr = *group;
705         timer_setup(&mp->timer, br_multicast_group_expired, 0);
706
707         hlist_add_head_rcu(&mp->hlist[mdb->ver], &mdb->mhash[hash]);
708         mdb->size++;
709
710 out:
711         return mp;
712 }
713
714 struct net_bridge_port_group *br_multicast_new_port_group(
715                         struct net_bridge_port *port,
716                         struct br_ip *group,
717                         struct net_bridge_port_group __rcu *next,
718                         unsigned char flags,
719                         const unsigned char *src)
720 {
721         struct net_bridge_port_group *p;
722
723         p = kzalloc(sizeof(*p), GFP_ATOMIC);
724         if (unlikely(!p))
725                 return NULL;
726
727         p->addr = *group;
728         p->port = port;
729         p->flags = flags;
730         rcu_assign_pointer(p->next, next);
731         hlist_add_head(&p->mglist, &port->mglist);
732         timer_setup(&p->timer, br_multicast_port_group_expired, 0);
733
734         if (src)
735                 memcpy(p->eth_addr, src, ETH_ALEN);
736         else
737                 memset(p->eth_addr, 0xff, ETH_ALEN);
738
739         return p;
740 }
741
742 static bool br_port_group_equal(struct net_bridge_port_group *p,
743                                 struct net_bridge_port *port,
744                                 const unsigned char *src)
745 {
746         if (p->port != port)
747                 return false;
748
749         if (!(port->flags & BR_MULTICAST_TO_UNICAST))
750                 return true;
751
752         return ether_addr_equal(src, p->eth_addr);
753 }
754
755 static int br_multicast_add_group(struct net_bridge *br,
756                                   struct net_bridge_port *port,
757                                   struct br_ip *group,
758                                   const unsigned char *src)
759 {
760         struct net_bridge_port_group __rcu **pp;
761         struct net_bridge_port_group *p;
762         struct net_bridge_mdb_entry *mp;
763         unsigned long now = jiffies;
764         int err;
765
766         spin_lock(&br->multicast_lock);
767         if (!netif_running(br->dev) ||
768             (port && port->state == BR_STATE_DISABLED))
769                 goto out;
770
771         mp = br_multicast_new_group(br, port, group);
772         err = PTR_ERR(mp);
773         if (IS_ERR(mp))
774                 goto err;
775
776         if (!port) {
777                 if (!mp->host_joined) {
778                         mp->host_joined = true;
779                         br_mdb_notify(br->dev, NULL, &mp->addr, RTM_NEWMDB, 0);
780                 }
781                 mod_timer(&mp->timer, now + br->multicast_membership_interval);
782                 goto out;
783         }
784
785         for (pp = &mp->ports;
786              (p = mlock_dereference(*pp, br)) != NULL;
787              pp = &p->next) {
788                 if (br_port_group_equal(p, port, src))
789                         goto found;
790                 if ((unsigned long)p->port < (unsigned long)port)
791                         break;
792         }
793
794         p = br_multicast_new_port_group(port, group, *pp, 0, src);
795         if (unlikely(!p))
796                 goto err;
797         rcu_assign_pointer(*pp, p);
798         br_mdb_notify(br->dev, port, group, RTM_NEWMDB, 0);
799
800 found:
801         mod_timer(&p->timer, now + br->multicast_membership_interval);
802 out:
803         err = 0;
804
805 err:
806         spin_unlock(&br->multicast_lock);
807         return err;
808 }
809
810 static int br_ip4_multicast_add_group(struct net_bridge *br,
811                                       struct net_bridge_port *port,
812                                       __be32 group,
813                                       __u16 vid,
814                                       const unsigned char *src)
815 {
816         struct br_ip br_group;
817
818         if (ipv4_is_local_multicast(group))
819                 return 0;
820
821         br_group.u.ip4 = group;
822         br_group.proto = htons(ETH_P_IP);
823         br_group.vid = vid;
824
825         return br_multicast_add_group(br, port, &br_group, src);
826 }
827
828 #if IS_ENABLED(CONFIG_IPV6)
829 static int br_ip6_multicast_add_group(struct net_bridge *br,
830                                       struct net_bridge_port *port,
831                                       const struct in6_addr *group,
832                                       __u16 vid,
833                                       const unsigned char *src)
834 {
835         struct br_ip br_group;
836
837         if (ipv6_addr_is_ll_all_nodes(group))
838                 return 0;
839
840         br_group.u.ip6 = *group;
841         br_group.proto = htons(ETH_P_IPV6);
842         br_group.vid = vid;
843
844         return br_multicast_add_group(br, port, &br_group, src);
845 }
846 #endif
847
848 static void br_multicast_router_expired(struct timer_list *t)
849 {
850         struct net_bridge_port *port =
851                         from_timer(port, t, multicast_router_timer);
852         struct net_bridge *br = port->br;
853
854         spin_lock(&br->multicast_lock);
855         if (port->multicast_router == MDB_RTR_TYPE_DISABLED ||
856             port->multicast_router == MDB_RTR_TYPE_PERM ||
857             timer_pending(&port->multicast_router_timer))
858                 goto out;
859
860         __del_port_router(port);
861 out:
862         spin_unlock(&br->multicast_lock);
863 }
864
865 static void br_mc_router_state_change(struct net_bridge *p,
866                                       bool is_mc_router)
867 {
868         struct switchdev_attr attr = {
869                 .orig_dev = p->dev,
870                 .id = SWITCHDEV_ATTR_ID_BRIDGE_MROUTER,
871                 .flags = SWITCHDEV_F_DEFER,
872                 .u.mrouter = is_mc_router,
873         };
874
875         switchdev_port_attr_set(p->dev, &attr);
876 }
877
878 static void br_multicast_local_router_expired(struct timer_list *t)
879 {
880         struct net_bridge *br = from_timer(br, t, multicast_router_timer);
881
882         spin_lock(&br->multicast_lock);
883         if (br->multicast_router == MDB_RTR_TYPE_DISABLED ||
884             br->multicast_router == MDB_RTR_TYPE_PERM ||
885             timer_pending(&br->multicast_router_timer))
886                 goto out;
887
888         br_mc_router_state_change(br, false);
889 out:
890         spin_unlock(&br->multicast_lock);
891 }
892
893 static void br_multicast_querier_expired(struct net_bridge *br,
894                                          struct bridge_mcast_own_query *query)
895 {
896         spin_lock(&br->multicast_lock);
897         if (!netif_running(br->dev) || !br_opt_get(br, BROPT_MULTICAST_ENABLED))
898                 goto out;
899
900         br_multicast_start_querier(br, query);
901
902 out:
903         spin_unlock(&br->multicast_lock);
904 }
905
906 static void br_ip4_multicast_querier_expired(struct timer_list *t)
907 {
908         struct net_bridge *br = from_timer(br, t, ip4_other_query.timer);
909
910         br_multicast_querier_expired(br, &br->ip4_own_query);
911 }
912
913 #if IS_ENABLED(CONFIG_IPV6)
914 static void br_ip6_multicast_querier_expired(struct timer_list *t)
915 {
916         struct net_bridge *br = from_timer(br, t, ip6_other_query.timer);
917
918         br_multicast_querier_expired(br, &br->ip6_own_query);
919 }
920 #endif
921
922 static void br_multicast_select_own_querier(struct net_bridge *br,
923                                             struct br_ip *ip,
924                                             struct sk_buff *skb)
925 {
926         if (ip->proto == htons(ETH_P_IP))
927                 br->ip4_querier.addr.u.ip4 = ip_hdr(skb)->saddr;
928 #if IS_ENABLED(CONFIG_IPV6)
929         else
930                 br->ip6_querier.addr.u.ip6 = ipv6_hdr(skb)->saddr;
931 #endif
932 }
933
934 static void __br_multicast_send_query(struct net_bridge *br,
935                                       struct net_bridge_port *port,
936                                       struct br_ip *ip)
937 {
938         struct sk_buff *skb;
939         u8 igmp_type;
940
941         skb = br_multicast_alloc_query(br, ip, &igmp_type);
942         if (!skb)
943                 return;
944
945         if (port) {
946                 skb->dev = port->dev;
947                 br_multicast_count(br, port, skb, igmp_type,
948                                    BR_MCAST_DIR_TX);
949                 NF_HOOK(NFPROTO_BRIDGE, NF_BR_LOCAL_OUT,
950                         dev_net(port->dev), NULL, skb, NULL, skb->dev,
951                         br_dev_queue_push_xmit);
952         } else {
953                 br_multicast_select_own_querier(br, ip, skb);
954                 br_multicast_count(br, port, skb, igmp_type,
955                                    BR_MCAST_DIR_RX);
956                 netif_rx(skb);
957         }
958 }
959
960 static void br_multicast_send_query(struct net_bridge *br,
961                                     struct net_bridge_port *port,
962                                     struct bridge_mcast_own_query *own_query)
963 {
964         struct bridge_mcast_other_query *other_query = NULL;
965         struct br_ip br_group;
966         unsigned long time;
967
968         if (!netif_running(br->dev) ||
969             !br_opt_get(br, BROPT_MULTICAST_ENABLED) ||
970             !br_opt_get(br, BROPT_MULTICAST_QUERIER))
971                 return;
972
973         memset(&br_group.u, 0, sizeof(br_group.u));
974
975         if (port ? (own_query == &port->ip4_own_query) :
976                    (own_query == &br->ip4_own_query)) {
977                 other_query = &br->ip4_other_query;
978                 br_group.proto = htons(ETH_P_IP);
979 #if IS_ENABLED(CONFIG_IPV6)
980         } else {
981                 other_query = &br->ip6_other_query;
982                 br_group.proto = htons(ETH_P_IPV6);
983 #endif
984         }
985
986         if (!other_query || timer_pending(&other_query->timer))
987                 return;
988
989         __br_multicast_send_query(br, port, &br_group);
990
991         time = jiffies;
992         time += own_query->startup_sent < br->multicast_startup_query_count ?
993                 br->multicast_startup_query_interval :
994                 br->multicast_query_interval;
995         mod_timer(&own_query->timer, time);
996 }
997
998 static void
999 br_multicast_port_query_expired(struct net_bridge_port *port,
1000                                 struct bridge_mcast_own_query *query)
1001 {
1002         struct net_bridge *br = port->br;
1003
1004         spin_lock(&br->multicast_lock);
1005         if (port->state == BR_STATE_DISABLED ||
1006             port->state == BR_STATE_BLOCKING)
1007                 goto out;
1008
1009         if (query->startup_sent < br->multicast_startup_query_count)
1010                 query->startup_sent++;
1011
1012         br_multicast_send_query(port->br, port, query);
1013
1014 out:
1015         spin_unlock(&br->multicast_lock);
1016 }
1017
1018 static void br_ip4_multicast_port_query_expired(struct timer_list *t)
1019 {
1020         struct net_bridge_port *port = from_timer(port, t, ip4_own_query.timer);
1021
1022         br_multicast_port_query_expired(port, &port->ip4_own_query);
1023 }
1024
1025 #if IS_ENABLED(CONFIG_IPV6)
1026 static void br_ip6_multicast_port_query_expired(struct timer_list *t)
1027 {
1028         struct net_bridge_port *port = from_timer(port, t, ip6_own_query.timer);
1029
1030         br_multicast_port_query_expired(port, &port->ip6_own_query);
1031 }
1032 #endif
1033
1034 static void br_mc_disabled_update(struct net_device *dev, bool value)
1035 {
1036         struct switchdev_attr attr = {
1037                 .orig_dev = dev,
1038                 .id = SWITCHDEV_ATTR_ID_BRIDGE_MC_DISABLED,
1039                 .flags = SWITCHDEV_F_DEFER,
1040                 .u.mc_disabled = !value,
1041         };
1042
1043         switchdev_port_attr_set(dev, &attr);
1044 }
1045
1046 int br_multicast_add_port(struct net_bridge_port *port)
1047 {
1048         port->multicast_router = MDB_RTR_TYPE_TEMP_QUERY;
1049
1050         timer_setup(&port->multicast_router_timer,
1051                     br_multicast_router_expired, 0);
1052         timer_setup(&port->ip4_own_query.timer,
1053                     br_ip4_multicast_port_query_expired, 0);
1054 #if IS_ENABLED(CONFIG_IPV6)
1055         timer_setup(&port->ip6_own_query.timer,
1056                     br_ip6_multicast_port_query_expired, 0);
1057 #endif
1058         br_mc_disabled_update(port->dev,
1059                               br_opt_get(port->br, BROPT_MULTICAST_ENABLED));
1060
1061         port->mcast_stats = netdev_alloc_pcpu_stats(struct bridge_mcast_stats);
1062         if (!port->mcast_stats)
1063                 return -ENOMEM;
1064
1065         return 0;
1066 }
1067
1068 void br_multicast_del_port(struct net_bridge_port *port)
1069 {
1070         struct net_bridge *br = port->br;
1071         struct net_bridge_port_group *pg;
1072         struct hlist_node *n;
1073
1074         /* Take care of the remaining groups, only perm ones should be left */
1075         spin_lock_bh(&br->multicast_lock);
1076         hlist_for_each_entry_safe(pg, n, &port->mglist, mglist)
1077                 br_multicast_del_pg(br, pg);
1078         spin_unlock_bh(&br->multicast_lock);
1079         del_timer_sync(&port->multicast_router_timer);
1080         free_percpu(port->mcast_stats);
1081 }
1082
1083 static void br_multicast_enable(struct bridge_mcast_own_query *query)
1084 {
1085         query->startup_sent = 0;
1086
1087         if (try_to_del_timer_sync(&query->timer) >= 0 ||
1088             del_timer(&query->timer))
1089                 mod_timer(&query->timer, jiffies);
1090 }
1091
1092 static void __br_multicast_enable_port(struct net_bridge_port *port)
1093 {
1094         struct net_bridge *br = port->br;
1095
1096         if (!br_opt_get(br, BROPT_MULTICAST_ENABLED) || !netif_running(br->dev))
1097                 return;
1098
1099         br_multicast_enable(&port->ip4_own_query);
1100 #if IS_ENABLED(CONFIG_IPV6)
1101         br_multicast_enable(&port->ip6_own_query);
1102 #endif
1103         if (port->multicast_router == MDB_RTR_TYPE_PERM &&
1104             hlist_unhashed(&port->rlist))
1105                 br_multicast_add_router(br, port);
1106 }
1107
1108 void br_multicast_enable_port(struct net_bridge_port *port)
1109 {
1110         struct net_bridge *br = port->br;
1111
1112         spin_lock(&br->multicast_lock);
1113         __br_multicast_enable_port(port);
1114         spin_unlock(&br->multicast_lock);
1115 }
1116
1117 void br_multicast_disable_port(struct net_bridge_port *port)
1118 {
1119         struct net_bridge *br = port->br;
1120         struct net_bridge_port_group *pg;
1121         struct hlist_node *n;
1122
1123         spin_lock(&br->multicast_lock);
1124         hlist_for_each_entry_safe(pg, n, &port->mglist, mglist)
1125                 if (!(pg->flags & MDB_PG_FLAGS_PERMANENT))
1126                         br_multicast_del_pg(br, pg);
1127
1128         __del_port_router(port);
1129
1130         del_timer(&port->multicast_router_timer);
1131         del_timer(&port->ip4_own_query.timer);
1132 #if IS_ENABLED(CONFIG_IPV6)
1133         del_timer(&port->ip6_own_query.timer);
1134 #endif
1135         spin_unlock(&br->multicast_lock);
1136 }
1137
1138 static int br_ip4_multicast_igmp3_report(struct net_bridge *br,
1139                                          struct net_bridge_port *port,
1140                                          struct sk_buff *skb,
1141                                          u16 vid)
1142 {
1143         const unsigned char *src;
1144         struct igmpv3_report *ih;
1145         struct igmpv3_grec *grec;
1146         int i;
1147         int len;
1148         int num;
1149         int type;
1150         int err = 0;
1151         __be32 group;
1152
1153         ih = igmpv3_report_hdr(skb);
1154         num = ntohs(ih->ngrec);
1155         len = skb_transport_offset(skb) + sizeof(*ih);
1156
1157         for (i = 0; i < num; i++) {
1158                 len += sizeof(*grec);
1159                 if (!pskb_may_pull(skb, len))
1160                         return -EINVAL;
1161
1162                 grec = (void *)(skb->data + len - sizeof(*grec));
1163                 group = grec->grec_mca;
1164                 type = grec->grec_type;
1165
1166                 len += ntohs(grec->grec_nsrcs) * 4;
1167                 if (!pskb_may_pull(skb, len))
1168                         return -EINVAL;
1169
1170                 /* We treat this as an IGMPv2 report for now. */
1171                 switch (type) {
1172                 case IGMPV3_MODE_IS_INCLUDE:
1173                 case IGMPV3_MODE_IS_EXCLUDE:
1174                 case IGMPV3_CHANGE_TO_INCLUDE:
1175                 case IGMPV3_CHANGE_TO_EXCLUDE:
1176                 case IGMPV3_ALLOW_NEW_SOURCES:
1177                 case IGMPV3_BLOCK_OLD_SOURCES:
1178                         break;
1179
1180                 default:
1181                         continue;
1182                 }
1183
1184                 src = eth_hdr(skb)->h_source;
1185                 if ((type == IGMPV3_CHANGE_TO_INCLUDE ||
1186                      type == IGMPV3_MODE_IS_INCLUDE) &&
1187                     ntohs(grec->grec_nsrcs) == 0) {
1188                         br_ip4_multicast_leave_group(br, port, group, vid, src);
1189                 } else {
1190                         err = br_ip4_multicast_add_group(br, port, group, vid,
1191                                                          src);
1192                         if (err)
1193                                 break;
1194                 }
1195         }
1196
1197         return err;
1198 }
1199
1200 #if IS_ENABLED(CONFIG_IPV6)
1201 static int br_ip6_multicast_mld2_report(struct net_bridge *br,
1202                                         struct net_bridge_port *port,
1203                                         struct sk_buff *skb,
1204                                         u16 vid)
1205 {
1206         const unsigned char *src;
1207         struct icmp6hdr *icmp6h;
1208         struct mld2_grec *grec;
1209         int i;
1210         int len;
1211         int num;
1212         int err = 0;
1213
1214         if (!pskb_may_pull(skb, sizeof(*icmp6h)))
1215                 return -EINVAL;
1216
1217         icmp6h = icmp6_hdr(skb);
1218         num = ntohs(icmp6h->icmp6_dataun.un_data16[1]);
1219         len = skb_transport_offset(skb) + sizeof(*icmp6h);
1220
1221         for (i = 0; i < num; i++) {
1222                 __be16 *nsrcs, _nsrcs;
1223
1224                 nsrcs = skb_header_pointer(skb,
1225                                            len + offsetof(struct mld2_grec,
1226                                                           grec_nsrcs),
1227                                            sizeof(_nsrcs), &_nsrcs);
1228                 if (!nsrcs)
1229                         return -EINVAL;
1230
1231                 if (!pskb_may_pull(skb,
1232                                    len + sizeof(*grec) +
1233                                    sizeof(struct in6_addr) * ntohs(*nsrcs)))
1234                         return -EINVAL;
1235
1236                 grec = (struct mld2_grec *)(skb->data + len);
1237                 len += sizeof(*grec) +
1238                        sizeof(struct in6_addr) * ntohs(*nsrcs);
1239
1240                 /* We treat these as MLDv1 reports for now. */
1241                 switch (grec->grec_type) {
1242                 case MLD2_MODE_IS_INCLUDE:
1243                 case MLD2_MODE_IS_EXCLUDE:
1244                 case MLD2_CHANGE_TO_INCLUDE:
1245                 case MLD2_CHANGE_TO_EXCLUDE:
1246                 case MLD2_ALLOW_NEW_SOURCES:
1247                 case MLD2_BLOCK_OLD_SOURCES:
1248                         break;
1249
1250                 default:
1251                         continue;
1252                 }
1253
1254                 src = eth_hdr(skb)->h_source;
1255                 if ((grec->grec_type == MLD2_CHANGE_TO_INCLUDE ||
1256                      grec->grec_type == MLD2_MODE_IS_INCLUDE) &&
1257                     ntohs(*nsrcs) == 0) {
1258                         br_ip6_multicast_leave_group(br, port, &grec->grec_mca,
1259                                                      vid, src);
1260                 } else {
1261                         err = br_ip6_multicast_add_group(br, port,
1262                                                          &grec->grec_mca, vid,
1263                                                          src);
1264                         if (err)
1265                                 break;
1266                 }
1267         }
1268
1269         return err;
1270 }
1271 #endif
1272
1273 static bool br_ip4_multicast_select_querier(struct net_bridge *br,
1274                                             struct net_bridge_port *port,
1275                                             __be32 saddr)
1276 {
1277         if (!timer_pending(&br->ip4_own_query.timer) &&
1278             !timer_pending(&br->ip4_other_query.timer))
1279                 goto update;
1280
1281         if (!br->ip4_querier.addr.u.ip4)
1282                 goto update;
1283
1284         if (ntohl(saddr) <= ntohl(br->ip4_querier.addr.u.ip4))
1285                 goto update;
1286
1287         return false;
1288
1289 update:
1290         br->ip4_querier.addr.u.ip4 = saddr;
1291
1292         /* update protected by general multicast_lock by caller */
1293         rcu_assign_pointer(br->ip4_querier.port, port);
1294
1295         return true;
1296 }
1297
1298 #if IS_ENABLED(CONFIG_IPV6)
1299 static bool br_ip6_multicast_select_querier(struct net_bridge *br,
1300                                             struct net_bridge_port *port,
1301                                             struct in6_addr *saddr)
1302 {
1303         if (!timer_pending(&br->ip6_own_query.timer) &&
1304             !timer_pending(&br->ip6_other_query.timer))
1305                 goto update;
1306
1307         if (ipv6_addr_cmp(saddr, &br->ip6_querier.addr.u.ip6) <= 0)
1308                 goto update;
1309
1310         return false;
1311
1312 update:
1313         br->ip6_querier.addr.u.ip6 = *saddr;
1314
1315         /* update protected by general multicast_lock by caller */
1316         rcu_assign_pointer(br->ip6_querier.port, port);
1317
1318         return true;
1319 }
1320 #endif
1321
1322 static bool br_multicast_select_querier(struct net_bridge *br,
1323                                         struct net_bridge_port *port,
1324                                         struct br_ip *saddr)
1325 {
1326         switch (saddr->proto) {
1327         case htons(ETH_P_IP):
1328                 return br_ip4_multicast_select_querier(br, port, saddr->u.ip4);
1329 #if IS_ENABLED(CONFIG_IPV6)
1330         case htons(ETH_P_IPV6):
1331                 return br_ip6_multicast_select_querier(br, port, &saddr->u.ip6);
1332 #endif
1333         }
1334
1335         return false;
1336 }
1337
1338 static void
1339 br_multicast_update_query_timer(struct net_bridge *br,
1340                                 struct bridge_mcast_other_query *query,
1341                                 unsigned long max_delay)
1342 {
1343         if (!timer_pending(&query->timer))
1344                 query->delay_time = jiffies + max_delay;
1345
1346         mod_timer(&query->timer, jiffies + br->multicast_querier_interval);
1347 }
1348
1349 static void br_port_mc_router_state_change(struct net_bridge_port *p,
1350                                            bool is_mc_router)
1351 {
1352         struct switchdev_attr attr = {
1353                 .orig_dev = p->dev,
1354                 .id = SWITCHDEV_ATTR_ID_PORT_MROUTER,
1355                 .flags = SWITCHDEV_F_DEFER,
1356                 .u.mrouter = is_mc_router,
1357         };
1358
1359         switchdev_port_attr_set(p->dev, &attr);
1360 }
1361
1362 /*
1363  * Add port to router_list
1364  *  list is maintained ordered by pointer value
1365  *  and locked by br->multicast_lock and RCU
1366  */
1367 static void br_multicast_add_router(struct net_bridge *br,
1368                                     struct net_bridge_port *port)
1369 {
1370         struct net_bridge_port *p;
1371         struct hlist_node *slot = NULL;
1372
1373         if (!hlist_unhashed(&port->rlist))
1374                 return;
1375
1376         hlist_for_each_entry(p, &br->router_list, rlist) {
1377                 if ((unsigned long) port >= (unsigned long) p)
1378                         break;
1379                 slot = &p->rlist;
1380         }
1381
1382         if (slot)
1383                 hlist_add_behind_rcu(&port->rlist, slot);
1384         else
1385                 hlist_add_head_rcu(&port->rlist, &br->router_list);
1386         br_rtr_notify(br->dev, port, RTM_NEWMDB);
1387         br_port_mc_router_state_change(port, true);
1388 }
1389
1390 static void br_multicast_mark_router(struct net_bridge *br,
1391                                      struct net_bridge_port *port)
1392 {
1393         unsigned long now = jiffies;
1394
1395         if (!port) {
1396                 if (br->multicast_router == MDB_RTR_TYPE_TEMP_QUERY) {
1397                         if (!timer_pending(&br->multicast_router_timer))
1398                                 br_mc_router_state_change(br, true);
1399                         mod_timer(&br->multicast_router_timer,
1400                                   now + br->multicast_querier_interval);
1401                 }
1402                 return;
1403         }
1404
1405         if (port->multicast_router == MDB_RTR_TYPE_DISABLED ||
1406             port->multicast_router == MDB_RTR_TYPE_PERM)
1407                 return;
1408
1409         br_multicast_add_router(br, port);
1410
1411         mod_timer(&port->multicast_router_timer,
1412                   now + br->multicast_querier_interval);
1413 }
1414
1415 static void br_multicast_query_received(struct net_bridge *br,
1416                                         struct net_bridge_port *port,
1417                                         struct bridge_mcast_other_query *query,
1418                                         struct br_ip *saddr,
1419                                         unsigned long max_delay)
1420 {
1421         if (!br_multicast_select_querier(br, port, saddr))
1422                 return;
1423
1424         br_multicast_update_query_timer(br, query, max_delay);
1425
1426         /* Based on RFC4541, section 2.1.1 IGMP Forwarding Rules,
1427          * the arrival port for IGMP Queries where the source address
1428          * is 0.0.0.0 should not be added to router port list.
1429          */
1430         if ((saddr->proto == htons(ETH_P_IP) && saddr->u.ip4) ||
1431             (saddr->proto == htons(ETH_P_IPV6) &&
1432              !ipv6_addr_any(&saddr->u.ip6)))
1433                 br_multicast_mark_router(br, port);
1434 }
1435
1436 static void br_ip4_multicast_query(struct net_bridge *br,
1437                                    struct net_bridge_port *port,
1438                                    struct sk_buff *skb,
1439                                    u16 vid)
1440 {
1441         const struct iphdr *iph = ip_hdr(skb);
1442         struct igmphdr *ih = igmp_hdr(skb);
1443         struct net_bridge_mdb_entry *mp;
1444         struct igmpv3_query *ih3;
1445         struct net_bridge_port_group *p;
1446         struct net_bridge_port_group __rcu **pp;
1447         struct br_ip saddr;
1448         unsigned long max_delay;
1449         unsigned long now = jiffies;
1450         unsigned int offset = skb_transport_offset(skb);
1451         __be32 group;
1452
1453         spin_lock(&br->multicast_lock);
1454         if (!netif_running(br->dev) ||
1455             (port && port->state == BR_STATE_DISABLED))
1456                 goto out;
1457
1458         group = ih->group;
1459
1460         if (skb->len == offset + sizeof(*ih)) {
1461                 max_delay = ih->code * (HZ / IGMP_TIMER_SCALE);
1462
1463                 if (!max_delay) {
1464                         max_delay = 10 * HZ;
1465                         group = 0;
1466                 }
1467         } else if (skb->len >= offset + sizeof(*ih3)) {
1468                 ih3 = igmpv3_query_hdr(skb);
1469                 if (ih3->nsrcs)
1470                         goto out;
1471
1472                 max_delay = ih3->code ?
1473                             IGMPV3_MRC(ih3->code) * (HZ / IGMP_TIMER_SCALE) : 1;
1474         } else {
1475                 goto out;
1476         }
1477
1478         if (!group) {
1479                 saddr.proto = htons(ETH_P_IP);
1480                 saddr.u.ip4 = iph->saddr;
1481
1482                 br_multicast_query_received(br, port, &br->ip4_other_query,
1483                                             &saddr, max_delay);
1484                 goto out;
1485         }
1486
1487         mp = br_mdb_ip4_get(mlock_dereference(br->mdb, br), group, vid);
1488         if (!mp)
1489                 goto out;
1490
1491         max_delay *= br->multicast_last_member_count;
1492
1493         if (mp->host_joined &&
1494             (timer_pending(&mp->timer) ?
1495              time_after(mp->timer.expires, now + max_delay) :
1496              try_to_del_timer_sync(&mp->timer) >= 0))
1497                 mod_timer(&mp->timer, now + max_delay);
1498
1499         for (pp = &mp->ports;
1500              (p = mlock_dereference(*pp, br)) != NULL;
1501              pp = &p->next) {
1502                 if (timer_pending(&p->timer) ?
1503                     time_after(p->timer.expires, now + max_delay) :
1504                     try_to_del_timer_sync(&p->timer) >= 0)
1505                         mod_timer(&p->timer, now + max_delay);
1506         }
1507
1508 out:
1509         spin_unlock(&br->multicast_lock);
1510 }
1511
1512 #if IS_ENABLED(CONFIG_IPV6)
1513 static int br_ip6_multicast_query(struct net_bridge *br,
1514                                   struct net_bridge_port *port,
1515                                   struct sk_buff *skb,
1516                                   u16 vid)
1517 {
1518         const struct ipv6hdr *ip6h = ipv6_hdr(skb);
1519         struct mld_msg *mld;
1520         struct net_bridge_mdb_entry *mp;
1521         struct mld2_query *mld2q;
1522         struct net_bridge_port_group *p;
1523         struct net_bridge_port_group __rcu **pp;
1524         struct br_ip saddr;
1525         unsigned long max_delay;
1526         unsigned long now = jiffies;
1527         unsigned int offset = skb_transport_offset(skb);
1528         const struct in6_addr *group = NULL;
1529         bool is_general_query;
1530         int err = 0;
1531
1532         spin_lock(&br->multicast_lock);
1533         if (!netif_running(br->dev) ||
1534             (port && port->state == BR_STATE_DISABLED))
1535                 goto out;
1536
1537         if (skb->len == offset + sizeof(*mld)) {
1538                 if (!pskb_may_pull(skb, offset + sizeof(*mld))) {
1539                         err = -EINVAL;
1540                         goto out;
1541                 }
1542                 mld = (struct mld_msg *) icmp6_hdr(skb);
1543                 max_delay = msecs_to_jiffies(ntohs(mld->mld_maxdelay));
1544                 if (max_delay)
1545                         group = &mld->mld_mca;
1546         } else {
1547                 if (!pskb_may_pull(skb, offset + sizeof(*mld2q))) {
1548                         err = -EINVAL;
1549                         goto out;
1550                 }
1551                 mld2q = (struct mld2_query *)icmp6_hdr(skb);
1552                 if (!mld2q->mld2q_nsrcs)
1553                         group = &mld2q->mld2q_mca;
1554
1555                 max_delay = max(msecs_to_jiffies(mldv2_mrc(mld2q)), 1UL);
1556         }
1557
1558         is_general_query = group && ipv6_addr_any(group);
1559
1560         if (is_general_query) {
1561                 saddr.proto = htons(ETH_P_IPV6);
1562                 saddr.u.ip6 = ip6h->saddr;
1563
1564                 br_multicast_query_received(br, port, &br->ip6_other_query,
1565                                             &saddr, max_delay);
1566                 goto out;
1567         } else if (!group) {
1568                 goto out;
1569         }
1570
1571         mp = br_mdb_ip6_get(mlock_dereference(br->mdb, br), group, vid);
1572         if (!mp)
1573                 goto out;
1574
1575         max_delay *= br->multicast_last_member_count;
1576         if (mp->host_joined &&
1577             (timer_pending(&mp->timer) ?
1578              time_after(mp->timer.expires, now + max_delay) :
1579              try_to_del_timer_sync(&mp->timer) >= 0))
1580                 mod_timer(&mp->timer, now + max_delay);
1581
1582         for (pp = &mp->ports;
1583              (p = mlock_dereference(*pp, br)) != NULL;
1584              pp = &p->next) {
1585                 if (timer_pending(&p->timer) ?
1586                     time_after(p->timer.expires, now + max_delay) :
1587                     try_to_del_timer_sync(&p->timer) >= 0)
1588                         mod_timer(&p->timer, now + max_delay);
1589         }
1590
1591 out:
1592         spin_unlock(&br->multicast_lock);
1593         return err;
1594 }
1595 #endif
1596
1597 static void
1598 br_multicast_leave_group(struct net_bridge *br,
1599                          struct net_bridge_port *port,
1600                          struct br_ip *group,
1601                          struct bridge_mcast_other_query *other_query,
1602                          struct bridge_mcast_own_query *own_query,
1603                          const unsigned char *src)
1604 {
1605         struct net_bridge_mdb_htable *mdb;
1606         struct net_bridge_mdb_entry *mp;
1607         struct net_bridge_port_group *p;
1608         unsigned long now;
1609         unsigned long time;
1610
1611         spin_lock(&br->multicast_lock);
1612         if (!netif_running(br->dev) ||
1613             (port && port->state == BR_STATE_DISABLED))
1614                 goto out;
1615
1616         mdb = mlock_dereference(br->mdb, br);
1617         mp = br_mdb_ip_get(mdb, group);
1618         if (!mp)
1619                 goto out;
1620
1621         if (port && (port->flags & BR_MULTICAST_FAST_LEAVE)) {
1622                 struct net_bridge_port_group __rcu **pp;
1623
1624                 for (pp = &mp->ports;
1625                      (p = mlock_dereference(*pp, br)) != NULL;
1626                      pp = &p->next) {
1627                         if (!br_port_group_equal(p, port, src))
1628                                 continue;
1629
1630                         rcu_assign_pointer(*pp, p->next);
1631                         hlist_del_init(&p->mglist);
1632                         del_timer(&p->timer);
1633                         call_rcu_bh(&p->rcu, br_multicast_free_pg);
1634                         br_mdb_notify(br->dev, port, group, RTM_DELMDB,
1635                                       p->flags);
1636
1637                         if (!mp->ports && !mp->host_joined &&
1638                             netif_running(br->dev))
1639                                 mod_timer(&mp->timer, jiffies);
1640                 }
1641                 goto out;
1642         }
1643
1644         if (timer_pending(&other_query->timer))
1645                 goto out;
1646
1647         if (br_opt_get(br, BROPT_MULTICAST_QUERIER)) {
1648                 __br_multicast_send_query(br, port, &mp->addr);
1649
1650                 time = jiffies + br->multicast_last_member_count *
1651                                  br->multicast_last_member_interval;
1652
1653                 mod_timer(&own_query->timer, time);
1654
1655                 for (p = mlock_dereference(mp->ports, br);
1656                      p != NULL;
1657                      p = mlock_dereference(p->next, br)) {
1658                         if (!br_port_group_equal(p, port, src))
1659                                 continue;
1660
1661                         if (!hlist_unhashed(&p->mglist) &&
1662                             (timer_pending(&p->timer) ?
1663                              time_after(p->timer.expires, time) :
1664                              try_to_del_timer_sync(&p->timer) >= 0)) {
1665                                 mod_timer(&p->timer, time);
1666                         }
1667
1668                         break;
1669                 }
1670         }
1671
1672         now = jiffies;
1673         time = now + br->multicast_last_member_count *
1674                      br->multicast_last_member_interval;
1675
1676         if (!port) {
1677                 if (mp->host_joined &&
1678                     (timer_pending(&mp->timer) ?
1679                      time_after(mp->timer.expires, time) :
1680                      try_to_del_timer_sync(&mp->timer) >= 0)) {
1681                         mod_timer(&mp->timer, time);
1682                 }
1683
1684                 goto out;
1685         }
1686
1687         for (p = mlock_dereference(mp->ports, br);
1688              p != NULL;
1689              p = mlock_dereference(p->next, br)) {
1690                 if (p->port != port)
1691                         continue;
1692
1693                 if (!hlist_unhashed(&p->mglist) &&
1694                     (timer_pending(&p->timer) ?
1695                      time_after(p->timer.expires, time) :
1696                      try_to_del_timer_sync(&p->timer) >= 0)) {
1697                         mod_timer(&p->timer, time);
1698                 }
1699
1700                 break;
1701         }
1702 out:
1703         spin_unlock(&br->multicast_lock);
1704 }
1705
1706 static void br_ip4_multicast_leave_group(struct net_bridge *br,
1707                                          struct net_bridge_port *port,
1708                                          __be32 group,
1709                                          __u16 vid,
1710                                          const unsigned char *src)
1711 {
1712         struct br_ip br_group;
1713         struct bridge_mcast_own_query *own_query;
1714
1715         if (ipv4_is_local_multicast(group))
1716                 return;
1717
1718         own_query = port ? &port->ip4_own_query : &br->ip4_own_query;
1719
1720         br_group.u.ip4 = group;
1721         br_group.proto = htons(ETH_P_IP);
1722         br_group.vid = vid;
1723
1724         br_multicast_leave_group(br, port, &br_group, &br->ip4_other_query,
1725                                  own_query, src);
1726 }
1727
1728 #if IS_ENABLED(CONFIG_IPV6)
1729 static void br_ip6_multicast_leave_group(struct net_bridge *br,
1730                                          struct net_bridge_port *port,
1731                                          const struct in6_addr *group,
1732                                          __u16 vid,
1733                                          const unsigned char *src)
1734 {
1735         struct br_ip br_group;
1736         struct bridge_mcast_own_query *own_query;
1737
1738         if (ipv6_addr_is_ll_all_nodes(group))
1739                 return;
1740
1741         own_query = port ? &port->ip6_own_query : &br->ip6_own_query;
1742
1743         br_group.u.ip6 = *group;
1744         br_group.proto = htons(ETH_P_IPV6);
1745         br_group.vid = vid;
1746
1747         br_multicast_leave_group(br, port, &br_group, &br->ip6_other_query,
1748                                  own_query, src);
1749 }
1750 #endif
1751
1752 static void br_multicast_err_count(const struct net_bridge *br,
1753                                    const struct net_bridge_port *p,
1754                                    __be16 proto)
1755 {
1756         struct bridge_mcast_stats __percpu *stats;
1757         struct bridge_mcast_stats *pstats;
1758
1759         if (!br_opt_get(br, BROPT_MULTICAST_STATS_ENABLED))
1760                 return;
1761
1762         if (p)
1763                 stats = p->mcast_stats;
1764         else
1765                 stats = br->mcast_stats;
1766         if (WARN_ON(!stats))
1767                 return;
1768
1769         pstats = this_cpu_ptr(stats);
1770
1771         u64_stats_update_begin(&pstats->syncp);
1772         switch (proto) {
1773         case htons(ETH_P_IP):
1774                 pstats->mstats.igmp_parse_errors++;
1775                 break;
1776 #if IS_ENABLED(CONFIG_IPV6)
1777         case htons(ETH_P_IPV6):
1778                 pstats->mstats.mld_parse_errors++;
1779                 break;
1780 #endif
1781         }
1782         u64_stats_update_end(&pstats->syncp);
1783 }
1784
1785 static void br_multicast_pim(struct net_bridge *br,
1786                              struct net_bridge_port *port,
1787                              const struct sk_buff *skb)
1788 {
1789         unsigned int offset = skb_transport_offset(skb);
1790         struct pimhdr *pimhdr, _pimhdr;
1791
1792         pimhdr = skb_header_pointer(skb, offset, sizeof(_pimhdr), &_pimhdr);
1793         if (!pimhdr || pim_hdr_version(pimhdr) != PIM_VERSION ||
1794             pim_hdr_type(pimhdr) != PIM_TYPE_HELLO)
1795                 return;
1796
1797         br_multicast_mark_router(br, port);
1798 }
1799
1800 static int br_multicast_ipv4_rcv(struct net_bridge *br,
1801                                  struct net_bridge_port *port,
1802                                  struct sk_buff *skb,
1803                                  u16 vid)
1804 {
1805         struct sk_buff *skb_trimmed = NULL;
1806         const unsigned char *src;
1807         struct igmphdr *ih;
1808         int err;
1809
1810         err = ip_mc_check_igmp(skb, &skb_trimmed);
1811
1812         if (err == -ENOMSG) {
1813                 if (!ipv4_is_local_multicast(ip_hdr(skb)->daddr)) {
1814                         BR_INPUT_SKB_CB(skb)->mrouters_only = 1;
1815                 } else if (pim_ipv4_all_pim_routers(ip_hdr(skb)->daddr)) {
1816                         if (ip_hdr(skb)->protocol == IPPROTO_PIM)
1817                                 br_multicast_pim(br, port, skb);
1818                 }
1819                 return 0;
1820         } else if (err < 0) {
1821                 br_multicast_err_count(br, port, skb->protocol);
1822                 return err;
1823         }
1824
1825         ih = igmp_hdr(skb);
1826         src = eth_hdr(skb)->h_source;
1827         BR_INPUT_SKB_CB(skb)->igmp = ih->type;
1828
1829         switch (ih->type) {
1830         case IGMP_HOST_MEMBERSHIP_REPORT:
1831         case IGMPV2_HOST_MEMBERSHIP_REPORT:
1832                 BR_INPUT_SKB_CB(skb)->mrouters_only = 1;
1833                 err = br_ip4_multicast_add_group(br, port, ih->group, vid, src);
1834                 break;
1835         case IGMPV3_HOST_MEMBERSHIP_REPORT:
1836                 err = br_ip4_multicast_igmp3_report(br, port, skb_trimmed, vid);
1837                 break;
1838         case IGMP_HOST_MEMBERSHIP_QUERY:
1839                 br_ip4_multicast_query(br, port, skb_trimmed, vid);
1840                 break;
1841         case IGMP_HOST_LEAVE_MESSAGE:
1842                 br_ip4_multicast_leave_group(br, port, ih->group, vid, src);
1843                 break;
1844         }
1845
1846         if (skb_trimmed && skb_trimmed != skb)
1847                 kfree_skb(skb_trimmed);
1848
1849         br_multicast_count(br, port, skb, BR_INPUT_SKB_CB(skb)->igmp,
1850                            BR_MCAST_DIR_RX);
1851
1852         return err;
1853 }
1854
1855 #if IS_ENABLED(CONFIG_IPV6)
1856 static int br_multicast_ipv6_rcv(struct net_bridge *br,
1857                                  struct net_bridge_port *port,
1858                                  struct sk_buff *skb,
1859                                  u16 vid)
1860 {
1861         struct sk_buff *skb_trimmed = NULL;
1862         const unsigned char *src;
1863         struct mld_msg *mld;
1864         int err;
1865
1866         err = ipv6_mc_check_mld(skb, &skb_trimmed);
1867
1868         if (err == -ENOMSG) {
1869                 if (!ipv6_addr_is_ll_all_nodes(&ipv6_hdr(skb)->daddr))
1870                         BR_INPUT_SKB_CB(skb)->mrouters_only = 1;
1871                 return 0;
1872         } else if (err < 0) {
1873                 br_multicast_err_count(br, port, skb->protocol);
1874                 return err;
1875         }
1876
1877         mld = (struct mld_msg *)skb_transport_header(skb);
1878         BR_INPUT_SKB_CB(skb)->igmp = mld->mld_type;
1879
1880         switch (mld->mld_type) {
1881         case ICMPV6_MGM_REPORT:
1882                 src = eth_hdr(skb)->h_source;
1883                 BR_INPUT_SKB_CB(skb)->mrouters_only = 1;
1884                 err = br_ip6_multicast_add_group(br, port, &mld->mld_mca, vid,
1885                                                  src);
1886                 break;
1887         case ICMPV6_MLD2_REPORT:
1888                 err = br_ip6_multicast_mld2_report(br, port, skb_trimmed, vid);
1889                 break;
1890         case ICMPV6_MGM_QUERY:
1891                 err = br_ip6_multicast_query(br, port, skb_trimmed, vid);
1892                 break;
1893         case ICMPV6_MGM_REDUCTION:
1894                 src = eth_hdr(skb)->h_source;
1895                 br_ip6_multicast_leave_group(br, port, &mld->mld_mca, vid, src);
1896                 break;
1897         }
1898
1899         if (skb_trimmed && skb_trimmed != skb)
1900                 kfree_skb(skb_trimmed);
1901
1902         br_multicast_count(br, port, skb, BR_INPUT_SKB_CB(skb)->igmp,
1903                            BR_MCAST_DIR_RX);
1904
1905         return err;
1906 }
1907 #endif
1908
1909 int br_multicast_rcv(struct net_bridge *br, struct net_bridge_port *port,
1910                      struct sk_buff *skb, u16 vid)
1911 {
1912         int ret = 0;
1913
1914         BR_INPUT_SKB_CB(skb)->igmp = 0;
1915         BR_INPUT_SKB_CB(skb)->mrouters_only = 0;
1916
1917         if (!br_opt_get(br, BROPT_MULTICAST_ENABLED))
1918                 return 0;
1919
1920         switch (skb->protocol) {
1921         case htons(ETH_P_IP):
1922                 ret = br_multicast_ipv4_rcv(br, port, skb, vid);
1923                 break;
1924 #if IS_ENABLED(CONFIG_IPV6)
1925         case htons(ETH_P_IPV6):
1926                 ret = br_multicast_ipv6_rcv(br, port, skb, vid);
1927                 break;
1928 #endif
1929         }
1930
1931         return ret;
1932 }
1933
1934 static void br_multicast_query_expired(struct net_bridge *br,
1935                                        struct bridge_mcast_own_query *query,
1936                                        struct bridge_mcast_querier *querier)
1937 {
1938         spin_lock(&br->multicast_lock);
1939         if (query->startup_sent < br->multicast_startup_query_count)
1940                 query->startup_sent++;
1941
1942         RCU_INIT_POINTER(querier->port, NULL);
1943         br_multicast_send_query(br, NULL, query);
1944         spin_unlock(&br->multicast_lock);
1945 }
1946
1947 static void br_ip4_multicast_query_expired(struct timer_list *t)
1948 {
1949         struct net_bridge *br = from_timer(br, t, ip4_own_query.timer);
1950
1951         br_multicast_query_expired(br, &br->ip4_own_query, &br->ip4_querier);
1952 }
1953
1954 #if IS_ENABLED(CONFIG_IPV6)
1955 static void br_ip6_multicast_query_expired(struct timer_list *t)
1956 {
1957         struct net_bridge *br = from_timer(br, t, ip6_own_query.timer);
1958
1959         br_multicast_query_expired(br, &br->ip6_own_query, &br->ip6_querier);
1960 }
1961 #endif
1962
1963 void br_multicast_init(struct net_bridge *br)
1964 {
1965         br->hash_elasticity = 4;
1966         br->hash_max = 512;
1967
1968         br->multicast_router = MDB_RTR_TYPE_TEMP_QUERY;
1969         br->multicast_last_member_count = 2;
1970         br->multicast_startup_query_count = 2;
1971
1972         br->multicast_last_member_interval = HZ;
1973         br->multicast_query_response_interval = 10 * HZ;
1974         br->multicast_startup_query_interval = 125 * HZ / 4;
1975         br->multicast_query_interval = 125 * HZ;
1976         br->multicast_querier_interval = 255 * HZ;
1977         br->multicast_membership_interval = 260 * HZ;
1978
1979         br->ip4_other_query.delay_time = 0;
1980         br->ip4_querier.port = NULL;
1981         br->multicast_igmp_version = 2;
1982 #if IS_ENABLED(CONFIG_IPV6)
1983         br->multicast_mld_version = 1;
1984         br->ip6_other_query.delay_time = 0;
1985         br->ip6_querier.port = NULL;
1986 #endif
1987         br_opt_toggle(br, BROPT_MULTICAST_ENABLED, true);
1988         br_opt_toggle(br, BROPT_HAS_IPV6_ADDR, true);
1989
1990         spin_lock_init(&br->multicast_lock);
1991         timer_setup(&br->multicast_router_timer,
1992                     br_multicast_local_router_expired, 0);
1993         timer_setup(&br->ip4_other_query.timer,
1994                     br_ip4_multicast_querier_expired, 0);
1995         timer_setup(&br->ip4_own_query.timer,
1996                     br_ip4_multicast_query_expired, 0);
1997 #if IS_ENABLED(CONFIG_IPV6)
1998         timer_setup(&br->ip6_other_query.timer,
1999                     br_ip6_multicast_querier_expired, 0);
2000         timer_setup(&br->ip6_own_query.timer,
2001                     br_ip6_multicast_query_expired, 0);
2002 #endif
2003 }
2004
2005 static void __br_multicast_open(struct net_bridge *br,
2006                                 struct bridge_mcast_own_query *query)
2007 {
2008         query->startup_sent = 0;
2009
2010         if (!br_opt_get(br, BROPT_MULTICAST_ENABLED))
2011                 return;
2012
2013         mod_timer(&query->timer, jiffies);
2014 }
2015
2016 void br_multicast_open(struct net_bridge *br)
2017 {
2018         __br_multicast_open(br, &br->ip4_own_query);
2019 #if IS_ENABLED(CONFIG_IPV6)
2020         __br_multicast_open(br, &br->ip6_own_query);
2021 #endif
2022 }
2023
2024 void br_multicast_stop(struct net_bridge *br)
2025 {
2026         del_timer_sync(&br->multicast_router_timer);
2027         del_timer_sync(&br->ip4_other_query.timer);
2028         del_timer_sync(&br->ip4_own_query.timer);
2029 #if IS_ENABLED(CONFIG_IPV6)
2030         del_timer_sync(&br->ip6_other_query.timer);
2031         del_timer_sync(&br->ip6_own_query.timer);
2032 #endif
2033 }
2034
2035 void br_multicast_dev_del(struct net_bridge *br)
2036 {
2037         struct net_bridge_mdb_htable *mdb;
2038         struct net_bridge_mdb_entry *mp;
2039         struct hlist_node *n;
2040         u32 ver;
2041         int i;
2042
2043         spin_lock_bh(&br->multicast_lock);
2044         mdb = mlock_dereference(br->mdb, br);
2045         if (!mdb)
2046                 goto out;
2047
2048         br->mdb = NULL;
2049
2050         ver = mdb->ver;
2051         for (i = 0; i < mdb->max; i++) {
2052                 hlist_for_each_entry_safe(mp, n, &mdb->mhash[i],
2053                                           hlist[ver]) {
2054                         del_timer(&mp->timer);
2055                         call_rcu_bh(&mp->rcu, br_multicast_free_group);
2056                 }
2057         }
2058
2059         if (mdb->old) {
2060                 spin_unlock_bh(&br->multicast_lock);
2061                 rcu_barrier_bh();
2062                 spin_lock_bh(&br->multicast_lock);
2063                 WARN_ON(mdb->old);
2064         }
2065
2066         mdb->old = mdb;
2067         call_rcu_bh(&mdb->rcu, br_mdb_free);
2068
2069 out:
2070         spin_unlock_bh(&br->multicast_lock);
2071 }
2072
2073 int br_multicast_set_router(struct net_bridge *br, unsigned long val)
2074 {
2075         int err = -EINVAL;
2076
2077         spin_lock_bh(&br->multicast_lock);
2078
2079         switch (val) {
2080         case MDB_RTR_TYPE_DISABLED:
2081         case MDB_RTR_TYPE_PERM:
2082                 br_mc_router_state_change(br, val == MDB_RTR_TYPE_PERM);
2083                 del_timer(&br->multicast_router_timer);
2084                 br->multicast_router = val;
2085                 err = 0;
2086                 break;
2087         case MDB_RTR_TYPE_TEMP_QUERY:
2088                 if (br->multicast_router != MDB_RTR_TYPE_TEMP_QUERY)
2089                         br_mc_router_state_change(br, false);
2090                 br->multicast_router = val;
2091                 err = 0;
2092                 break;
2093         }
2094
2095         spin_unlock_bh(&br->multicast_lock);
2096
2097         return err;
2098 }
2099
2100 static void __del_port_router(struct net_bridge_port *p)
2101 {
2102         if (hlist_unhashed(&p->rlist))
2103                 return;
2104         hlist_del_init_rcu(&p->rlist);
2105         br_rtr_notify(p->br->dev, p, RTM_DELMDB);
2106         br_port_mc_router_state_change(p, false);
2107
2108         /* don't allow timer refresh */
2109         if (p->multicast_router == MDB_RTR_TYPE_TEMP)
2110                 p->multicast_router = MDB_RTR_TYPE_TEMP_QUERY;
2111 }
2112
2113 int br_multicast_set_port_router(struct net_bridge_port *p, unsigned long val)
2114 {
2115         struct net_bridge *br = p->br;
2116         unsigned long now = jiffies;
2117         int err = -EINVAL;
2118
2119         spin_lock(&br->multicast_lock);
2120         if (p->multicast_router == val) {
2121                 /* Refresh the temp router port timer */
2122                 if (p->multicast_router == MDB_RTR_TYPE_TEMP)
2123                         mod_timer(&p->multicast_router_timer,
2124                                   now + br->multicast_querier_interval);
2125                 err = 0;
2126                 goto unlock;
2127         }
2128         switch (val) {
2129         case MDB_RTR_TYPE_DISABLED:
2130                 p->multicast_router = MDB_RTR_TYPE_DISABLED;
2131                 __del_port_router(p);
2132                 del_timer(&p->multicast_router_timer);
2133                 break;
2134         case MDB_RTR_TYPE_TEMP_QUERY:
2135                 p->multicast_router = MDB_RTR_TYPE_TEMP_QUERY;
2136                 __del_port_router(p);
2137                 break;
2138         case MDB_RTR_TYPE_PERM:
2139                 p->multicast_router = MDB_RTR_TYPE_PERM;
2140                 del_timer(&p->multicast_router_timer);
2141                 br_multicast_add_router(br, p);
2142                 break;
2143         case MDB_RTR_TYPE_TEMP:
2144                 p->multicast_router = MDB_RTR_TYPE_TEMP;
2145                 br_multicast_mark_router(br, p);
2146                 break;
2147         default:
2148                 goto unlock;
2149         }
2150         err = 0;
2151 unlock:
2152         spin_unlock(&br->multicast_lock);
2153
2154         return err;
2155 }
2156
2157 static void br_multicast_start_querier(struct net_bridge *br,
2158                                        struct bridge_mcast_own_query *query)
2159 {
2160         struct net_bridge_port *port;
2161
2162         __br_multicast_open(br, query);
2163
2164         list_for_each_entry(port, &br->port_list, list) {
2165                 if (port->state == BR_STATE_DISABLED ||
2166                     port->state == BR_STATE_BLOCKING)
2167                         continue;
2168
2169                 if (query == &br->ip4_own_query)
2170                         br_multicast_enable(&port->ip4_own_query);
2171 #if IS_ENABLED(CONFIG_IPV6)
2172                 else
2173                         br_multicast_enable(&port->ip6_own_query);
2174 #endif
2175         }
2176 }
2177
2178 int br_multicast_toggle(struct net_bridge *br, unsigned long val)
2179 {
2180         struct net_bridge_mdb_htable *mdb;
2181         struct net_bridge_port *port;
2182         int err = 0;
2183
2184         spin_lock_bh(&br->multicast_lock);
2185         if (!!br_opt_get(br, BROPT_MULTICAST_ENABLED) == !!val)
2186                 goto unlock;
2187
2188         br_mc_disabled_update(br->dev, val);
2189         br_opt_toggle(br, BROPT_MULTICAST_ENABLED, !!val);
2190         if (!br_opt_get(br, BROPT_MULTICAST_ENABLED))
2191                 goto unlock;
2192
2193         if (!netif_running(br->dev))
2194                 goto unlock;
2195
2196         mdb = mlock_dereference(br->mdb, br);
2197         if (mdb) {
2198                 if (mdb->old) {
2199                         err = -EEXIST;
2200 rollback:
2201                         br_opt_toggle(br, BROPT_MULTICAST_ENABLED, false);
2202                         goto unlock;
2203                 }
2204
2205                 err = br_mdb_rehash(&br->mdb, mdb->max,
2206                                     br->hash_elasticity);
2207                 if (err)
2208                         goto rollback;
2209         }
2210
2211         br_multicast_open(br);
2212         list_for_each_entry(port, &br->port_list, list)
2213                 __br_multicast_enable_port(port);
2214
2215 unlock:
2216         spin_unlock_bh(&br->multicast_lock);
2217
2218         return err;
2219 }
2220
2221 bool br_multicast_enabled(const struct net_device *dev)
2222 {
2223         struct net_bridge *br = netdev_priv(dev);
2224
2225         return !!br_opt_get(br, BROPT_MULTICAST_ENABLED);
2226 }
2227 EXPORT_SYMBOL_GPL(br_multicast_enabled);
2228
2229 bool br_multicast_router(const struct net_device *dev)
2230 {
2231         struct net_bridge *br = netdev_priv(dev);
2232         bool is_router;
2233
2234         spin_lock_bh(&br->multicast_lock);
2235         is_router = br_multicast_is_router(br);
2236         spin_unlock_bh(&br->multicast_lock);
2237         return is_router;
2238 }
2239 EXPORT_SYMBOL_GPL(br_multicast_router);
2240
2241 int br_multicast_set_querier(struct net_bridge *br, unsigned long val)
2242 {
2243         unsigned long max_delay;
2244
2245         val = !!val;
2246
2247         spin_lock_bh(&br->multicast_lock);
2248         if (br_opt_get(br, BROPT_MULTICAST_QUERIER) == val)
2249                 goto unlock;
2250
2251         br_opt_toggle(br, BROPT_MULTICAST_QUERIER, !!val);
2252         if (!val)
2253                 goto unlock;
2254
2255         max_delay = br->multicast_query_response_interval;
2256
2257         if (!timer_pending(&br->ip4_other_query.timer))
2258                 br->ip4_other_query.delay_time = jiffies + max_delay;
2259
2260         br_multicast_start_querier(br, &br->ip4_own_query);
2261
2262 #if IS_ENABLED(CONFIG_IPV6)
2263         if (!timer_pending(&br->ip6_other_query.timer))
2264                 br->ip6_other_query.delay_time = jiffies + max_delay;
2265
2266         br_multicast_start_querier(br, &br->ip6_own_query);
2267 #endif
2268
2269 unlock:
2270         spin_unlock_bh(&br->multicast_lock);
2271
2272         return 0;
2273 }
2274
2275 int br_multicast_set_hash_max(struct net_bridge *br, unsigned long val)
2276 {
2277         int err = -EINVAL;
2278         u32 old;
2279         struct net_bridge_mdb_htable *mdb;
2280
2281         spin_lock_bh(&br->multicast_lock);
2282         if (!is_power_of_2(val))
2283                 goto unlock;
2284
2285         mdb = mlock_dereference(br->mdb, br);
2286         if (mdb && val < mdb->size)
2287                 goto unlock;
2288
2289         err = 0;
2290
2291         old = br->hash_max;
2292         br->hash_max = val;
2293
2294         if (mdb) {
2295                 if (mdb->old) {
2296                         err = -EEXIST;
2297 rollback:
2298                         br->hash_max = old;
2299                         goto unlock;
2300                 }
2301
2302                 err = br_mdb_rehash(&br->mdb, br->hash_max,
2303                                     br->hash_elasticity);
2304                 if (err)
2305                         goto rollback;
2306         }
2307
2308 unlock:
2309         spin_unlock_bh(&br->multicast_lock);
2310
2311         return err;
2312 }
2313
2314 int br_multicast_set_igmp_version(struct net_bridge *br, unsigned long val)
2315 {
2316         /* Currently we support only version 2 and 3 */
2317         switch (val) {
2318         case 2:
2319         case 3:
2320                 break;
2321         default:
2322                 return -EINVAL;
2323         }
2324
2325         spin_lock_bh(&br->multicast_lock);
2326         br->multicast_igmp_version = val;
2327         spin_unlock_bh(&br->multicast_lock);
2328
2329         return 0;
2330 }
2331
2332 #if IS_ENABLED(CONFIG_IPV6)
2333 int br_multicast_set_mld_version(struct net_bridge *br, unsigned long val)
2334 {
2335         /* Currently we support version 1 and 2 */
2336         switch (val) {
2337         case 1:
2338         case 2:
2339                 break;
2340         default:
2341                 return -EINVAL;
2342         }
2343
2344         spin_lock_bh(&br->multicast_lock);
2345         br->multicast_mld_version = val;
2346         spin_unlock_bh(&br->multicast_lock);
2347
2348         return 0;
2349 }
2350 #endif
2351
2352 /**
2353  * br_multicast_list_adjacent - Returns snooped multicast addresses
2354  * @dev:        The bridge port adjacent to which to retrieve addresses
2355  * @br_ip_list: The list to store found, snooped multicast IP addresses in
2356  *
2357  * Creates a list of IP addresses (struct br_ip_list) sensed by the multicast
2358  * snooping feature on all bridge ports of dev's bridge device, excluding
2359  * the addresses from dev itself.
2360  *
2361  * Returns the number of items added to br_ip_list.
2362  *
2363  * Notes:
2364  * - br_ip_list needs to be initialized by caller
2365  * - br_ip_list might contain duplicates in the end
2366  *   (needs to be taken care of by caller)
2367  * - br_ip_list needs to be freed by caller
2368  */
2369 int br_multicast_list_adjacent(struct net_device *dev,
2370                                struct list_head *br_ip_list)
2371 {
2372         struct net_bridge *br;
2373         struct net_bridge_port *port;
2374         struct net_bridge_port_group *group;
2375         struct br_ip_list *entry;
2376         int count = 0;
2377
2378         rcu_read_lock();
2379         if (!br_ip_list || !br_port_exists(dev))
2380                 goto unlock;
2381
2382         port = br_port_get_rcu(dev);
2383         if (!port || !port->br)
2384                 goto unlock;
2385
2386         br = port->br;
2387
2388         list_for_each_entry_rcu(port, &br->port_list, list) {
2389                 if (!port->dev || port->dev == dev)
2390                         continue;
2391
2392                 hlist_for_each_entry_rcu(group, &port->mglist, mglist) {
2393                         entry = kmalloc(sizeof(*entry), GFP_ATOMIC);
2394                         if (!entry)
2395                                 goto unlock;
2396
2397                         entry->addr = group->addr;
2398                         list_add(&entry->list, br_ip_list);
2399                         count++;
2400                 }
2401         }
2402
2403 unlock:
2404         rcu_read_unlock();
2405         return count;
2406 }
2407 EXPORT_SYMBOL_GPL(br_multicast_list_adjacent);
2408
2409 /**
2410  * br_multicast_has_querier_anywhere - Checks for a querier on a bridge
2411  * @dev: The bridge port providing the bridge on which to check for a querier
2412  * @proto: The protocol family to check for: IGMP -> ETH_P_IP, MLD -> ETH_P_IPV6
2413  *
2414  * Checks whether the given interface has a bridge on top and if so returns
2415  * true if a valid querier exists anywhere on the bridged link layer.
2416  * Otherwise returns false.
2417  */
2418 bool br_multicast_has_querier_anywhere(struct net_device *dev, int proto)
2419 {
2420         struct net_bridge *br;
2421         struct net_bridge_port *port;
2422         struct ethhdr eth;
2423         bool ret = false;
2424
2425         rcu_read_lock();
2426         if (!br_port_exists(dev))
2427                 goto unlock;
2428
2429         port = br_port_get_rcu(dev);
2430         if (!port || !port->br)
2431                 goto unlock;
2432
2433         br = port->br;
2434
2435         memset(&eth, 0, sizeof(eth));
2436         eth.h_proto = htons(proto);
2437
2438         ret = br_multicast_querier_exists(br, &eth);
2439
2440 unlock:
2441         rcu_read_unlock();
2442         return ret;
2443 }
2444 EXPORT_SYMBOL_GPL(br_multicast_has_querier_anywhere);
2445
2446 /**
2447  * br_multicast_has_querier_adjacent - Checks for a querier behind a bridge port
2448  * @dev: The bridge port adjacent to which to check for a querier
2449  * @proto: The protocol family to check for: IGMP -> ETH_P_IP, MLD -> ETH_P_IPV6
2450  *
2451  * Checks whether the given interface has a bridge on top and if so returns
2452  * true if a selected querier is behind one of the other ports of this
2453  * bridge. Otherwise returns false.
2454  */
2455 bool br_multicast_has_querier_adjacent(struct net_device *dev, int proto)
2456 {
2457         struct net_bridge *br;
2458         struct net_bridge_port *port;
2459         bool ret = false;
2460
2461         rcu_read_lock();
2462         if (!br_port_exists(dev))
2463                 goto unlock;
2464
2465         port = br_port_get_rcu(dev);
2466         if (!port || !port->br)
2467                 goto unlock;
2468
2469         br = port->br;
2470
2471         switch (proto) {
2472         case ETH_P_IP:
2473                 if (!timer_pending(&br->ip4_other_query.timer) ||
2474                     rcu_dereference(br->ip4_querier.port) == port)
2475                         goto unlock;
2476                 break;
2477 #if IS_ENABLED(CONFIG_IPV6)
2478         case ETH_P_IPV6:
2479                 if (!timer_pending(&br->ip6_other_query.timer) ||
2480                     rcu_dereference(br->ip6_querier.port) == port)
2481                         goto unlock;
2482                 break;
2483 #endif
2484         default:
2485                 goto unlock;
2486         }
2487
2488         ret = true;
2489 unlock:
2490         rcu_read_unlock();
2491         return ret;
2492 }
2493 EXPORT_SYMBOL_GPL(br_multicast_has_querier_adjacent);
2494
2495 static void br_mcast_stats_add(struct bridge_mcast_stats __percpu *stats,
2496                                const struct sk_buff *skb, u8 type, u8 dir)
2497 {
2498         struct bridge_mcast_stats *pstats = this_cpu_ptr(stats);
2499         __be16 proto = skb->protocol;
2500         unsigned int t_len;
2501
2502         u64_stats_update_begin(&pstats->syncp);
2503         switch (proto) {
2504         case htons(ETH_P_IP):
2505                 t_len = ntohs(ip_hdr(skb)->tot_len) - ip_hdrlen(skb);
2506                 switch (type) {
2507                 case IGMP_HOST_MEMBERSHIP_REPORT:
2508                         pstats->mstats.igmp_v1reports[dir]++;
2509                         break;
2510                 case IGMPV2_HOST_MEMBERSHIP_REPORT:
2511                         pstats->mstats.igmp_v2reports[dir]++;
2512                         break;
2513                 case IGMPV3_HOST_MEMBERSHIP_REPORT:
2514                         pstats->mstats.igmp_v3reports[dir]++;
2515                         break;
2516                 case IGMP_HOST_MEMBERSHIP_QUERY:
2517                         if (t_len != sizeof(struct igmphdr)) {
2518                                 pstats->mstats.igmp_v3queries[dir]++;
2519                         } else {
2520                                 unsigned int offset = skb_transport_offset(skb);
2521                                 struct igmphdr *ih, _ihdr;
2522
2523                                 ih = skb_header_pointer(skb, offset,
2524                                                         sizeof(_ihdr), &_ihdr);
2525                                 if (!ih)
2526                                         break;
2527                                 if (!ih->code)
2528                                         pstats->mstats.igmp_v1queries[dir]++;
2529                                 else
2530                                         pstats->mstats.igmp_v2queries[dir]++;
2531                         }
2532                         break;
2533                 case IGMP_HOST_LEAVE_MESSAGE:
2534                         pstats->mstats.igmp_leaves[dir]++;
2535                         break;
2536                 }
2537                 break;
2538 #if IS_ENABLED(CONFIG_IPV6)
2539         case htons(ETH_P_IPV6):
2540                 t_len = ntohs(ipv6_hdr(skb)->payload_len) +
2541                         sizeof(struct ipv6hdr);
2542                 t_len -= skb_network_header_len(skb);
2543                 switch (type) {
2544                 case ICMPV6_MGM_REPORT:
2545                         pstats->mstats.mld_v1reports[dir]++;
2546                         break;
2547                 case ICMPV6_MLD2_REPORT:
2548                         pstats->mstats.mld_v2reports[dir]++;
2549                         break;
2550                 case ICMPV6_MGM_QUERY:
2551                         if (t_len != sizeof(struct mld_msg))
2552                                 pstats->mstats.mld_v2queries[dir]++;
2553                         else
2554                                 pstats->mstats.mld_v1queries[dir]++;
2555                         break;
2556                 case ICMPV6_MGM_REDUCTION:
2557                         pstats->mstats.mld_leaves[dir]++;
2558                         break;
2559                 }
2560                 break;
2561 #endif /* CONFIG_IPV6 */
2562         }
2563         u64_stats_update_end(&pstats->syncp);
2564 }
2565
2566 void br_multicast_count(struct net_bridge *br, const struct net_bridge_port *p,
2567                         const struct sk_buff *skb, u8 type, u8 dir)
2568 {
2569         struct bridge_mcast_stats __percpu *stats;
2570
2571         /* if multicast_disabled is true then igmp type can't be set */
2572         if (!type || !br_opt_get(br, BROPT_MULTICAST_STATS_ENABLED))
2573                 return;
2574
2575         if (p)
2576                 stats = p->mcast_stats;
2577         else
2578                 stats = br->mcast_stats;
2579         if (WARN_ON(!stats))
2580                 return;
2581
2582         br_mcast_stats_add(stats, skb, type, dir);
2583 }
2584
2585 int br_multicast_init_stats(struct net_bridge *br)
2586 {
2587         br->mcast_stats = netdev_alloc_pcpu_stats(struct bridge_mcast_stats);
2588         if (!br->mcast_stats)
2589                 return -ENOMEM;
2590
2591         return 0;
2592 }
2593
2594 void br_multicast_uninit_stats(struct net_bridge *br)
2595 {
2596         free_percpu(br->mcast_stats);
2597 }
2598
2599 static void mcast_stats_add_dir(u64 *dst, u64 *src)
2600 {
2601         dst[BR_MCAST_DIR_RX] += src[BR_MCAST_DIR_RX];
2602         dst[BR_MCAST_DIR_TX] += src[BR_MCAST_DIR_TX];
2603 }
2604
2605 void br_multicast_get_stats(const struct net_bridge *br,
2606                             const struct net_bridge_port *p,
2607                             struct br_mcast_stats *dest)
2608 {
2609         struct bridge_mcast_stats __percpu *stats;
2610         struct br_mcast_stats tdst;
2611         int i;
2612
2613         memset(dest, 0, sizeof(*dest));
2614         if (p)
2615                 stats = p->mcast_stats;
2616         else
2617                 stats = br->mcast_stats;
2618         if (WARN_ON(!stats))
2619                 return;
2620
2621         memset(&tdst, 0, sizeof(tdst));
2622         for_each_possible_cpu(i) {
2623                 struct bridge_mcast_stats *cpu_stats = per_cpu_ptr(stats, i);
2624                 struct br_mcast_stats temp;
2625                 unsigned int start;
2626
2627                 do {
2628                         start = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
2629                         memcpy(&temp, &cpu_stats->mstats, sizeof(temp));
2630                 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, start));
2631
2632                 mcast_stats_add_dir(tdst.igmp_v1queries, temp.igmp_v1queries);
2633                 mcast_stats_add_dir(tdst.igmp_v2queries, temp.igmp_v2queries);
2634                 mcast_stats_add_dir(tdst.igmp_v3queries, temp.igmp_v3queries);
2635                 mcast_stats_add_dir(tdst.igmp_leaves, temp.igmp_leaves);
2636                 mcast_stats_add_dir(tdst.igmp_v1reports, temp.igmp_v1reports);
2637                 mcast_stats_add_dir(tdst.igmp_v2reports, temp.igmp_v2reports);
2638                 mcast_stats_add_dir(tdst.igmp_v3reports, temp.igmp_v3reports);
2639                 tdst.igmp_parse_errors += temp.igmp_parse_errors;
2640
2641                 mcast_stats_add_dir(tdst.mld_v1queries, temp.mld_v1queries);
2642                 mcast_stats_add_dir(tdst.mld_v2queries, temp.mld_v2queries);
2643                 mcast_stats_add_dir(tdst.mld_leaves, temp.mld_leaves);
2644                 mcast_stats_add_dir(tdst.mld_v1reports, temp.mld_v1reports);
2645                 mcast_stats_add_dir(tdst.mld_v2reports, temp.mld_v2reports);
2646                 tdst.mld_parse_errors += temp.mld_parse_errors;
2647         }
2648         memcpy(dest, &tdst, sizeof(*dest));
2649 }