Linux Audio

Check our new training course

Loading...
v3.1
   1/*
   2 *	Linux NET3:	Internet Group Management Protocol  [IGMP]
   3 *
   4 *	This code implements the IGMP protocol as defined in RFC1112. There has
   5 *	been a further revision of this protocol since which is now supported.
   6 *
   7 *	If you have trouble with this module be careful what gcc you have used,
   8 *	the older version didn't come out right using gcc 2.5.8, the newer one
   9 *	seems to fall out with gcc 2.6.2.
  10 *
  11 *	Authors:
  12 *		Alan Cox <alan@lxorguk.ukuu.org.uk>
  13 *
  14 *	This program is free software; you can redistribute it and/or
  15 *	modify it under the terms of the GNU General Public License
  16 *	as published by the Free Software Foundation; either version
  17 *	2 of the License, or (at your option) any later version.
  18 *
  19 *	Fixes:
  20 *
  21 *		Alan Cox	:	Added lots of __inline__ to optimise
  22 *					the memory usage of all the tiny little
  23 *					functions.
  24 *		Alan Cox	:	Dumped the header building experiment.
  25 *		Alan Cox	:	Minor tweaks ready for multicast routing
  26 *					and extended IGMP protocol.
  27 *		Alan Cox	:	Removed a load of inline directives. Gcc 2.5.8
  28 *					writes utterly bogus code otherwise (sigh)
  29 *					fixed IGMP loopback to behave in the manner
  30 *					desired by mrouted, fixed the fact it has been
  31 *					broken since 1.3.6 and cleaned up a few minor
  32 *					points.
  33 *
  34 *		Chih-Jen Chang	:	Tried to revise IGMP to Version 2
  35 *		Tsu-Sheng Tsao		E-mail: chihjenc@scf.usc.edu and tsusheng@scf.usc.edu
  36 *					The enhancements are mainly based on Steve Deering's
  37 * 					ipmulti-3.5 source code.
  38 *		Chih-Jen Chang	:	Added the igmp_get_mrouter_info and
  39 *		Tsu-Sheng Tsao		igmp_set_mrouter_info to keep track of
  40 *					the mrouted version on that device.
  41 *		Chih-Jen Chang	:	Added the max_resp_time parameter to
  42 *		Tsu-Sheng Tsao		igmp_heard_query(). Using this parameter
  43 *					to identify the multicast router version
  44 *					and do what the IGMP version 2 specified.
  45 *		Chih-Jen Chang	:	Added a timer to revert to IGMP V2 router
  46 *		Tsu-Sheng Tsao		if the specified time expired.
  47 *		Alan Cox	:	Stop IGMP from 0.0.0.0 being accepted.
  48 *		Alan Cox	:	Use GFP_ATOMIC in the right places.
  49 *		Christian Daudt :	igmp timer wasn't set for local group
  50 *					memberships but was being deleted,
  51 *					which caused a "del_timer() called
  52 *					from %p with timer not initialized\n"
  53 *					message (960131).
  54 *		Christian Daudt :	removed del_timer from
  55 *					igmp_timer_expire function (960205).
  56 *             Christian Daudt :       igmp_heard_report now only calls
  57 *                                     igmp_timer_expire if tm->running is
  58 *                                     true (960216).
  59 *		Malcolm Beattie :	ttl comparison wrong in igmp_rcv made
  60 *					igmp_heard_query never trigger. Expiry
  61 *					miscalculation fixed in igmp_heard_query
  62 *					and random() made to return unsigned to
  63 *					prevent negative expiry times.
  64 *		Alexey Kuznetsov:	Wrong group leaving behaviour, backport
  65 *					fix from pending 2.1.x patches.
  66 *		Alan Cox:		Forget to enable FDDI support earlier.
  67 *		Alexey Kuznetsov:	Fixed leaving groups on device down.
  68 *		Alexey Kuznetsov:	Accordance to igmp-v2-06 draft.
  69 *		David L Stevens:	IGMPv3 support, with help from
  70 *					Vinay Kulkarni
  71 */
  72
  73#include <linux/module.h>
  74#include <linux/slab.h>
  75#include <asm/uaccess.h>
  76#include <asm/system.h>
  77#include <linux/types.h>
  78#include <linux/kernel.h>
  79#include <linux/jiffies.h>
  80#include <linux/string.h>
  81#include <linux/socket.h>
  82#include <linux/sockios.h>
  83#include <linux/in.h>
  84#include <linux/inet.h>
  85#include <linux/netdevice.h>
  86#include <linux/skbuff.h>
  87#include <linux/inetdevice.h>
  88#include <linux/igmp.h>
  89#include <linux/if_arp.h>
  90#include <linux/rtnetlink.h>
  91#include <linux/times.h>
  92
  93#include <net/net_namespace.h>
  94#include <net/arp.h>
  95#include <net/ip.h>
  96#include <net/protocol.h>
  97#include <net/route.h>
  98#include <net/sock.h>
  99#include <net/checksum.h>
 100#include <linux/netfilter_ipv4.h>
 101#ifdef CONFIG_IP_MROUTE
 102#include <linux/mroute.h>
 103#endif
 104#ifdef CONFIG_PROC_FS
 105#include <linux/proc_fs.h>
 106#include <linux/seq_file.h>
 107#endif
 108
 109#define IP_MAX_MEMBERSHIPS	20
 110#define IP_MAX_MSF		10
 111
 112#ifdef CONFIG_IP_MULTICAST
 113/* Parameter names and values are taken from igmp-v2-06 draft */
 114
 115#define IGMP_V1_Router_Present_Timeout		(400*HZ)
 116#define IGMP_V2_Router_Present_Timeout		(400*HZ)
 117#define IGMP_Unsolicited_Report_Interval	(10*HZ)
 118#define IGMP_Query_Response_Interval		(10*HZ)
 119#define IGMP_Unsolicited_Report_Count		2
 120
 121
 122#define IGMP_Initial_Report_Delay		(1)
 123
 124/* IGMP_Initial_Report_Delay is not from IGMP specs!
 125 * IGMP specs require to report membership immediately after
 126 * joining a group, but we delay the first report by a
 127 * small interval. It seems more natural and still does not
 128 * contradict to specs provided this delay is small enough.
 129 */
 130
 131#define IGMP_V1_SEEN(in_dev) \
 132	(IPV4_DEVCONF_ALL(dev_net(in_dev->dev), FORCE_IGMP_VERSION) == 1 || \
 133	 IN_DEV_CONF_GET((in_dev), FORCE_IGMP_VERSION) == 1 || \
 134	 ((in_dev)->mr_v1_seen && \
 135	  time_before(jiffies, (in_dev)->mr_v1_seen)))
 136#define IGMP_V2_SEEN(in_dev) \
 137	(IPV4_DEVCONF_ALL(dev_net(in_dev->dev), FORCE_IGMP_VERSION) == 2 || \
 138	 IN_DEV_CONF_GET((in_dev), FORCE_IGMP_VERSION) == 2 || \
 139	 ((in_dev)->mr_v2_seen && \
 140	  time_before(jiffies, (in_dev)->mr_v2_seen)))
 141
 142static void igmpv3_add_delrec(struct in_device *in_dev, struct ip_mc_list *im);
 143static void igmpv3_del_delrec(struct in_device *in_dev, __be32 multiaddr);
 144static void igmpv3_clear_delrec(struct in_device *in_dev);
 145static int sf_setstate(struct ip_mc_list *pmc);
 146static void sf_markstate(struct ip_mc_list *pmc);
 147#endif
 148static void ip_mc_clear_src(struct ip_mc_list *pmc);
 149static int ip_mc_add_src(struct in_device *in_dev, __be32 *pmca, int sfmode,
 150			 int sfcount, __be32 *psfsrc, int delta);
 151
 152static void ip_ma_put(struct ip_mc_list *im)
 153{
 154	if (atomic_dec_and_test(&im->refcnt)) {
 155		in_dev_put(im->interface);
 156		kfree_rcu(im, rcu);
 157	}
 158}
 159
 160#define for_each_pmc_rcu(in_dev, pmc)				\
 161	for (pmc = rcu_dereference(in_dev->mc_list);		\
 162	     pmc != NULL;					\
 163	     pmc = rcu_dereference(pmc->next_rcu))
 164
 165#define for_each_pmc_rtnl(in_dev, pmc)				\
 166	for (pmc = rtnl_dereference(in_dev->mc_list);		\
 167	     pmc != NULL;					\
 168	     pmc = rtnl_dereference(pmc->next_rcu))
 169
 170#ifdef CONFIG_IP_MULTICAST
 171
 172/*
 173 *	Timer management
 174 */
 175
 176static void igmp_stop_timer(struct ip_mc_list *im)
 177{
 178	spin_lock_bh(&im->lock);
 179	if (del_timer(&im->timer))
 180		atomic_dec(&im->refcnt);
 181	im->tm_running = 0;
 182	im->reporter = 0;
 183	im->unsolicit_count = 0;
 184	spin_unlock_bh(&im->lock);
 185}
 186
 187/* It must be called with locked im->lock */
 188static void igmp_start_timer(struct ip_mc_list *im, int max_delay)
 189{
 190	int tv = net_random() % max_delay;
 191
 192	im->tm_running = 1;
 193	if (!mod_timer(&im->timer, jiffies+tv+2))
 194		atomic_inc(&im->refcnt);
 195}
 196
 197static void igmp_gq_start_timer(struct in_device *in_dev)
 198{
 199	int tv = net_random() % in_dev->mr_maxdelay;
 200
 201	in_dev->mr_gq_running = 1;
 202	if (!mod_timer(&in_dev->mr_gq_timer, jiffies+tv+2))
 203		in_dev_hold(in_dev);
 204}
 205
 206static void igmp_ifc_start_timer(struct in_device *in_dev, int delay)
 207{
 208	int tv = net_random() % delay;
 209
 210	if (!mod_timer(&in_dev->mr_ifc_timer, jiffies+tv+2))
 211		in_dev_hold(in_dev);
 212}
 213
 214static void igmp_mod_timer(struct ip_mc_list *im, int max_delay)
 215{
 216	spin_lock_bh(&im->lock);
 217	im->unsolicit_count = 0;
 218	if (del_timer(&im->timer)) {
 219		if ((long)(im->timer.expires-jiffies) < max_delay) {
 220			add_timer(&im->timer);
 221			im->tm_running = 1;
 222			spin_unlock_bh(&im->lock);
 223			return;
 224		}
 225		atomic_dec(&im->refcnt);
 226	}
 227	igmp_start_timer(im, max_delay);
 228	spin_unlock_bh(&im->lock);
 229}
 230
 231
 232/*
 233 *	Send an IGMP report.
 234 */
 235
 236#define IGMP_SIZE (sizeof(struct igmphdr)+sizeof(struct iphdr)+4)
 237
 238
 239static int is_in(struct ip_mc_list *pmc, struct ip_sf_list *psf, int type,
 240	int gdeleted, int sdeleted)
 241{
 242	switch (type) {
 243	case IGMPV3_MODE_IS_INCLUDE:
 244	case IGMPV3_MODE_IS_EXCLUDE:
 245		if (gdeleted || sdeleted)
 246			return 0;
 247		if (!(pmc->gsquery && !psf->sf_gsresp)) {
 248			if (pmc->sfmode == MCAST_INCLUDE)
 249				return 1;
 250			/* don't include if this source is excluded
 251			 * in all filters
 252			 */
 253			if (psf->sf_count[MCAST_INCLUDE])
 254				return type == IGMPV3_MODE_IS_INCLUDE;
 255			return pmc->sfcount[MCAST_EXCLUDE] ==
 256				psf->sf_count[MCAST_EXCLUDE];
 257		}
 258		return 0;
 259	case IGMPV3_CHANGE_TO_INCLUDE:
 260		if (gdeleted || sdeleted)
 261			return 0;
 262		return psf->sf_count[MCAST_INCLUDE] != 0;
 263	case IGMPV3_CHANGE_TO_EXCLUDE:
 264		if (gdeleted || sdeleted)
 265			return 0;
 266		if (pmc->sfcount[MCAST_EXCLUDE] == 0 ||
 267		    psf->sf_count[MCAST_INCLUDE])
 268			return 0;
 269		return pmc->sfcount[MCAST_EXCLUDE] ==
 270			psf->sf_count[MCAST_EXCLUDE];
 271	case IGMPV3_ALLOW_NEW_SOURCES:
 272		if (gdeleted || !psf->sf_crcount)
 273			return 0;
 274		return (pmc->sfmode == MCAST_INCLUDE) ^ sdeleted;
 275	case IGMPV3_BLOCK_OLD_SOURCES:
 276		if (pmc->sfmode == MCAST_INCLUDE)
 277			return gdeleted || (psf->sf_crcount && sdeleted);
 278		return psf->sf_crcount && !gdeleted && !sdeleted;
 279	}
 280	return 0;
 281}
 282
 283static int
 284igmp_scount(struct ip_mc_list *pmc, int type, int gdeleted, int sdeleted)
 285{
 286	struct ip_sf_list *psf;
 287	int scount = 0;
 288
 289	for (psf=pmc->sources; psf; psf=psf->sf_next) {
 290		if (!is_in(pmc, psf, type, gdeleted, sdeleted))
 291			continue;
 292		scount++;
 293	}
 294	return scount;
 295}
 296
 297#define igmp_skb_size(skb) (*(unsigned int *)((skb)->cb))
 298
 299static struct sk_buff *igmpv3_newpack(struct net_device *dev, int size)
 300{
 301	struct sk_buff *skb;
 302	struct rtable *rt;
 303	struct iphdr *pip;
 304	struct igmpv3_report *pig;
 305	struct net *net = dev_net(dev);
 306	struct flowi4 fl4;
 
 
 307
 308	while (1) {
 309		skb = alloc_skb(size + LL_ALLOCATED_SPACE(dev),
 310				GFP_ATOMIC | __GFP_NOWARN);
 311		if (skb)
 312			break;
 313		size >>= 1;
 314		if (size < 256)
 315			return NULL;
 316	}
 317	igmp_skb_size(skb) = size;
 318
 319	rt = ip_route_output_ports(net, &fl4, NULL, IGMPV3_ALL_MCR, 0,
 320				   0, 0,
 321				   IPPROTO_IGMP, 0, dev->ifindex);
 322	if (IS_ERR(rt)) {
 323		kfree_skb(skb);
 324		return NULL;
 325	}
 326
 327	skb_dst_set(skb, &rt->dst);
 328	skb->dev = dev;
 329
 330	skb_reserve(skb, LL_RESERVED_SPACE(dev));
 331
 332	skb_reset_network_header(skb);
 333	pip = ip_hdr(skb);
 334	skb_put(skb, sizeof(struct iphdr) + 4);
 335
 336	pip->version  = 4;
 337	pip->ihl      = (sizeof(struct iphdr)+4)>>2;
 338	pip->tos      = 0xc0;
 339	pip->frag_off = htons(IP_DF);
 340	pip->ttl      = 1;
 341	pip->daddr    = fl4.daddr;
 342	pip->saddr    = fl4.saddr;
 343	pip->protocol = IPPROTO_IGMP;
 344	pip->tot_len  = 0;	/* filled in later */
 345	ip_select_ident(pip, &rt->dst, NULL);
 346	((u8*)&pip[1])[0] = IPOPT_RA;
 347	((u8*)&pip[1])[1] = 4;
 348	((u8*)&pip[1])[2] = 0;
 349	((u8*)&pip[1])[3] = 0;
 350
 351	skb->transport_header = skb->network_header + sizeof(struct iphdr) + 4;
 352	skb_put(skb, sizeof(*pig));
 353	pig = igmpv3_report_hdr(skb);
 354	pig->type = IGMPV3_HOST_MEMBERSHIP_REPORT;
 355	pig->resv1 = 0;
 356	pig->csum = 0;
 357	pig->resv2 = 0;
 358	pig->ngrec = 0;
 359	return skb;
 360}
 361
 362static int igmpv3_sendpack(struct sk_buff *skb)
 363{
 364	struct igmphdr *pig = igmp_hdr(skb);
 365	const int igmplen = skb->tail - skb->transport_header;
 366
 367	pig->csum = ip_compute_csum(igmp_hdr(skb), igmplen);
 368
 369	return ip_local_out(skb);
 370}
 371
 372static int grec_size(struct ip_mc_list *pmc, int type, int gdel, int sdel)
 373{
 374	return sizeof(struct igmpv3_grec) + 4*igmp_scount(pmc, type, gdel, sdel);
 375}
 376
 377static struct sk_buff *add_grhead(struct sk_buff *skb, struct ip_mc_list *pmc,
 378	int type, struct igmpv3_grec **ppgr)
 379{
 380	struct net_device *dev = pmc->interface->dev;
 381	struct igmpv3_report *pih;
 382	struct igmpv3_grec *pgr;
 383
 384	if (!skb)
 385		skb = igmpv3_newpack(dev, dev->mtu);
 386	if (!skb)
 387		return NULL;
 388	pgr = (struct igmpv3_grec *)skb_put(skb, sizeof(struct igmpv3_grec));
 389	pgr->grec_type = type;
 390	pgr->grec_auxwords = 0;
 391	pgr->grec_nsrcs = 0;
 392	pgr->grec_mca = pmc->multiaddr;
 393	pih = igmpv3_report_hdr(skb);
 394	pih->ngrec = htons(ntohs(pih->ngrec)+1);
 395	*ppgr = pgr;
 396	return skb;
 397}
 398
 399#define AVAILABLE(skb) ((skb) ? ((skb)->dev ? igmp_skb_size(skb) - (skb)->len : \
 400	skb_tailroom(skb)) : 0)
 401
 402static struct sk_buff *add_grec(struct sk_buff *skb, struct ip_mc_list *pmc,
 403	int type, int gdeleted, int sdeleted)
 404{
 405	struct net_device *dev = pmc->interface->dev;
 406	struct igmpv3_report *pih;
 407	struct igmpv3_grec *pgr = NULL;
 408	struct ip_sf_list *psf, *psf_next, *psf_prev, **psf_list;
 409	int scount, stotal, first, isquery, truncate;
 410
 411	if (pmc->multiaddr == IGMP_ALL_HOSTS)
 412		return skb;
 413
 414	isquery = type == IGMPV3_MODE_IS_INCLUDE ||
 415		  type == IGMPV3_MODE_IS_EXCLUDE;
 416	truncate = type == IGMPV3_MODE_IS_EXCLUDE ||
 417		    type == IGMPV3_CHANGE_TO_EXCLUDE;
 418
 419	stotal = scount = 0;
 420
 421	psf_list = sdeleted ? &pmc->tomb : &pmc->sources;
 422
 423	if (!*psf_list)
 424		goto empty_source;
 425
 426	pih = skb ? igmpv3_report_hdr(skb) : NULL;
 427
 428	/* EX and TO_EX get a fresh packet, if needed */
 429	if (truncate) {
 430		if (pih && pih->ngrec &&
 431		    AVAILABLE(skb) < grec_size(pmc, type, gdeleted, sdeleted)) {
 432			if (skb)
 433				igmpv3_sendpack(skb);
 434			skb = igmpv3_newpack(dev, dev->mtu);
 435		}
 436	}
 437	first = 1;
 438	psf_prev = NULL;
 439	for (psf=*psf_list; psf; psf=psf_next) {
 440		__be32 *psrc;
 441
 442		psf_next = psf->sf_next;
 443
 444		if (!is_in(pmc, psf, type, gdeleted, sdeleted)) {
 445			psf_prev = psf;
 446			continue;
 447		}
 448
 449		/* clear marks on query responses */
 450		if (isquery)
 451			psf->sf_gsresp = 0;
 452
 453		if (AVAILABLE(skb) < sizeof(__be32) +
 454		    first*sizeof(struct igmpv3_grec)) {
 455			if (truncate && !first)
 456				break;	 /* truncate these */
 457			if (pgr)
 458				pgr->grec_nsrcs = htons(scount);
 459			if (skb)
 460				igmpv3_sendpack(skb);
 461			skb = igmpv3_newpack(dev, dev->mtu);
 462			first = 1;
 463			scount = 0;
 464		}
 465		if (first) {
 466			skb = add_grhead(skb, pmc, type, &pgr);
 467			first = 0;
 468		}
 469		if (!skb)
 470			return NULL;
 471		psrc = (__be32 *)skb_put(skb, sizeof(__be32));
 472		*psrc = psf->sf_inaddr;
 473		scount++; stotal++;
 474		if ((type == IGMPV3_ALLOW_NEW_SOURCES ||
 475		     type == IGMPV3_BLOCK_OLD_SOURCES) && psf->sf_crcount) {
 476			psf->sf_crcount--;
 477			if ((sdeleted || gdeleted) && psf->sf_crcount == 0) {
 478				if (psf_prev)
 479					psf_prev->sf_next = psf->sf_next;
 480				else
 481					*psf_list = psf->sf_next;
 482				kfree(psf);
 483				continue;
 484			}
 485		}
 486		psf_prev = psf;
 487	}
 488
 489empty_source:
 490	if (!stotal) {
 491		if (type == IGMPV3_ALLOW_NEW_SOURCES ||
 492		    type == IGMPV3_BLOCK_OLD_SOURCES)
 493			return skb;
 494		if (pmc->crcount || isquery) {
 495			/* make sure we have room for group header */
 496			if (skb && AVAILABLE(skb)<sizeof(struct igmpv3_grec)) {
 497				igmpv3_sendpack(skb);
 498				skb = NULL; /* add_grhead will get a new one */
 499			}
 500			skb = add_grhead(skb, pmc, type, &pgr);
 501		}
 502	}
 503	if (pgr)
 504		pgr->grec_nsrcs = htons(scount);
 505
 506	if (isquery)
 507		pmc->gsquery = 0;	/* clear query state on report */
 508	return skb;
 509}
 510
 511static int igmpv3_send_report(struct in_device *in_dev, struct ip_mc_list *pmc)
 512{
 513	struct sk_buff *skb = NULL;
 514	int type;
 515
 516	if (!pmc) {
 517		rcu_read_lock();
 518		for_each_pmc_rcu(in_dev, pmc) {
 519			if (pmc->multiaddr == IGMP_ALL_HOSTS)
 520				continue;
 521			spin_lock_bh(&pmc->lock);
 522			if (pmc->sfcount[MCAST_EXCLUDE])
 523				type = IGMPV3_MODE_IS_EXCLUDE;
 524			else
 525				type = IGMPV3_MODE_IS_INCLUDE;
 526			skb = add_grec(skb, pmc, type, 0, 0);
 527			spin_unlock_bh(&pmc->lock);
 528		}
 529		rcu_read_unlock();
 530	} else {
 531		spin_lock_bh(&pmc->lock);
 532		if (pmc->sfcount[MCAST_EXCLUDE])
 533			type = IGMPV3_MODE_IS_EXCLUDE;
 534		else
 535			type = IGMPV3_MODE_IS_INCLUDE;
 536		skb = add_grec(skb, pmc, type, 0, 0);
 537		spin_unlock_bh(&pmc->lock);
 538	}
 539	if (!skb)
 540		return 0;
 541	return igmpv3_sendpack(skb);
 542}
 543
 544/*
 545 * remove zero-count source records from a source filter list
 546 */
 547static void igmpv3_clear_zeros(struct ip_sf_list **ppsf)
 548{
 549	struct ip_sf_list *psf_prev, *psf_next, *psf;
 550
 551	psf_prev = NULL;
 552	for (psf=*ppsf; psf; psf = psf_next) {
 553		psf_next = psf->sf_next;
 554		if (psf->sf_crcount == 0) {
 555			if (psf_prev)
 556				psf_prev->sf_next = psf->sf_next;
 557			else
 558				*ppsf = psf->sf_next;
 559			kfree(psf);
 560		} else
 561			psf_prev = psf;
 562	}
 563}
 564
 565static void igmpv3_send_cr(struct in_device *in_dev)
 566{
 567	struct ip_mc_list *pmc, *pmc_prev, *pmc_next;
 568	struct sk_buff *skb = NULL;
 569	int type, dtype;
 570
 571	rcu_read_lock();
 572	spin_lock_bh(&in_dev->mc_tomb_lock);
 573
 574	/* deleted MCA's */
 575	pmc_prev = NULL;
 576	for (pmc=in_dev->mc_tomb; pmc; pmc=pmc_next) {
 577		pmc_next = pmc->next;
 578		if (pmc->sfmode == MCAST_INCLUDE) {
 579			type = IGMPV3_BLOCK_OLD_SOURCES;
 580			dtype = IGMPV3_BLOCK_OLD_SOURCES;
 581			skb = add_grec(skb, pmc, type, 1, 0);
 582			skb = add_grec(skb, pmc, dtype, 1, 1);
 583		}
 584		if (pmc->crcount) {
 585			if (pmc->sfmode == MCAST_EXCLUDE) {
 586				type = IGMPV3_CHANGE_TO_INCLUDE;
 587				skb = add_grec(skb, pmc, type, 1, 0);
 588			}
 589			pmc->crcount--;
 590			if (pmc->crcount == 0) {
 591				igmpv3_clear_zeros(&pmc->tomb);
 592				igmpv3_clear_zeros(&pmc->sources);
 593			}
 594		}
 595		if (pmc->crcount == 0 && !pmc->tomb && !pmc->sources) {
 596			if (pmc_prev)
 597				pmc_prev->next = pmc_next;
 598			else
 599				in_dev->mc_tomb = pmc_next;
 600			in_dev_put(pmc->interface);
 601			kfree(pmc);
 602		} else
 603			pmc_prev = pmc;
 604	}
 605	spin_unlock_bh(&in_dev->mc_tomb_lock);
 606
 607	/* change recs */
 608	for_each_pmc_rcu(in_dev, pmc) {
 609		spin_lock_bh(&pmc->lock);
 610		if (pmc->sfcount[MCAST_EXCLUDE]) {
 611			type = IGMPV3_BLOCK_OLD_SOURCES;
 612			dtype = IGMPV3_ALLOW_NEW_SOURCES;
 613		} else {
 614			type = IGMPV3_ALLOW_NEW_SOURCES;
 615			dtype = IGMPV3_BLOCK_OLD_SOURCES;
 616		}
 617		skb = add_grec(skb, pmc, type, 0, 0);
 618		skb = add_grec(skb, pmc, dtype, 0, 1);	/* deleted sources */
 619
 620		/* filter mode changes */
 621		if (pmc->crcount) {
 622			if (pmc->sfmode == MCAST_EXCLUDE)
 623				type = IGMPV3_CHANGE_TO_EXCLUDE;
 624			else
 625				type = IGMPV3_CHANGE_TO_INCLUDE;
 626			skb = add_grec(skb, pmc, type, 0, 0);
 627			pmc->crcount--;
 628		}
 629		spin_unlock_bh(&pmc->lock);
 630	}
 631	rcu_read_unlock();
 632
 633	if (!skb)
 634		return;
 635	(void) igmpv3_sendpack(skb);
 636}
 637
 638static int igmp_send_report(struct in_device *in_dev, struct ip_mc_list *pmc,
 639	int type)
 640{
 641	struct sk_buff *skb;
 642	struct iphdr *iph;
 643	struct igmphdr *ih;
 644	struct rtable *rt;
 645	struct net_device *dev = in_dev->dev;
 646	struct net *net = dev_net(dev);
 647	__be32	group = pmc ? pmc->multiaddr : 0;
 648	struct flowi4 fl4;
 649	__be32	dst;
 
 650
 651	if (type == IGMPV3_HOST_MEMBERSHIP_REPORT)
 652		return igmpv3_send_report(in_dev, pmc);
 653	else if (type == IGMP_HOST_LEAVE_MESSAGE)
 654		dst = IGMP_ALL_ROUTER;
 655	else
 656		dst = group;
 657
 658	rt = ip_route_output_ports(net, &fl4, NULL, dst, 0,
 659				   0, 0,
 660				   IPPROTO_IGMP, 0, dev->ifindex);
 661	if (IS_ERR(rt))
 662		return -1;
 663
 664	skb = alloc_skb(IGMP_SIZE+LL_ALLOCATED_SPACE(dev), GFP_ATOMIC);
 
 
 665	if (skb == NULL) {
 666		ip_rt_put(rt);
 667		return -1;
 668	}
 669
 670	skb_dst_set(skb, &rt->dst);
 671
 672	skb_reserve(skb, LL_RESERVED_SPACE(dev));
 673
 674	skb_reset_network_header(skb);
 675	iph = ip_hdr(skb);
 676	skb_put(skb, sizeof(struct iphdr) + 4);
 677
 678	iph->version  = 4;
 679	iph->ihl      = (sizeof(struct iphdr)+4)>>2;
 680	iph->tos      = 0xc0;
 681	iph->frag_off = htons(IP_DF);
 682	iph->ttl      = 1;
 683	iph->daddr    = dst;
 684	iph->saddr    = fl4.saddr;
 685	iph->protocol = IPPROTO_IGMP;
 686	ip_select_ident(iph, &rt->dst, NULL);
 687	((u8*)&iph[1])[0] = IPOPT_RA;
 688	((u8*)&iph[1])[1] = 4;
 689	((u8*)&iph[1])[2] = 0;
 690	((u8*)&iph[1])[3] = 0;
 691
 692	ih = (struct igmphdr *)skb_put(skb, sizeof(struct igmphdr));
 693	ih->type = type;
 694	ih->code = 0;
 695	ih->csum = 0;
 696	ih->group = group;
 697	ih->csum = ip_compute_csum((void *)ih, sizeof(struct igmphdr));
 698
 699	return ip_local_out(skb);
 700}
 701
 702static void igmp_gq_timer_expire(unsigned long data)
 703{
 704	struct in_device *in_dev = (struct in_device *)data;
 705
 706	in_dev->mr_gq_running = 0;
 707	igmpv3_send_report(in_dev, NULL);
 708	__in_dev_put(in_dev);
 709}
 710
 711static void igmp_ifc_timer_expire(unsigned long data)
 712{
 713	struct in_device *in_dev = (struct in_device *)data;
 714
 715	igmpv3_send_cr(in_dev);
 716	if (in_dev->mr_ifc_count) {
 717		in_dev->mr_ifc_count--;
 718		igmp_ifc_start_timer(in_dev, IGMP_Unsolicited_Report_Interval);
 719	}
 720	__in_dev_put(in_dev);
 721}
 722
 723static void igmp_ifc_event(struct in_device *in_dev)
 724{
 725	if (IGMP_V1_SEEN(in_dev) || IGMP_V2_SEEN(in_dev))
 726		return;
 727	in_dev->mr_ifc_count = in_dev->mr_qrv ? in_dev->mr_qrv :
 728		IGMP_Unsolicited_Report_Count;
 729	igmp_ifc_start_timer(in_dev, 1);
 730}
 731
 732
 733static void igmp_timer_expire(unsigned long data)
 734{
 735	struct ip_mc_list *im=(struct ip_mc_list *)data;
 736	struct in_device *in_dev = im->interface;
 737
 738	spin_lock(&im->lock);
 739	im->tm_running = 0;
 740
 741	if (im->unsolicit_count) {
 742		im->unsolicit_count--;
 743		igmp_start_timer(im, IGMP_Unsolicited_Report_Interval);
 744	}
 745	im->reporter = 1;
 746	spin_unlock(&im->lock);
 747
 748	if (IGMP_V1_SEEN(in_dev))
 749		igmp_send_report(in_dev, im, IGMP_HOST_MEMBERSHIP_REPORT);
 750	else if (IGMP_V2_SEEN(in_dev))
 751		igmp_send_report(in_dev, im, IGMPV2_HOST_MEMBERSHIP_REPORT);
 752	else
 753		igmp_send_report(in_dev, im, IGMPV3_HOST_MEMBERSHIP_REPORT);
 754
 755	ip_ma_put(im);
 756}
 757
 758/* mark EXCLUDE-mode sources */
 759static int igmp_xmarksources(struct ip_mc_list *pmc, int nsrcs, __be32 *srcs)
 760{
 761	struct ip_sf_list *psf;
 762	int i, scount;
 763
 764	scount = 0;
 765	for (psf=pmc->sources; psf; psf=psf->sf_next) {
 766		if (scount == nsrcs)
 767			break;
 768		for (i=0; i<nsrcs; i++) {
 769			/* skip inactive filters */
 770			if (psf->sf_count[MCAST_INCLUDE] ||
 771			    pmc->sfcount[MCAST_EXCLUDE] !=
 772			    psf->sf_count[MCAST_EXCLUDE])
 773				continue;
 774			if (srcs[i] == psf->sf_inaddr) {
 775				scount++;
 776				break;
 777			}
 778		}
 779	}
 780	pmc->gsquery = 0;
 781	if (scount == nsrcs)	/* all sources excluded */
 782		return 0;
 783	return 1;
 784}
 785
 786static int igmp_marksources(struct ip_mc_list *pmc, int nsrcs, __be32 *srcs)
 787{
 788	struct ip_sf_list *psf;
 789	int i, scount;
 790
 791	if (pmc->sfmode == MCAST_EXCLUDE)
 792		return igmp_xmarksources(pmc, nsrcs, srcs);
 793
 794	/* mark INCLUDE-mode sources */
 795	scount = 0;
 796	for (psf=pmc->sources; psf; psf=psf->sf_next) {
 797		if (scount == nsrcs)
 798			break;
 799		for (i=0; i<nsrcs; i++)
 800			if (srcs[i] == psf->sf_inaddr) {
 801				psf->sf_gsresp = 1;
 802				scount++;
 803				break;
 804			}
 805	}
 806	if (!scount) {
 807		pmc->gsquery = 0;
 808		return 0;
 809	}
 810	pmc->gsquery = 1;
 811	return 1;
 812}
 813
 814static void igmp_heard_report(struct in_device *in_dev, __be32 group)
 815{
 816	struct ip_mc_list *im;
 817
 818	/* Timers are only set for non-local groups */
 819
 820	if (group == IGMP_ALL_HOSTS)
 821		return;
 822
 823	rcu_read_lock();
 824	for_each_pmc_rcu(in_dev, im) {
 825		if (im->multiaddr == group) {
 826			igmp_stop_timer(im);
 827			break;
 828		}
 829	}
 830	rcu_read_unlock();
 831}
 832
 833static void igmp_heard_query(struct in_device *in_dev, struct sk_buff *skb,
 834	int len)
 835{
 836	struct igmphdr 		*ih = igmp_hdr(skb);
 837	struct igmpv3_query *ih3 = igmpv3_query_hdr(skb);
 838	struct ip_mc_list	*im;
 839	__be32			group = ih->group;
 840	int			max_delay;
 841	int			mark = 0;
 842
 843
 844	if (len == 8) {
 845		if (ih->code == 0) {
 846			/* Alas, old v1 router presents here. */
 847
 848			max_delay = IGMP_Query_Response_Interval;
 849			in_dev->mr_v1_seen = jiffies +
 850				IGMP_V1_Router_Present_Timeout;
 851			group = 0;
 852		} else {
 853			/* v2 router present */
 854			max_delay = ih->code*(HZ/IGMP_TIMER_SCALE);
 855			in_dev->mr_v2_seen = jiffies +
 856				IGMP_V2_Router_Present_Timeout;
 857		}
 858		/* cancel the interface change timer */
 859		in_dev->mr_ifc_count = 0;
 860		if (del_timer(&in_dev->mr_ifc_timer))
 861			__in_dev_put(in_dev);
 862		/* clear deleted report items */
 863		igmpv3_clear_delrec(in_dev);
 864	} else if (len < 12) {
 865		return;	/* ignore bogus packet; freed by caller */
 866	} else if (IGMP_V1_SEEN(in_dev)) {
 867		/* This is a v3 query with v1 queriers present */
 868		max_delay = IGMP_Query_Response_Interval;
 869		group = 0;
 870	} else if (IGMP_V2_SEEN(in_dev)) {
 871		/* this is a v3 query with v2 queriers present;
 872		 * Interpretation of the max_delay code is problematic here.
 873		 * A real v2 host would use ih_code directly, while v3 has a
 874		 * different encoding. We use the v3 encoding as more likely
 875		 * to be intended in a v3 query.
 876		 */
 877		max_delay = IGMPV3_MRC(ih3->code)*(HZ/IGMP_TIMER_SCALE);
 
 
 878	} else { /* v3 */
 879		if (!pskb_may_pull(skb, sizeof(struct igmpv3_query)))
 880			return;
 881
 882		ih3 = igmpv3_query_hdr(skb);
 883		if (ih3->nsrcs) {
 884			if (!pskb_may_pull(skb, sizeof(struct igmpv3_query)
 885					   + ntohs(ih3->nsrcs)*sizeof(__be32)))
 886				return;
 887			ih3 = igmpv3_query_hdr(skb);
 888		}
 889
 890		max_delay = IGMPV3_MRC(ih3->code)*(HZ/IGMP_TIMER_SCALE);
 891		if (!max_delay)
 892			max_delay = 1;	/* can't mod w/ 0 */
 893		in_dev->mr_maxdelay = max_delay;
 894		if (ih3->qrv)
 895			in_dev->mr_qrv = ih3->qrv;
 896		if (!group) { /* general query */
 897			if (ih3->nsrcs)
 898				return;	/* no sources allowed */
 899			igmp_gq_start_timer(in_dev);
 900			return;
 901		}
 902		/* mark sources to include, if group & source-specific */
 903		mark = ih3->nsrcs != 0;
 904	}
 905
 906	/*
 907	 * - Start the timers in all of our membership records
 908	 *   that the query applies to for the interface on
 909	 *   which the query arrived excl. those that belong
 910	 *   to a "local" group (224.0.0.X)
 911	 * - For timers already running check if they need to
 912	 *   be reset.
 913	 * - Use the igmp->igmp_code field as the maximum
 914	 *   delay possible
 915	 */
 916	rcu_read_lock();
 917	for_each_pmc_rcu(in_dev, im) {
 918		int changed;
 919
 920		if (group && group != im->multiaddr)
 921			continue;
 922		if (im->multiaddr == IGMP_ALL_HOSTS)
 923			continue;
 924		spin_lock_bh(&im->lock);
 925		if (im->tm_running)
 926			im->gsquery = im->gsquery && mark;
 927		else
 928			im->gsquery = mark;
 929		changed = !im->gsquery ||
 930			igmp_marksources(im, ntohs(ih3->nsrcs), ih3->srcs);
 931		spin_unlock_bh(&im->lock);
 932		if (changed)
 933			igmp_mod_timer(im, max_delay);
 934	}
 935	rcu_read_unlock();
 936}
 937
 938/* called in rcu_read_lock() section */
 939int igmp_rcv(struct sk_buff *skb)
 940{
 941	/* This basically follows the spec line by line -- see RFC1112 */
 942	struct igmphdr *ih;
 943	struct in_device *in_dev = __in_dev_get_rcu(skb->dev);
 944	int len = skb->len;
 945
 946	if (in_dev == NULL)
 947		goto drop;
 948
 949	if (!pskb_may_pull(skb, sizeof(struct igmphdr)))
 950		goto drop;
 951
 952	switch (skb->ip_summed) {
 953	case CHECKSUM_COMPLETE:
 954		if (!csum_fold(skb->csum))
 955			break;
 956		/* fall through */
 957	case CHECKSUM_NONE:
 958		skb->csum = 0;
 959		if (__skb_checksum_complete(skb))
 960			goto drop;
 961	}
 962
 963	ih = igmp_hdr(skb);
 964	switch (ih->type) {
 965	case IGMP_HOST_MEMBERSHIP_QUERY:
 966		igmp_heard_query(in_dev, skb, len);
 967		break;
 968	case IGMP_HOST_MEMBERSHIP_REPORT:
 969	case IGMPV2_HOST_MEMBERSHIP_REPORT:
 970		/* Is it our report looped back? */
 971		if (rt_is_output_route(skb_rtable(skb)))
 972			break;
 973		/* don't rely on MC router hearing unicast reports */
 974		if (skb->pkt_type == PACKET_MULTICAST ||
 975		    skb->pkt_type == PACKET_BROADCAST)
 976			igmp_heard_report(in_dev, ih->group);
 977		break;
 978	case IGMP_PIM:
 979#ifdef CONFIG_IP_PIMSM_V1
 980		return pim_rcv_v1(skb);
 981#endif
 982	case IGMPV3_HOST_MEMBERSHIP_REPORT:
 983	case IGMP_DVMRP:
 984	case IGMP_TRACE:
 985	case IGMP_HOST_LEAVE_MESSAGE:
 986	case IGMP_MTRACE:
 987	case IGMP_MTRACE_RESP:
 988		break;
 989	default:
 990		break;
 991	}
 992
 993drop:
 994	kfree_skb(skb);
 995	return 0;
 996}
 997
 998#endif
 999
1000
1001/*
1002 *	Add a filter to a device
1003 */
1004
1005static void ip_mc_filter_add(struct in_device *in_dev, __be32 addr)
1006{
1007	char buf[MAX_ADDR_LEN];
1008	struct net_device *dev = in_dev->dev;
1009
1010	/* Checking for IFF_MULTICAST here is WRONG-WRONG-WRONG.
1011	   We will get multicast token leakage, when IFF_MULTICAST
1012	   is changed. This check should be done in dev->set_multicast_list
1013	   routine. Something sort of:
1014	   if (dev->mc_list && dev->flags&IFF_MULTICAST) { do it; }
1015	   --ANK
1016	   */
1017	if (arp_mc_map(addr, buf, dev, 0) == 0)
1018		dev_mc_add(dev, buf);
1019}
1020
1021/*
1022 *	Remove a filter from a device
1023 */
1024
1025static void ip_mc_filter_del(struct in_device *in_dev, __be32 addr)
1026{
1027	char buf[MAX_ADDR_LEN];
1028	struct net_device *dev = in_dev->dev;
1029
1030	if (arp_mc_map(addr, buf, dev, 0) == 0)
1031		dev_mc_del(dev, buf);
1032}
1033
1034#ifdef CONFIG_IP_MULTICAST
1035/*
1036 * deleted ip_mc_list manipulation
1037 */
1038static void igmpv3_add_delrec(struct in_device *in_dev, struct ip_mc_list *im)
1039{
1040	struct ip_mc_list *pmc;
1041
1042	/* this is an "ip_mc_list" for convenience; only the fields below
1043	 * are actually used. In particular, the refcnt and users are not
1044	 * used for management of the delete list. Using the same structure
1045	 * for deleted items allows change reports to use common code with
1046	 * non-deleted or query-response MCA's.
1047	 */
1048	pmc = kzalloc(sizeof(*pmc), GFP_KERNEL);
1049	if (!pmc)
1050		return;
1051	spin_lock_bh(&im->lock);
1052	pmc->interface = im->interface;
1053	in_dev_hold(in_dev);
1054	pmc->multiaddr = im->multiaddr;
1055	pmc->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1056		IGMP_Unsolicited_Report_Count;
1057	pmc->sfmode = im->sfmode;
1058	if (pmc->sfmode == MCAST_INCLUDE) {
1059		struct ip_sf_list *psf;
1060
1061		pmc->tomb = im->tomb;
1062		pmc->sources = im->sources;
1063		im->tomb = im->sources = NULL;
1064		for (psf=pmc->sources; psf; psf=psf->sf_next)
1065			psf->sf_crcount = pmc->crcount;
1066	}
1067	spin_unlock_bh(&im->lock);
1068
1069	spin_lock_bh(&in_dev->mc_tomb_lock);
1070	pmc->next = in_dev->mc_tomb;
1071	in_dev->mc_tomb = pmc;
1072	spin_unlock_bh(&in_dev->mc_tomb_lock);
1073}
1074
1075static void igmpv3_del_delrec(struct in_device *in_dev, __be32 multiaddr)
1076{
1077	struct ip_mc_list *pmc, *pmc_prev;
1078	struct ip_sf_list *psf, *psf_next;
1079
1080	spin_lock_bh(&in_dev->mc_tomb_lock);
1081	pmc_prev = NULL;
1082	for (pmc=in_dev->mc_tomb; pmc; pmc=pmc->next) {
1083		if (pmc->multiaddr == multiaddr)
1084			break;
1085		pmc_prev = pmc;
1086	}
1087	if (pmc) {
1088		if (pmc_prev)
1089			pmc_prev->next = pmc->next;
1090		else
1091			in_dev->mc_tomb = pmc->next;
1092	}
1093	spin_unlock_bh(&in_dev->mc_tomb_lock);
1094	if (pmc) {
1095		for (psf=pmc->tomb; psf; psf=psf_next) {
1096			psf_next = psf->sf_next;
1097			kfree(psf);
1098		}
1099		in_dev_put(pmc->interface);
1100		kfree(pmc);
1101	}
1102}
1103
1104static void igmpv3_clear_delrec(struct in_device *in_dev)
1105{
1106	struct ip_mc_list *pmc, *nextpmc;
1107
1108	spin_lock_bh(&in_dev->mc_tomb_lock);
1109	pmc = in_dev->mc_tomb;
1110	in_dev->mc_tomb = NULL;
1111	spin_unlock_bh(&in_dev->mc_tomb_lock);
1112
1113	for (; pmc; pmc = nextpmc) {
1114		nextpmc = pmc->next;
1115		ip_mc_clear_src(pmc);
1116		in_dev_put(pmc->interface);
1117		kfree(pmc);
1118	}
1119	/* clear dead sources, too */
1120	rcu_read_lock();
1121	for_each_pmc_rcu(in_dev, pmc) {
1122		struct ip_sf_list *psf, *psf_next;
1123
1124		spin_lock_bh(&pmc->lock);
1125		psf = pmc->tomb;
1126		pmc->tomb = NULL;
1127		spin_unlock_bh(&pmc->lock);
1128		for (; psf; psf=psf_next) {
1129			psf_next = psf->sf_next;
1130			kfree(psf);
1131		}
1132	}
1133	rcu_read_unlock();
1134}
1135#endif
1136
1137static void igmp_group_dropped(struct ip_mc_list *im)
1138{
1139	struct in_device *in_dev = im->interface;
1140#ifdef CONFIG_IP_MULTICAST
1141	int reporter;
1142#endif
1143
1144	if (im->loaded) {
1145		im->loaded = 0;
1146		ip_mc_filter_del(in_dev, im->multiaddr);
1147	}
1148
1149#ifdef CONFIG_IP_MULTICAST
1150	if (im->multiaddr == IGMP_ALL_HOSTS)
1151		return;
1152
1153	reporter = im->reporter;
1154	igmp_stop_timer(im);
1155
1156	if (!in_dev->dead) {
1157		if (IGMP_V1_SEEN(in_dev))
1158			return;
1159		if (IGMP_V2_SEEN(in_dev)) {
1160			if (reporter)
1161				igmp_send_report(in_dev, im, IGMP_HOST_LEAVE_MESSAGE);
1162			return;
1163		}
1164		/* IGMPv3 */
1165		igmpv3_add_delrec(in_dev, im);
1166
1167		igmp_ifc_event(in_dev);
1168	}
1169#endif
1170}
1171
1172static void igmp_group_added(struct ip_mc_list *im)
1173{
1174	struct in_device *in_dev = im->interface;
1175
1176	if (im->loaded == 0) {
1177		im->loaded = 1;
1178		ip_mc_filter_add(in_dev, im->multiaddr);
1179	}
1180
1181#ifdef CONFIG_IP_MULTICAST
1182	if (im->multiaddr == IGMP_ALL_HOSTS)
1183		return;
1184
1185	if (in_dev->dead)
1186		return;
1187	if (IGMP_V1_SEEN(in_dev) || IGMP_V2_SEEN(in_dev)) {
1188		spin_lock_bh(&im->lock);
1189		igmp_start_timer(im, IGMP_Initial_Report_Delay);
1190		spin_unlock_bh(&im->lock);
1191		return;
1192	}
1193	/* else, v3 */
1194
1195	im->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1196		IGMP_Unsolicited_Report_Count;
1197	igmp_ifc_event(in_dev);
1198#endif
1199}
1200
1201
1202/*
1203 *	Multicast list managers
1204 */
1205
1206
1207/*
1208 *	A socket has joined a multicast group on device dev.
1209 */
1210
1211void ip_mc_inc_group(struct in_device *in_dev, __be32 addr)
1212{
1213	struct ip_mc_list *im;
1214
1215	ASSERT_RTNL();
1216
1217	for_each_pmc_rtnl(in_dev, im) {
1218		if (im->multiaddr == addr) {
1219			im->users++;
1220			ip_mc_add_src(in_dev, &addr, MCAST_EXCLUDE, 0, NULL, 0);
1221			goto out;
1222		}
1223	}
1224
1225	im = kzalloc(sizeof(*im), GFP_KERNEL);
1226	if (!im)
1227		goto out;
1228
1229	im->users = 1;
1230	im->interface = in_dev;
1231	in_dev_hold(in_dev);
1232	im->multiaddr = addr;
1233	/* initial mode is (EX, empty) */
1234	im->sfmode = MCAST_EXCLUDE;
1235	im->sfcount[MCAST_EXCLUDE] = 1;
1236	atomic_set(&im->refcnt, 1);
1237	spin_lock_init(&im->lock);
1238#ifdef CONFIG_IP_MULTICAST
1239	setup_timer(&im->timer, &igmp_timer_expire, (unsigned long)im);
1240	im->unsolicit_count = IGMP_Unsolicited_Report_Count;
1241#endif
1242
1243	im->next_rcu = in_dev->mc_list;
1244	in_dev->mc_count++;
1245	rcu_assign_pointer(in_dev->mc_list, im);
1246
1247#ifdef CONFIG_IP_MULTICAST
1248	igmpv3_del_delrec(in_dev, im->multiaddr);
1249#endif
1250	igmp_group_added(im);
1251	if (!in_dev->dead)
1252		ip_rt_multicast_event(in_dev);
1253out:
1254	return;
1255}
1256EXPORT_SYMBOL(ip_mc_inc_group);
1257
1258/*
1259 *	Resend IGMP JOIN report; used for bonding.
1260 *	Called with rcu_read_lock()
1261 */
1262void ip_mc_rejoin_groups(struct in_device *in_dev)
1263{
1264#ifdef CONFIG_IP_MULTICAST
1265	struct ip_mc_list *im;
1266	int type;
1267
1268	for_each_pmc_rcu(in_dev, im) {
1269		if (im->multiaddr == IGMP_ALL_HOSTS)
1270			continue;
1271
1272		/* a failover is happening and switches
1273		 * must be notified immediately
1274		 */
1275		if (IGMP_V1_SEEN(in_dev))
1276			type = IGMP_HOST_MEMBERSHIP_REPORT;
1277		else if (IGMP_V2_SEEN(in_dev))
1278			type = IGMPV2_HOST_MEMBERSHIP_REPORT;
1279		else
1280			type = IGMPV3_HOST_MEMBERSHIP_REPORT;
1281		igmp_send_report(in_dev, im, type);
1282	}
1283#endif
1284}
1285EXPORT_SYMBOL(ip_mc_rejoin_groups);
1286
1287/*
1288 *	A socket has left a multicast group on device dev
1289 */
1290
1291void ip_mc_dec_group(struct in_device *in_dev, __be32 addr)
1292{
1293	struct ip_mc_list *i;
1294	struct ip_mc_list __rcu **ip;
1295
1296	ASSERT_RTNL();
1297
1298	for (ip = &in_dev->mc_list;
1299	     (i = rtnl_dereference(*ip)) != NULL;
1300	     ip = &i->next_rcu) {
1301		if (i->multiaddr == addr) {
1302			if (--i->users == 0) {
1303				*ip = i->next_rcu;
1304				in_dev->mc_count--;
1305				igmp_group_dropped(i);
1306				ip_mc_clear_src(i);
1307
1308				if (!in_dev->dead)
1309					ip_rt_multicast_event(in_dev);
1310
1311				ip_ma_put(i);
1312				return;
1313			}
1314			break;
1315		}
1316	}
1317}
1318EXPORT_SYMBOL(ip_mc_dec_group);
1319
1320/* Device changing type */
1321
1322void ip_mc_unmap(struct in_device *in_dev)
1323{
1324	struct ip_mc_list *pmc;
1325
1326	ASSERT_RTNL();
1327
1328	for_each_pmc_rtnl(in_dev, pmc)
1329		igmp_group_dropped(pmc);
1330}
1331
1332void ip_mc_remap(struct in_device *in_dev)
1333{
1334	struct ip_mc_list *pmc;
1335
1336	ASSERT_RTNL();
1337
1338	for_each_pmc_rtnl(in_dev, pmc)
1339		igmp_group_added(pmc);
1340}
1341
1342/* Device going down */
1343
1344void ip_mc_down(struct in_device *in_dev)
1345{
1346	struct ip_mc_list *pmc;
1347
1348	ASSERT_RTNL();
1349
1350	for_each_pmc_rtnl(in_dev, pmc)
1351		igmp_group_dropped(pmc);
1352
1353#ifdef CONFIG_IP_MULTICAST
1354	in_dev->mr_ifc_count = 0;
1355	if (del_timer(&in_dev->mr_ifc_timer))
1356		__in_dev_put(in_dev);
1357	in_dev->mr_gq_running = 0;
1358	if (del_timer(&in_dev->mr_gq_timer))
1359		__in_dev_put(in_dev);
1360	igmpv3_clear_delrec(in_dev);
1361#endif
1362
1363	ip_mc_dec_group(in_dev, IGMP_ALL_HOSTS);
1364}
1365
1366void ip_mc_init_dev(struct in_device *in_dev)
1367{
1368	ASSERT_RTNL();
1369
1370	in_dev->mc_tomb = NULL;
1371#ifdef CONFIG_IP_MULTICAST
1372	in_dev->mr_gq_running = 0;
1373	setup_timer(&in_dev->mr_gq_timer, igmp_gq_timer_expire,
1374			(unsigned long)in_dev);
1375	in_dev->mr_ifc_count = 0;
1376	in_dev->mc_count     = 0;
1377	setup_timer(&in_dev->mr_ifc_timer, igmp_ifc_timer_expire,
1378			(unsigned long)in_dev);
1379	in_dev->mr_qrv = IGMP_Unsolicited_Report_Count;
1380#endif
1381
1382	spin_lock_init(&in_dev->mc_tomb_lock);
1383}
1384
1385/* Device going up */
1386
1387void ip_mc_up(struct in_device *in_dev)
1388{
1389	struct ip_mc_list *pmc;
1390
1391	ASSERT_RTNL();
1392
1393	ip_mc_inc_group(in_dev, IGMP_ALL_HOSTS);
1394
1395	for_each_pmc_rtnl(in_dev, pmc)
1396		igmp_group_added(pmc);
1397}
1398
1399/*
1400 *	Device is about to be destroyed: clean up.
1401 */
1402
1403void ip_mc_destroy_dev(struct in_device *in_dev)
1404{
1405	struct ip_mc_list *i;
1406
1407	ASSERT_RTNL();
1408
1409	/* Deactivate timers */
1410	ip_mc_down(in_dev);
1411
1412	while ((i = rtnl_dereference(in_dev->mc_list)) != NULL) {
1413		in_dev->mc_list = i->next_rcu;
1414		in_dev->mc_count--;
1415
1416		/* We've dropped the groups in ip_mc_down already */
1417		ip_mc_clear_src(i);
1418		ip_ma_put(i);
1419	}
1420}
1421
1422/* RTNL is locked */
1423static struct in_device *ip_mc_find_dev(struct net *net, struct ip_mreqn *imr)
1424{
1425	struct net_device *dev = NULL;
1426	struct in_device *idev = NULL;
1427
1428	if (imr->imr_ifindex) {
1429		idev = inetdev_by_index(net, imr->imr_ifindex);
1430		return idev;
1431	}
1432	if (imr->imr_address.s_addr) {
1433		dev = __ip_dev_find(net, imr->imr_address.s_addr, false);
1434		if (!dev)
1435			return NULL;
1436	}
1437
1438	if (!dev) {
1439		struct rtable *rt = ip_route_output(net,
1440						    imr->imr_multiaddr.s_addr,
1441						    0, 0, 0);
1442		if (!IS_ERR(rt)) {
1443			dev = rt->dst.dev;
1444			ip_rt_put(rt);
1445		}
1446	}
1447	if (dev) {
1448		imr->imr_ifindex = dev->ifindex;
1449		idev = __in_dev_get_rtnl(dev);
1450	}
1451	return idev;
1452}
1453
1454/*
1455 *	Join a socket to a group
1456 */
1457int sysctl_igmp_max_memberships __read_mostly = IP_MAX_MEMBERSHIPS;
1458int sysctl_igmp_max_msf __read_mostly = IP_MAX_MSF;
1459
1460
1461static int ip_mc_del1_src(struct ip_mc_list *pmc, int sfmode,
1462	__be32 *psfsrc)
1463{
1464	struct ip_sf_list *psf, *psf_prev;
1465	int rv = 0;
1466
1467	psf_prev = NULL;
1468	for (psf=pmc->sources; psf; psf=psf->sf_next) {
1469		if (psf->sf_inaddr == *psfsrc)
1470			break;
1471		psf_prev = psf;
1472	}
1473	if (!psf || psf->sf_count[sfmode] == 0) {
1474		/* source filter not found, or count wrong =>  bug */
1475		return -ESRCH;
1476	}
1477	psf->sf_count[sfmode]--;
1478	if (psf->sf_count[sfmode] == 0) {
1479		ip_rt_multicast_event(pmc->interface);
1480	}
1481	if (!psf->sf_count[MCAST_INCLUDE] && !psf->sf_count[MCAST_EXCLUDE]) {
1482#ifdef CONFIG_IP_MULTICAST
1483		struct in_device *in_dev = pmc->interface;
1484#endif
1485
1486		/* no more filters for this source */
1487		if (psf_prev)
1488			psf_prev->sf_next = psf->sf_next;
1489		else
1490			pmc->sources = psf->sf_next;
1491#ifdef CONFIG_IP_MULTICAST
1492		if (psf->sf_oldin &&
1493		    !IGMP_V1_SEEN(in_dev) && !IGMP_V2_SEEN(in_dev)) {
1494			psf->sf_crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1495				IGMP_Unsolicited_Report_Count;
1496			psf->sf_next = pmc->tomb;
1497			pmc->tomb = psf;
1498			rv = 1;
1499		} else
1500#endif
1501			kfree(psf);
1502	}
1503	return rv;
1504}
1505
1506#ifndef CONFIG_IP_MULTICAST
1507#define igmp_ifc_event(x)	do { } while (0)
1508#endif
1509
1510static int ip_mc_del_src(struct in_device *in_dev, __be32 *pmca, int sfmode,
1511			 int sfcount, __be32 *psfsrc, int delta)
1512{
1513	struct ip_mc_list *pmc;
1514	int	changerec = 0;
1515	int	i, err;
1516
1517	if (!in_dev)
1518		return -ENODEV;
1519	rcu_read_lock();
1520	for_each_pmc_rcu(in_dev, pmc) {
1521		if (*pmca == pmc->multiaddr)
1522			break;
1523	}
1524	if (!pmc) {
1525		/* MCA not found?? bug */
1526		rcu_read_unlock();
1527		return -ESRCH;
1528	}
1529	spin_lock_bh(&pmc->lock);
1530	rcu_read_unlock();
1531#ifdef CONFIG_IP_MULTICAST
1532	sf_markstate(pmc);
1533#endif
1534	if (!delta) {
1535		err = -EINVAL;
1536		if (!pmc->sfcount[sfmode])
1537			goto out_unlock;
1538		pmc->sfcount[sfmode]--;
1539	}
1540	err = 0;
1541	for (i=0; i<sfcount; i++) {
1542		int rv = ip_mc_del1_src(pmc, sfmode, &psfsrc[i]);
1543
1544		changerec |= rv > 0;
1545		if (!err && rv < 0)
1546			err = rv;
1547	}
1548	if (pmc->sfmode == MCAST_EXCLUDE &&
1549	    pmc->sfcount[MCAST_EXCLUDE] == 0 &&
1550	    pmc->sfcount[MCAST_INCLUDE]) {
1551#ifdef CONFIG_IP_MULTICAST
1552		struct ip_sf_list *psf;
1553#endif
1554
1555		/* filter mode change */
1556		pmc->sfmode = MCAST_INCLUDE;
1557#ifdef CONFIG_IP_MULTICAST
1558		pmc->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1559			IGMP_Unsolicited_Report_Count;
1560		in_dev->mr_ifc_count = pmc->crcount;
1561		for (psf=pmc->sources; psf; psf = psf->sf_next)
1562			psf->sf_crcount = 0;
1563		igmp_ifc_event(pmc->interface);
1564	} else if (sf_setstate(pmc) || changerec) {
1565		igmp_ifc_event(pmc->interface);
1566#endif
1567	}
1568out_unlock:
1569	spin_unlock_bh(&pmc->lock);
1570	return err;
1571}
1572
1573/*
1574 * Add multicast single-source filter to the interface list
1575 */
1576static int ip_mc_add1_src(struct ip_mc_list *pmc, int sfmode,
1577	__be32 *psfsrc, int delta)
1578{
1579	struct ip_sf_list *psf, *psf_prev;
1580
1581	psf_prev = NULL;
1582	for (psf=pmc->sources; psf; psf=psf->sf_next) {
1583		if (psf->sf_inaddr == *psfsrc)
1584			break;
1585		psf_prev = psf;
1586	}
1587	if (!psf) {
1588		psf = kzalloc(sizeof(*psf), GFP_ATOMIC);
1589		if (!psf)
1590			return -ENOBUFS;
1591		psf->sf_inaddr = *psfsrc;
1592		if (psf_prev) {
1593			psf_prev->sf_next = psf;
1594		} else
1595			pmc->sources = psf;
1596	}
1597	psf->sf_count[sfmode]++;
1598	if (psf->sf_count[sfmode] == 1) {
1599		ip_rt_multicast_event(pmc->interface);
1600	}
1601	return 0;
1602}
1603
1604#ifdef CONFIG_IP_MULTICAST
1605static void sf_markstate(struct ip_mc_list *pmc)
1606{
1607	struct ip_sf_list *psf;
1608	int mca_xcount = pmc->sfcount[MCAST_EXCLUDE];
1609
1610	for (psf=pmc->sources; psf; psf=psf->sf_next)
1611		if (pmc->sfcount[MCAST_EXCLUDE]) {
1612			psf->sf_oldin = mca_xcount ==
1613				psf->sf_count[MCAST_EXCLUDE] &&
1614				!psf->sf_count[MCAST_INCLUDE];
1615		} else
1616			psf->sf_oldin = psf->sf_count[MCAST_INCLUDE] != 0;
1617}
1618
1619static int sf_setstate(struct ip_mc_list *pmc)
1620{
1621	struct ip_sf_list *psf, *dpsf;
1622	int mca_xcount = pmc->sfcount[MCAST_EXCLUDE];
1623	int qrv = pmc->interface->mr_qrv;
1624	int new_in, rv;
1625
1626	rv = 0;
1627	for (psf=pmc->sources; psf; psf=psf->sf_next) {
1628		if (pmc->sfcount[MCAST_EXCLUDE]) {
1629			new_in = mca_xcount == psf->sf_count[MCAST_EXCLUDE] &&
1630				!psf->sf_count[MCAST_INCLUDE];
1631		} else
1632			new_in = psf->sf_count[MCAST_INCLUDE] != 0;
1633		if (new_in) {
1634			if (!psf->sf_oldin) {
1635				struct ip_sf_list *prev = NULL;
1636
1637				for (dpsf=pmc->tomb; dpsf; dpsf=dpsf->sf_next) {
1638					if (dpsf->sf_inaddr == psf->sf_inaddr)
1639						break;
1640					prev = dpsf;
1641				}
1642				if (dpsf) {
1643					if (prev)
1644						prev->sf_next = dpsf->sf_next;
1645					else
1646						pmc->tomb = dpsf->sf_next;
1647					kfree(dpsf);
1648				}
1649				psf->sf_crcount = qrv;
1650				rv++;
1651			}
1652		} else if (psf->sf_oldin) {
1653
1654			psf->sf_crcount = 0;
1655			/*
1656			 * add or update "delete" records if an active filter
1657			 * is now inactive
1658			 */
1659			for (dpsf=pmc->tomb; dpsf; dpsf=dpsf->sf_next)
1660				if (dpsf->sf_inaddr == psf->sf_inaddr)
1661					break;
1662			if (!dpsf) {
1663				dpsf = kmalloc(sizeof(*dpsf), GFP_ATOMIC);
1664				if (!dpsf)
1665					continue;
1666				*dpsf = *psf;
1667				/* pmc->lock held by callers */
1668				dpsf->sf_next = pmc->tomb;
1669				pmc->tomb = dpsf;
1670			}
1671			dpsf->sf_crcount = qrv;
1672			rv++;
1673		}
1674	}
1675	return rv;
1676}
1677#endif
1678
1679/*
1680 * Add multicast source filter list to the interface list
1681 */
1682static int ip_mc_add_src(struct in_device *in_dev, __be32 *pmca, int sfmode,
1683			 int sfcount, __be32 *psfsrc, int delta)
1684{
1685	struct ip_mc_list *pmc;
1686	int	isexclude;
1687	int	i, err;
1688
1689	if (!in_dev)
1690		return -ENODEV;
1691	rcu_read_lock();
1692	for_each_pmc_rcu(in_dev, pmc) {
1693		if (*pmca == pmc->multiaddr)
1694			break;
1695	}
1696	if (!pmc) {
1697		/* MCA not found?? bug */
1698		rcu_read_unlock();
1699		return -ESRCH;
1700	}
1701	spin_lock_bh(&pmc->lock);
1702	rcu_read_unlock();
1703
1704#ifdef CONFIG_IP_MULTICAST
1705	sf_markstate(pmc);
1706#endif
1707	isexclude = pmc->sfmode == MCAST_EXCLUDE;
1708	if (!delta)
1709		pmc->sfcount[sfmode]++;
1710	err = 0;
1711	for (i=0; i<sfcount; i++) {
1712		err = ip_mc_add1_src(pmc, sfmode, &psfsrc[i], delta);
1713		if (err)
1714			break;
1715	}
1716	if (err) {
1717		int j;
1718
1719		pmc->sfcount[sfmode]--;
 
1720		for (j=0; j<i; j++)
1721			(void) ip_mc_del1_src(pmc, sfmode, &psfsrc[j]);
1722	} else if (isexclude != (pmc->sfcount[MCAST_EXCLUDE] != 0)) {
1723#ifdef CONFIG_IP_MULTICAST
1724		struct ip_sf_list *psf;
1725		in_dev = pmc->interface;
1726#endif
1727
1728		/* filter mode change */
1729		if (pmc->sfcount[MCAST_EXCLUDE])
1730			pmc->sfmode = MCAST_EXCLUDE;
1731		else if (pmc->sfcount[MCAST_INCLUDE])
1732			pmc->sfmode = MCAST_INCLUDE;
1733#ifdef CONFIG_IP_MULTICAST
1734		/* else no filters; keep old mode for reports */
1735
1736		pmc->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1737			IGMP_Unsolicited_Report_Count;
1738		in_dev->mr_ifc_count = pmc->crcount;
1739		for (psf=pmc->sources; psf; psf = psf->sf_next)
1740			psf->sf_crcount = 0;
1741		igmp_ifc_event(in_dev);
1742	} else if (sf_setstate(pmc)) {
1743		igmp_ifc_event(in_dev);
1744#endif
1745	}
1746	spin_unlock_bh(&pmc->lock);
1747	return err;
1748}
1749
1750static void ip_mc_clear_src(struct ip_mc_list *pmc)
1751{
1752	struct ip_sf_list *psf, *nextpsf;
1753
1754	for (psf=pmc->tomb; psf; psf=nextpsf) {
1755		nextpsf = psf->sf_next;
1756		kfree(psf);
1757	}
1758	pmc->tomb = NULL;
1759	for (psf=pmc->sources; psf; psf=nextpsf) {
1760		nextpsf = psf->sf_next;
1761		kfree(psf);
1762	}
1763	pmc->sources = NULL;
1764	pmc->sfmode = MCAST_EXCLUDE;
1765	pmc->sfcount[MCAST_INCLUDE] = 0;
1766	pmc->sfcount[MCAST_EXCLUDE] = 1;
1767}
1768
1769
1770/*
1771 * Join a multicast group
1772 */
1773int ip_mc_join_group(struct sock *sk , struct ip_mreqn *imr)
1774{
1775	int err;
1776	__be32 addr = imr->imr_multiaddr.s_addr;
1777	struct ip_mc_socklist *iml = NULL, *i;
1778	struct in_device *in_dev;
1779	struct inet_sock *inet = inet_sk(sk);
1780	struct net *net = sock_net(sk);
1781	int ifindex;
1782	int count = 0;
1783
1784	if (!ipv4_is_multicast(addr))
1785		return -EINVAL;
1786
1787	rtnl_lock();
1788
1789	in_dev = ip_mc_find_dev(net, imr);
1790
1791	if (!in_dev) {
1792		iml = NULL;
1793		err = -ENODEV;
1794		goto done;
1795	}
1796
1797	err = -EADDRINUSE;
1798	ifindex = imr->imr_ifindex;
1799	for_each_pmc_rtnl(inet, i) {
1800		if (i->multi.imr_multiaddr.s_addr == addr &&
1801		    i->multi.imr_ifindex == ifindex)
1802			goto done;
1803		count++;
1804	}
1805	err = -ENOBUFS;
1806	if (count >= sysctl_igmp_max_memberships)
1807		goto done;
1808	iml = sock_kmalloc(sk, sizeof(*iml), GFP_KERNEL);
1809	if (iml == NULL)
1810		goto done;
1811
1812	memcpy(&iml->multi, imr, sizeof(*imr));
1813	iml->next_rcu = inet->mc_list;
1814	iml->sflist = NULL;
1815	iml->sfmode = MCAST_EXCLUDE;
1816	rcu_assign_pointer(inet->mc_list, iml);
1817	ip_mc_inc_group(in_dev, addr);
1818	err = 0;
1819done:
1820	rtnl_unlock();
1821	return err;
1822}
1823EXPORT_SYMBOL(ip_mc_join_group);
1824
1825static int ip_mc_leave_src(struct sock *sk, struct ip_mc_socklist *iml,
1826			   struct in_device *in_dev)
1827{
1828	struct ip_sf_socklist *psf = rtnl_dereference(iml->sflist);
1829	int err;
1830
1831	if (psf == NULL) {
1832		/* any-source empty exclude case */
1833		return ip_mc_del_src(in_dev, &iml->multi.imr_multiaddr.s_addr,
1834			iml->sfmode, 0, NULL, 0);
1835	}
1836	err = ip_mc_del_src(in_dev, &iml->multi.imr_multiaddr.s_addr,
1837			iml->sfmode, psf->sl_count, psf->sl_addr, 0);
1838	rcu_assign_pointer(iml->sflist, NULL);
1839	/* decrease mem now to avoid the memleak warning */
1840	atomic_sub(IP_SFLSIZE(psf->sl_max), &sk->sk_omem_alloc);
1841	kfree_rcu(psf, rcu);
1842	return err;
1843}
1844
1845/*
1846 *	Ask a socket to leave a group.
1847 */
1848
1849int ip_mc_leave_group(struct sock *sk, struct ip_mreqn *imr)
1850{
1851	struct inet_sock *inet = inet_sk(sk);
1852	struct ip_mc_socklist *iml;
1853	struct ip_mc_socklist __rcu **imlp;
1854	struct in_device *in_dev;
1855	struct net *net = sock_net(sk);
1856	__be32 group = imr->imr_multiaddr.s_addr;
1857	u32 ifindex;
1858	int ret = -EADDRNOTAVAIL;
1859
1860	rtnl_lock();
1861	in_dev = ip_mc_find_dev(net, imr);
1862	ifindex = imr->imr_ifindex;
1863	for (imlp = &inet->mc_list;
1864	     (iml = rtnl_dereference(*imlp)) != NULL;
1865	     imlp = &iml->next_rcu) {
1866		if (iml->multi.imr_multiaddr.s_addr != group)
1867			continue;
1868		if (ifindex) {
1869			if (iml->multi.imr_ifindex != ifindex)
1870				continue;
1871		} else if (imr->imr_address.s_addr && imr->imr_address.s_addr !=
1872				iml->multi.imr_address.s_addr)
1873			continue;
1874
1875		(void) ip_mc_leave_src(sk, iml, in_dev);
1876
1877		*imlp = iml->next_rcu;
1878
1879		if (in_dev)
1880			ip_mc_dec_group(in_dev, group);
1881		rtnl_unlock();
1882		/* decrease mem now to avoid the memleak warning */
1883		atomic_sub(sizeof(*iml), &sk->sk_omem_alloc);
1884		kfree_rcu(iml, rcu);
1885		return 0;
1886	}
1887	if (!in_dev)
1888		ret = -ENODEV;
1889	rtnl_unlock();
1890	return ret;
1891}
1892
1893int ip_mc_source(int add, int omode, struct sock *sk, struct
1894	ip_mreq_source *mreqs, int ifindex)
1895{
1896	int err;
1897	struct ip_mreqn imr;
1898	__be32 addr = mreqs->imr_multiaddr;
1899	struct ip_mc_socklist *pmc;
1900	struct in_device *in_dev = NULL;
1901	struct inet_sock *inet = inet_sk(sk);
1902	struct ip_sf_socklist *psl;
1903	struct net *net = sock_net(sk);
1904	int leavegroup = 0;
1905	int i, j, rv;
1906
1907	if (!ipv4_is_multicast(addr))
1908		return -EINVAL;
1909
1910	rtnl_lock();
1911
1912	imr.imr_multiaddr.s_addr = mreqs->imr_multiaddr;
1913	imr.imr_address.s_addr = mreqs->imr_interface;
1914	imr.imr_ifindex = ifindex;
1915	in_dev = ip_mc_find_dev(net, &imr);
1916
1917	if (!in_dev) {
1918		err = -ENODEV;
1919		goto done;
1920	}
1921	err = -EADDRNOTAVAIL;
1922
1923	for_each_pmc_rtnl(inet, pmc) {
1924		if ((pmc->multi.imr_multiaddr.s_addr ==
1925		     imr.imr_multiaddr.s_addr) &&
1926		    (pmc->multi.imr_ifindex == imr.imr_ifindex))
1927			break;
1928	}
1929	if (!pmc) {		/* must have a prior join */
1930		err = -EINVAL;
1931		goto done;
1932	}
1933	/* if a source filter was set, must be the same mode as before */
1934	if (pmc->sflist) {
1935		if (pmc->sfmode != omode) {
1936			err = -EINVAL;
1937			goto done;
1938		}
1939	} else if (pmc->sfmode != omode) {
1940		/* allow mode switches for empty-set filters */
1941		ip_mc_add_src(in_dev, &mreqs->imr_multiaddr, omode, 0, NULL, 0);
1942		ip_mc_del_src(in_dev, &mreqs->imr_multiaddr, pmc->sfmode, 0,
1943			NULL, 0);
1944		pmc->sfmode = omode;
1945	}
1946
1947	psl = rtnl_dereference(pmc->sflist);
1948	if (!add) {
1949		if (!psl)
1950			goto done;	/* err = -EADDRNOTAVAIL */
1951		rv = !0;
1952		for (i=0; i<psl->sl_count; i++) {
1953			rv = memcmp(&psl->sl_addr[i], &mreqs->imr_sourceaddr,
1954				sizeof(__be32));
1955			if (rv == 0)
1956				break;
1957		}
1958		if (rv)		/* source not found */
1959			goto done;	/* err = -EADDRNOTAVAIL */
1960
1961		/* special case - (INCLUDE, empty) == LEAVE_GROUP */
1962		if (psl->sl_count == 1 && omode == MCAST_INCLUDE) {
1963			leavegroup = 1;
1964			goto done;
1965		}
1966
1967		/* update the interface filter */
1968		ip_mc_del_src(in_dev, &mreqs->imr_multiaddr, omode, 1,
1969			&mreqs->imr_sourceaddr, 1);
1970
1971		for (j=i+1; j<psl->sl_count; j++)
1972			psl->sl_addr[j-1] = psl->sl_addr[j];
1973		psl->sl_count--;
1974		err = 0;
1975		goto done;
1976	}
1977	/* else, add a new source to the filter */
1978
1979	if (psl && psl->sl_count >= sysctl_igmp_max_msf) {
1980		err = -ENOBUFS;
1981		goto done;
1982	}
1983	if (!psl || psl->sl_count == psl->sl_max) {
1984		struct ip_sf_socklist *newpsl;
1985		int count = IP_SFBLOCK;
1986
1987		if (psl)
1988			count += psl->sl_max;
1989		newpsl = sock_kmalloc(sk, IP_SFLSIZE(count), GFP_KERNEL);
1990		if (!newpsl) {
1991			err = -ENOBUFS;
1992			goto done;
1993		}
1994		newpsl->sl_max = count;
1995		newpsl->sl_count = count - IP_SFBLOCK;
1996		if (psl) {
1997			for (i=0; i<psl->sl_count; i++)
1998				newpsl->sl_addr[i] = psl->sl_addr[i];
1999			/* decrease mem now to avoid the memleak warning */
2000			atomic_sub(IP_SFLSIZE(psl->sl_max), &sk->sk_omem_alloc);
2001			kfree_rcu(psl, rcu);
2002		}
2003		rcu_assign_pointer(pmc->sflist, newpsl);
2004		psl = newpsl;
2005	}
2006	rv = 1;	/* > 0 for insert logic below if sl_count is 0 */
2007	for (i=0; i<psl->sl_count; i++) {
2008		rv = memcmp(&psl->sl_addr[i], &mreqs->imr_sourceaddr,
2009			sizeof(__be32));
2010		if (rv == 0)
2011			break;
2012	}
2013	if (rv == 0)		/* address already there is an error */
2014		goto done;
2015	for (j=psl->sl_count-1; j>=i; j--)
2016		psl->sl_addr[j+1] = psl->sl_addr[j];
2017	psl->sl_addr[i] = mreqs->imr_sourceaddr;
2018	psl->sl_count++;
2019	err = 0;
2020	/* update the interface list */
2021	ip_mc_add_src(in_dev, &mreqs->imr_multiaddr, omode, 1,
2022		&mreqs->imr_sourceaddr, 1);
2023done:
2024	rtnl_unlock();
2025	if (leavegroup)
2026		return ip_mc_leave_group(sk, &imr);
2027	return err;
2028}
2029
2030int ip_mc_msfilter(struct sock *sk, struct ip_msfilter *msf, int ifindex)
2031{
2032	int err = 0;
2033	struct ip_mreqn	imr;
2034	__be32 addr = msf->imsf_multiaddr;
2035	struct ip_mc_socklist *pmc;
2036	struct in_device *in_dev;
2037	struct inet_sock *inet = inet_sk(sk);
2038	struct ip_sf_socklist *newpsl, *psl;
2039	struct net *net = sock_net(sk);
2040	int leavegroup = 0;
2041
2042	if (!ipv4_is_multicast(addr))
2043		return -EINVAL;
2044	if (msf->imsf_fmode != MCAST_INCLUDE &&
2045	    msf->imsf_fmode != MCAST_EXCLUDE)
2046		return -EINVAL;
2047
2048	rtnl_lock();
2049
2050	imr.imr_multiaddr.s_addr = msf->imsf_multiaddr;
2051	imr.imr_address.s_addr = msf->imsf_interface;
2052	imr.imr_ifindex = ifindex;
2053	in_dev = ip_mc_find_dev(net, &imr);
2054
2055	if (!in_dev) {
2056		err = -ENODEV;
2057		goto done;
2058	}
2059
2060	/* special case - (INCLUDE, empty) == LEAVE_GROUP */
2061	if (msf->imsf_fmode == MCAST_INCLUDE && msf->imsf_numsrc == 0) {
2062		leavegroup = 1;
2063		goto done;
2064	}
2065
2066	for_each_pmc_rtnl(inet, pmc) {
2067		if (pmc->multi.imr_multiaddr.s_addr == msf->imsf_multiaddr &&
2068		    pmc->multi.imr_ifindex == imr.imr_ifindex)
2069			break;
2070	}
2071	if (!pmc) {		/* must have a prior join */
2072		err = -EINVAL;
2073		goto done;
2074	}
2075	if (msf->imsf_numsrc) {
2076		newpsl = sock_kmalloc(sk, IP_SFLSIZE(msf->imsf_numsrc),
2077							   GFP_KERNEL);
2078		if (!newpsl) {
2079			err = -ENOBUFS;
2080			goto done;
2081		}
2082		newpsl->sl_max = newpsl->sl_count = msf->imsf_numsrc;
2083		memcpy(newpsl->sl_addr, msf->imsf_slist,
2084			msf->imsf_numsrc * sizeof(msf->imsf_slist[0]));
2085		err = ip_mc_add_src(in_dev, &msf->imsf_multiaddr,
2086			msf->imsf_fmode, newpsl->sl_count, newpsl->sl_addr, 0);
2087		if (err) {
2088			sock_kfree_s(sk, newpsl, IP_SFLSIZE(newpsl->sl_max));
2089			goto done;
2090		}
2091	} else {
2092		newpsl = NULL;
2093		(void) ip_mc_add_src(in_dev, &msf->imsf_multiaddr,
2094				     msf->imsf_fmode, 0, NULL, 0);
2095	}
2096	psl = rtnl_dereference(pmc->sflist);
2097	if (psl) {
2098		(void) ip_mc_del_src(in_dev, &msf->imsf_multiaddr, pmc->sfmode,
2099			psl->sl_count, psl->sl_addr, 0);
2100		/* decrease mem now to avoid the memleak warning */
2101		atomic_sub(IP_SFLSIZE(psl->sl_max), &sk->sk_omem_alloc);
2102		kfree_rcu(psl, rcu);
2103	} else
2104		(void) ip_mc_del_src(in_dev, &msf->imsf_multiaddr, pmc->sfmode,
2105			0, NULL, 0);
2106	rcu_assign_pointer(pmc->sflist, newpsl);
2107	pmc->sfmode = msf->imsf_fmode;
2108	err = 0;
2109done:
2110	rtnl_unlock();
2111	if (leavegroup)
2112		err = ip_mc_leave_group(sk, &imr);
2113	return err;
2114}
2115
2116int ip_mc_msfget(struct sock *sk, struct ip_msfilter *msf,
2117	struct ip_msfilter __user *optval, int __user *optlen)
2118{
2119	int err, len, count, copycount;
2120	struct ip_mreqn	imr;
2121	__be32 addr = msf->imsf_multiaddr;
2122	struct ip_mc_socklist *pmc;
2123	struct in_device *in_dev;
2124	struct inet_sock *inet = inet_sk(sk);
2125	struct ip_sf_socklist *psl;
2126	struct net *net = sock_net(sk);
2127
2128	if (!ipv4_is_multicast(addr))
2129		return -EINVAL;
2130
2131	rtnl_lock();
2132
2133	imr.imr_multiaddr.s_addr = msf->imsf_multiaddr;
2134	imr.imr_address.s_addr = msf->imsf_interface;
2135	imr.imr_ifindex = 0;
2136	in_dev = ip_mc_find_dev(net, &imr);
2137
2138	if (!in_dev) {
2139		err = -ENODEV;
2140		goto done;
2141	}
2142	err = -EADDRNOTAVAIL;
2143
2144	for_each_pmc_rtnl(inet, pmc) {
2145		if (pmc->multi.imr_multiaddr.s_addr == msf->imsf_multiaddr &&
2146		    pmc->multi.imr_ifindex == imr.imr_ifindex)
2147			break;
2148	}
2149	if (!pmc)		/* must have a prior join */
2150		goto done;
2151	msf->imsf_fmode = pmc->sfmode;
2152	psl = rtnl_dereference(pmc->sflist);
2153	rtnl_unlock();
2154	if (!psl) {
2155		len = 0;
2156		count = 0;
2157	} else {
2158		count = psl->sl_count;
2159	}
2160	copycount = count < msf->imsf_numsrc ? count : msf->imsf_numsrc;
2161	len = copycount * sizeof(psl->sl_addr[0]);
2162	msf->imsf_numsrc = count;
2163	if (put_user(IP_MSFILTER_SIZE(copycount), optlen) ||
2164	    copy_to_user(optval, msf, IP_MSFILTER_SIZE(0))) {
2165		return -EFAULT;
2166	}
2167	if (len &&
2168	    copy_to_user(&optval->imsf_slist[0], psl->sl_addr, len))
2169		return -EFAULT;
2170	return 0;
2171done:
2172	rtnl_unlock();
2173	return err;
2174}
2175
2176int ip_mc_gsfget(struct sock *sk, struct group_filter *gsf,
2177	struct group_filter __user *optval, int __user *optlen)
2178{
2179	int err, i, count, copycount;
2180	struct sockaddr_in *psin;
2181	__be32 addr;
2182	struct ip_mc_socklist *pmc;
2183	struct inet_sock *inet = inet_sk(sk);
2184	struct ip_sf_socklist *psl;
2185
2186	psin = (struct sockaddr_in *)&gsf->gf_group;
2187	if (psin->sin_family != AF_INET)
2188		return -EINVAL;
2189	addr = psin->sin_addr.s_addr;
2190	if (!ipv4_is_multicast(addr))
2191		return -EINVAL;
2192
2193	rtnl_lock();
2194
2195	err = -EADDRNOTAVAIL;
2196
2197	for_each_pmc_rtnl(inet, pmc) {
2198		if (pmc->multi.imr_multiaddr.s_addr == addr &&
2199		    pmc->multi.imr_ifindex == gsf->gf_interface)
2200			break;
2201	}
2202	if (!pmc)		/* must have a prior join */
2203		goto done;
2204	gsf->gf_fmode = pmc->sfmode;
2205	psl = rtnl_dereference(pmc->sflist);
2206	rtnl_unlock();
2207	count = psl ? psl->sl_count : 0;
2208	copycount = count < gsf->gf_numsrc ? count : gsf->gf_numsrc;
2209	gsf->gf_numsrc = count;
2210	if (put_user(GROUP_FILTER_SIZE(copycount), optlen) ||
2211	    copy_to_user(optval, gsf, GROUP_FILTER_SIZE(0))) {
2212		return -EFAULT;
2213	}
2214	for (i=0; i<copycount; i++) {
2215		struct sockaddr_storage ss;
2216
2217		psin = (struct sockaddr_in *)&ss;
2218		memset(&ss, 0, sizeof(ss));
2219		psin->sin_family = AF_INET;
2220		psin->sin_addr.s_addr = psl->sl_addr[i];
2221		if (copy_to_user(&optval->gf_slist[i], &ss, sizeof(ss)))
2222			return -EFAULT;
2223	}
2224	return 0;
2225done:
2226	rtnl_unlock();
2227	return err;
2228}
2229
2230/*
2231 * check if a multicast source filter allows delivery for a given <src,dst,intf>
2232 */
2233int ip_mc_sf_allow(struct sock *sk, __be32 loc_addr, __be32 rmt_addr, int dif)
2234{
2235	struct inet_sock *inet = inet_sk(sk);
2236	struct ip_mc_socklist *pmc;
2237	struct ip_sf_socklist *psl;
2238	int i;
2239	int ret;
2240
2241	ret = 1;
2242	if (!ipv4_is_multicast(loc_addr))
2243		goto out;
2244
2245	rcu_read_lock();
2246	for_each_pmc_rcu(inet, pmc) {
2247		if (pmc->multi.imr_multiaddr.s_addr == loc_addr &&
2248		    pmc->multi.imr_ifindex == dif)
2249			break;
2250	}
2251	ret = inet->mc_all;
2252	if (!pmc)
2253		goto unlock;
2254	psl = rcu_dereference(pmc->sflist);
2255	ret = (pmc->sfmode == MCAST_EXCLUDE);
2256	if (!psl)
2257		goto unlock;
2258
2259	for (i=0; i<psl->sl_count; i++) {
2260		if (psl->sl_addr[i] == rmt_addr)
2261			break;
2262	}
2263	ret = 0;
2264	if (pmc->sfmode == MCAST_INCLUDE && i >= psl->sl_count)
2265		goto unlock;
2266	if (pmc->sfmode == MCAST_EXCLUDE && i < psl->sl_count)
2267		goto unlock;
2268	ret = 1;
2269unlock:
2270	rcu_read_unlock();
2271out:
2272	return ret;
2273}
2274
2275/*
2276 *	A socket is closing.
2277 */
2278
2279void ip_mc_drop_socket(struct sock *sk)
2280{
2281	struct inet_sock *inet = inet_sk(sk);
2282	struct ip_mc_socklist *iml;
2283	struct net *net = sock_net(sk);
2284
2285	if (inet->mc_list == NULL)
2286		return;
2287
2288	rtnl_lock();
2289	while ((iml = rtnl_dereference(inet->mc_list)) != NULL) {
2290		struct in_device *in_dev;
2291
2292		inet->mc_list = iml->next_rcu;
2293		in_dev = inetdev_by_index(net, iml->multi.imr_ifindex);
2294		(void) ip_mc_leave_src(sk, iml, in_dev);
2295		if (in_dev != NULL)
2296			ip_mc_dec_group(in_dev, iml->multi.imr_multiaddr.s_addr);
2297		/* decrease mem now to avoid the memleak warning */
2298		atomic_sub(sizeof(*iml), &sk->sk_omem_alloc);
2299		kfree_rcu(iml, rcu);
2300	}
2301	rtnl_unlock();
2302}
2303
2304/* called with rcu_read_lock() */
2305int ip_check_mc_rcu(struct in_device *in_dev, __be32 mc_addr, __be32 src_addr, u16 proto)
2306{
2307	struct ip_mc_list *im;
2308	struct ip_sf_list *psf;
2309	int rv = 0;
2310
2311	for_each_pmc_rcu(in_dev, im) {
2312		if (im->multiaddr == mc_addr)
2313			break;
2314	}
2315	if (im && proto == IPPROTO_IGMP) {
2316		rv = 1;
2317	} else if (im) {
2318		if (src_addr) {
2319			for (psf=im->sources; psf; psf=psf->sf_next) {
2320				if (psf->sf_inaddr == src_addr)
2321					break;
2322			}
2323			if (psf)
2324				rv = psf->sf_count[MCAST_INCLUDE] ||
2325					psf->sf_count[MCAST_EXCLUDE] !=
2326					im->sfcount[MCAST_EXCLUDE];
2327			else
2328				rv = im->sfcount[MCAST_EXCLUDE] != 0;
2329		} else
2330			rv = 1; /* unspecified source; tentatively allow */
2331	}
2332	return rv;
2333}
2334
2335#if defined(CONFIG_PROC_FS)
2336struct igmp_mc_iter_state {
2337	struct seq_net_private p;
2338	struct net_device *dev;
2339	struct in_device *in_dev;
2340};
2341
2342#define	igmp_mc_seq_private(seq)	((struct igmp_mc_iter_state *)(seq)->private)
2343
2344static inline struct ip_mc_list *igmp_mc_get_first(struct seq_file *seq)
2345{
2346	struct net *net = seq_file_net(seq);
2347	struct ip_mc_list *im = NULL;
2348	struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2349
2350	state->in_dev = NULL;
2351	for_each_netdev_rcu(net, state->dev) {
2352		struct in_device *in_dev;
2353
2354		in_dev = __in_dev_get_rcu(state->dev);
2355		if (!in_dev)
2356			continue;
2357		im = rcu_dereference(in_dev->mc_list);
2358		if (im) {
2359			state->in_dev = in_dev;
2360			break;
2361		}
2362	}
2363	return im;
2364}
2365
2366static struct ip_mc_list *igmp_mc_get_next(struct seq_file *seq, struct ip_mc_list *im)
2367{
2368	struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2369
2370	im = rcu_dereference(im->next_rcu);
2371	while (!im) {
2372		state->dev = next_net_device_rcu(state->dev);
2373		if (!state->dev) {
2374			state->in_dev = NULL;
2375			break;
2376		}
2377		state->in_dev = __in_dev_get_rcu(state->dev);
2378		if (!state->in_dev)
2379			continue;
2380		im = rcu_dereference(state->in_dev->mc_list);
2381	}
2382	return im;
2383}
2384
2385static struct ip_mc_list *igmp_mc_get_idx(struct seq_file *seq, loff_t pos)
2386{
2387	struct ip_mc_list *im = igmp_mc_get_first(seq);
2388	if (im)
2389		while (pos && (im = igmp_mc_get_next(seq, im)) != NULL)
2390			--pos;
2391	return pos ? NULL : im;
2392}
2393
2394static void *igmp_mc_seq_start(struct seq_file *seq, loff_t *pos)
2395	__acquires(rcu)
2396{
2397	rcu_read_lock();
2398	return *pos ? igmp_mc_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
2399}
2400
2401static void *igmp_mc_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2402{
2403	struct ip_mc_list *im;
2404	if (v == SEQ_START_TOKEN)
2405		im = igmp_mc_get_first(seq);
2406	else
2407		im = igmp_mc_get_next(seq, v);
2408	++*pos;
2409	return im;
2410}
2411
2412static void igmp_mc_seq_stop(struct seq_file *seq, void *v)
2413	__releases(rcu)
2414{
2415	struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2416
2417	state->in_dev = NULL;
2418	state->dev = NULL;
2419	rcu_read_unlock();
2420}
2421
2422static int igmp_mc_seq_show(struct seq_file *seq, void *v)
2423{
2424	if (v == SEQ_START_TOKEN)
2425		seq_puts(seq,
2426			 "Idx\tDevice    : Count Querier\tGroup    Users Timer\tReporter\n");
2427	else {
2428		struct ip_mc_list *im = (struct ip_mc_list *)v;
2429		struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2430		char   *querier;
2431#ifdef CONFIG_IP_MULTICAST
2432		querier = IGMP_V1_SEEN(state->in_dev) ? "V1" :
2433			  IGMP_V2_SEEN(state->in_dev) ? "V2" :
2434			  "V3";
2435#else
2436		querier = "NONE";
2437#endif
2438
2439		if (rcu_dereference(state->in_dev->mc_list) == im) {
2440			seq_printf(seq, "%d\t%-10s: %5d %7s\n",
2441				   state->dev->ifindex, state->dev->name, state->in_dev->mc_count, querier);
2442		}
2443
2444		seq_printf(seq,
2445			   "\t\t\t\t%08X %5d %d:%08lX\t\t%d\n",
2446			   im->multiaddr, im->users,
2447			   im->tm_running, im->tm_running ?
2448			   jiffies_to_clock_t(im->timer.expires-jiffies) : 0,
2449			   im->reporter);
2450	}
2451	return 0;
2452}
2453
2454static const struct seq_operations igmp_mc_seq_ops = {
2455	.start	=	igmp_mc_seq_start,
2456	.next	=	igmp_mc_seq_next,
2457	.stop	=	igmp_mc_seq_stop,
2458	.show	=	igmp_mc_seq_show,
2459};
2460
2461static int igmp_mc_seq_open(struct inode *inode, struct file *file)
2462{
2463	return seq_open_net(inode, file, &igmp_mc_seq_ops,
2464			sizeof(struct igmp_mc_iter_state));
2465}
2466
2467static const struct file_operations igmp_mc_seq_fops = {
2468	.owner		=	THIS_MODULE,
2469	.open		=	igmp_mc_seq_open,
2470	.read		=	seq_read,
2471	.llseek		=	seq_lseek,
2472	.release	=	seq_release_net,
2473};
2474
2475struct igmp_mcf_iter_state {
2476	struct seq_net_private p;
2477	struct net_device *dev;
2478	struct in_device *idev;
2479	struct ip_mc_list *im;
2480};
2481
2482#define igmp_mcf_seq_private(seq)	((struct igmp_mcf_iter_state *)(seq)->private)
2483
2484static inline struct ip_sf_list *igmp_mcf_get_first(struct seq_file *seq)
2485{
2486	struct net *net = seq_file_net(seq);
2487	struct ip_sf_list *psf = NULL;
2488	struct ip_mc_list *im = NULL;
2489	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2490
2491	state->idev = NULL;
2492	state->im = NULL;
2493	for_each_netdev_rcu(net, state->dev) {
2494		struct in_device *idev;
2495		idev = __in_dev_get_rcu(state->dev);
2496		if (unlikely(idev == NULL))
2497			continue;
2498		im = rcu_dereference(idev->mc_list);
2499		if (likely(im != NULL)) {
2500			spin_lock_bh(&im->lock);
2501			psf = im->sources;
2502			if (likely(psf != NULL)) {
2503				state->im = im;
2504				state->idev = idev;
2505				break;
2506			}
2507			spin_unlock_bh(&im->lock);
2508		}
2509	}
2510	return psf;
2511}
2512
2513static struct ip_sf_list *igmp_mcf_get_next(struct seq_file *seq, struct ip_sf_list *psf)
2514{
2515	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2516
2517	psf = psf->sf_next;
2518	while (!psf) {
2519		spin_unlock_bh(&state->im->lock);
2520		state->im = state->im->next;
2521		while (!state->im) {
2522			state->dev = next_net_device_rcu(state->dev);
2523			if (!state->dev) {
2524				state->idev = NULL;
2525				goto out;
2526			}
2527			state->idev = __in_dev_get_rcu(state->dev);
2528			if (!state->idev)
2529				continue;
2530			state->im = rcu_dereference(state->idev->mc_list);
2531		}
2532		if (!state->im)
2533			break;
2534		spin_lock_bh(&state->im->lock);
2535		psf = state->im->sources;
2536	}
2537out:
2538	return psf;
2539}
2540
2541static struct ip_sf_list *igmp_mcf_get_idx(struct seq_file *seq, loff_t pos)
2542{
2543	struct ip_sf_list *psf = igmp_mcf_get_first(seq);
2544	if (psf)
2545		while (pos && (psf = igmp_mcf_get_next(seq, psf)) != NULL)
2546			--pos;
2547	return pos ? NULL : psf;
2548}
2549
2550static void *igmp_mcf_seq_start(struct seq_file *seq, loff_t *pos)
2551	__acquires(rcu)
2552{
2553	rcu_read_lock();
2554	return *pos ? igmp_mcf_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
2555}
2556
2557static void *igmp_mcf_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2558{
2559	struct ip_sf_list *psf;
2560	if (v == SEQ_START_TOKEN)
2561		psf = igmp_mcf_get_first(seq);
2562	else
2563		psf = igmp_mcf_get_next(seq, v);
2564	++*pos;
2565	return psf;
2566}
2567
2568static void igmp_mcf_seq_stop(struct seq_file *seq, void *v)
2569	__releases(rcu)
2570{
2571	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2572	if (likely(state->im != NULL)) {
2573		spin_unlock_bh(&state->im->lock);
2574		state->im = NULL;
2575	}
2576	state->idev = NULL;
2577	state->dev = NULL;
2578	rcu_read_unlock();
2579}
2580
2581static int igmp_mcf_seq_show(struct seq_file *seq, void *v)
2582{
2583	struct ip_sf_list *psf = (struct ip_sf_list *)v;
2584	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2585
2586	if (v == SEQ_START_TOKEN) {
2587		seq_printf(seq,
2588			   "%3s %6s "
2589			   "%10s %10s %6s %6s\n", "Idx",
2590			   "Device", "MCA",
2591			   "SRC", "INC", "EXC");
2592	} else {
2593		seq_printf(seq,
2594			   "%3d %6.6s 0x%08x "
2595			   "0x%08x %6lu %6lu\n",
2596			   state->dev->ifindex, state->dev->name,
2597			   ntohl(state->im->multiaddr),
2598			   ntohl(psf->sf_inaddr),
2599			   psf->sf_count[MCAST_INCLUDE],
2600			   psf->sf_count[MCAST_EXCLUDE]);
2601	}
2602	return 0;
2603}
2604
2605static const struct seq_operations igmp_mcf_seq_ops = {
2606	.start	=	igmp_mcf_seq_start,
2607	.next	=	igmp_mcf_seq_next,
2608	.stop	=	igmp_mcf_seq_stop,
2609	.show	=	igmp_mcf_seq_show,
2610};
2611
2612static int igmp_mcf_seq_open(struct inode *inode, struct file *file)
2613{
2614	return seq_open_net(inode, file, &igmp_mcf_seq_ops,
2615			sizeof(struct igmp_mcf_iter_state));
2616}
2617
2618static const struct file_operations igmp_mcf_seq_fops = {
2619	.owner		=	THIS_MODULE,
2620	.open		=	igmp_mcf_seq_open,
2621	.read		=	seq_read,
2622	.llseek		=	seq_lseek,
2623	.release	=	seq_release_net,
2624};
2625
2626static int __net_init igmp_net_init(struct net *net)
2627{
2628	struct proc_dir_entry *pde;
2629
2630	pde = proc_net_fops_create(net, "igmp", S_IRUGO, &igmp_mc_seq_fops);
2631	if (!pde)
2632		goto out_igmp;
2633	pde = proc_net_fops_create(net, "mcfilter", S_IRUGO, &igmp_mcf_seq_fops);
2634	if (!pde)
2635		goto out_mcfilter;
2636	return 0;
2637
2638out_mcfilter:
2639	proc_net_remove(net, "igmp");
2640out_igmp:
2641	return -ENOMEM;
2642}
2643
2644static void __net_exit igmp_net_exit(struct net *net)
2645{
2646	proc_net_remove(net, "mcfilter");
2647	proc_net_remove(net, "igmp");
2648}
2649
2650static struct pernet_operations igmp_net_ops = {
2651	.init = igmp_net_init,
2652	.exit = igmp_net_exit,
2653};
2654
2655int __init igmp_mc_proc_init(void)
2656{
2657	return register_pernet_subsys(&igmp_net_ops);
2658}
2659#endif
v3.5.6
   1/*
   2 *	Linux NET3:	Internet Group Management Protocol  [IGMP]
   3 *
   4 *	This code implements the IGMP protocol as defined in RFC1112. There has
   5 *	been a further revision of this protocol since which is now supported.
   6 *
   7 *	If you have trouble with this module be careful what gcc you have used,
   8 *	the older version didn't come out right using gcc 2.5.8, the newer one
   9 *	seems to fall out with gcc 2.6.2.
  10 *
  11 *	Authors:
  12 *		Alan Cox <alan@lxorguk.ukuu.org.uk>
  13 *
  14 *	This program is free software; you can redistribute it and/or
  15 *	modify it under the terms of the GNU General Public License
  16 *	as published by the Free Software Foundation; either version
  17 *	2 of the License, or (at your option) any later version.
  18 *
  19 *	Fixes:
  20 *
  21 *		Alan Cox	:	Added lots of __inline__ to optimise
  22 *					the memory usage of all the tiny little
  23 *					functions.
  24 *		Alan Cox	:	Dumped the header building experiment.
  25 *		Alan Cox	:	Minor tweaks ready for multicast routing
  26 *					and extended IGMP protocol.
  27 *		Alan Cox	:	Removed a load of inline directives. Gcc 2.5.8
  28 *					writes utterly bogus code otherwise (sigh)
  29 *					fixed IGMP loopback to behave in the manner
  30 *					desired by mrouted, fixed the fact it has been
  31 *					broken since 1.3.6 and cleaned up a few minor
  32 *					points.
  33 *
  34 *		Chih-Jen Chang	:	Tried to revise IGMP to Version 2
  35 *		Tsu-Sheng Tsao		E-mail: chihjenc@scf.usc.edu and tsusheng@scf.usc.edu
  36 *					The enhancements are mainly based on Steve Deering's
  37 * 					ipmulti-3.5 source code.
  38 *		Chih-Jen Chang	:	Added the igmp_get_mrouter_info and
  39 *		Tsu-Sheng Tsao		igmp_set_mrouter_info to keep track of
  40 *					the mrouted version on that device.
  41 *		Chih-Jen Chang	:	Added the max_resp_time parameter to
  42 *		Tsu-Sheng Tsao		igmp_heard_query(). Using this parameter
  43 *					to identify the multicast router version
  44 *					and do what the IGMP version 2 specified.
  45 *		Chih-Jen Chang	:	Added a timer to revert to IGMP V2 router
  46 *		Tsu-Sheng Tsao		if the specified time expired.
  47 *		Alan Cox	:	Stop IGMP from 0.0.0.0 being accepted.
  48 *		Alan Cox	:	Use GFP_ATOMIC in the right places.
  49 *		Christian Daudt :	igmp timer wasn't set for local group
  50 *					memberships but was being deleted,
  51 *					which caused a "del_timer() called
  52 *					from %p with timer not initialized\n"
  53 *					message (960131).
  54 *		Christian Daudt :	removed del_timer from
  55 *					igmp_timer_expire function (960205).
  56 *             Christian Daudt :       igmp_heard_report now only calls
  57 *                                     igmp_timer_expire if tm->running is
  58 *                                     true (960216).
  59 *		Malcolm Beattie :	ttl comparison wrong in igmp_rcv made
  60 *					igmp_heard_query never trigger. Expiry
  61 *					miscalculation fixed in igmp_heard_query
  62 *					and random() made to return unsigned to
  63 *					prevent negative expiry times.
  64 *		Alexey Kuznetsov:	Wrong group leaving behaviour, backport
  65 *					fix from pending 2.1.x patches.
  66 *		Alan Cox:		Forget to enable FDDI support earlier.
  67 *		Alexey Kuznetsov:	Fixed leaving groups on device down.
  68 *		Alexey Kuznetsov:	Accordance to igmp-v2-06 draft.
  69 *		David L Stevens:	IGMPv3 support, with help from
  70 *					Vinay Kulkarni
  71 */
  72
  73#include <linux/module.h>
  74#include <linux/slab.h>
  75#include <asm/uaccess.h>
 
  76#include <linux/types.h>
  77#include <linux/kernel.h>
  78#include <linux/jiffies.h>
  79#include <linux/string.h>
  80#include <linux/socket.h>
  81#include <linux/sockios.h>
  82#include <linux/in.h>
  83#include <linux/inet.h>
  84#include <linux/netdevice.h>
  85#include <linux/skbuff.h>
  86#include <linux/inetdevice.h>
  87#include <linux/igmp.h>
  88#include <linux/if_arp.h>
  89#include <linux/rtnetlink.h>
  90#include <linux/times.h>
  91
  92#include <net/net_namespace.h>
  93#include <net/arp.h>
  94#include <net/ip.h>
  95#include <net/protocol.h>
  96#include <net/route.h>
  97#include <net/sock.h>
  98#include <net/checksum.h>
  99#include <linux/netfilter_ipv4.h>
 100#ifdef CONFIG_IP_MROUTE
 101#include <linux/mroute.h>
 102#endif
 103#ifdef CONFIG_PROC_FS
 104#include <linux/proc_fs.h>
 105#include <linux/seq_file.h>
 106#endif
 107
 108#define IP_MAX_MEMBERSHIPS	20
 109#define IP_MAX_MSF		10
 110
 111#ifdef CONFIG_IP_MULTICAST
 112/* Parameter names and values are taken from igmp-v2-06 draft */
 113
 114#define IGMP_V1_Router_Present_Timeout		(400*HZ)
 115#define IGMP_V2_Router_Present_Timeout		(400*HZ)
 116#define IGMP_Unsolicited_Report_Interval	(10*HZ)
 117#define IGMP_Query_Response_Interval		(10*HZ)
 118#define IGMP_Unsolicited_Report_Count		2
 119
 120
 121#define IGMP_Initial_Report_Delay		(1)
 122
 123/* IGMP_Initial_Report_Delay is not from IGMP specs!
 124 * IGMP specs require to report membership immediately after
 125 * joining a group, but we delay the first report by a
 126 * small interval. It seems more natural and still does not
 127 * contradict to specs provided this delay is small enough.
 128 */
 129
 130#define IGMP_V1_SEEN(in_dev) \
 131	(IPV4_DEVCONF_ALL(dev_net(in_dev->dev), FORCE_IGMP_VERSION) == 1 || \
 132	 IN_DEV_CONF_GET((in_dev), FORCE_IGMP_VERSION) == 1 || \
 133	 ((in_dev)->mr_v1_seen && \
 134	  time_before(jiffies, (in_dev)->mr_v1_seen)))
 135#define IGMP_V2_SEEN(in_dev) \
 136	(IPV4_DEVCONF_ALL(dev_net(in_dev->dev), FORCE_IGMP_VERSION) == 2 || \
 137	 IN_DEV_CONF_GET((in_dev), FORCE_IGMP_VERSION) == 2 || \
 138	 ((in_dev)->mr_v2_seen && \
 139	  time_before(jiffies, (in_dev)->mr_v2_seen)))
 140
 141static void igmpv3_add_delrec(struct in_device *in_dev, struct ip_mc_list *im);
 142static void igmpv3_del_delrec(struct in_device *in_dev, __be32 multiaddr);
 143static void igmpv3_clear_delrec(struct in_device *in_dev);
 144static int sf_setstate(struct ip_mc_list *pmc);
 145static void sf_markstate(struct ip_mc_list *pmc);
 146#endif
 147static void ip_mc_clear_src(struct ip_mc_list *pmc);
 148static int ip_mc_add_src(struct in_device *in_dev, __be32 *pmca, int sfmode,
 149			 int sfcount, __be32 *psfsrc, int delta);
 150
 151static void ip_ma_put(struct ip_mc_list *im)
 152{
 153	if (atomic_dec_and_test(&im->refcnt)) {
 154		in_dev_put(im->interface);
 155		kfree_rcu(im, rcu);
 156	}
 157}
 158
 159#define for_each_pmc_rcu(in_dev, pmc)				\
 160	for (pmc = rcu_dereference(in_dev->mc_list);		\
 161	     pmc != NULL;					\
 162	     pmc = rcu_dereference(pmc->next_rcu))
 163
 164#define for_each_pmc_rtnl(in_dev, pmc)				\
 165	for (pmc = rtnl_dereference(in_dev->mc_list);		\
 166	     pmc != NULL;					\
 167	     pmc = rtnl_dereference(pmc->next_rcu))
 168
 169#ifdef CONFIG_IP_MULTICAST
 170
 171/*
 172 *	Timer management
 173 */
 174
 175static void igmp_stop_timer(struct ip_mc_list *im)
 176{
 177	spin_lock_bh(&im->lock);
 178	if (del_timer(&im->timer))
 179		atomic_dec(&im->refcnt);
 180	im->tm_running = 0;
 181	im->reporter = 0;
 182	im->unsolicit_count = 0;
 183	spin_unlock_bh(&im->lock);
 184}
 185
 186/* It must be called with locked im->lock */
 187static void igmp_start_timer(struct ip_mc_list *im, int max_delay)
 188{
 189	int tv = net_random() % max_delay;
 190
 191	im->tm_running = 1;
 192	if (!mod_timer(&im->timer, jiffies+tv+2))
 193		atomic_inc(&im->refcnt);
 194}
 195
 196static void igmp_gq_start_timer(struct in_device *in_dev)
 197{
 198	int tv = net_random() % in_dev->mr_maxdelay;
 199
 200	in_dev->mr_gq_running = 1;
 201	if (!mod_timer(&in_dev->mr_gq_timer, jiffies+tv+2))
 202		in_dev_hold(in_dev);
 203}
 204
 205static void igmp_ifc_start_timer(struct in_device *in_dev, int delay)
 206{
 207	int tv = net_random() % delay;
 208
 209	if (!mod_timer(&in_dev->mr_ifc_timer, jiffies+tv+2))
 210		in_dev_hold(in_dev);
 211}
 212
 213static void igmp_mod_timer(struct ip_mc_list *im, int max_delay)
 214{
 215	spin_lock_bh(&im->lock);
 216	im->unsolicit_count = 0;
 217	if (del_timer(&im->timer)) {
 218		if ((long)(im->timer.expires-jiffies) < max_delay) {
 219			add_timer(&im->timer);
 220			im->tm_running = 1;
 221			spin_unlock_bh(&im->lock);
 222			return;
 223		}
 224		atomic_dec(&im->refcnt);
 225	}
 226	igmp_start_timer(im, max_delay);
 227	spin_unlock_bh(&im->lock);
 228}
 229
 230
 231/*
 232 *	Send an IGMP report.
 233 */
 234
 235#define IGMP_SIZE (sizeof(struct igmphdr)+sizeof(struct iphdr)+4)
 236
 237
 238static int is_in(struct ip_mc_list *pmc, struct ip_sf_list *psf, int type,
 239	int gdeleted, int sdeleted)
 240{
 241	switch (type) {
 242	case IGMPV3_MODE_IS_INCLUDE:
 243	case IGMPV3_MODE_IS_EXCLUDE:
 244		if (gdeleted || sdeleted)
 245			return 0;
 246		if (!(pmc->gsquery && !psf->sf_gsresp)) {
 247			if (pmc->sfmode == MCAST_INCLUDE)
 248				return 1;
 249			/* don't include if this source is excluded
 250			 * in all filters
 251			 */
 252			if (psf->sf_count[MCAST_INCLUDE])
 253				return type == IGMPV3_MODE_IS_INCLUDE;
 254			return pmc->sfcount[MCAST_EXCLUDE] ==
 255				psf->sf_count[MCAST_EXCLUDE];
 256		}
 257		return 0;
 258	case IGMPV3_CHANGE_TO_INCLUDE:
 259		if (gdeleted || sdeleted)
 260			return 0;
 261		return psf->sf_count[MCAST_INCLUDE] != 0;
 262	case IGMPV3_CHANGE_TO_EXCLUDE:
 263		if (gdeleted || sdeleted)
 264			return 0;
 265		if (pmc->sfcount[MCAST_EXCLUDE] == 0 ||
 266		    psf->sf_count[MCAST_INCLUDE])
 267			return 0;
 268		return pmc->sfcount[MCAST_EXCLUDE] ==
 269			psf->sf_count[MCAST_EXCLUDE];
 270	case IGMPV3_ALLOW_NEW_SOURCES:
 271		if (gdeleted || !psf->sf_crcount)
 272			return 0;
 273		return (pmc->sfmode == MCAST_INCLUDE) ^ sdeleted;
 274	case IGMPV3_BLOCK_OLD_SOURCES:
 275		if (pmc->sfmode == MCAST_INCLUDE)
 276			return gdeleted || (psf->sf_crcount && sdeleted);
 277		return psf->sf_crcount && !gdeleted && !sdeleted;
 278	}
 279	return 0;
 280}
 281
 282static int
 283igmp_scount(struct ip_mc_list *pmc, int type, int gdeleted, int sdeleted)
 284{
 285	struct ip_sf_list *psf;
 286	int scount = 0;
 287
 288	for (psf=pmc->sources; psf; psf=psf->sf_next) {
 289		if (!is_in(pmc, psf, type, gdeleted, sdeleted))
 290			continue;
 291		scount++;
 292	}
 293	return scount;
 294}
 295
 296#define igmp_skb_size(skb) (*(unsigned int *)((skb)->cb))
 297
 298static struct sk_buff *igmpv3_newpack(struct net_device *dev, int size)
 299{
 300	struct sk_buff *skb;
 301	struct rtable *rt;
 302	struct iphdr *pip;
 303	struct igmpv3_report *pig;
 304	struct net *net = dev_net(dev);
 305	struct flowi4 fl4;
 306	int hlen = LL_RESERVED_SPACE(dev);
 307	int tlen = dev->needed_tailroom;
 308
 309	while (1) {
 310		skb = alloc_skb(size + hlen + tlen,
 311				GFP_ATOMIC | __GFP_NOWARN);
 312		if (skb)
 313			break;
 314		size >>= 1;
 315		if (size < 256)
 316			return NULL;
 317	}
 318	igmp_skb_size(skb) = size;
 319
 320	rt = ip_route_output_ports(net, &fl4, NULL, IGMPV3_ALL_MCR, 0,
 321				   0, 0,
 322				   IPPROTO_IGMP, 0, dev->ifindex);
 323	if (IS_ERR(rt)) {
 324		kfree_skb(skb);
 325		return NULL;
 326	}
 327
 328	skb_dst_set(skb, &rt->dst);
 329	skb->dev = dev;
 330
 331	skb_reserve(skb, hlen);
 332
 333	skb_reset_network_header(skb);
 334	pip = ip_hdr(skb);
 335	skb_put(skb, sizeof(struct iphdr) + 4);
 336
 337	pip->version  = 4;
 338	pip->ihl      = (sizeof(struct iphdr)+4)>>2;
 339	pip->tos      = 0xc0;
 340	pip->frag_off = htons(IP_DF);
 341	pip->ttl      = 1;
 342	pip->daddr    = fl4.daddr;
 343	pip->saddr    = fl4.saddr;
 344	pip->protocol = IPPROTO_IGMP;
 345	pip->tot_len  = 0;	/* filled in later */
 346	ip_select_ident(pip, &rt->dst, NULL);
 347	((u8 *)&pip[1])[0] = IPOPT_RA;
 348	((u8 *)&pip[1])[1] = 4;
 349	((u8 *)&pip[1])[2] = 0;
 350	((u8 *)&pip[1])[3] = 0;
 351
 352	skb->transport_header = skb->network_header + sizeof(struct iphdr) + 4;
 353	skb_put(skb, sizeof(*pig));
 354	pig = igmpv3_report_hdr(skb);
 355	pig->type = IGMPV3_HOST_MEMBERSHIP_REPORT;
 356	pig->resv1 = 0;
 357	pig->csum = 0;
 358	pig->resv2 = 0;
 359	pig->ngrec = 0;
 360	return skb;
 361}
 362
 363static int igmpv3_sendpack(struct sk_buff *skb)
 364{
 365	struct igmphdr *pig = igmp_hdr(skb);
 366	const int igmplen = skb->tail - skb->transport_header;
 367
 368	pig->csum = ip_compute_csum(igmp_hdr(skb), igmplen);
 369
 370	return ip_local_out(skb);
 371}
 372
 373static int grec_size(struct ip_mc_list *pmc, int type, int gdel, int sdel)
 374{
 375	return sizeof(struct igmpv3_grec) + 4*igmp_scount(pmc, type, gdel, sdel);
 376}
 377
 378static struct sk_buff *add_grhead(struct sk_buff *skb, struct ip_mc_list *pmc,
 379	int type, struct igmpv3_grec **ppgr)
 380{
 381	struct net_device *dev = pmc->interface->dev;
 382	struct igmpv3_report *pih;
 383	struct igmpv3_grec *pgr;
 384
 385	if (!skb)
 386		skb = igmpv3_newpack(dev, dev->mtu);
 387	if (!skb)
 388		return NULL;
 389	pgr = (struct igmpv3_grec *)skb_put(skb, sizeof(struct igmpv3_grec));
 390	pgr->grec_type = type;
 391	pgr->grec_auxwords = 0;
 392	pgr->grec_nsrcs = 0;
 393	pgr->grec_mca = pmc->multiaddr;
 394	pih = igmpv3_report_hdr(skb);
 395	pih->ngrec = htons(ntohs(pih->ngrec)+1);
 396	*ppgr = pgr;
 397	return skb;
 398}
 399
 400#define AVAILABLE(skb) ((skb) ? ((skb)->dev ? igmp_skb_size(skb) - (skb)->len : \
 401	skb_tailroom(skb)) : 0)
 402
 403static struct sk_buff *add_grec(struct sk_buff *skb, struct ip_mc_list *pmc,
 404	int type, int gdeleted, int sdeleted)
 405{
 406	struct net_device *dev = pmc->interface->dev;
 407	struct igmpv3_report *pih;
 408	struct igmpv3_grec *pgr = NULL;
 409	struct ip_sf_list *psf, *psf_next, *psf_prev, **psf_list;
 410	int scount, stotal, first, isquery, truncate;
 411
 412	if (pmc->multiaddr == IGMP_ALL_HOSTS)
 413		return skb;
 414
 415	isquery = type == IGMPV3_MODE_IS_INCLUDE ||
 416		  type == IGMPV3_MODE_IS_EXCLUDE;
 417	truncate = type == IGMPV3_MODE_IS_EXCLUDE ||
 418		    type == IGMPV3_CHANGE_TO_EXCLUDE;
 419
 420	stotal = scount = 0;
 421
 422	psf_list = sdeleted ? &pmc->tomb : &pmc->sources;
 423
 424	if (!*psf_list)
 425		goto empty_source;
 426
 427	pih = skb ? igmpv3_report_hdr(skb) : NULL;
 428
 429	/* EX and TO_EX get a fresh packet, if needed */
 430	if (truncate) {
 431		if (pih && pih->ngrec &&
 432		    AVAILABLE(skb) < grec_size(pmc, type, gdeleted, sdeleted)) {
 433			if (skb)
 434				igmpv3_sendpack(skb);
 435			skb = igmpv3_newpack(dev, dev->mtu);
 436		}
 437	}
 438	first = 1;
 439	psf_prev = NULL;
 440	for (psf=*psf_list; psf; psf=psf_next) {
 441		__be32 *psrc;
 442
 443		psf_next = psf->sf_next;
 444
 445		if (!is_in(pmc, psf, type, gdeleted, sdeleted)) {
 446			psf_prev = psf;
 447			continue;
 448		}
 449
 450		/* clear marks on query responses */
 451		if (isquery)
 452			psf->sf_gsresp = 0;
 453
 454		if (AVAILABLE(skb) < sizeof(__be32) +
 455		    first*sizeof(struct igmpv3_grec)) {
 456			if (truncate && !first)
 457				break;	 /* truncate these */
 458			if (pgr)
 459				pgr->grec_nsrcs = htons(scount);
 460			if (skb)
 461				igmpv3_sendpack(skb);
 462			skb = igmpv3_newpack(dev, dev->mtu);
 463			first = 1;
 464			scount = 0;
 465		}
 466		if (first) {
 467			skb = add_grhead(skb, pmc, type, &pgr);
 468			first = 0;
 469		}
 470		if (!skb)
 471			return NULL;
 472		psrc = (__be32 *)skb_put(skb, sizeof(__be32));
 473		*psrc = psf->sf_inaddr;
 474		scount++; stotal++;
 475		if ((type == IGMPV3_ALLOW_NEW_SOURCES ||
 476		     type == IGMPV3_BLOCK_OLD_SOURCES) && psf->sf_crcount) {
 477			psf->sf_crcount--;
 478			if ((sdeleted || gdeleted) && psf->sf_crcount == 0) {
 479				if (psf_prev)
 480					psf_prev->sf_next = psf->sf_next;
 481				else
 482					*psf_list = psf->sf_next;
 483				kfree(psf);
 484				continue;
 485			}
 486		}
 487		psf_prev = psf;
 488	}
 489
 490empty_source:
 491	if (!stotal) {
 492		if (type == IGMPV3_ALLOW_NEW_SOURCES ||
 493		    type == IGMPV3_BLOCK_OLD_SOURCES)
 494			return skb;
 495		if (pmc->crcount || isquery) {
 496			/* make sure we have room for group header */
 497			if (skb && AVAILABLE(skb)<sizeof(struct igmpv3_grec)) {
 498				igmpv3_sendpack(skb);
 499				skb = NULL; /* add_grhead will get a new one */
 500			}
 501			skb = add_grhead(skb, pmc, type, &pgr);
 502		}
 503	}
 504	if (pgr)
 505		pgr->grec_nsrcs = htons(scount);
 506
 507	if (isquery)
 508		pmc->gsquery = 0;	/* clear query state on report */
 509	return skb;
 510}
 511
 512static int igmpv3_send_report(struct in_device *in_dev, struct ip_mc_list *pmc)
 513{
 514	struct sk_buff *skb = NULL;
 515	int type;
 516
 517	if (!pmc) {
 518		rcu_read_lock();
 519		for_each_pmc_rcu(in_dev, pmc) {
 520			if (pmc->multiaddr == IGMP_ALL_HOSTS)
 521				continue;
 522			spin_lock_bh(&pmc->lock);
 523			if (pmc->sfcount[MCAST_EXCLUDE])
 524				type = IGMPV3_MODE_IS_EXCLUDE;
 525			else
 526				type = IGMPV3_MODE_IS_INCLUDE;
 527			skb = add_grec(skb, pmc, type, 0, 0);
 528			spin_unlock_bh(&pmc->lock);
 529		}
 530		rcu_read_unlock();
 531	} else {
 532		spin_lock_bh(&pmc->lock);
 533		if (pmc->sfcount[MCAST_EXCLUDE])
 534			type = IGMPV3_MODE_IS_EXCLUDE;
 535		else
 536			type = IGMPV3_MODE_IS_INCLUDE;
 537		skb = add_grec(skb, pmc, type, 0, 0);
 538		spin_unlock_bh(&pmc->lock);
 539	}
 540	if (!skb)
 541		return 0;
 542	return igmpv3_sendpack(skb);
 543}
 544
 545/*
 546 * remove zero-count source records from a source filter list
 547 */
 548static void igmpv3_clear_zeros(struct ip_sf_list **ppsf)
 549{
 550	struct ip_sf_list *psf_prev, *psf_next, *psf;
 551
 552	psf_prev = NULL;
 553	for (psf=*ppsf; psf; psf = psf_next) {
 554		psf_next = psf->sf_next;
 555		if (psf->sf_crcount == 0) {
 556			if (psf_prev)
 557				psf_prev->sf_next = psf->sf_next;
 558			else
 559				*ppsf = psf->sf_next;
 560			kfree(psf);
 561		} else
 562			psf_prev = psf;
 563	}
 564}
 565
 566static void igmpv3_send_cr(struct in_device *in_dev)
 567{
 568	struct ip_mc_list *pmc, *pmc_prev, *pmc_next;
 569	struct sk_buff *skb = NULL;
 570	int type, dtype;
 571
 572	rcu_read_lock();
 573	spin_lock_bh(&in_dev->mc_tomb_lock);
 574
 575	/* deleted MCA's */
 576	pmc_prev = NULL;
 577	for (pmc=in_dev->mc_tomb; pmc; pmc=pmc_next) {
 578		pmc_next = pmc->next;
 579		if (pmc->sfmode == MCAST_INCLUDE) {
 580			type = IGMPV3_BLOCK_OLD_SOURCES;
 581			dtype = IGMPV3_BLOCK_OLD_SOURCES;
 582			skb = add_grec(skb, pmc, type, 1, 0);
 583			skb = add_grec(skb, pmc, dtype, 1, 1);
 584		}
 585		if (pmc->crcount) {
 586			if (pmc->sfmode == MCAST_EXCLUDE) {
 587				type = IGMPV3_CHANGE_TO_INCLUDE;
 588				skb = add_grec(skb, pmc, type, 1, 0);
 589			}
 590			pmc->crcount--;
 591			if (pmc->crcount == 0) {
 592				igmpv3_clear_zeros(&pmc->tomb);
 593				igmpv3_clear_zeros(&pmc->sources);
 594			}
 595		}
 596		if (pmc->crcount == 0 && !pmc->tomb && !pmc->sources) {
 597			if (pmc_prev)
 598				pmc_prev->next = pmc_next;
 599			else
 600				in_dev->mc_tomb = pmc_next;
 601			in_dev_put(pmc->interface);
 602			kfree(pmc);
 603		} else
 604			pmc_prev = pmc;
 605	}
 606	spin_unlock_bh(&in_dev->mc_tomb_lock);
 607
 608	/* change recs */
 609	for_each_pmc_rcu(in_dev, pmc) {
 610		spin_lock_bh(&pmc->lock);
 611		if (pmc->sfcount[MCAST_EXCLUDE]) {
 612			type = IGMPV3_BLOCK_OLD_SOURCES;
 613			dtype = IGMPV3_ALLOW_NEW_SOURCES;
 614		} else {
 615			type = IGMPV3_ALLOW_NEW_SOURCES;
 616			dtype = IGMPV3_BLOCK_OLD_SOURCES;
 617		}
 618		skb = add_grec(skb, pmc, type, 0, 0);
 619		skb = add_grec(skb, pmc, dtype, 0, 1);	/* deleted sources */
 620
 621		/* filter mode changes */
 622		if (pmc->crcount) {
 623			if (pmc->sfmode == MCAST_EXCLUDE)
 624				type = IGMPV3_CHANGE_TO_EXCLUDE;
 625			else
 626				type = IGMPV3_CHANGE_TO_INCLUDE;
 627			skb = add_grec(skb, pmc, type, 0, 0);
 628			pmc->crcount--;
 629		}
 630		spin_unlock_bh(&pmc->lock);
 631	}
 632	rcu_read_unlock();
 633
 634	if (!skb)
 635		return;
 636	(void) igmpv3_sendpack(skb);
 637}
 638
 639static int igmp_send_report(struct in_device *in_dev, struct ip_mc_list *pmc,
 640	int type)
 641{
 642	struct sk_buff *skb;
 643	struct iphdr *iph;
 644	struct igmphdr *ih;
 645	struct rtable *rt;
 646	struct net_device *dev = in_dev->dev;
 647	struct net *net = dev_net(dev);
 648	__be32	group = pmc ? pmc->multiaddr : 0;
 649	struct flowi4 fl4;
 650	__be32	dst;
 651	int hlen, tlen;
 652
 653	if (type == IGMPV3_HOST_MEMBERSHIP_REPORT)
 654		return igmpv3_send_report(in_dev, pmc);
 655	else if (type == IGMP_HOST_LEAVE_MESSAGE)
 656		dst = IGMP_ALL_ROUTER;
 657	else
 658		dst = group;
 659
 660	rt = ip_route_output_ports(net, &fl4, NULL, dst, 0,
 661				   0, 0,
 662				   IPPROTO_IGMP, 0, dev->ifindex);
 663	if (IS_ERR(rt))
 664		return -1;
 665
 666	hlen = LL_RESERVED_SPACE(dev);
 667	tlen = dev->needed_tailroom;
 668	skb = alloc_skb(IGMP_SIZE + hlen + tlen, GFP_ATOMIC);
 669	if (skb == NULL) {
 670		ip_rt_put(rt);
 671		return -1;
 672	}
 673
 674	skb_dst_set(skb, &rt->dst);
 675
 676	skb_reserve(skb, hlen);
 677
 678	skb_reset_network_header(skb);
 679	iph = ip_hdr(skb);
 680	skb_put(skb, sizeof(struct iphdr) + 4);
 681
 682	iph->version  = 4;
 683	iph->ihl      = (sizeof(struct iphdr)+4)>>2;
 684	iph->tos      = 0xc0;
 685	iph->frag_off = htons(IP_DF);
 686	iph->ttl      = 1;
 687	iph->daddr    = dst;
 688	iph->saddr    = fl4.saddr;
 689	iph->protocol = IPPROTO_IGMP;
 690	ip_select_ident(iph, &rt->dst, NULL);
 691	((u8 *)&iph[1])[0] = IPOPT_RA;
 692	((u8 *)&iph[1])[1] = 4;
 693	((u8 *)&iph[1])[2] = 0;
 694	((u8 *)&iph[1])[3] = 0;
 695
 696	ih = (struct igmphdr *)skb_put(skb, sizeof(struct igmphdr));
 697	ih->type = type;
 698	ih->code = 0;
 699	ih->csum = 0;
 700	ih->group = group;
 701	ih->csum = ip_compute_csum((void *)ih, sizeof(struct igmphdr));
 702
 703	return ip_local_out(skb);
 704}
 705
 706static void igmp_gq_timer_expire(unsigned long data)
 707{
 708	struct in_device *in_dev = (struct in_device *)data;
 709
 710	in_dev->mr_gq_running = 0;
 711	igmpv3_send_report(in_dev, NULL);
 712	__in_dev_put(in_dev);
 713}
 714
 715static void igmp_ifc_timer_expire(unsigned long data)
 716{
 717	struct in_device *in_dev = (struct in_device *)data;
 718
 719	igmpv3_send_cr(in_dev);
 720	if (in_dev->mr_ifc_count) {
 721		in_dev->mr_ifc_count--;
 722		igmp_ifc_start_timer(in_dev, IGMP_Unsolicited_Report_Interval);
 723	}
 724	__in_dev_put(in_dev);
 725}
 726
 727static void igmp_ifc_event(struct in_device *in_dev)
 728{
 729	if (IGMP_V1_SEEN(in_dev) || IGMP_V2_SEEN(in_dev))
 730		return;
 731	in_dev->mr_ifc_count = in_dev->mr_qrv ? in_dev->mr_qrv :
 732		IGMP_Unsolicited_Report_Count;
 733	igmp_ifc_start_timer(in_dev, 1);
 734}
 735
 736
 737static void igmp_timer_expire(unsigned long data)
 738{
 739	struct ip_mc_list *im=(struct ip_mc_list *)data;
 740	struct in_device *in_dev = im->interface;
 741
 742	spin_lock(&im->lock);
 743	im->tm_running = 0;
 744
 745	if (im->unsolicit_count) {
 746		im->unsolicit_count--;
 747		igmp_start_timer(im, IGMP_Unsolicited_Report_Interval);
 748	}
 749	im->reporter = 1;
 750	spin_unlock(&im->lock);
 751
 752	if (IGMP_V1_SEEN(in_dev))
 753		igmp_send_report(in_dev, im, IGMP_HOST_MEMBERSHIP_REPORT);
 754	else if (IGMP_V2_SEEN(in_dev))
 755		igmp_send_report(in_dev, im, IGMPV2_HOST_MEMBERSHIP_REPORT);
 756	else
 757		igmp_send_report(in_dev, im, IGMPV3_HOST_MEMBERSHIP_REPORT);
 758
 759	ip_ma_put(im);
 760}
 761
 762/* mark EXCLUDE-mode sources */
 763static int igmp_xmarksources(struct ip_mc_list *pmc, int nsrcs, __be32 *srcs)
 764{
 765	struct ip_sf_list *psf;
 766	int i, scount;
 767
 768	scount = 0;
 769	for (psf=pmc->sources; psf; psf=psf->sf_next) {
 770		if (scount == nsrcs)
 771			break;
 772		for (i=0; i<nsrcs; i++) {
 773			/* skip inactive filters */
 774			if (psf->sf_count[MCAST_INCLUDE] ||
 775			    pmc->sfcount[MCAST_EXCLUDE] !=
 776			    psf->sf_count[MCAST_EXCLUDE])
 777				break;
 778			if (srcs[i] == psf->sf_inaddr) {
 779				scount++;
 780				break;
 781			}
 782		}
 783	}
 784	pmc->gsquery = 0;
 785	if (scount == nsrcs)	/* all sources excluded */
 786		return 0;
 787	return 1;
 788}
 789
 790static int igmp_marksources(struct ip_mc_list *pmc, int nsrcs, __be32 *srcs)
 791{
 792	struct ip_sf_list *psf;
 793	int i, scount;
 794
 795	if (pmc->sfmode == MCAST_EXCLUDE)
 796		return igmp_xmarksources(pmc, nsrcs, srcs);
 797
 798	/* mark INCLUDE-mode sources */
 799	scount = 0;
 800	for (psf=pmc->sources; psf; psf=psf->sf_next) {
 801		if (scount == nsrcs)
 802			break;
 803		for (i=0; i<nsrcs; i++)
 804			if (srcs[i] == psf->sf_inaddr) {
 805				psf->sf_gsresp = 1;
 806				scount++;
 807				break;
 808			}
 809	}
 810	if (!scount) {
 811		pmc->gsquery = 0;
 812		return 0;
 813	}
 814	pmc->gsquery = 1;
 815	return 1;
 816}
 817
 818static void igmp_heard_report(struct in_device *in_dev, __be32 group)
 819{
 820	struct ip_mc_list *im;
 821
 822	/* Timers are only set for non-local groups */
 823
 824	if (group == IGMP_ALL_HOSTS)
 825		return;
 826
 827	rcu_read_lock();
 828	for_each_pmc_rcu(in_dev, im) {
 829		if (im->multiaddr == group) {
 830			igmp_stop_timer(im);
 831			break;
 832		}
 833	}
 834	rcu_read_unlock();
 835}
 836
 837static void igmp_heard_query(struct in_device *in_dev, struct sk_buff *skb,
 838	int len)
 839{
 840	struct igmphdr 		*ih = igmp_hdr(skb);
 841	struct igmpv3_query *ih3 = igmpv3_query_hdr(skb);
 842	struct ip_mc_list	*im;
 843	__be32			group = ih->group;
 844	int			max_delay;
 845	int			mark = 0;
 846
 847
 848	if (len == 8) {
 849		if (ih->code == 0) {
 850			/* Alas, old v1 router presents here. */
 851
 852			max_delay = IGMP_Query_Response_Interval;
 853			in_dev->mr_v1_seen = jiffies +
 854				IGMP_V1_Router_Present_Timeout;
 855			group = 0;
 856		} else {
 857			/* v2 router present */
 858			max_delay = ih->code*(HZ/IGMP_TIMER_SCALE);
 859			in_dev->mr_v2_seen = jiffies +
 860				IGMP_V2_Router_Present_Timeout;
 861		}
 862		/* cancel the interface change timer */
 863		in_dev->mr_ifc_count = 0;
 864		if (del_timer(&in_dev->mr_ifc_timer))
 865			__in_dev_put(in_dev);
 866		/* clear deleted report items */
 867		igmpv3_clear_delrec(in_dev);
 868	} else if (len < 12) {
 869		return;	/* ignore bogus packet; freed by caller */
 870	} else if (IGMP_V1_SEEN(in_dev)) {
 871		/* This is a v3 query with v1 queriers present */
 872		max_delay = IGMP_Query_Response_Interval;
 873		group = 0;
 874	} else if (IGMP_V2_SEEN(in_dev)) {
 875		/* this is a v3 query with v2 queriers present;
 876		 * Interpretation of the max_delay code is problematic here.
 877		 * A real v2 host would use ih_code directly, while v3 has a
 878		 * different encoding. We use the v3 encoding as more likely
 879		 * to be intended in a v3 query.
 880		 */
 881		max_delay = IGMPV3_MRC(ih3->code)*(HZ/IGMP_TIMER_SCALE);
 882		if (!max_delay)
 883			max_delay = 1;	/* can't mod w/ 0 */
 884	} else { /* v3 */
 885		if (!pskb_may_pull(skb, sizeof(struct igmpv3_query)))
 886			return;
 887
 888		ih3 = igmpv3_query_hdr(skb);
 889		if (ih3->nsrcs) {
 890			if (!pskb_may_pull(skb, sizeof(struct igmpv3_query)
 891					   + ntohs(ih3->nsrcs)*sizeof(__be32)))
 892				return;
 893			ih3 = igmpv3_query_hdr(skb);
 894		}
 895
 896		max_delay = IGMPV3_MRC(ih3->code)*(HZ/IGMP_TIMER_SCALE);
 897		if (!max_delay)
 898			max_delay = 1;	/* can't mod w/ 0 */
 899		in_dev->mr_maxdelay = max_delay;
 900		if (ih3->qrv)
 901			in_dev->mr_qrv = ih3->qrv;
 902		if (!group) { /* general query */
 903			if (ih3->nsrcs)
 904				return;	/* no sources allowed */
 905			igmp_gq_start_timer(in_dev);
 906			return;
 907		}
 908		/* mark sources to include, if group & source-specific */
 909		mark = ih3->nsrcs != 0;
 910	}
 911
 912	/*
 913	 * - Start the timers in all of our membership records
 914	 *   that the query applies to for the interface on
 915	 *   which the query arrived excl. those that belong
 916	 *   to a "local" group (224.0.0.X)
 917	 * - For timers already running check if they need to
 918	 *   be reset.
 919	 * - Use the igmp->igmp_code field as the maximum
 920	 *   delay possible
 921	 */
 922	rcu_read_lock();
 923	for_each_pmc_rcu(in_dev, im) {
 924		int changed;
 925
 926		if (group && group != im->multiaddr)
 927			continue;
 928		if (im->multiaddr == IGMP_ALL_HOSTS)
 929			continue;
 930		spin_lock_bh(&im->lock);
 931		if (im->tm_running)
 932			im->gsquery = im->gsquery && mark;
 933		else
 934			im->gsquery = mark;
 935		changed = !im->gsquery ||
 936			igmp_marksources(im, ntohs(ih3->nsrcs), ih3->srcs);
 937		spin_unlock_bh(&im->lock);
 938		if (changed)
 939			igmp_mod_timer(im, max_delay);
 940	}
 941	rcu_read_unlock();
 942}
 943
 944/* called in rcu_read_lock() section */
 945int igmp_rcv(struct sk_buff *skb)
 946{
 947	/* This basically follows the spec line by line -- see RFC1112 */
 948	struct igmphdr *ih;
 949	struct in_device *in_dev = __in_dev_get_rcu(skb->dev);
 950	int len = skb->len;
 951
 952	if (in_dev == NULL)
 953		goto drop;
 954
 955	if (!pskb_may_pull(skb, sizeof(struct igmphdr)))
 956		goto drop;
 957
 958	switch (skb->ip_summed) {
 959	case CHECKSUM_COMPLETE:
 960		if (!csum_fold(skb->csum))
 961			break;
 962		/* fall through */
 963	case CHECKSUM_NONE:
 964		skb->csum = 0;
 965		if (__skb_checksum_complete(skb))
 966			goto drop;
 967	}
 968
 969	ih = igmp_hdr(skb);
 970	switch (ih->type) {
 971	case IGMP_HOST_MEMBERSHIP_QUERY:
 972		igmp_heard_query(in_dev, skb, len);
 973		break;
 974	case IGMP_HOST_MEMBERSHIP_REPORT:
 975	case IGMPV2_HOST_MEMBERSHIP_REPORT:
 976		/* Is it our report looped back? */
 977		if (rt_is_output_route(skb_rtable(skb)))
 978			break;
 979		/* don't rely on MC router hearing unicast reports */
 980		if (skb->pkt_type == PACKET_MULTICAST ||
 981		    skb->pkt_type == PACKET_BROADCAST)
 982			igmp_heard_report(in_dev, ih->group);
 983		break;
 984	case IGMP_PIM:
 985#ifdef CONFIG_IP_PIMSM_V1
 986		return pim_rcv_v1(skb);
 987#endif
 988	case IGMPV3_HOST_MEMBERSHIP_REPORT:
 989	case IGMP_DVMRP:
 990	case IGMP_TRACE:
 991	case IGMP_HOST_LEAVE_MESSAGE:
 992	case IGMP_MTRACE:
 993	case IGMP_MTRACE_RESP:
 994		break;
 995	default:
 996		break;
 997	}
 998
 999drop:
1000	kfree_skb(skb);
1001	return 0;
1002}
1003
1004#endif
1005
1006
1007/*
1008 *	Add a filter to a device
1009 */
1010
1011static void ip_mc_filter_add(struct in_device *in_dev, __be32 addr)
1012{
1013	char buf[MAX_ADDR_LEN];
1014	struct net_device *dev = in_dev->dev;
1015
1016	/* Checking for IFF_MULTICAST here is WRONG-WRONG-WRONG.
1017	   We will get multicast token leakage, when IFF_MULTICAST
1018	   is changed. This check should be done in ndo_set_rx_mode
1019	   routine. Something sort of:
1020	   if (dev->mc_list && dev->flags&IFF_MULTICAST) { do it; }
1021	   --ANK
1022	   */
1023	if (arp_mc_map(addr, buf, dev, 0) == 0)
1024		dev_mc_add(dev, buf);
1025}
1026
1027/*
1028 *	Remove a filter from a device
1029 */
1030
1031static void ip_mc_filter_del(struct in_device *in_dev, __be32 addr)
1032{
1033	char buf[MAX_ADDR_LEN];
1034	struct net_device *dev = in_dev->dev;
1035
1036	if (arp_mc_map(addr, buf, dev, 0) == 0)
1037		dev_mc_del(dev, buf);
1038}
1039
1040#ifdef CONFIG_IP_MULTICAST
1041/*
1042 * deleted ip_mc_list manipulation
1043 */
1044static void igmpv3_add_delrec(struct in_device *in_dev, struct ip_mc_list *im)
1045{
1046	struct ip_mc_list *pmc;
1047
1048	/* this is an "ip_mc_list" for convenience; only the fields below
1049	 * are actually used. In particular, the refcnt and users are not
1050	 * used for management of the delete list. Using the same structure
1051	 * for deleted items allows change reports to use common code with
1052	 * non-deleted or query-response MCA's.
1053	 */
1054	pmc = kzalloc(sizeof(*pmc), GFP_KERNEL);
1055	if (!pmc)
1056		return;
1057	spin_lock_bh(&im->lock);
1058	pmc->interface = im->interface;
1059	in_dev_hold(in_dev);
1060	pmc->multiaddr = im->multiaddr;
1061	pmc->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1062		IGMP_Unsolicited_Report_Count;
1063	pmc->sfmode = im->sfmode;
1064	if (pmc->sfmode == MCAST_INCLUDE) {
1065		struct ip_sf_list *psf;
1066
1067		pmc->tomb = im->tomb;
1068		pmc->sources = im->sources;
1069		im->tomb = im->sources = NULL;
1070		for (psf=pmc->sources; psf; psf=psf->sf_next)
1071			psf->sf_crcount = pmc->crcount;
1072	}
1073	spin_unlock_bh(&im->lock);
1074
1075	spin_lock_bh(&in_dev->mc_tomb_lock);
1076	pmc->next = in_dev->mc_tomb;
1077	in_dev->mc_tomb = pmc;
1078	spin_unlock_bh(&in_dev->mc_tomb_lock);
1079}
1080
1081static void igmpv3_del_delrec(struct in_device *in_dev, __be32 multiaddr)
1082{
1083	struct ip_mc_list *pmc, *pmc_prev;
1084	struct ip_sf_list *psf, *psf_next;
1085
1086	spin_lock_bh(&in_dev->mc_tomb_lock);
1087	pmc_prev = NULL;
1088	for (pmc=in_dev->mc_tomb; pmc; pmc=pmc->next) {
1089		if (pmc->multiaddr == multiaddr)
1090			break;
1091		pmc_prev = pmc;
1092	}
1093	if (pmc) {
1094		if (pmc_prev)
1095			pmc_prev->next = pmc->next;
1096		else
1097			in_dev->mc_tomb = pmc->next;
1098	}
1099	spin_unlock_bh(&in_dev->mc_tomb_lock);
1100	if (pmc) {
1101		for (psf=pmc->tomb; psf; psf=psf_next) {
1102			psf_next = psf->sf_next;
1103			kfree(psf);
1104		}
1105		in_dev_put(pmc->interface);
1106		kfree(pmc);
1107	}
1108}
1109
1110static void igmpv3_clear_delrec(struct in_device *in_dev)
1111{
1112	struct ip_mc_list *pmc, *nextpmc;
1113
1114	spin_lock_bh(&in_dev->mc_tomb_lock);
1115	pmc = in_dev->mc_tomb;
1116	in_dev->mc_tomb = NULL;
1117	spin_unlock_bh(&in_dev->mc_tomb_lock);
1118
1119	for (; pmc; pmc = nextpmc) {
1120		nextpmc = pmc->next;
1121		ip_mc_clear_src(pmc);
1122		in_dev_put(pmc->interface);
1123		kfree(pmc);
1124	}
1125	/* clear dead sources, too */
1126	rcu_read_lock();
1127	for_each_pmc_rcu(in_dev, pmc) {
1128		struct ip_sf_list *psf, *psf_next;
1129
1130		spin_lock_bh(&pmc->lock);
1131		psf = pmc->tomb;
1132		pmc->tomb = NULL;
1133		spin_unlock_bh(&pmc->lock);
1134		for (; psf; psf=psf_next) {
1135			psf_next = psf->sf_next;
1136			kfree(psf);
1137		}
1138	}
1139	rcu_read_unlock();
1140}
1141#endif
1142
1143static void igmp_group_dropped(struct ip_mc_list *im)
1144{
1145	struct in_device *in_dev = im->interface;
1146#ifdef CONFIG_IP_MULTICAST
1147	int reporter;
1148#endif
1149
1150	if (im->loaded) {
1151		im->loaded = 0;
1152		ip_mc_filter_del(in_dev, im->multiaddr);
1153	}
1154
1155#ifdef CONFIG_IP_MULTICAST
1156	if (im->multiaddr == IGMP_ALL_HOSTS)
1157		return;
1158
1159	reporter = im->reporter;
1160	igmp_stop_timer(im);
1161
1162	if (!in_dev->dead) {
1163		if (IGMP_V1_SEEN(in_dev))
1164			return;
1165		if (IGMP_V2_SEEN(in_dev)) {
1166			if (reporter)
1167				igmp_send_report(in_dev, im, IGMP_HOST_LEAVE_MESSAGE);
1168			return;
1169		}
1170		/* IGMPv3 */
1171		igmpv3_add_delrec(in_dev, im);
1172
1173		igmp_ifc_event(in_dev);
1174	}
1175#endif
1176}
1177
1178static void igmp_group_added(struct ip_mc_list *im)
1179{
1180	struct in_device *in_dev = im->interface;
1181
1182	if (im->loaded == 0) {
1183		im->loaded = 1;
1184		ip_mc_filter_add(in_dev, im->multiaddr);
1185	}
1186
1187#ifdef CONFIG_IP_MULTICAST
1188	if (im->multiaddr == IGMP_ALL_HOSTS)
1189		return;
1190
1191	if (in_dev->dead)
1192		return;
1193	if (IGMP_V1_SEEN(in_dev) || IGMP_V2_SEEN(in_dev)) {
1194		spin_lock_bh(&im->lock);
1195		igmp_start_timer(im, IGMP_Initial_Report_Delay);
1196		spin_unlock_bh(&im->lock);
1197		return;
1198	}
1199	/* else, v3 */
1200
1201	im->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1202		IGMP_Unsolicited_Report_Count;
1203	igmp_ifc_event(in_dev);
1204#endif
1205}
1206
1207
1208/*
1209 *	Multicast list managers
1210 */
1211
1212
1213/*
1214 *	A socket has joined a multicast group on device dev.
1215 */
1216
1217void ip_mc_inc_group(struct in_device *in_dev, __be32 addr)
1218{
1219	struct ip_mc_list *im;
1220
1221	ASSERT_RTNL();
1222
1223	for_each_pmc_rtnl(in_dev, im) {
1224		if (im->multiaddr == addr) {
1225			im->users++;
1226			ip_mc_add_src(in_dev, &addr, MCAST_EXCLUDE, 0, NULL, 0);
1227			goto out;
1228		}
1229	}
1230
1231	im = kzalloc(sizeof(*im), GFP_KERNEL);
1232	if (!im)
1233		goto out;
1234
1235	im->users = 1;
1236	im->interface = in_dev;
1237	in_dev_hold(in_dev);
1238	im->multiaddr = addr;
1239	/* initial mode is (EX, empty) */
1240	im->sfmode = MCAST_EXCLUDE;
1241	im->sfcount[MCAST_EXCLUDE] = 1;
1242	atomic_set(&im->refcnt, 1);
1243	spin_lock_init(&im->lock);
1244#ifdef CONFIG_IP_MULTICAST
1245	setup_timer(&im->timer, &igmp_timer_expire, (unsigned long)im);
1246	im->unsolicit_count = IGMP_Unsolicited_Report_Count;
1247#endif
1248
1249	im->next_rcu = in_dev->mc_list;
1250	in_dev->mc_count++;
1251	rcu_assign_pointer(in_dev->mc_list, im);
1252
1253#ifdef CONFIG_IP_MULTICAST
1254	igmpv3_del_delrec(in_dev, im->multiaddr);
1255#endif
1256	igmp_group_added(im);
1257	if (!in_dev->dead)
1258		ip_rt_multicast_event(in_dev);
1259out:
1260	return;
1261}
1262EXPORT_SYMBOL(ip_mc_inc_group);
1263
1264/*
1265 *	Resend IGMP JOIN report; used for bonding.
1266 *	Called with rcu_read_lock()
1267 */
1268void ip_mc_rejoin_groups(struct in_device *in_dev)
1269{
1270#ifdef CONFIG_IP_MULTICAST
1271	struct ip_mc_list *im;
1272	int type;
1273
1274	for_each_pmc_rcu(in_dev, im) {
1275		if (im->multiaddr == IGMP_ALL_HOSTS)
1276			continue;
1277
1278		/* a failover is happening and switches
1279		 * must be notified immediately
1280		 */
1281		if (IGMP_V1_SEEN(in_dev))
1282			type = IGMP_HOST_MEMBERSHIP_REPORT;
1283		else if (IGMP_V2_SEEN(in_dev))
1284			type = IGMPV2_HOST_MEMBERSHIP_REPORT;
1285		else
1286			type = IGMPV3_HOST_MEMBERSHIP_REPORT;
1287		igmp_send_report(in_dev, im, type);
1288	}
1289#endif
1290}
1291EXPORT_SYMBOL(ip_mc_rejoin_groups);
1292
1293/*
1294 *	A socket has left a multicast group on device dev
1295 */
1296
1297void ip_mc_dec_group(struct in_device *in_dev, __be32 addr)
1298{
1299	struct ip_mc_list *i;
1300	struct ip_mc_list __rcu **ip;
1301
1302	ASSERT_RTNL();
1303
1304	for (ip = &in_dev->mc_list;
1305	     (i = rtnl_dereference(*ip)) != NULL;
1306	     ip = &i->next_rcu) {
1307		if (i->multiaddr == addr) {
1308			if (--i->users == 0) {
1309				*ip = i->next_rcu;
1310				in_dev->mc_count--;
1311				igmp_group_dropped(i);
1312				ip_mc_clear_src(i);
1313
1314				if (!in_dev->dead)
1315					ip_rt_multicast_event(in_dev);
1316
1317				ip_ma_put(i);
1318				return;
1319			}
1320			break;
1321		}
1322	}
1323}
1324EXPORT_SYMBOL(ip_mc_dec_group);
1325
1326/* Device changing type */
1327
1328void ip_mc_unmap(struct in_device *in_dev)
1329{
1330	struct ip_mc_list *pmc;
1331
1332	ASSERT_RTNL();
1333
1334	for_each_pmc_rtnl(in_dev, pmc)
1335		igmp_group_dropped(pmc);
1336}
1337
1338void ip_mc_remap(struct in_device *in_dev)
1339{
1340	struct ip_mc_list *pmc;
1341
1342	ASSERT_RTNL();
1343
1344	for_each_pmc_rtnl(in_dev, pmc)
1345		igmp_group_added(pmc);
1346}
1347
1348/* Device going down */
1349
1350void ip_mc_down(struct in_device *in_dev)
1351{
1352	struct ip_mc_list *pmc;
1353
1354	ASSERT_RTNL();
1355
1356	for_each_pmc_rtnl(in_dev, pmc)
1357		igmp_group_dropped(pmc);
1358
1359#ifdef CONFIG_IP_MULTICAST
1360	in_dev->mr_ifc_count = 0;
1361	if (del_timer(&in_dev->mr_ifc_timer))
1362		__in_dev_put(in_dev);
1363	in_dev->mr_gq_running = 0;
1364	if (del_timer(&in_dev->mr_gq_timer))
1365		__in_dev_put(in_dev);
1366	igmpv3_clear_delrec(in_dev);
1367#endif
1368
1369	ip_mc_dec_group(in_dev, IGMP_ALL_HOSTS);
1370}
1371
1372void ip_mc_init_dev(struct in_device *in_dev)
1373{
1374	ASSERT_RTNL();
1375
1376	in_dev->mc_tomb = NULL;
1377#ifdef CONFIG_IP_MULTICAST
1378	in_dev->mr_gq_running = 0;
1379	setup_timer(&in_dev->mr_gq_timer, igmp_gq_timer_expire,
1380			(unsigned long)in_dev);
1381	in_dev->mr_ifc_count = 0;
1382	in_dev->mc_count     = 0;
1383	setup_timer(&in_dev->mr_ifc_timer, igmp_ifc_timer_expire,
1384			(unsigned long)in_dev);
1385	in_dev->mr_qrv = IGMP_Unsolicited_Report_Count;
1386#endif
1387
1388	spin_lock_init(&in_dev->mc_tomb_lock);
1389}
1390
1391/* Device going up */
1392
1393void ip_mc_up(struct in_device *in_dev)
1394{
1395	struct ip_mc_list *pmc;
1396
1397	ASSERT_RTNL();
1398
1399	ip_mc_inc_group(in_dev, IGMP_ALL_HOSTS);
1400
1401	for_each_pmc_rtnl(in_dev, pmc)
1402		igmp_group_added(pmc);
1403}
1404
1405/*
1406 *	Device is about to be destroyed: clean up.
1407 */
1408
1409void ip_mc_destroy_dev(struct in_device *in_dev)
1410{
1411	struct ip_mc_list *i;
1412
1413	ASSERT_RTNL();
1414
1415	/* Deactivate timers */
1416	ip_mc_down(in_dev);
1417
1418	while ((i = rtnl_dereference(in_dev->mc_list)) != NULL) {
1419		in_dev->mc_list = i->next_rcu;
1420		in_dev->mc_count--;
1421
1422		/* We've dropped the groups in ip_mc_down already */
1423		ip_mc_clear_src(i);
1424		ip_ma_put(i);
1425	}
1426}
1427
1428/* RTNL is locked */
1429static struct in_device *ip_mc_find_dev(struct net *net, struct ip_mreqn *imr)
1430{
1431	struct net_device *dev = NULL;
1432	struct in_device *idev = NULL;
1433
1434	if (imr->imr_ifindex) {
1435		idev = inetdev_by_index(net, imr->imr_ifindex);
1436		return idev;
1437	}
1438	if (imr->imr_address.s_addr) {
1439		dev = __ip_dev_find(net, imr->imr_address.s_addr, false);
1440		if (!dev)
1441			return NULL;
1442	}
1443
1444	if (!dev) {
1445		struct rtable *rt = ip_route_output(net,
1446						    imr->imr_multiaddr.s_addr,
1447						    0, 0, 0);
1448		if (!IS_ERR(rt)) {
1449			dev = rt->dst.dev;
1450			ip_rt_put(rt);
1451		}
1452	}
1453	if (dev) {
1454		imr->imr_ifindex = dev->ifindex;
1455		idev = __in_dev_get_rtnl(dev);
1456	}
1457	return idev;
1458}
1459
1460/*
1461 *	Join a socket to a group
1462 */
1463int sysctl_igmp_max_memberships __read_mostly = IP_MAX_MEMBERSHIPS;
1464int sysctl_igmp_max_msf __read_mostly = IP_MAX_MSF;
1465
1466
1467static int ip_mc_del1_src(struct ip_mc_list *pmc, int sfmode,
1468	__be32 *psfsrc)
1469{
1470	struct ip_sf_list *psf, *psf_prev;
1471	int rv = 0;
1472
1473	psf_prev = NULL;
1474	for (psf=pmc->sources; psf; psf=psf->sf_next) {
1475		if (psf->sf_inaddr == *psfsrc)
1476			break;
1477		psf_prev = psf;
1478	}
1479	if (!psf || psf->sf_count[sfmode] == 0) {
1480		/* source filter not found, or count wrong =>  bug */
1481		return -ESRCH;
1482	}
1483	psf->sf_count[sfmode]--;
1484	if (psf->sf_count[sfmode] == 0) {
1485		ip_rt_multicast_event(pmc->interface);
1486	}
1487	if (!psf->sf_count[MCAST_INCLUDE] && !psf->sf_count[MCAST_EXCLUDE]) {
1488#ifdef CONFIG_IP_MULTICAST
1489		struct in_device *in_dev = pmc->interface;
1490#endif
1491
1492		/* no more filters for this source */
1493		if (psf_prev)
1494			psf_prev->sf_next = psf->sf_next;
1495		else
1496			pmc->sources = psf->sf_next;
1497#ifdef CONFIG_IP_MULTICAST
1498		if (psf->sf_oldin &&
1499		    !IGMP_V1_SEEN(in_dev) && !IGMP_V2_SEEN(in_dev)) {
1500			psf->sf_crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1501				IGMP_Unsolicited_Report_Count;
1502			psf->sf_next = pmc->tomb;
1503			pmc->tomb = psf;
1504			rv = 1;
1505		} else
1506#endif
1507			kfree(psf);
1508	}
1509	return rv;
1510}
1511
1512#ifndef CONFIG_IP_MULTICAST
1513#define igmp_ifc_event(x)	do { } while (0)
1514#endif
1515
1516static int ip_mc_del_src(struct in_device *in_dev, __be32 *pmca, int sfmode,
1517			 int sfcount, __be32 *psfsrc, int delta)
1518{
1519	struct ip_mc_list *pmc;
1520	int	changerec = 0;
1521	int	i, err;
1522
1523	if (!in_dev)
1524		return -ENODEV;
1525	rcu_read_lock();
1526	for_each_pmc_rcu(in_dev, pmc) {
1527		if (*pmca == pmc->multiaddr)
1528			break;
1529	}
1530	if (!pmc) {
1531		/* MCA not found?? bug */
1532		rcu_read_unlock();
1533		return -ESRCH;
1534	}
1535	spin_lock_bh(&pmc->lock);
1536	rcu_read_unlock();
1537#ifdef CONFIG_IP_MULTICAST
1538	sf_markstate(pmc);
1539#endif
1540	if (!delta) {
1541		err = -EINVAL;
1542		if (!pmc->sfcount[sfmode])
1543			goto out_unlock;
1544		pmc->sfcount[sfmode]--;
1545	}
1546	err = 0;
1547	for (i=0; i<sfcount; i++) {
1548		int rv = ip_mc_del1_src(pmc, sfmode, &psfsrc[i]);
1549
1550		changerec |= rv > 0;
1551		if (!err && rv < 0)
1552			err = rv;
1553	}
1554	if (pmc->sfmode == MCAST_EXCLUDE &&
1555	    pmc->sfcount[MCAST_EXCLUDE] == 0 &&
1556	    pmc->sfcount[MCAST_INCLUDE]) {
1557#ifdef CONFIG_IP_MULTICAST
1558		struct ip_sf_list *psf;
1559#endif
1560
1561		/* filter mode change */
1562		pmc->sfmode = MCAST_INCLUDE;
1563#ifdef CONFIG_IP_MULTICAST
1564		pmc->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1565			IGMP_Unsolicited_Report_Count;
1566		in_dev->mr_ifc_count = pmc->crcount;
1567		for (psf=pmc->sources; psf; psf = psf->sf_next)
1568			psf->sf_crcount = 0;
1569		igmp_ifc_event(pmc->interface);
1570	} else if (sf_setstate(pmc) || changerec) {
1571		igmp_ifc_event(pmc->interface);
1572#endif
1573	}
1574out_unlock:
1575	spin_unlock_bh(&pmc->lock);
1576	return err;
1577}
1578
1579/*
1580 * Add multicast single-source filter to the interface list
1581 */
1582static int ip_mc_add1_src(struct ip_mc_list *pmc, int sfmode,
1583	__be32 *psfsrc)
1584{
1585	struct ip_sf_list *psf, *psf_prev;
1586
1587	psf_prev = NULL;
1588	for (psf=pmc->sources; psf; psf=psf->sf_next) {
1589		if (psf->sf_inaddr == *psfsrc)
1590			break;
1591		psf_prev = psf;
1592	}
1593	if (!psf) {
1594		psf = kzalloc(sizeof(*psf), GFP_ATOMIC);
1595		if (!psf)
1596			return -ENOBUFS;
1597		psf->sf_inaddr = *psfsrc;
1598		if (psf_prev) {
1599			psf_prev->sf_next = psf;
1600		} else
1601			pmc->sources = psf;
1602	}
1603	psf->sf_count[sfmode]++;
1604	if (psf->sf_count[sfmode] == 1) {
1605		ip_rt_multicast_event(pmc->interface);
1606	}
1607	return 0;
1608}
1609
1610#ifdef CONFIG_IP_MULTICAST
1611static void sf_markstate(struct ip_mc_list *pmc)
1612{
1613	struct ip_sf_list *psf;
1614	int mca_xcount = pmc->sfcount[MCAST_EXCLUDE];
1615
1616	for (psf=pmc->sources; psf; psf=psf->sf_next)
1617		if (pmc->sfcount[MCAST_EXCLUDE]) {
1618			psf->sf_oldin = mca_xcount ==
1619				psf->sf_count[MCAST_EXCLUDE] &&
1620				!psf->sf_count[MCAST_INCLUDE];
1621		} else
1622			psf->sf_oldin = psf->sf_count[MCAST_INCLUDE] != 0;
1623}
1624
1625static int sf_setstate(struct ip_mc_list *pmc)
1626{
1627	struct ip_sf_list *psf, *dpsf;
1628	int mca_xcount = pmc->sfcount[MCAST_EXCLUDE];
1629	int qrv = pmc->interface->mr_qrv;
1630	int new_in, rv;
1631
1632	rv = 0;
1633	for (psf=pmc->sources; psf; psf=psf->sf_next) {
1634		if (pmc->sfcount[MCAST_EXCLUDE]) {
1635			new_in = mca_xcount == psf->sf_count[MCAST_EXCLUDE] &&
1636				!psf->sf_count[MCAST_INCLUDE];
1637		} else
1638			new_in = psf->sf_count[MCAST_INCLUDE] != 0;
1639		if (new_in) {
1640			if (!psf->sf_oldin) {
1641				struct ip_sf_list *prev = NULL;
1642
1643				for (dpsf=pmc->tomb; dpsf; dpsf=dpsf->sf_next) {
1644					if (dpsf->sf_inaddr == psf->sf_inaddr)
1645						break;
1646					prev = dpsf;
1647				}
1648				if (dpsf) {
1649					if (prev)
1650						prev->sf_next = dpsf->sf_next;
1651					else
1652						pmc->tomb = dpsf->sf_next;
1653					kfree(dpsf);
1654				}
1655				psf->sf_crcount = qrv;
1656				rv++;
1657			}
1658		} else if (psf->sf_oldin) {
1659
1660			psf->sf_crcount = 0;
1661			/*
1662			 * add or update "delete" records if an active filter
1663			 * is now inactive
1664			 */
1665			for (dpsf=pmc->tomb; dpsf; dpsf=dpsf->sf_next)
1666				if (dpsf->sf_inaddr == psf->sf_inaddr)
1667					break;
1668			if (!dpsf) {
1669				dpsf = kmalloc(sizeof(*dpsf), GFP_ATOMIC);
1670				if (!dpsf)
1671					continue;
1672				*dpsf = *psf;
1673				/* pmc->lock held by callers */
1674				dpsf->sf_next = pmc->tomb;
1675				pmc->tomb = dpsf;
1676			}
1677			dpsf->sf_crcount = qrv;
1678			rv++;
1679		}
1680	}
1681	return rv;
1682}
1683#endif
1684
1685/*
1686 * Add multicast source filter list to the interface list
1687 */
1688static int ip_mc_add_src(struct in_device *in_dev, __be32 *pmca, int sfmode,
1689			 int sfcount, __be32 *psfsrc, int delta)
1690{
1691	struct ip_mc_list *pmc;
1692	int	isexclude;
1693	int	i, err;
1694
1695	if (!in_dev)
1696		return -ENODEV;
1697	rcu_read_lock();
1698	for_each_pmc_rcu(in_dev, pmc) {
1699		if (*pmca == pmc->multiaddr)
1700			break;
1701	}
1702	if (!pmc) {
1703		/* MCA not found?? bug */
1704		rcu_read_unlock();
1705		return -ESRCH;
1706	}
1707	spin_lock_bh(&pmc->lock);
1708	rcu_read_unlock();
1709
1710#ifdef CONFIG_IP_MULTICAST
1711	sf_markstate(pmc);
1712#endif
1713	isexclude = pmc->sfmode == MCAST_EXCLUDE;
1714	if (!delta)
1715		pmc->sfcount[sfmode]++;
1716	err = 0;
1717	for (i=0; i<sfcount; i++) {
1718		err = ip_mc_add1_src(pmc, sfmode, &psfsrc[i]);
1719		if (err)
1720			break;
1721	}
1722	if (err) {
1723		int j;
1724
1725		if (!delta)
1726			pmc->sfcount[sfmode]--;
1727		for (j=0; j<i; j++)
1728			(void) ip_mc_del1_src(pmc, sfmode, &psfsrc[j]);
1729	} else if (isexclude != (pmc->sfcount[MCAST_EXCLUDE] != 0)) {
1730#ifdef CONFIG_IP_MULTICAST
1731		struct ip_sf_list *psf;
1732		in_dev = pmc->interface;
1733#endif
1734
1735		/* filter mode change */
1736		if (pmc->sfcount[MCAST_EXCLUDE])
1737			pmc->sfmode = MCAST_EXCLUDE;
1738		else if (pmc->sfcount[MCAST_INCLUDE])
1739			pmc->sfmode = MCAST_INCLUDE;
1740#ifdef CONFIG_IP_MULTICAST
1741		/* else no filters; keep old mode for reports */
1742
1743		pmc->crcount = in_dev->mr_qrv ? in_dev->mr_qrv :
1744			IGMP_Unsolicited_Report_Count;
1745		in_dev->mr_ifc_count = pmc->crcount;
1746		for (psf=pmc->sources; psf; psf = psf->sf_next)
1747			psf->sf_crcount = 0;
1748		igmp_ifc_event(in_dev);
1749	} else if (sf_setstate(pmc)) {
1750		igmp_ifc_event(in_dev);
1751#endif
1752	}
1753	spin_unlock_bh(&pmc->lock);
1754	return err;
1755}
1756
1757static void ip_mc_clear_src(struct ip_mc_list *pmc)
1758{
1759	struct ip_sf_list *psf, *nextpsf;
1760
1761	for (psf=pmc->tomb; psf; psf=nextpsf) {
1762		nextpsf = psf->sf_next;
1763		kfree(psf);
1764	}
1765	pmc->tomb = NULL;
1766	for (psf=pmc->sources; psf; psf=nextpsf) {
1767		nextpsf = psf->sf_next;
1768		kfree(psf);
1769	}
1770	pmc->sources = NULL;
1771	pmc->sfmode = MCAST_EXCLUDE;
1772	pmc->sfcount[MCAST_INCLUDE] = 0;
1773	pmc->sfcount[MCAST_EXCLUDE] = 1;
1774}
1775
1776
1777/*
1778 * Join a multicast group
1779 */
1780int ip_mc_join_group(struct sock *sk , struct ip_mreqn *imr)
1781{
1782	int err;
1783	__be32 addr = imr->imr_multiaddr.s_addr;
1784	struct ip_mc_socklist *iml = NULL, *i;
1785	struct in_device *in_dev;
1786	struct inet_sock *inet = inet_sk(sk);
1787	struct net *net = sock_net(sk);
1788	int ifindex;
1789	int count = 0;
1790
1791	if (!ipv4_is_multicast(addr))
1792		return -EINVAL;
1793
1794	rtnl_lock();
1795
1796	in_dev = ip_mc_find_dev(net, imr);
1797
1798	if (!in_dev) {
1799		iml = NULL;
1800		err = -ENODEV;
1801		goto done;
1802	}
1803
1804	err = -EADDRINUSE;
1805	ifindex = imr->imr_ifindex;
1806	for_each_pmc_rtnl(inet, i) {
1807		if (i->multi.imr_multiaddr.s_addr == addr &&
1808		    i->multi.imr_ifindex == ifindex)
1809			goto done;
1810		count++;
1811	}
1812	err = -ENOBUFS;
1813	if (count >= sysctl_igmp_max_memberships)
1814		goto done;
1815	iml = sock_kmalloc(sk, sizeof(*iml), GFP_KERNEL);
1816	if (iml == NULL)
1817		goto done;
1818
1819	memcpy(&iml->multi, imr, sizeof(*imr));
1820	iml->next_rcu = inet->mc_list;
1821	iml->sflist = NULL;
1822	iml->sfmode = MCAST_EXCLUDE;
1823	rcu_assign_pointer(inet->mc_list, iml);
1824	ip_mc_inc_group(in_dev, addr);
1825	err = 0;
1826done:
1827	rtnl_unlock();
1828	return err;
1829}
1830EXPORT_SYMBOL(ip_mc_join_group);
1831
1832static int ip_mc_leave_src(struct sock *sk, struct ip_mc_socklist *iml,
1833			   struct in_device *in_dev)
1834{
1835	struct ip_sf_socklist *psf = rtnl_dereference(iml->sflist);
1836	int err;
1837
1838	if (psf == NULL) {
1839		/* any-source empty exclude case */
1840		return ip_mc_del_src(in_dev, &iml->multi.imr_multiaddr.s_addr,
1841			iml->sfmode, 0, NULL, 0);
1842	}
1843	err = ip_mc_del_src(in_dev, &iml->multi.imr_multiaddr.s_addr,
1844			iml->sfmode, psf->sl_count, psf->sl_addr, 0);
1845	RCU_INIT_POINTER(iml->sflist, NULL);
1846	/* decrease mem now to avoid the memleak warning */
1847	atomic_sub(IP_SFLSIZE(psf->sl_max), &sk->sk_omem_alloc);
1848	kfree_rcu(psf, rcu);
1849	return err;
1850}
1851
1852/*
1853 *	Ask a socket to leave a group.
1854 */
1855
1856int ip_mc_leave_group(struct sock *sk, struct ip_mreqn *imr)
1857{
1858	struct inet_sock *inet = inet_sk(sk);
1859	struct ip_mc_socklist *iml;
1860	struct ip_mc_socklist __rcu **imlp;
1861	struct in_device *in_dev;
1862	struct net *net = sock_net(sk);
1863	__be32 group = imr->imr_multiaddr.s_addr;
1864	u32 ifindex;
1865	int ret = -EADDRNOTAVAIL;
1866
1867	rtnl_lock();
1868	in_dev = ip_mc_find_dev(net, imr);
1869	ifindex = imr->imr_ifindex;
1870	for (imlp = &inet->mc_list;
1871	     (iml = rtnl_dereference(*imlp)) != NULL;
1872	     imlp = &iml->next_rcu) {
1873		if (iml->multi.imr_multiaddr.s_addr != group)
1874			continue;
1875		if (ifindex) {
1876			if (iml->multi.imr_ifindex != ifindex)
1877				continue;
1878		} else if (imr->imr_address.s_addr && imr->imr_address.s_addr !=
1879				iml->multi.imr_address.s_addr)
1880			continue;
1881
1882		(void) ip_mc_leave_src(sk, iml, in_dev);
1883
1884		*imlp = iml->next_rcu;
1885
1886		if (in_dev)
1887			ip_mc_dec_group(in_dev, group);
1888		rtnl_unlock();
1889		/* decrease mem now to avoid the memleak warning */
1890		atomic_sub(sizeof(*iml), &sk->sk_omem_alloc);
1891		kfree_rcu(iml, rcu);
1892		return 0;
1893	}
1894	if (!in_dev)
1895		ret = -ENODEV;
1896	rtnl_unlock();
1897	return ret;
1898}
1899
1900int ip_mc_source(int add, int omode, struct sock *sk, struct
1901	ip_mreq_source *mreqs, int ifindex)
1902{
1903	int err;
1904	struct ip_mreqn imr;
1905	__be32 addr = mreqs->imr_multiaddr;
1906	struct ip_mc_socklist *pmc;
1907	struct in_device *in_dev = NULL;
1908	struct inet_sock *inet = inet_sk(sk);
1909	struct ip_sf_socklist *psl;
1910	struct net *net = sock_net(sk);
1911	int leavegroup = 0;
1912	int i, j, rv;
1913
1914	if (!ipv4_is_multicast(addr))
1915		return -EINVAL;
1916
1917	rtnl_lock();
1918
1919	imr.imr_multiaddr.s_addr = mreqs->imr_multiaddr;
1920	imr.imr_address.s_addr = mreqs->imr_interface;
1921	imr.imr_ifindex = ifindex;
1922	in_dev = ip_mc_find_dev(net, &imr);
1923
1924	if (!in_dev) {
1925		err = -ENODEV;
1926		goto done;
1927	}
1928	err = -EADDRNOTAVAIL;
1929
1930	for_each_pmc_rtnl(inet, pmc) {
1931		if ((pmc->multi.imr_multiaddr.s_addr ==
1932		     imr.imr_multiaddr.s_addr) &&
1933		    (pmc->multi.imr_ifindex == imr.imr_ifindex))
1934			break;
1935	}
1936	if (!pmc) {		/* must have a prior join */
1937		err = -EINVAL;
1938		goto done;
1939	}
1940	/* if a source filter was set, must be the same mode as before */
1941	if (pmc->sflist) {
1942		if (pmc->sfmode != omode) {
1943			err = -EINVAL;
1944			goto done;
1945		}
1946	} else if (pmc->sfmode != omode) {
1947		/* allow mode switches for empty-set filters */
1948		ip_mc_add_src(in_dev, &mreqs->imr_multiaddr, omode, 0, NULL, 0);
1949		ip_mc_del_src(in_dev, &mreqs->imr_multiaddr, pmc->sfmode, 0,
1950			NULL, 0);
1951		pmc->sfmode = omode;
1952	}
1953
1954	psl = rtnl_dereference(pmc->sflist);
1955	if (!add) {
1956		if (!psl)
1957			goto done;	/* err = -EADDRNOTAVAIL */
1958		rv = !0;
1959		for (i=0; i<psl->sl_count; i++) {
1960			rv = memcmp(&psl->sl_addr[i], &mreqs->imr_sourceaddr,
1961				sizeof(__be32));
1962			if (rv == 0)
1963				break;
1964		}
1965		if (rv)		/* source not found */
1966			goto done;	/* err = -EADDRNOTAVAIL */
1967
1968		/* special case - (INCLUDE, empty) == LEAVE_GROUP */
1969		if (psl->sl_count == 1 && omode == MCAST_INCLUDE) {
1970			leavegroup = 1;
1971			goto done;
1972		}
1973
1974		/* update the interface filter */
1975		ip_mc_del_src(in_dev, &mreqs->imr_multiaddr, omode, 1,
1976			&mreqs->imr_sourceaddr, 1);
1977
1978		for (j=i+1; j<psl->sl_count; j++)
1979			psl->sl_addr[j-1] = psl->sl_addr[j];
1980		psl->sl_count--;
1981		err = 0;
1982		goto done;
1983	}
1984	/* else, add a new source to the filter */
1985
1986	if (psl && psl->sl_count >= sysctl_igmp_max_msf) {
1987		err = -ENOBUFS;
1988		goto done;
1989	}
1990	if (!psl || psl->sl_count == psl->sl_max) {
1991		struct ip_sf_socklist *newpsl;
1992		int count = IP_SFBLOCK;
1993
1994		if (psl)
1995			count += psl->sl_max;
1996		newpsl = sock_kmalloc(sk, IP_SFLSIZE(count), GFP_KERNEL);
1997		if (!newpsl) {
1998			err = -ENOBUFS;
1999			goto done;
2000		}
2001		newpsl->sl_max = count;
2002		newpsl->sl_count = count - IP_SFBLOCK;
2003		if (psl) {
2004			for (i=0; i<psl->sl_count; i++)
2005				newpsl->sl_addr[i] = psl->sl_addr[i];
2006			/* decrease mem now to avoid the memleak warning */
2007			atomic_sub(IP_SFLSIZE(psl->sl_max), &sk->sk_omem_alloc);
2008			kfree_rcu(psl, rcu);
2009		}
2010		rcu_assign_pointer(pmc->sflist, newpsl);
2011		psl = newpsl;
2012	}
2013	rv = 1;	/* > 0 for insert logic below if sl_count is 0 */
2014	for (i=0; i<psl->sl_count; i++) {
2015		rv = memcmp(&psl->sl_addr[i], &mreqs->imr_sourceaddr,
2016			sizeof(__be32));
2017		if (rv == 0)
2018			break;
2019	}
2020	if (rv == 0)		/* address already there is an error */
2021		goto done;
2022	for (j=psl->sl_count-1; j>=i; j--)
2023		psl->sl_addr[j+1] = psl->sl_addr[j];
2024	psl->sl_addr[i] = mreqs->imr_sourceaddr;
2025	psl->sl_count++;
2026	err = 0;
2027	/* update the interface list */
2028	ip_mc_add_src(in_dev, &mreqs->imr_multiaddr, omode, 1,
2029		&mreqs->imr_sourceaddr, 1);
2030done:
2031	rtnl_unlock();
2032	if (leavegroup)
2033		return ip_mc_leave_group(sk, &imr);
2034	return err;
2035}
2036
2037int ip_mc_msfilter(struct sock *sk, struct ip_msfilter *msf, int ifindex)
2038{
2039	int err = 0;
2040	struct ip_mreqn	imr;
2041	__be32 addr = msf->imsf_multiaddr;
2042	struct ip_mc_socklist *pmc;
2043	struct in_device *in_dev;
2044	struct inet_sock *inet = inet_sk(sk);
2045	struct ip_sf_socklist *newpsl, *psl;
2046	struct net *net = sock_net(sk);
2047	int leavegroup = 0;
2048
2049	if (!ipv4_is_multicast(addr))
2050		return -EINVAL;
2051	if (msf->imsf_fmode != MCAST_INCLUDE &&
2052	    msf->imsf_fmode != MCAST_EXCLUDE)
2053		return -EINVAL;
2054
2055	rtnl_lock();
2056
2057	imr.imr_multiaddr.s_addr = msf->imsf_multiaddr;
2058	imr.imr_address.s_addr = msf->imsf_interface;
2059	imr.imr_ifindex = ifindex;
2060	in_dev = ip_mc_find_dev(net, &imr);
2061
2062	if (!in_dev) {
2063		err = -ENODEV;
2064		goto done;
2065	}
2066
2067	/* special case - (INCLUDE, empty) == LEAVE_GROUP */
2068	if (msf->imsf_fmode == MCAST_INCLUDE && msf->imsf_numsrc == 0) {
2069		leavegroup = 1;
2070		goto done;
2071	}
2072
2073	for_each_pmc_rtnl(inet, pmc) {
2074		if (pmc->multi.imr_multiaddr.s_addr == msf->imsf_multiaddr &&
2075		    pmc->multi.imr_ifindex == imr.imr_ifindex)
2076			break;
2077	}
2078	if (!pmc) {		/* must have a prior join */
2079		err = -EINVAL;
2080		goto done;
2081	}
2082	if (msf->imsf_numsrc) {
2083		newpsl = sock_kmalloc(sk, IP_SFLSIZE(msf->imsf_numsrc),
2084							   GFP_KERNEL);
2085		if (!newpsl) {
2086			err = -ENOBUFS;
2087			goto done;
2088		}
2089		newpsl->sl_max = newpsl->sl_count = msf->imsf_numsrc;
2090		memcpy(newpsl->sl_addr, msf->imsf_slist,
2091			msf->imsf_numsrc * sizeof(msf->imsf_slist[0]));
2092		err = ip_mc_add_src(in_dev, &msf->imsf_multiaddr,
2093			msf->imsf_fmode, newpsl->sl_count, newpsl->sl_addr, 0);
2094		if (err) {
2095			sock_kfree_s(sk, newpsl, IP_SFLSIZE(newpsl->sl_max));
2096			goto done;
2097		}
2098	} else {
2099		newpsl = NULL;
2100		(void) ip_mc_add_src(in_dev, &msf->imsf_multiaddr,
2101				     msf->imsf_fmode, 0, NULL, 0);
2102	}
2103	psl = rtnl_dereference(pmc->sflist);
2104	if (psl) {
2105		(void) ip_mc_del_src(in_dev, &msf->imsf_multiaddr, pmc->sfmode,
2106			psl->sl_count, psl->sl_addr, 0);
2107		/* decrease mem now to avoid the memleak warning */
2108		atomic_sub(IP_SFLSIZE(psl->sl_max), &sk->sk_omem_alloc);
2109		kfree_rcu(psl, rcu);
2110	} else
2111		(void) ip_mc_del_src(in_dev, &msf->imsf_multiaddr, pmc->sfmode,
2112			0, NULL, 0);
2113	rcu_assign_pointer(pmc->sflist, newpsl);
2114	pmc->sfmode = msf->imsf_fmode;
2115	err = 0;
2116done:
2117	rtnl_unlock();
2118	if (leavegroup)
2119		err = ip_mc_leave_group(sk, &imr);
2120	return err;
2121}
2122
2123int ip_mc_msfget(struct sock *sk, struct ip_msfilter *msf,
2124	struct ip_msfilter __user *optval, int __user *optlen)
2125{
2126	int err, len, count, copycount;
2127	struct ip_mreqn	imr;
2128	__be32 addr = msf->imsf_multiaddr;
2129	struct ip_mc_socklist *pmc;
2130	struct in_device *in_dev;
2131	struct inet_sock *inet = inet_sk(sk);
2132	struct ip_sf_socklist *psl;
2133	struct net *net = sock_net(sk);
2134
2135	if (!ipv4_is_multicast(addr))
2136		return -EINVAL;
2137
2138	rtnl_lock();
2139
2140	imr.imr_multiaddr.s_addr = msf->imsf_multiaddr;
2141	imr.imr_address.s_addr = msf->imsf_interface;
2142	imr.imr_ifindex = 0;
2143	in_dev = ip_mc_find_dev(net, &imr);
2144
2145	if (!in_dev) {
2146		err = -ENODEV;
2147		goto done;
2148	}
2149	err = -EADDRNOTAVAIL;
2150
2151	for_each_pmc_rtnl(inet, pmc) {
2152		if (pmc->multi.imr_multiaddr.s_addr == msf->imsf_multiaddr &&
2153		    pmc->multi.imr_ifindex == imr.imr_ifindex)
2154			break;
2155	}
2156	if (!pmc)		/* must have a prior join */
2157		goto done;
2158	msf->imsf_fmode = pmc->sfmode;
2159	psl = rtnl_dereference(pmc->sflist);
2160	rtnl_unlock();
2161	if (!psl) {
2162		len = 0;
2163		count = 0;
2164	} else {
2165		count = psl->sl_count;
2166	}
2167	copycount = count < msf->imsf_numsrc ? count : msf->imsf_numsrc;
2168	len = copycount * sizeof(psl->sl_addr[0]);
2169	msf->imsf_numsrc = count;
2170	if (put_user(IP_MSFILTER_SIZE(copycount), optlen) ||
2171	    copy_to_user(optval, msf, IP_MSFILTER_SIZE(0))) {
2172		return -EFAULT;
2173	}
2174	if (len &&
2175	    copy_to_user(&optval->imsf_slist[0], psl->sl_addr, len))
2176		return -EFAULT;
2177	return 0;
2178done:
2179	rtnl_unlock();
2180	return err;
2181}
2182
2183int ip_mc_gsfget(struct sock *sk, struct group_filter *gsf,
2184	struct group_filter __user *optval, int __user *optlen)
2185{
2186	int err, i, count, copycount;
2187	struct sockaddr_in *psin;
2188	__be32 addr;
2189	struct ip_mc_socklist *pmc;
2190	struct inet_sock *inet = inet_sk(sk);
2191	struct ip_sf_socklist *psl;
2192
2193	psin = (struct sockaddr_in *)&gsf->gf_group;
2194	if (psin->sin_family != AF_INET)
2195		return -EINVAL;
2196	addr = psin->sin_addr.s_addr;
2197	if (!ipv4_is_multicast(addr))
2198		return -EINVAL;
2199
2200	rtnl_lock();
2201
2202	err = -EADDRNOTAVAIL;
2203
2204	for_each_pmc_rtnl(inet, pmc) {
2205		if (pmc->multi.imr_multiaddr.s_addr == addr &&
2206		    pmc->multi.imr_ifindex == gsf->gf_interface)
2207			break;
2208	}
2209	if (!pmc)		/* must have a prior join */
2210		goto done;
2211	gsf->gf_fmode = pmc->sfmode;
2212	psl = rtnl_dereference(pmc->sflist);
2213	rtnl_unlock();
2214	count = psl ? psl->sl_count : 0;
2215	copycount = count < gsf->gf_numsrc ? count : gsf->gf_numsrc;
2216	gsf->gf_numsrc = count;
2217	if (put_user(GROUP_FILTER_SIZE(copycount), optlen) ||
2218	    copy_to_user(optval, gsf, GROUP_FILTER_SIZE(0))) {
2219		return -EFAULT;
2220	}
2221	for (i=0; i<copycount; i++) {
2222		struct sockaddr_storage ss;
2223
2224		psin = (struct sockaddr_in *)&ss;
2225		memset(&ss, 0, sizeof(ss));
2226		psin->sin_family = AF_INET;
2227		psin->sin_addr.s_addr = psl->sl_addr[i];
2228		if (copy_to_user(&optval->gf_slist[i], &ss, sizeof(ss)))
2229			return -EFAULT;
2230	}
2231	return 0;
2232done:
2233	rtnl_unlock();
2234	return err;
2235}
2236
2237/*
2238 * check if a multicast source filter allows delivery for a given <src,dst,intf>
2239 */
2240int ip_mc_sf_allow(struct sock *sk, __be32 loc_addr, __be32 rmt_addr, int dif)
2241{
2242	struct inet_sock *inet = inet_sk(sk);
2243	struct ip_mc_socklist *pmc;
2244	struct ip_sf_socklist *psl;
2245	int i;
2246	int ret;
2247
2248	ret = 1;
2249	if (!ipv4_is_multicast(loc_addr))
2250		goto out;
2251
2252	rcu_read_lock();
2253	for_each_pmc_rcu(inet, pmc) {
2254		if (pmc->multi.imr_multiaddr.s_addr == loc_addr &&
2255		    pmc->multi.imr_ifindex == dif)
2256			break;
2257	}
2258	ret = inet->mc_all;
2259	if (!pmc)
2260		goto unlock;
2261	psl = rcu_dereference(pmc->sflist);
2262	ret = (pmc->sfmode == MCAST_EXCLUDE);
2263	if (!psl)
2264		goto unlock;
2265
2266	for (i=0; i<psl->sl_count; i++) {
2267		if (psl->sl_addr[i] == rmt_addr)
2268			break;
2269	}
2270	ret = 0;
2271	if (pmc->sfmode == MCAST_INCLUDE && i >= psl->sl_count)
2272		goto unlock;
2273	if (pmc->sfmode == MCAST_EXCLUDE && i < psl->sl_count)
2274		goto unlock;
2275	ret = 1;
2276unlock:
2277	rcu_read_unlock();
2278out:
2279	return ret;
2280}
2281
2282/*
2283 *	A socket is closing.
2284 */
2285
2286void ip_mc_drop_socket(struct sock *sk)
2287{
2288	struct inet_sock *inet = inet_sk(sk);
2289	struct ip_mc_socklist *iml;
2290	struct net *net = sock_net(sk);
2291
2292	if (inet->mc_list == NULL)
2293		return;
2294
2295	rtnl_lock();
2296	while ((iml = rtnl_dereference(inet->mc_list)) != NULL) {
2297		struct in_device *in_dev;
2298
2299		inet->mc_list = iml->next_rcu;
2300		in_dev = inetdev_by_index(net, iml->multi.imr_ifindex);
2301		(void) ip_mc_leave_src(sk, iml, in_dev);
2302		if (in_dev != NULL)
2303			ip_mc_dec_group(in_dev, iml->multi.imr_multiaddr.s_addr);
2304		/* decrease mem now to avoid the memleak warning */
2305		atomic_sub(sizeof(*iml), &sk->sk_omem_alloc);
2306		kfree_rcu(iml, rcu);
2307	}
2308	rtnl_unlock();
2309}
2310
2311/* called with rcu_read_lock() */
2312int ip_check_mc_rcu(struct in_device *in_dev, __be32 mc_addr, __be32 src_addr, u16 proto)
2313{
2314	struct ip_mc_list *im;
2315	struct ip_sf_list *psf;
2316	int rv = 0;
2317
2318	for_each_pmc_rcu(in_dev, im) {
2319		if (im->multiaddr == mc_addr)
2320			break;
2321	}
2322	if (im && proto == IPPROTO_IGMP) {
2323		rv = 1;
2324	} else if (im) {
2325		if (src_addr) {
2326			for (psf=im->sources; psf; psf=psf->sf_next) {
2327				if (psf->sf_inaddr == src_addr)
2328					break;
2329			}
2330			if (psf)
2331				rv = psf->sf_count[MCAST_INCLUDE] ||
2332					psf->sf_count[MCAST_EXCLUDE] !=
2333					im->sfcount[MCAST_EXCLUDE];
2334			else
2335				rv = im->sfcount[MCAST_EXCLUDE] != 0;
2336		} else
2337			rv = 1; /* unspecified source; tentatively allow */
2338	}
2339	return rv;
2340}
2341
2342#if defined(CONFIG_PROC_FS)
2343struct igmp_mc_iter_state {
2344	struct seq_net_private p;
2345	struct net_device *dev;
2346	struct in_device *in_dev;
2347};
2348
2349#define	igmp_mc_seq_private(seq)	((struct igmp_mc_iter_state *)(seq)->private)
2350
2351static inline struct ip_mc_list *igmp_mc_get_first(struct seq_file *seq)
2352{
2353	struct net *net = seq_file_net(seq);
2354	struct ip_mc_list *im = NULL;
2355	struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2356
2357	state->in_dev = NULL;
2358	for_each_netdev_rcu(net, state->dev) {
2359		struct in_device *in_dev;
2360
2361		in_dev = __in_dev_get_rcu(state->dev);
2362		if (!in_dev)
2363			continue;
2364		im = rcu_dereference(in_dev->mc_list);
2365		if (im) {
2366			state->in_dev = in_dev;
2367			break;
2368		}
2369	}
2370	return im;
2371}
2372
2373static struct ip_mc_list *igmp_mc_get_next(struct seq_file *seq, struct ip_mc_list *im)
2374{
2375	struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2376
2377	im = rcu_dereference(im->next_rcu);
2378	while (!im) {
2379		state->dev = next_net_device_rcu(state->dev);
2380		if (!state->dev) {
2381			state->in_dev = NULL;
2382			break;
2383		}
2384		state->in_dev = __in_dev_get_rcu(state->dev);
2385		if (!state->in_dev)
2386			continue;
2387		im = rcu_dereference(state->in_dev->mc_list);
2388	}
2389	return im;
2390}
2391
2392static struct ip_mc_list *igmp_mc_get_idx(struct seq_file *seq, loff_t pos)
2393{
2394	struct ip_mc_list *im = igmp_mc_get_first(seq);
2395	if (im)
2396		while (pos && (im = igmp_mc_get_next(seq, im)) != NULL)
2397			--pos;
2398	return pos ? NULL : im;
2399}
2400
2401static void *igmp_mc_seq_start(struct seq_file *seq, loff_t *pos)
2402	__acquires(rcu)
2403{
2404	rcu_read_lock();
2405	return *pos ? igmp_mc_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
2406}
2407
2408static void *igmp_mc_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2409{
2410	struct ip_mc_list *im;
2411	if (v == SEQ_START_TOKEN)
2412		im = igmp_mc_get_first(seq);
2413	else
2414		im = igmp_mc_get_next(seq, v);
2415	++*pos;
2416	return im;
2417}
2418
2419static void igmp_mc_seq_stop(struct seq_file *seq, void *v)
2420	__releases(rcu)
2421{
2422	struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2423
2424	state->in_dev = NULL;
2425	state->dev = NULL;
2426	rcu_read_unlock();
2427}
2428
2429static int igmp_mc_seq_show(struct seq_file *seq, void *v)
2430{
2431	if (v == SEQ_START_TOKEN)
2432		seq_puts(seq,
2433			 "Idx\tDevice    : Count Querier\tGroup    Users Timer\tReporter\n");
2434	else {
2435		struct ip_mc_list *im = (struct ip_mc_list *)v;
2436		struct igmp_mc_iter_state *state = igmp_mc_seq_private(seq);
2437		char   *querier;
2438#ifdef CONFIG_IP_MULTICAST
2439		querier = IGMP_V1_SEEN(state->in_dev) ? "V1" :
2440			  IGMP_V2_SEEN(state->in_dev) ? "V2" :
2441			  "V3";
2442#else
2443		querier = "NONE";
2444#endif
2445
2446		if (rcu_dereference(state->in_dev->mc_list) == im) {
2447			seq_printf(seq, "%d\t%-10s: %5d %7s\n",
2448				   state->dev->ifindex, state->dev->name, state->in_dev->mc_count, querier);
2449		}
2450
2451		seq_printf(seq,
2452			   "\t\t\t\t%08X %5d %d:%08lX\t\t%d\n",
2453			   im->multiaddr, im->users,
2454			   im->tm_running, im->tm_running ?
2455			   jiffies_to_clock_t(im->timer.expires-jiffies) : 0,
2456			   im->reporter);
2457	}
2458	return 0;
2459}
2460
2461static const struct seq_operations igmp_mc_seq_ops = {
2462	.start	=	igmp_mc_seq_start,
2463	.next	=	igmp_mc_seq_next,
2464	.stop	=	igmp_mc_seq_stop,
2465	.show	=	igmp_mc_seq_show,
2466};
2467
2468static int igmp_mc_seq_open(struct inode *inode, struct file *file)
2469{
2470	return seq_open_net(inode, file, &igmp_mc_seq_ops,
2471			sizeof(struct igmp_mc_iter_state));
2472}
2473
2474static const struct file_operations igmp_mc_seq_fops = {
2475	.owner		=	THIS_MODULE,
2476	.open		=	igmp_mc_seq_open,
2477	.read		=	seq_read,
2478	.llseek		=	seq_lseek,
2479	.release	=	seq_release_net,
2480};
2481
2482struct igmp_mcf_iter_state {
2483	struct seq_net_private p;
2484	struct net_device *dev;
2485	struct in_device *idev;
2486	struct ip_mc_list *im;
2487};
2488
2489#define igmp_mcf_seq_private(seq)	((struct igmp_mcf_iter_state *)(seq)->private)
2490
2491static inline struct ip_sf_list *igmp_mcf_get_first(struct seq_file *seq)
2492{
2493	struct net *net = seq_file_net(seq);
2494	struct ip_sf_list *psf = NULL;
2495	struct ip_mc_list *im = NULL;
2496	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2497
2498	state->idev = NULL;
2499	state->im = NULL;
2500	for_each_netdev_rcu(net, state->dev) {
2501		struct in_device *idev;
2502		idev = __in_dev_get_rcu(state->dev);
2503		if (unlikely(idev == NULL))
2504			continue;
2505		im = rcu_dereference(idev->mc_list);
2506		if (likely(im != NULL)) {
2507			spin_lock_bh(&im->lock);
2508			psf = im->sources;
2509			if (likely(psf != NULL)) {
2510				state->im = im;
2511				state->idev = idev;
2512				break;
2513			}
2514			spin_unlock_bh(&im->lock);
2515		}
2516	}
2517	return psf;
2518}
2519
2520static struct ip_sf_list *igmp_mcf_get_next(struct seq_file *seq, struct ip_sf_list *psf)
2521{
2522	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2523
2524	psf = psf->sf_next;
2525	while (!psf) {
2526		spin_unlock_bh(&state->im->lock);
2527		state->im = state->im->next;
2528		while (!state->im) {
2529			state->dev = next_net_device_rcu(state->dev);
2530			if (!state->dev) {
2531				state->idev = NULL;
2532				goto out;
2533			}
2534			state->idev = __in_dev_get_rcu(state->dev);
2535			if (!state->idev)
2536				continue;
2537			state->im = rcu_dereference(state->idev->mc_list);
2538		}
2539		if (!state->im)
2540			break;
2541		spin_lock_bh(&state->im->lock);
2542		psf = state->im->sources;
2543	}
2544out:
2545	return psf;
2546}
2547
2548static struct ip_sf_list *igmp_mcf_get_idx(struct seq_file *seq, loff_t pos)
2549{
2550	struct ip_sf_list *psf = igmp_mcf_get_first(seq);
2551	if (psf)
2552		while (pos && (psf = igmp_mcf_get_next(seq, psf)) != NULL)
2553			--pos;
2554	return pos ? NULL : psf;
2555}
2556
2557static void *igmp_mcf_seq_start(struct seq_file *seq, loff_t *pos)
2558	__acquires(rcu)
2559{
2560	rcu_read_lock();
2561	return *pos ? igmp_mcf_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
2562}
2563
2564static void *igmp_mcf_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2565{
2566	struct ip_sf_list *psf;
2567	if (v == SEQ_START_TOKEN)
2568		psf = igmp_mcf_get_first(seq);
2569	else
2570		psf = igmp_mcf_get_next(seq, v);
2571	++*pos;
2572	return psf;
2573}
2574
2575static void igmp_mcf_seq_stop(struct seq_file *seq, void *v)
2576	__releases(rcu)
2577{
2578	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2579	if (likely(state->im != NULL)) {
2580		spin_unlock_bh(&state->im->lock);
2581		state->im = NULL;
2582	}
2583	state->idev = NULL;
2584	state->dev = NULL;
2585	rcu_read_unlock();
2586}
2587
2588static int igmp_mcf_seq_show(struct seq_file *seq, void *v)
2589{
2590	struct ip_sf_list *psf = (struct ip_sf_list *)v;
2591	struct igmp_mcf_iter_state *state = igmp_mcf_seq_private(seq);
2592
2593	if (v == SEQ_START_TOKEN) {
2594		seq_printf(seq,
2595			   "%3s %6s "
2596			   "%10s %10s %6s %6s\n", "Idx",
2597			   "Device", "MCA",
2598			   "SRC", "INC", "EXC");
2599	} else {
2600		seq_printf(seq,
2601			   "%3d %6.6s 0x%08x "
2602			   "0x%08x %6lu %6lu\n",
2603			   state->dev->ifindex, state->dev->name,
2604			   ntohl(state->im->multiaddr),
2605			   ntohl(psf->sf_inaddr),
2606			   psf->sf_count[MCAST_INCLUDE],
2607			   psf->sf_count[MCAST_EXCLUDE]);
2608	}
2609	return 0;
2610}
2611
2612static const struct seq_operations igmp_mcf_seq_ops = {
2613	.start	=	igmp_mcf_seq_start,
2614	.next	=	igmp_mcf_seq_next,
2615	.stop	=	igmp_mcf_seq_stop,
2616	.show	=	igmp_mcf_seq_show,
2617};
2618
2619static int igmp_mcf_seq_open(struct inode *inode, struct file *file)
2620{
2621	return seq_open_net(inode, file, &igmp_mcf_seq_ops,
2622			sizeof(struct igmp_mcf_iter_state));
2623}
2624
2625static const struct file_operations igmp_mcf_seq_fops = {
2626	.owner		=	THIS_MODULE,
2627	.open		=	igmp_mcf_seq_open,
2628	.read		=	seq_read,
2629	.llseek		=	seq_lseek,
2630	.release	=	seq_release_net,
2631};
2632
2633static int __net_init igmp_net_init(struct net *net)
2634{
2635	struct proc_dir_entry *pde;
2636
2637	pde = proc_net_fops_create(net, "igmp", S_IRUGO, &igmp_mc_seq_fops);
2638	if (!pde)
2639		goto out_igmp;
2640	pde = proc_net_fops_create(net, "mcfilter", S_IRUGO, &igmp_mcf_seq_fops);
2641	if (!pde)
2642		goto out_mcfilter;
2643	return 0;
2644
2645out_mcfilter:
2646	proc_net_remove(net, "igmp");
2647out_igmp:
2648	return -ENOMEM;
2649}
2650
2651static void __net_exit igmp_net_exit(struct net *net)
2652{
2653	proc_net_remove(net, "mcfilter");
2654	proc_net_remove(net, "igmp");
2655}
2656
2657static struct pernet_operations igmp_net_ops = {
2658	.init = igmp_net_init,
2659	.exit = igmp_net_exit,
2660};
2661
2662int __init igmp_mc_proc_init(void)
2663{
2664	return register_pernet_subsys(&igmp_net_ops);
2665}
2666#endif