br_if.c revision 384912ed194e43c03ad1cdaa09b0b1e488c34d46
1/*
2 *	Userspace interface
3 *	Linux ethernet bridge
4 *
5 *	Authors:
6 *	Lennert Buytenhek		<buytenh@gnu.org>
7 *
8 *	This program is free software; you can redistribute it and/or
9 *	modify it under the terms of the GNU General Public License
10 *	as published by the Free Software Foundation; either version
11 *	2 of the License, or (at your option) any later version.
12 */
13
14#include <linux/kernel.h>
15#include <linux/netdevice.h>
16#include <linux/ethtool.h>
17#include <linux/if_arp.h>
18#include <linux/module.h>
19#include <linux/init.h>
20#include <linux/rtnetlink.h>
21#include <linux/if_ether.h>
22#include <net/sock.h>
23
24#include "br_private.h"
25
26/*
27 * Determine initial path cost based on speed.
28 * using recommendations from 802.1d standard
29 *
30 * Since driver might sleep need to not be holding any locks.
31 */
32static int port_cost(struct net_device *dev)
33{
34	if (dev->ethtool_ops && dev->ethtool_ops->get_settings) {
35		struct ethtool_cmd ecmd = { .cmd = ETHTOOL_GSET, };
36
37		if (!dev->ethtool_ops->get_settings(dev, &ecmd)) {
38			switch(ecmd.speed) {
39			case SPEED_10000:
40				return 2;
41			case SPEED_1000:
42				return 4;
43			case SPEED_100:
44				return 19;
45			case SPEED_10:
46				return 100;
47			}
48		}
49	}
50
51	/* Old silly heuristics based on name */
52	if (!strncmp(dev->name, "lec", 3))
53		return 7;
54
55	if (!strncmp(dev->name, "plip", 4))
56		return 2500;
57
58	return 100;	/* assume old 10Mbps */
59}
60
61
62/*
63 * Check for port carrier transistions.
64 * Called from work queue to allow for calling functions that
65 * might sleep (such as speed check), and to debounce.
66 */
67void br_port_carrier_check(struct net_bridge_port *p)
68{
69	struct net_device *dev = p->dev;
70	struct net_bridge *br = p->br;
71
72	if (netif_carrier_ok(dev))
73		p->path_cost = port_cost(dev);
74
75	if (netif_running(br->dev)) {
76		spin_lock_bh(&br->lock);
77		if (netif_carrier_ok(dev)) {
78			if (p->state == BR_STATE_DISABLED)
79				br_stp_enable_port(p);
80		} else {
81			if (p->state != BR_STATE_DISABLED)
82				br_stp_disable_port(p);
83		}
84		spin_unlock_bh(&br->lock);
85	}
86}
87
88static void release_nbp(struct kobject *kobj)
89{
90	struct net_bridge_port *p
91		= container_of(kobj, struct net_bridge_port, kobj);
92	kfree(p);
93}
94
95static struct kobj_type brport_ktype = {
96#ifdef CONFIG_SYSFS
97	.sysfs_ops = &brport_sysfs_ops,
98#endif
99	.release = release_nbp,
100};
101
102static void destroy_nbp(struct net_bridge_port *p)
103{
104	struct net_device *dev = p->dev;
105
106	p->br = NULL;
107	p->dev = NULL;
108	dev_put(dev);
109
110	kobject_put(&p->kobj);
111}
112
113static void destroy_nbp_rcu(struct rcu_head *head)
114{
115	struct net_bridge_port *p =
116			container_of(head, struct net_bridge_port, rcu);
117	destroy_nbp(p);
118}
119
120/* Delete port(interface) from bridge is done in two steps.
121 * via RCU. First step, marks device as down. That deletes
122 * all the timers and stops new packets from flowing through.
123 *
124 * Final cleanup doesn't occur until after all CPU's finished
125 * processing packets.
126 *
127 * Protected from multiple admin operations by RTNL mutex
128 */
129static void del_nbp(struct net_bridge_port *p)
130{
131	struct net_bridge *br = p->br;
132	struct net_device *dev = p->dev;
133
134	sysfs_remove_link(br->ifobj, dev->name);
135
136	dev_set_promiscuity(dev, -1);
137
138	spin_lock_bh(&br->lock);
139	br_stp_disable_port(p);
140	spin_unlock_bh(&br->lock);
141
142	br_ifinfo_notify(RTM_DELLINK, p);
143
144	br_fdb_delete_by_port(br, p, 1);
145
146	list_del_rcu(&p->list);
147
148	rcu_assign_pointer(dev->br_port, NULL);
149
150	kobject_uevent(&p->kobj, KOBJ_REMOVE);
151	kobject_del(&p->kobj);
152
153	call_rcu(&p->rcu, destroy_nbp_rcu);
154}
155
156/* called with RTNL */
157static void del_br(struct net_bridge *br)
158{
159	struct net_bridge_port *p, *n;
160
161	list_for_each_entry_safe(p, n, &br->port_list, list) {
162		del_nbp(p);
163	}
164
165	del_timer_sync(&br->gc_timer);
166
167	br_sysfs_delbr(br->dev);
168	unregister_netdevice(br->dev);
169}
170
171static struct net_device *new_bridge_dev(struct net *net, const char *name)
172{
173	struct net_bridge *br;
174	struct net_device *dev;
175
176	dev = alloc_netdev(sizeof(struct net_bridge), name,
177			   br_dev_setup);
178
179	if (!dev)
180		return NULL;
181	dev_net_set(dev, net);
182
183	br = netdev_priv(dev);
184	br->dev = dev;
185
186	spin_lock_init(&br->lock);
187	INIT_LIST_HEAD(&br->port_list);
188	spin_lock_init(&br->hash_lock);
189
190	br->bridge_id.prio[0] = 0x80;
191	br->bridge_id.prio[1] = 0x00;
192
193	memcpy(br->group_addr, br_group_address, ETH_ALEN);
194
195	br->feature_mask = dev->features;
196	br->stp_enabled = BR_NO_STP;
197	br->designated_root = br->bridge_id;
198	br->root_path_cost = 0;
199	br->root_port = 0;
200	br->bridge_max_age = br->max_age = 20 * HZ;
201	br->bridge_hello_time = br->hello_time = 2 * HZ;
202	br->bridge_forward_delay = br->forward_delay = 15 * HZ;
203	br->topology_change = 0;
204	br->topology_change_detected = 0;
205	br->ageing_time = 300 * HZ;
206
207	br_netfilter_rtable_init(br);
208
209	INIT_LIST_HEAD(&br->age_list);
210
211	br_stp_timer_init(br);
212
213	return dev;
214}
215
216/* find an available port number */
217static int find_portno(struct net_bridge *br)
218{
219	int index;
220	struct net_bridge_port *p;
221	unsigned long *inuse;
222
223	inuse = kcalloc(BITS_TO_LONGS(BR_MAX_PORTS), sizeof(unsigned long),
224			GFP_KERNEL);
225	if (!inuse)
226		return -ENOMEM;
227
228	set_bit(0, inuse);	/* zero is reserved */
229	list_for_each_entry(p, &br->port_list, list) {
230		set_bit(p->port_no, inuse);
231	}
232	index = find_first_zero_bit(inuse, BR_MAX_PORTS);
233	kfree(inuse);
234
235	return (index >= BR_MAX_PORTS) ? -EXFULL : index;
236}
237
238/* called with RTNL but without bridge lock */
239static struct net_bridge_port *new_nbp(struct net_bridge *br,
240				       struct net_device *dev)
241{
242	int index;
243	struct net_bridge_port *p;
244
245	index = find_portno(br);
246	if (index < 0)
247		return ERR_PTR(index);
248
249	p = kzalloc(sizeof(*p), GFP_KERNEL);
250	if (p == NULL)
251		return ERR_PTR(-ENOMEM);
252
253	p->br = br;
254	dev_hold(dev);
255	p->dev = dev;
256	p->path_cost = port_cost(dev);
257	p->priority = 0x8000 >> BR_PORT_BITS;
258	p->port_no = index;
259	p->flags = 0;
260	br_init_port(p);
261	p->state = BR_STATE_DISABLED;
262	br_stp_port_timer_init(p);
263
264	return p;
265}
266
267static struct device_type br_type = {
268	.name	= "bridge",
269};
270
271int br_add_bridge(struct net *net, const char *name)
272{
273	struct net_device *dev;
274	int ret;
275
276	dev = new_bridge_dev(net, name);
277	if (!dev)
278		return -ENOMEM;
279
280	rtnl_lock();
281	if (strchr(dev->name, '%')) {
282		ret = dev_alloc_name(dev, dev->name);
283		if (ret < 0)
284			goto out_free;
285	}
286
287	SET_NETDEV_DEVTYPE(dev, &br_type);
288
289	ret = register_netdevice(dev);
290	if (ret)
291		goto out_free;
292
293	ret = br_sysfs_addbr(dev);
294	if (ret)
295		unregister_netdevice(dev);
296 out:
297	rtnl_unlock();
298	return ret;
299
300out_free:
301	free_netdev(dev);
302	goto out;
303}
304
305int br_del_bridge(struct net *net, const char *name)
306{
307	struct net_device *dev;
308	int ret = 0;
309
310	rtnl_lock();
311	dev = __dev_get_by_name(net, name);
312	if (dev == NULL)
313		ret =  -ENXIO; 	/* Could not find device */
314
315	else if (!(dev->priv_flags & IFF_EBRIDGE)) {
316		/* Attempt to delete non bridge device! */
317		ret = -EPERM;
318	}
319
320	else if (dev->flags & IFF_UP) {
321		/* Not shutdown yet. */
322		ret = -EBUSY;
323	}
324
325	else
326		del_br(netdev_priv(dev));
327
328	rtnl_unlock();
329	return ret;
330}
331
332/* MTU of the bridge pseudo-device: ETH_DATA_LEN or the minimum of the ports */
333int br_min_mtu(const struct net_bridge *br)
334{
335	const struct net_bridge_port *p;
336	int mtu = 0;
337
338	ASSERT_RTNL();
339
340	if (list_empty(&br->port_list))
341		mtu = ETH_DATA_LEN;
342	else {
343		list_for_each_entry(p, &br->port_list, list) {
344			if (!mtu  || p->dev->mtu < mtu)
345				mtu = p->dev->mtu;
346		}
347	}
348	return mtu;
349}
350
351/*
352 * Recomputes features using slave's features
353 */
354void br_features_recompute(struct net_bridge *br)
355{
356	struct net_bridge_port *p;
357	unsigned long features, mask;
358
359	features = mask = br->feature_mask;
360	if (list_empty(&br->port_list))
361		goto done;
362
363	features &= ~NETIF_F_ONE_FOR_ALL;
364
365	list_for_each_entry(p, &br->port_list, list) {
366		features = netdev_increment_features(features,
367						     p->dev->features, mask);
368	}
369
370done:
371	br->dev->features = netdev_fix_features(features, NULL);
372}
373
374/* called with RTNL */
375int br_add_if(struct net_bridge *br, struct net_device *dev)
376{
377	struct net_bridge_port *p;
378	int err = 0;
379
380	if (dev->flags & IFF_LOOPBACK || dev->type != ARPHRD_ETHER)
381		return -EINVAL;
382
383	if (dev->netdev_ops->ndo_start_xmit == br_dev_xmit)
384		return -ELOOP;
385
386	if (dev->br_port != NULL)
387		return -EBUSY;
388
389	p = new_nbp(br, dev);
390	if (IS_ERR(p))
391		return PTR_ERR(p);
392
393	err = dev_set_promiscuity(dev, 1);
394	if (err)
395		goto put_back;
396
397	err = kobject_init_and_add(&p->kobj, &brport_ktype, &(dev->dev.kobj),
398				   SYSFS_BRIDGE_PORT_ATTR);
399	if (err)
400		goto err0;
401
402	err = br_fdb_insert(br, p, dev->dev_addr);
403	if (err)
404		goto err1;
405
406	err = br_sysfs_addif(p);
407	if (err)
408		goto err2;
409
410	rcu_assign_pointer(dev->br_port, p);
411	dev_disable_lro(dev);
412
413	list_add_rcu(&p->list, &br->port_list);
414
415	spin_lock_bh(&br->lock);
416	br_stp_recalculate_bridge_id(br);
417	br_features_recompute(br);
418
419	if ((dev->flags & IFF_UP) && netif_carrier_ok(dev) &&
420	    (br->dev->flags & IFF_UP))
421		br_stp_enable_port(p);
422	spin_unlock_bh(&br->lock);
423
424	br_ifinfo_notify(RTM_NEWLINK, p);
425
426	dev_set_mtu(br->dev, br_min_mtu(br));
427
428	kobject_uevent(&p->kobj, KOBJ_ADD);
429
430	return 0;
431err2:
432	br_fdb_delete_by_port(br, p, 1);
433err1:
434	kobject_put(&p->kobj);
435err0:
436	dev_set_promiscuity(dev, -1);
437put_back:
438	dev_put(dev);
439	kfree(p);
440	return err;
441}
442
443/* called with RTNL */
444int br_del_if(struct net_bridge *br, struct net_device *dev)
445{
446	struct net_bridge_port *p = dev->br_port;
447
448	if (!p || p->br != br)
449		return -EINVAL;
450
451	del_nbp(p);
452
453	spin_lock_bh(&br->lock);
454	br_stp_recalculate_bridge_id(br);
455	br_features_recompute(br);
456	spin_unlock_bh(&br->lock);
457
458	return 0;
459}
460
461void br_net_exit(struct net *net)
462{
463	struct net_device *dev;
464
465	rtnl_lock();
466restart:
467	for_each_netdev(net, dev) {
468		if (dev->priv_flags & IFF_EBRIDGE) {
469			del_br(netdev_priv(dev));
470			goto restart;
471		}
472	}
473	rtnl_unlock();
474
475}
476