Commit | Line | Data |
---|---|---|
b863ceb7 PM |
1 | /* |
2 | * Copyright (c) 2007 Patrick McHardy <kaber@trash.net> | |
3 | * | |
4 | * This program is free software; you can redistribute it and/or | |
5 | * modify it under the terms of the GNU General Public License as | |
6 | * published by the Free Software Foundation; either version 2 of | |
7 | * the License, or (at your option) any later version. | |
8 | * | |
9 | * The code this is based on carried the following copyright notice: | |
10 | * --- | |
11 | * (C) Copyright 2001-2006 | |
12 | * Alex Zeffertt, Cambridge Broadband Ltd, ajz@cambridgebroadband.com | |
13 | * Re-worked by Ben Greear <greearb@candelatech.com> | |
14 | * --- | |
15 | */ | |
16 | #include <linux/kernel.h> | |
17 | #include <linux/types.h> | |
18 | #include <linux/module.h> | |
19 | #include <linux/init.h> | |
20 | #include <linux/errno.h> | |
21 | #include <linux/slab.h> | |
22 | #include <linux/string.h> | |
82524746 | 23 | #include <linux/rculist.h> |
b863ceb7 PM |
24 | #include <linux/notifier.h> |
25 | #include <linux/netdevice.h> | |
26 | #include <linux/etherdevice.h> | |
27 | #include <linux/ethtool.h> | |
28 | #include <linux/if_arp.h> | |
29 | #include <linux/if_link.h> | |
30 | #include <linux/if_macvlan.h> | |
31 | #include <net/rtnetlink.h> | |
618e1b74 | 32 | #include <net/xfrm.h> |
b863ceb7 PM |
33 | |
34 | #define MACVLAN_HASH_SIZE (1 << BITS_PER_BYTE) | |
35 | ||
36 | struct macvlan_port { | |
37 | struct net_device *dev; | |
38 | struct hlist_head vlan_hash[MACVLAN_HASH_SIZE]; | |
39 | struct list_head vlans; | |
8b37ef0a | 40 | struct rcu_head rcu; |
eb06acdc | 41 | bool passthru; |
d5cd9244 | 42 | int count; |
b863ceb7 PM |
43 | }; |
44 | ||
d5cd9244 EB |
45 | static void macvlan_port_destroy(struct net_device *dev); |
46 | ||
a35e2c1b JP |
47 | #define macvlan_port_get_rcu(dev) \ |
48 | ((struct macvlan_port *) rcu_dereference(dev->rx_handler_data)) | |
49 | #define macvlan_port_get(dev) ((struct macvlan_port *) dev->rx_handler_data) | |
50 | #define macvlan_port_exists(dev) (dev->priv_flags & IFF_MACVLAN_PORT) | |
51 | ||
b863ceb7 PM |
52 | static struct macvlan_dev *macvlan_hash_lookup(const struct macvlan_port *port, |
53 | const unsigned char *addr) | |
54 | { | |
55 | struct macvlan_dev *vlan; | |
56 | struct hlist_node *n; | |
57 | ||
58 | hlist_for_each_entry_rcu(vlan, n, &port->vlan_hash[addr[5]], hlist) { | |
ac06713d | 59 | if (!compare_ether_addr_64bits(vlan->dev->dev_addr, addr)) |
b863ceb7 PM |
60 | return vlan; |
61 | } | |
62 | return NULL; | |
63 | } | |
64 | ||
f9ac30f0 EB |
65 | static void macvlan_hash_add(struct macvlan_dev *vlan) |
66 | { | |
67 | struct macvlan_port *port = vlan->port; | |
68 | const unsigned char *addr = vlan->dev->dev_addr; | |
69 | ||
70 | hlist_add_head_rcu(&vlan->hlist, &port->vlan_hash[addr[5]]); | |
71 | } | |
72 | ||
73 | static void macvlan_hash_del(struct macvlan_dev *vlan) | |
74 | { | |
75 | hlist_del_rcu(&vlan->hlist); | |
76 | synchronize_rcu(); | |
77 | } | |
78 | ||
79 | static void macvlan_hash_change_addr(struct macvlan_dev *vlan, | |
80 | const unsigned char *addr) | |
81 | { | |
82 | macvlan_hash_del(vlan); | |
83 | /* Now that we are unhashed it is safe to change the device | |
84 | * address without confusing packet delivery. | |
85 | */ | |
86 | memcpy(vlan->dev->dev_addr, addr, ETH_ALEN); | |
87 | macvlan_hash_add(vlan); | |
88 | } | |
89 | ||
90 | static int macvlan_addr_busy(const struct macvlan_port *port, | |
91 | const unsigned char *addr) | |
92 | { | |
93 | /* Test to see if the specified multicast address is | |
94 | * currently in use by the underlying device or | |
95 | * another macvlan. | |
96 | */ | |
ac06713d | 97 | if (!compare_ether_addr_64bits(port->dev->dev_addr, addr)) |
f9ac30f0 EB |
98 | return 1; |
99 | ||
100 | if (macvlan_hash_lookup(port, addr)) | |
101 | return 1; | |
102 | ||
103 | return 0; | |
104 | } | |
105 | ||
a1e514c5 | 106 | |
fc0663d6 AB |
107 | static int macvlan_broadcast_one(struct sk_buff *skb, |
108 | const struct macvlan_dev *vlan, | |
618e1b74 | 109 | const struct ethhdr *eth, bool local) |
a1e514c5 | 110 | { |
fc0663d6 | 111 | struct net_device *dev = vlan->dev; |
a1e514c5 AB |
112 | if (!skb) |
113 | return NET_RX_DROP; | |
114 | ||
618e1b74 | 115 | if (local) |
fc0663d6 | 116 | return vlan->forward(dev, skb); |
618e1b74 | 117 | |
a1e514c5 AB |
118 | skb->dev = dev; |
119 | if (!compare_ether_addr_64bits(eth->h_dest, | |
120 | dev->broadcast)) | |
121 | skb->pkt_type = PACKET_BROADCAST; | |
122 | else | |
123 | skb->pkt_type = PACKET_MULTICAST; | |
124 | ||
fc0663d6 | 125 | return vlan->receive(skb); |
a1e514c5 AB |
126 | } |
127 | ||
b863ceb7 | 128 | static void macvlan_broadcast(struct sk_buff *skb, |
618e1b74 AB |
129 | const struct macvlan_port *port, |
130 | struct net_device *src, | |
131 | enum macvlan_mode mode) | |
b863ceb7 PM |
132 | { |
133 | const struct ethhdr *eth = eth_hdr(skb); | |
134 | const struct macvlan_dev *vlan; | |
135 | struct hlist_node *n; | |
b863ceb7 PM |
136 | struct sk_buff *nskb; |
137 | unsigned int i; | |
a1e514c5 | 138 | int err; |
b863ceb7 | 139 | |
efbbced3 PM |
140 | if (skb->protocol == htons(ETH_P_PAUSE)) |
141 | return; | |
142 | ||
b863ceb7 PM |
143 | for (i = 0; i < MACVLAN_HASH_SIZE; i++) { |
144 | hlist_for_each_entry_rcu(vlan, n, &port->vlan_hash[i], hlist) { | |
618e1b74 AB |
145 | if (vlan->dev == src || !(vlan->mode & mode)) |
146 | continue; | |
147 | ||
b863ceb7 | 148 | nskb = skb_clone(skb, GFP_ATOMIC); |
fc0663d6 | 149 | err = macvlan_broadcast_one(nskb, vlan, eth, |
618e1b74 | 150 | mode == MACVLAN_MODE_BRIDGE); |
a1e514c5 AB |
151 | macvlan_count_rx(vlan, skb->len + ETH_HLEN, |
152 | err == NET_RX_SUCCESS, 1); | |
b863ceb7 PM |
153 | } |
154 | } | |
155 | } | |
156 | ||
157 | /* called under rcu_read_lock() from netif_receive_skb */ | |
8a4eb573 | 158 | static rx_handler_result_t macvlan_handle_frame(struct sk_buff **pskb) |
b863ceb7 | 159 | { |
ab95bfe0 | 160 | struct macvlan_port *port; |
8a4eb573 | 161 | struct sk_buff *skb = *pskb; |
b863ceb7 | 162 | const struct ethhdr *eth = eth_hdr(skb); |
b863ceb7 | 163 | const struct macvlan_dev *vlan; |
618e1b74 | 164 | const struct macvlan_dev *src; |
b863ceb7 | 165 | struct net_device *dev; |
ba01877f SS |
166 | unsigned int len = 0; |
167 | int ret = NET_RX_DROP; | |
b863ceb7 | 168 | |
a35e2c1b | 169 | port = macvlan_port_get_rcu(skb->dev); |
b863ceb7 | 170 | if (is_multicast_ether_addr(eth->h_dest)) { |
618e1b74 AB |
171 | src = macvlan_hash_lookup(port, eth->h_source); |
172 | if (!src) | |
173 | /* frame comes from an external address */ | |
174 | macvlan_broadcast(skb, port, NULL, | |
175 | MACVLAN_MODE_PRIVATE | | |
176 | MACVLAN_MODE_VEPA | | |
eb06acdc | 177 | MACVLAN_MODE_PASSTHRU| |
618e1b74 AB |
178 | MACVLAN_MODE_BRIDGE); |
179 | else if (src->mode == MACVLAN_MODE_VEPA) | |
180 | /* flood to everyone except source */ | |
181 | macvlan_broadcast(skb, port, src->dev, | |
182 | MACVLAN_MODE_VEPA | | |
183 | MACVLAN_MODE_BRIDGE); | |
184 | else if (src->mode == MACVLAN_MODE_BRIDGE) | |
185 | /* | |
186 | * flood only to VEPA ports, bridge ports | |
187 | * already saw the frame on the way out. | |
188 | */ | |
189 | macvlan_broadcast(skb, port, src->dev, | |
190 | MACVLAN_MODE_VEPA); | |
8a4eb573 | 191 | return RX_HANDLER_PASS; |
b863ceb7 PM |
192 | } |
193 | ||
eb06acdc SS |
194 | if (port->passthru) |
195 | vlan = list_first_entry(&port->vlans, struct macvlan_dev, list); | |
196 | else | |
197 | vlan = macvlan_hash_lookup(port, eth->h_dest); | |
b863ceb7 | 198 | if (vlan == NULL) |
8a4eb573 | 199 | return RX_HANDLER_PASS; |
b863ceb7 PM |
200 | |
201 | dev = vlan->dev; | |
202 | if (unlikely(!(dev->flags & IFF_UP))) { | |
203 | kfree_skb(skb); | |
8a4eb573 | 204 | return RX_HANDLER_CONSUMED; |
b863ceb7 | 205 | } |
a1e514c5 | 206 | len = skb->len + ETH_HLEN; |
b863ceb7 | 207 | skb = skb_share_check(skb, GFP_ATOMIC); |
a1e514c5 | 208 | if (!skb) |
ba01877f | 209 | goto out; |
b863ceb7 PM |
210 | |
211 | skb->dev = dev; | |
212 | skb->pkt_type = PACKET_HOST; | |
213 | ||
ba01877f SS |
214 | ret = vlan->receive(skb); |
215 | ||
216 | out: | |
217 | macvlan_count_rx(vlan, len, ret == NET_RX_SUCCESS, 0); | |
8a4eb573 | 218 | return RX_HANDLER_CONSUMED; |
b863ceb7 PM |
219 | } |
220 | ||
618e1b74 AB |
221 | static int macvlan_queue_xmit(struct sk_buff *skb, struct net_device *dev) |
222 | { | |
223 | const struct macvlan_dev *vlan = netdev_priv(dev); | |
224 | const struct macvlan_port *port = vlan->port; | |
225 | const struct macvlan_dev *dest; | |
12a2856b | 226 | __u8 ip_summed = skb->ip_summed; |
618e1b74 AB |
227 | |
228 | if (vlan->mode == MACVLAN_MODE_BRIDGE) { | |
229 | const struct ethhdr *eth = (void *)skb->data; | |
12a2856b | 230 | skb->ip_summed = CHECKSUM_UNNECESSARY; |
618e1b74 AB |
231 | |
232 | /* send to other bridge ports directly */ | |
233 | if (is_multicast_ether_addr(eth->h_dest)) { | |
234 | macvlan_broadcast(skb, port, dev, MACVLAN_MODE_BRIDGE); | |
235 | goto xmit_world; | |
236 | } | |
237 | ||
238 | dest = macvlan_hash_lookup(port, eth->h_dest); | |
239 | if (dest && dest->mode == MACVLAN_MODE_BRIDGE) { | |
240 | unsigned int length = skb->len + ETH_HLEN; | |
fc0663d6 | 241 | int ret = dest->forward(dest->dev, skb); |
618e1b74 AB |
242 | macvlan_count_rx(dest, length, |
243 | ret == NET_RX_SUCCESS, 0); | |
244 | ||
245 | return NET_XMIT_SUCCESS; | |
246 | } | |
247 | } | |
248 | ||
249 | xmit_world: | |
12a2856b | 250 | skb->ip_summed = ip_summed; |
8a83a00b | 251 | skb_set_dev(skb, vlan->lowerdev); |
618e1b74 AB |
252 | return dev_queue_xmit(skb); |
253 | } | |
254 | ||
fc0663d6 AB |
255 | netdev_tx_t macvlan_start_xmit(struct sk_buff *skb, |
256 | struct net_device *dev) | |
b863ceb7 | 257 | { |
b863ceb7 PM |
258 | unsigned int len = skb->len; |
259 | int ret; | |
8ffab51b | 260 | const struct macvlan_dev *vlan = netdev_priv(dev); |
b863ceb7 | 261 | |
618e1b74 | 262 | ret = macvlan_queue_xmit(skb, dev); |
2d6c9ffc | 263 | if (likely(ret == NET_XMIT_SUCCESS || ret == NET_XMIT_CN)) { |
8ffab51b | 264 | struct macvlan_pcpu_stats *pcpu_stats; |
2c114553 | 265 | |
8ffab51b ED |
266 | pcpu_stats = this_cpu_ptr(vlan->pcpu_stats); |
267 | u64_stats_update_begin(&pcpu_stats->syncp); | |
268 | pcpu_stats->tx_packets++; | |
269 | pcpu_stats->tx_bytes += len; | |
270 | u64_stats_update_end(&pcpu_stats->syncp); | |
271 | } else { | |
272 | this_cpu_inc(vlan->pcpu_stats->tx_dropped); | |
273 | } | |
cbbef5e1 | 274 | return ret; |
b863ceb7 | 275 | } |
fc0663d6 | 276 | EXPORT_SYMBOL_GPL(macvlan_start_xmit); |
b863ceb7 PM |
277 | |
278 | static int macvlan_hard_header(struct sk_buff *skb, struct net_device *dev, | |
3b04ddde SH |
279 | unsigned short type, const void *daddr, |
280 | const void *saddr, unsigned len) | |
b863ceb7 PM |
281 | { |
282 | const struct macvlan_dev *vlan = netdev_priv(dev); | |
283 | struct net_device *lowerdev = vlan->lowerdev; | |
284 | ||
0c4e8581 SH |
285 | return dev_hard_header(skb, lowerdev, type, daddr, |
286 | saddr ? : dev->dev_addr, len); | |
b863ceb7 PM |
287 | } |
288 | ||
3b04ddde SH |
289 | static const struct header_ops macvlan_hard_header_ops = { |
290 | .create = macvlan_hard_header, | |
291 | .rebuild = eth_rebuild_header, | |
292 | .parse = eth_header_parse, | |
3b04ddde SH |
293 | .cache = eth_header_cache, |
294 | .cache_update = eth_header_cache_update, | |
295 | }; | |
296 | ||
b863ceb7 PM |
297 | static int macvlan_open(struct net_device *dev) |
298 | { | |
299 | struct macvlan_dev *vlan = netdev_priv(dev); | |
b863ceb7 PM |
300 | struct net_device *lowerdev = vlan->lowerdev; |
301 | int err; | |
302 | ||
eb06acdc SS |
303 | if (vlan->port->passthru) { |
304 | dev_set_promiscuity(lowerdev, 1); | |
305 | goto hash_add; | |
306 | } | |
307 | ||
f9ac30f0 EB |
308 | err = -EBUSY; |
309 | if (macvlan_addr_busy(vlan->port, dev->dev_addr)) | |
310 | goto out; | |
311 | ||
a748ee24 | 312 | err = dev_uc_add(lowerdev, dev->dev_addr); |
b863ceb7 | 313 | if (err < 0) |
b89fb7da WC |
314 | goto out; |
315 | if (dev->flags & IFF_ALLMULTI) { | |
316 | err = dev_set_allmulti(lowerdev, 1); | |
317 | if (err < 0) | |
318 | goto del_unicast; | |
319 | } | |
eb06acdc SS |
320 | |
321 | hash_add: | |
f9ac30f0 | 322 | macvlan_hash_add(vlan); |
b863ceb7 | 323 | return 0; |
b89fb7da WC |
324 | |
325 | del_unicast: | |
a748ee24 | 326 | dev_uc_del(lowerdev, dev->dev_addr); |
b89fb7da WC |
327 | out: |
328 | return err; | |
b863ceb7 PM |
329 | } |
330 | ||
331 | static int macvlan_stop(struct net_device *dev) | |
332 | { | |
333 | struct macvlan_dev *vlan = netdev_priv(dev); | |
334 | struct net_device *lowerdev = vlan->lowerdev; | |
335 | ||
eb06acdc SS |
336 | if (vlan->port->passthru) { |
337 | dev_set_promiscuity(lowerdev, -1); | |
338 | goto hash_del; | |
339 | } | |
340 | ||
b863ceb7 PM |
341 | dev_mc_unsync(lowerdev, dev); |
342 | if (dev->flags & IFF_ALLMULTI) | |
343 | dev_set_allmulti(lowerdev, -1); | |
344 | ||
a748ee24 | 345 | dev_uc_del(lowerdev, dev->dev_addr); |
b863ceb7 | 346 | |
eb06acdc | 347 | hash_del: |
f9ac30f0 | 348 | macvlan_hash_del(vlan); |
b863ceb7 PM |
349 | return 0; |
350 | } | |
351 | ||
ad5d20a6 PM |
352 | static int macvlan_set_mac_address(struct net_device *dev, void *p) |
353 | { | |
354 | struct macvlan_dev *vlan = netdev_priv(dev); | |
355 | struct net_device *lowerdev = vlan->lowerdev; | |
356 | struct sockaddr *addr = p; | |
357 | int err; | |
358 | ||
359 | if (!is_valid_ether_addr(addr->sa_data)) | |
360 | return -EADDRNOTAVAIL; | |
361 | ||
f9ac30f0 EB |
362 | if (!(dev->flags & IFF_UP)) { |
363 | /* Just copy in the new address */ | |
364 | memcpy(dev->dev_addr, addr->sa_data, ETH_ALEN); | |
365 | } else { | |
366 | /* Rehash and update the device filters */ | |
367 | if (macvlan_addr_busy(vlan->port, addr->sa_data)) | |
368 | return -EBUSY; | |
ad5d20a6 | 369 | |
a748ee24 | 370 | err = dev_uc_add(lowerdev, addr->sa_data); |
ccffad25 | 371 | if (err) |
f9ac30f0 | 372 | return err; |
ad5d20a6 | 373 | |
a748ee24 | 374 | dev_uc_del(lowerdev, dev->dev_addr); |
f9ac30f0 EB |
375 | |
376 | macvlan_hash_change_addr(vlan, addr->sa_data); | |
377 | } | |
ad5d20a6 PM |
378 | return 0; |
379 | } | |
380 | ||
b863ceb7 PM |
381 | static void macvlan_change_rx_flags(struct net_device *dev, int change) |
382 | { | |
383 | struct macvlan_dev *vlan = netdev_priv(dev); | |
384 | struct net_device *lowerdev = vlan->lowerdev; | |
385 | ||
386 | if (change & IFF_ALLMULTI) | |
387 | dev_set_allmulti(lowerdev, dev->flags & IFF_ALLMULTI ? 1 : -1); | |
388 | } | |
389 | ||
390 | static void macvlan_set_multicast_list(struct net_device *dev) | |
391 | { | |
392 | struct macvlan_dev *vlan = netdev_priv(dev); | |
393 | ||
394 | dev_mc_sync(vlan->lowerdev, dev); | |
395 | } | |
396 | ||
397 | static int macvlan_change_mtu(struct net_device *dev, int new_mtu) | |
398 | { | |
399 | struct macvlan_dev *vlan = netdev_priv(dev); | |
400 | ||
401 | if (new_mtu < 68 || vlan->lowerdev->mtu < new_mtu) | |
402 | return -EINVAL; | |
403 | dev->mtu = new_mtu; | |
404 | return 0; | |
405 | } | |
406 | ||
407 | /* | |
408 | * macvlan network devices have devices nesting below it and are a special | |
409 | * "super class" of normal network devices; split their locks off into a | |
410 | * separate class since they always nest. | |
411 | */ | |
412 | static struct lock_class_key macvlan_netdev_xmit_lock_key; | |
cf508b12 | 413 | static struct lock_class_key macvlan_netdev_addr_lock_key; |
b863ceb7 PM |
414 | |
415 | #define MACVLAN_FEATURES \ | |
416 | (NETIF_F_SG | NETIF_F_ALL_CSUM | NETIF_F_HIGHDMA | NETIF_F_FRAGLIST | \ | |
417 | NETIF_F_GSO | NETIF_F_TSO | NETIF_F_UFO | NETIF_F_GSO_ROBUST | \ | |
39187646 | 418 | NETIF_F_TSO_ECN | NETIF_F_TSO6 | NETIF_F_GRO | NETIF_F_RXCSUM) |
b863ceb7 PM |
419 | |
420 | #define MACVLAN_STATE_MASK \ | |
421 | ((1<<__LINK_STATE_NOCARRIER) | (1<<__LINK_STATE_DORMANT)) | |
422 | ||
e8a0464c DM |
423 | static void macvlan_set_lockdep_class_one(struct net_device *dev, |
424 | struct netdev_queue *txq, | |
425 | void *_unused) | |
c773e847 DM |
426 | { |
427 | lockdep_set_class(&txq->_xmit_lock, | |
428 | &macvlan_netdev_xmit_lock_key); | |
429 | } | |
430 | ||
431 | static void macvlan_set_lockdep_class(struct net_device *dev) | |
432 | { | |
cf508b12 DM |
433 | lockdep_set_class(&dev->addr_list_lock, |
434 | &macvlan_netdev_addr_lock_key); | |
e8a0464c | 435 | netdev_for_each_tx_queue(dev, macvlan_set_lockdep_class_one, NULL); |
c773e847 DM |
436 | } |
437 | ||
b863ceb7 PM |
438 | static int macvlan_init(struct net_device *dev) |
439 | { | |
440 | struct macvlan_dev *vlan = netdev_priv(dev); | |
441 | const struct net_device *lowerdev = vlan->lowerdev; | |
442 | ||
443 | dev->state = (dev->state & ~MACVLAN_STATE_MASK) | | |
444 | (lowerdev->state & MACVLAN_STATE_MASK); | |
445 | dev->features = lowerdev->features & MACVLAN_FEATURES; | |
8ffab51b | 446 | dev->features |= NETIF_F_LLTX; |
8c2acc53 | 447 | dev->gso_max_size = lowerdev->gso_max_size; |
b863ceb7 | 448 | dev->iflink = lowerdev->ifindex; |
ef5c8996 | 449 | dev->hard_header_len = lowerdev->hard_header_len; |
b863ceb7 | 450 | |
c773e847 DM |
451 | macvlan_set_lockdep_class(dev); |
452 | ||
8ffab51b ED |
453 | vlan->pcpu_stats = alloc_percpu(struct macvlan_pcpu_stats); |
454 | if (!vlan->pcpu_stats) | |
fccaf710 ED |
455 | return -ENOMEM; |
456 | ||
b863ceb7 PM |
457 | return 0; |
458 | } | |
459 | ||
fccaf710 ED |
460 | static void macvlan_uninit(struct net_device *dev) |
461 | { | |
462 | struct macvlan_dev *vlan = netdev_priv(dev); | |
d5cd9244 | 463 | struct macvlan_port *port = vlan->port; |
fccaf710 | 464 | |
8ffab51b | 465 | free_percpu(vlan->pcpu_stats); |
d5cd9244 EB |
466 | |
467 | port->count -= 1; | |
468 | if (!port->count) | |
469 | macvlan_port_destroy(port->dev); | |
fccaf710 ED |
470 | } |
471 | ||
28172739 ED |
472 | static struct rtnl_link_stats64 *macvlan_dev_get_stats64(struct net_device *dev, |
473 | struct rtnl_link_stats64 *stats) | |
fccaf710 | 474 | { |
fccaf710 ED |
475 | struct macvlan_dev *vlan = netdev_priv(dev); |
476 | ||
8ffab51b ED |
477 | if (vlan->pcpu_stats) { |
478 | struct macvlan_pcpu_stats *p; | |
479 | u64 rx_packets, rx_bytes, rx_multicast, tx_packets, tx_bytes; | |
480 | u32 rx_errors = 0, tx_dropped = 0; | |
bc66154e | 481 | unsigned int start; |
fccaf710 ED |
482 | int i; |
483 | ||
484 | for_each_possible_cpu(i) { | |
8ffab51b | 485 | p = per_cpu_ptr(vlan->pcpu_stats, i); |
bc66154e ED |
486 | do { |
487 | start = u64_stats_fetch_begin_bh(&p->syncp); | |
488 | rx_packets = p->rx_packets; | |
489 | rx_bytes = p->rx_bytes; | |
490 | rx_multicast = p->rx_multicast; | |
8ffab51b ED |
491 | tx_packets = p->tx_packets; |
492 | tx_bytes = p->tx_bytes; | |
bc66154e | 493 | } while (u64_stats_fetch_retry_bh(&p->syncp, start)); |
8ffab51b ED |
494 | |
495 | stats->rx_packets += rx_packets; | |
496 | stats->rx_bytes += rx_bytes; | |
497 | stats->multicast += rx_multicast; | |
498 | stats->tx_packets += tx_packets; | |
499 | stats->tx_bytes += tx_bytes; | |
500 | /* rx_errors & tx_dropped are u32, updated | |
501 | * without syncp protection. | |
502 | */ | |
503 | rx_errors += p->rx_errors; | |
504 | tx_dropped += p->tx_dropped; | |
fccaf710 | 505 | } |
8ffab51b ED |
506 | stats->rx_errors = rx_errors; |
507 | stats->rx_dropped = rx_errors; | |
508 | stats->tx_dropped = tx_dropped; | |
fccaf710 ED |
509 | } |
510 | return stats; | |
511 | } | |
512 | ||
b863ceb7 PM |
513 | static void macvlan_ethtool_get_drvinfo(struct net_device *dev, |
514 | struct ethtool_drvinfo *drvinfo) | |
515 | { | |
516 | snprintf(drvinfo->driver, 32, "macvlan"); | |
517 | snprintf(drvinfo->version, 32, "0.1"); | |
518 | } | |
519 | ||
9edb8bb6 SH |
520 | static int macvlan_ethtool_get_settings(struct net_device *dev, |
521 | struct ethtool_cmd *cmd) | |
522 | { | |
523 | const struct macvlan_dev *vlan = netdev_priv(dev); | |
b1b67dd4 | 524 | return dev_ethtool_get_settings(vlan->lowerdev, cmd); |
9edb8bb6 SH |
525 | } |
526 | ||
b863ceb7 PM |
527 | static const struct ethtool_ops macvlan_ethtool_ops = { |
528 | .get_link = ethtool_op_get_link, | |
9edb8bb6 | 529 | .get_settings = macvlan_ethtool_get_settings, |
b863ceb7 PM |
530 | .get_drvinfo = macvlan_ethtool_get_drvinfo, |
531 | }; | |
532 | ||
54a30c97 SH |
533 | static const struct net_device_ops macvlan_netdev_ops = { |
534 | .ndo_init = macvlan_init, | |
fccaf710 | 535 | .ndo_uninit = macvlan_uninit, |
54a30c97 SH |
536 | .ndo_open = macvlan_open, |
537 | .ndo_stop = macvlan_stop, | |
00829823 | 538 | .ndo_start_xmit = macvlan_start_xmit, |
54a30c97 SH |
539 | .ndo_change_mtu = macvlan_change_mtu, |
540 | .ndo_change_rx_flags = macvlan_change_rx_flags, | |
541 | .ndo_set_mac_address = macvlan_set_mac_address, | |
542 | .ndo_set_multicast_list = macvlan_set_multicast_list, | |
bc66154e | 543 | .ndo_get_stats64 = macvlan_dev_get_stats64, |
54a30c97 SH |
544 | .ndo_validate_addr = eth_validate_addr, |
545 | }; | |
546 | ||
8a35747a | 547 | void macvlan_common_setup(struct net_device *dev) |
b863ceb7 PM |
548 | { |
549 | ether_setup(dev); | |
550 | ||
93f154b5 | 551 | dev->priv_flags &= ~IFF_XMIT_DST_RELEASE; |
54a30c97 | 552 | dev->netdev_ops = &macvlan_netdev_ops; |
b863ceb7 | 553 | dev->destructor = free_netdev; |
3b04ddde | 554 | dev->header_ops = &macvlan_hard_header_ops, |
b863ceb7 | 555 | dev->ethtool_ops = &macvlan_ethtool_ops; |
8a35747a HX |
556 | } |
557 | EXPORT_SYMBOL_GPL(macvlan_common_setup); | |
558 | ||
559 | static void macvlan_setup(struct net_device *dev) | |
560 | { | |
561 | macvlan_common_setup(dev); | |
b863ceb7 PM |
562 | dev->tx_queue_len = 0; |
563 | } | |
564 | ||
565 | static int macvlan_port_create(struct net_device *dev) | |
566 | { | |
567 | struct macvlan_port *port; | |
568 | unsigned int i; | |
ab95bfe0 | 569 | int err; |
b863ceb7 PM |
570 | |
571 | if (dev->type != ARPHRD_ETHER || dev->flags & IFF_LOOPBACK) | |
572 | return -EINVAL; | |
573 | ||
574 | port = kzalloc(sizeof(*port), GFP_KERNEL); | |
575 | if (port == NULL) | |
576 | return -ENOMEM; | |
577 | ||
eb06acdc | 578 | port->passthru = false; |
b863ceb7 PM |
579 | port->dev = dev; |
580 | INIT_LIST_HEAD(&port->vlans); | |
581 | for (i = 0; i < MACVLAN_HASH_SIZE; i++) | |
582 | INIT_HLIST_HEAD(&port->vlan_hash[i]); | |
ab95bfe0 | 583 | |
a35e2c1b JP |
584 | err = netdev_rx_handler_register(dev, macvlan_handle_frame, port); |
585 | if (err) | |
ab95bfe0 | 586 | kfree(port); |
ab95bfe0 | 587 | |
a35e2c1b | 588 | dev->priv_flags |= IFF_MACVLAN_PORT; |
ab95bfe0 | 589 | return err; |
b863ceb7 PM |
590 | } |
591 | ||
8b37ef0a JP |
592 | static void macvlan_port_rcu_free(struct rcu_head *head) |
593 | { | |
594 | struct macvlan_port *port; | |
595 | ||
596 | port = container_of(head, struct macvlan_port, rcu); | |
597 | kfree(port); | |
598 | } | |
599 | ||
b863ceb7 PM |
600 | static void macvlan_port_destroy(struct net_device *dev) |
601 | { | |
a35e2c1b | 602 | struct macvlan_port *port = macvlan_port_get(dev); |
b863ceb7 | 603 | |
a35e2c1b | 604 | dev->priv_flags &= ~IFF_MACVLAN_PORT; |
ab95bfe0 | 605 | netdev_rx_handler_unregister(dev); |
8b37ef0a | 606 | call_rcu(&port->rcu, macvlan_port_rcu_free); |
b863ceb7 PM |
607 | } |
608 | ||
b863ceb7 PM |
609 | static int macvlan_validate(struct nlattr *tb[], struct nlattr *data[]) |
610 | { | |
611 | if (tb[IFLA_ADDRESS]) { | |
612 | if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN) | |
613 | return -EINVAL; | |
614 | if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS]))) | |
615 | return -EADDRNOTAVAIL; | |
616 | } | |
27c0b1a8 AB |
617 | |
618 | if (data && data[IFLA_MACVLAN_MODE]) { | |
619 | switch (nla_get_u32(data[IFLA_MACVLAN_MODE])) { | |
620 | case MACVLAN_MODE_PRIVATE: | |
621 | case MACVLAN_MODE_VEPA: | |
622 | case MACVLAN_MODE_BRIDGE: | |
eb06acdc | 623 | case MACVLAN_MODE_PASSTHRU: |
27c0b1a8 AB |
624 | break; |
625 | default: | |
626 | return -EINVAL; | |
627 | } | |
628 | } | |
b863ceb7 PM |
629 | return 0; |
630 | } | |
631 | ||
fc0663d6 AB |
632 | int macvlan_common_newlink(struct net *src_net, struct net_device *dev, |
633 | struct nlattr *tb[], struct nlattr *data[], | |
634 | int (*receive)(struct sk_buff *skb), | |
635 | int (*forward)(struct net_device *dev, | |
636 | struct sk_buff *skb)) | |
b863ceb7 PM |
637 | { |
638 | struct macvlan_dev *vlan = netdev_priv(dev); | |
639 | struct macvlan_port *port; | |
640 | struct net_device *lowerdev; | |
641 | int err; | |
642 | ||
643 | if (!tb[IFLA_LINK]) | |
644 | return -EINVAL; | |
645 | ||
81adee47 | 646 | lowerdev = __dev_get_by_index(src_net, nla_get_u32(tb[IFLA_LINK])); |
b863ceb7 PM |
647 | if (lowerdev == NULL) |
648 | return -ENODEV; | |
649 | ||
b0832a29 EB |
650 | /* When creating macvlans on top of other macvlans - use |
651 | * the real device as the lowerdev. | |
a6ca5f1d | 652 | */ |
b0832a29 EB |
653 | if (lowerdev->rtnl_link_ops == dev->rtnl_link_ops) { |
654 | struct macvlan_dev *lowervlan = netdev_priv(lowerdev); | |
655 | lowerdev = lowervlan->lowerdev; | |
656 | } | |
a6ca5f1d | 657 | |
b863ceb7 PM |
658 | if (!tb[IFLA_MTU]) |
659 | dev->mtu = lowerdev->mtu; | |
660 | else if (dev->mtu > lowerdev->mtu) | |
661 | return -EINVAL; | |
662 | ||
663 | if (!tb[IFLA_ADDRESS]) | |
664 | random_ether_addr(dev->dev_addr); | |
665 | ||
a35e2c1b | 666 | if (!macvlan_port_exists(lowerdev)) { |
b863ceb7 PM |
667 | err = macvlan_port_create(lowerdev); |
668 | if (err < 0) | |
669 | return err; | |
670 | } | |
a35e2c1b | 671 | port = macvlan_port_get(lowerdev); |
b863ceb7 | 672 | |
eb06acdc SS |
673 | /* Only 1 macvlan device can be created in passthru mode */ |
674 | if (port->passthru) | |
675 | return -EINVAL; | |
676 | ||
b863ceb7 PM |
677 | vlan->lowerdev = lowerdev; |
678 | vlan->dev = dev; | |
679 | vlan->port = port; | |
fc0663d6 AB |
680 | vlan->receive = receive; |
681 | vlan->forward = forward; | |
b863ceb7 | 682 | |
27c0b1a8 AB |
683 | vlan->mode = MACVLAN_MODE_VEPA; |
684 | if (data && data[IFLA_MACVLAN_MODE]) | |
685 | vlan->mode = nla_get_u32(data[IFLA_MACVLAN_MODE]); | |
686 | ||
eb06acdc | 687 | if (vlan->mode == MACVLAN_MODE_PASSTHRU) { |
d5cd9244 | 688 | if (port->count) |
eb06acdc SS |
689 | return -EINVAL; |
690 | port->passthru = true; | |
691 | memcpy(dev->dev_addr, lowerdev->dev_addr, ETH_ALEN); | |
692 | } | |
693 | ||
d5cd9244 | 694 | port->count += 1; |
b863ceb7 PM |
695 | err = register_netdevice(dev); |
696 | if (err < 0) | |
f16d3d57 | 697 | goto destroy_port; |
b863ceb7 PM |
698 | |
699 | list_add_tail(&vlan->list, &port->vlans); | |
fc4a7489 | 700 | netif_stacked_transfer_operstate(lowerdev, dev); |
f16d3d57 | 701 | |
b863ceb7 | 702 | return 0; |
f16d3d57 JP |
703 | |
704 | destroy_port: | |
d5cd9244 EB |
705 | port->count -= 1; |
706 | if (!port->count) | |
f16d3d57 JP |
707 | macvlan_port_destroy(lowerdev); |
708 | ||
709 | return err; | |
b863ceb7 | 710 | } |
fc0663d6 | 711 | EXPORT_SYMBOL_GPL(macvlan_common_newlink); |
b863ceb7 | 712 | |
fc0663d6 AB |
713 | static int macvlan_newlink(struct net *src_net, struct net_device *dev, |
714 | struct nlattr *tb[], struct nlattr *data[]) | |
715 | { | |
716 | return macvlan_common_newlink(src_net, dev, tb, data, | |
717 | netif_rx, | |
718 | dev_forward_skb); | |
719 | } | |
720 | ||
721 | void macvlan_dellink(struct net_device *dev, struct list_head *head) | |
b863ceb7 PM |
722 | { |
723 | struct macvlan_dev *vlan = netdev_priv(dev); | |
b863ceb7 PM |
724 | |
725 | list_del(&vlan->list); | |
23289a37 | 726 | unregister_netdevice_queue(dev, head); |
b863ceb7 | 727 | } |
fc0663d6 | 728 | EXPORT_SYMBOL_GPL(macvlan_dellink); |
b863ceb7 | 729 | |
27c0b1a8 AB |
730 | static int macvlan_changelink(struct net_device *dev, |
731 | struct nlattr *tb[], struct nlattr *data[]) | |
732 | { | |
733 | struct macvlan_dev *vlan = netdev_priv(dev); | |
734 | if (data && data[IFLA_MACVLAN_MODE]) | |
735 | vlan->mode = nla_get_u32(data[IFLA_MACVLAN_MODE]); | |
736 | return 0; | |
737 | } | |
738 | ||
739 | static size_t macvlan_get_size(const struct net_device *dev) | |
740 | { | |
741 | return nla_total_size(4); | |
742 | } | |
743 | ||
744 | static int macvlan_fill_info(struct sk_buff *skb, | |
745 | const struct net_device *dev) | |
746 | { | |
747 | struct macvlan_dev *vlan = netdev_priv(dev); | |
748 | ||
749 | NLA_PUT_U32(skb, IFLA_MACVLAN_MODE, vlan->mode); | |
750 | return 0; | |
751 | ||
752 | nla_put_failure: | |
753 | return -EMSGSIZE; | |
754 | } | |
755 | ||
756 | static const struct nla_policy macvlan_policy[IFLA_MACVLAN_MAX + 1] = { | |
757 | [IFLA_MACVLAN_MODE] = { .type = NLA_U32 }, | |
758 | }; | |
759 | ||
fc0663d6 AB |
760 | int macvlan_link_register(struct rtnl_link_ops *ops) |
761 | { | |
762 | /* common fields */ | |
763 | ops->priv_size = sizeof(struct macvlan_dev); | |
fc0663d6 AB |
764 | ops->validate = macvlan_validate; |
765 | ops->maxtype = IFLA_MACVLAN_MAX; | |
766 | ops->policy = macvlan_policy; | |
767 | ops->changelink = macvlan_changelink; | |
768 | ops->get_size = macvlan_get_size; | |
769 | ops->fill_info = macvlan_fill_info; | |
770 | ||
771 | return rtnl_link_register(ops); | |
772 | }; | |
773 | EXPORT_SYMBOL_GPL(macvlan_link_register); | |
774 | ||
775 | static struct rtnl_link_ops macvlan_link_ops = { | |
b863ceb7 | 776 | .kind = "macvlan", |
8a35747a | 777 | .setup = macvlan_setup, |
b863ceb7 PM |
778 | .newlink = macvlan_newlink, |
779 | .dellink = macvlan_dellink, | |
780 | }; | |
781 | ||
782 | static int macvlan_device_event(struct notifier_block *unused, | |
783 | unsigned long event, void *ptr) | |
784 | { | |
785 | struct net_device *dev = ptr; | |
786 | struct macvlan_dev *vlan, *next; | |
787 | struct macvlan_port *port; | |
226bd341 | 788 | LIST_HEAD(list_kill); |
b863ceb7 | 789 | |
a35e2c1b | 790 | if (!macvlan_port_exists(dev)) |
b863ceb7 PM |
791 | return NOTIFY_DONE; |
792 | ||
a35e2c1b JP |
793 | port = macvlan_port_get(dev); |
794 | ||
b863ceb7 PM |
795 | switch (event) { |
796 | case NETDEV_CHANGE: | |
797 | list_for_each_entry(vlan, &port->vlans, list) | |
fc4a7489 PM |
798 | netif_stacked_transfer_operstate(vlan->lowerdev, |
799 | vlan->dev); | |
b863ceb7 PM |
800 | break; |
801 | case NETDEV_FEAT_CHANGE: | |
802 | list_for_each_entry(vlan, &port->vlans, list) { | |
803 | vlan->dev->features = dev->features & MACVLAN_FEATURES; | |
8c2acc53 | 804 | vlan->dev->gso_max_size = dev->gso_max_size; |
b863ceb7 PM |
805 | netdev_features_change(vlan->dev); |
806 | } | |
807 | break; | |
808 | case NETDEV_UNREGISTER: | |
3b27e105 DL |
809 | /* twiddle thumbs on netns device moves */ |
810 | if (dev->reg_state != NETREG_UNREGISTERING) | |
811 | break; | |
812 | ||
b863ceb7 | 813 | list_for_each_entry_safe(vlan, next, &port->vlans, list) |
226bd341 ED |
814 | vlan->dev->rtnl_link_ops->dellink(vlan->dev, &list_kill); |
815 | unregister_netdevice_many(&list_kill); | |
816 | list_del(&list_kill); | |
b863ceb7 | 817 | break; |
1c01fe14 JP |
818 | case NETDEV_PRE_TYPE_CHANGE: |
819 | /* Forbid underlaying device to change its type. */ | |
820 | return NOTIFY_BAD; | |
b863ceb7 PM |
821 | } |
822 | return NOTIFY_DONE; | |
823 | } | |
824 | ||
825 | static struct notifier_block macvlan_notifier_block __read_mostly = { | |
826 | .notifier_call = macvlan_device_event, | |
827 | }; | |
828 | ||
829 | static int __init macvlan_init_module(void) | |
830 | { | |
831 | int err; | |
832 | ||
833 | register_netdevice_notifier(&macvlan_notifier_block); | |
b863ceb7 | 834 | |
fc0663d6 | 835 | err = macvlan_link_register(&macvlan_link_ops); |
b863ceb7 PM |
836 | if (err < 0) |
837 | goto err1; | |
838 | return 0; | |
839 | err1: | |
b863ceb7 PM |
840 | unregister_netdevice_notifier(&macvlan_notifier_block); |
841 | return err; | |
842 | } | |
843 | ||
844 | static void __exit macvlan_cleanup_module(void) | |
845 | { | |
846 | rtnl_link_unregister(&macvlan_link_ops); | |
b863ceb7 PM |
847 | unregister_netdevice_notifier(&macvlan_notifier_block); |
848 | } | |
849 | ||
850 | module_init(macvlan_init_module); | |
851 | module_exit(macvlan_cleanup_module); | |
852 | ||
853 | MODULE_LICENSE("GPL"); | |
854 | MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>"); | |
855 | MODULE_DESCRIPTION("Driver for MAC address based VLANs"); | |
856 | MODULE_ALIAS_RTNL_LINK("macvlan"); |