2 * net-sysfs.c - network device class and attributes
4 * Copyright (c) 2003 Stephen Hemminger <shemminger@osdl.org>
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
12 #include <linux/capability.h>
13 #include <linux/kernel.h>
14 #include <linux/netdevice.h>
15 #include <net/switchdev.h>
16 #include <linux/if_arp.h>
17 #include <linux/slab.h>
18 #include <linux/nsproxy.h>
20 #include <net/net_namespace.h>
21 #include <linux/rtnetlink.h>
22 #include <linux/vmalloc.h>
23 #include <linux/export.h>
24 #include <linux/jiffies.h>
25 #include <linux/pm_runtime.h>
28 #include "net-sysfs.h"
31 static const char fmt_hex
[] = "%#x\n";
32 static const char fmt_long_hex
[] = "%#lx\n";
33 static const char fmt_dec
[] = "%d\n";
34 static const char fmt_udec
[] = "%u\n";
35 static const char fmt_ulong
[] = "%lu\n";
36 static const char fmt_u64
[] = "%llu\n";
38 static inline int dev_isalive(const struct net_device
*dev
)
40 return dev
->reg_state
<= NETREG_REGISTERED
;
43 /* use same locking rules as GIF* ioctl's */
44 static ssize_t
netdev_show(const struct device
*dev
,
45 struct device_attribute
*attr
, char *buf
,
46 ssize_t (*format
)(const struct net_device
*, char *))
48 struct net_device
*ndev
= to_net_dev(dev
);
49 ssize_t ret
= -EINVAL
;
51 read_lock(&dev_base_lock
);
52 if (dev_isalive(ndev
))
53 ret
= (*format
)(ndev
, buf
);
54 read_unlock(&dev_base_lock
);
59 /* generate a show function for simple field */
60 #define NETDEVICE_SHOW(field, format_string) \
61 static ssize_t format_##field(const struct net_device *dev, char *buf) \
63 return sprintf(buf, format_string, dev->field); \
65 static ssize_t field##_show(struct device *dev, \
66 struct device_attribute *attr, char *buf) \
68 return netdev_show(dev, attr, buf, format_##field); \
71 #define NETDEVICE_SHOW_RO(field, format_string) \
72 NETDEVICE_SHOW(field, format_string); \
73 static DEVICE_ATTR_RO(field)
75 #define NETDEVICE_SHOW_RW(field, format_string) \
76 NETDEVICE_SHOW(field, format_string); \
77 static DEVICE_ATTR_RW(field)
79 /* use same locking and permission rules as SIF* ioctl's */
80 static ssize_t
netdev_store(struct device
*dev
, struct device_attribute
*attr
,
81 const char *buf
, size_t len
,
82 int (*set
)(struct net_device
*, unsigned long))
84 struct net_device
*netdev
= to_net_dev(dev
);
85 struct net
*net
= dev_net(netdev
);
89 if (!ns_capable(net
->user_ns
, CAP_NET_ADMIN
))
92 ret
= kstrtoul(buf
, 0, &new);
97 return restart_syscall();
99 if (dev_isalive(netdev
)) {
100 if ((ret
= (*set
)(netdev
, new)) == 0)
108 NETDEVICE_SHOW_RO(dev_id
, fmt_hex
);
109 NETDEVICE_SHOW_RO(dev_port
, fmt_dec
);
110 NETDEVICE_SHOW_RO(addr_assign_type
, fmt_dec
);
111 NETDEVICE_SHOW_RO(addr_len
, fmt_dec
);
112 NETDEVICE_SHOW_RO(ifindex
, fmt_dec
);
113 NETDEVICE_SHOW_RO(type
, fmt_dec
);
114 NETDEVICE_SHOW_RO(link_mode
, fmt_dec
);
116 static ssize_t
iflink_show(struct device
*dev
, struct device_attribute
*attr
,
119 struct net_device
*ndev
= to_net_dev(dev
);
121 return sprintf(buf
, fmt_dec
, dev_get_iflink(ndev
));
123 static DEVICE_ATTR_RO(iflink
);
125 static ssize_t
format_name_assign_type(const struct net_device
*dev
, char *buf
)
127 return sprintf(buf
, fmt_dec
, dev
->name_assign_type
);
130 static ssize_t
name_assign_type_show(struct device
*dev
,
131 struct device_attribute
*attr
,
134 struct net_device
*ndev
= to_net_dev(dev
);
135 ssize_t ret
= -EINVAL
;
137 if (ndev
->name_assign_type
!= NET_NAME_UNKNOWN
)
138 ret
= netdev_show(dev
, attr
, buf
, format_name_assign_type
);
142 static DEVICE_ATTR_RO(name_assign_type
);
144 /* use same locking rules as GIFHWADDR ioctl's */
145 static ssize_t
address_show(struct device
*dev
, struct device_attribute
*attr
,
148 struct net_device
*ndev
= to_net_dev(dev
);
149 ssize_t ret
= -EINVAL
;
151 read_lock(&dev_base_lock
);
152 if (dev_isalive(ndev
))
153 ret
= sysfs_format_mac(buf
, ndev
->dev_addr
, ndev
->addr_len
);
154 read_unlock(&dev_base_lock
);
157 static DEVICE_ATTR_RO(address
);
159 static ssize_t
broadcast_show(struct device
*dev
,
160 struct device_attribute
*attr
, char *buf
)
162 struct net_device
*ndev
= to_net_dev(dev
);
163 if (dev_isalive(ndev
))
164 return sysfs_format_mac(buf
, ndev
->broadcast
, ndev
->addr_len
);
167 static DEVICE_ATTR_RO(broadcast
);
169 static int change_carrier(struct net_device
*dev
, unsigned long new_carrier
)
171 if (!netif_running(dev
))
173 return dev_change_carrier(dev
, (bool) new_carrier
);
176 static ssize_t
carrier_store(struct device
*dev
, struct device_attribute
*attr
,
177 const char *buf
, size_t len
)
179 return netdev_store(dev
, attr
, buf
, len
, change_carrier
);
182 static ssize_t
carrier_show(struct device
*dev
,
183 struct device_attribute
*attr
, char *buf
)
185 struct net_device
*netdev
= to_net_dev(dev
);
186 if (netif_running(netdev
)) {
187 return sprintf(buf
, fmt_dec
, !!netif_carrier_ok(netdev
));
191 static DEVICE_ATTR_RW(carrier
);
193 static ssize_t
speed_show(struct device
*dev
,
194 struct device_attribute
*attr
, char *buf
)
196 struct net_device
*netdev
= to_net_dev(dev
);
200 return restart_syscall();
202 if (netif_running(netdev
)) {
203 struct ethtool_cmd cmd
;
204 if (!__ethtool_get_settings(netdev
, &cmd
))
205 ret
= sprintf(buf
, fmt_udec
, ethtool_cmd_speed(&cmd
));
210 static DEVICE_ATTR_RO(speed
);
212 static ssize_t
duplex_show(struct device
*dev
,
213 struct device_attribute
*attr
, char *buf
)
215 struct net_device
*netdev
= to_net_dev(dev
);
219 return restart_syscall();
221 if (netif_running(netdev
)) {
222 struct ethtool_cmd cmd
;
223 if (!__ethtool_get_settings(netdev
, &cmd
)) {
225 switch (cmd
.duplex
) {
236 ret
= sprintf(buf
, "%s\n", duplex
);
242 static DEVICE_ATTR_RO(duplex
);
244 static ssize_t
dormant_show(struct device
*dev
,
245 struct device_attribute
*attr
, char *buf
)
247 struct net_device
*netdev
= to_net_dev(dev
);
249 if (netif_running(netdev
))
250 return sprintf(buf
, fmt_dec
, !!netif_dormant(netdev
));
254 static DEVICE_ATTR_RO(dormant
);
256 static const char *const operstates
[] = {
258 "notpresent", /* currently unused */
261 "testing", /* currently unused */
266 static ssize_t
operstate_show(struct device
*dev
,
267 struct device_attribute
*attr
, char *buf
)
269 const struct net_device
*netdev
= to_net_dev(dev
);
270 unsigned char operstate
;
272 read_lock(&dev_base_lock
);
273 operstate
= netdev
->operstate
;
274 if (!netif_running(netdev
))
275 operstate
= IF_OPER_DOWN
;
276 read_unlock(&dev_base_lock
);
278 if (operstate
>= ARRAY_SIZE(operstates
))
279 return -EINVAL
; /* should not happen */
281 return sprintf(buf
, "%s\n", operstates
[operstate
]);
283 static DEVICE_ATTR_RO(operstate
);
285 static ssize_t
carrier_changes_show(struct device
*dev
,
286 struct device_attribute
*attr
,
289 struct net_device
*netdev
= to_net_dev(dev
);
290 return sprintf(buf
, fmt_dec
,
291 atomic_read(&netdev
->carrier_changes
));
293 static DEVICE_ATTR_RO(carrier_changes
);
295 /* read-write attributes */
297 static int change_mtu(struct net_device
*dev
, unsigned long new_mtu
)
299 return dev_set_mtu(dev
, (int) new_mtu
);
302 static ssize_t
mtu_store(struct device
*dev
, struct device_attribute
*attr
,
303 const char *buf
, size_t len
)
305 return netdev_store(dev
, attr
, buf
, len
, change_mtu
);
307 NETDEVICE_SHOW_RW(mtu
, fmt_dec
);
309 static int change_flags(struct net_device
*dev
, unsigned long new_flags
)
311 return dev_change_flags(dev
, (unsigned int) new_flags
);
314 static ssize_t
flags_store(struct device
*dev
, struct device_attribute
*attr
,
315 const char *buf
, size_t len
)
317 return netdev_store(dev
, attr
, buf
, len
, change_flags
);
319 NETDEVICE_SHOW_RW(flags
, fmt_hex
);
321 static int change_tx_queue_len(struct net_device
*dev
, unsigned long new_len
)
323 dev
->tx_queue_len
= new_len
;
327 static ssize_t
tx_queue_len_store(struct device
*dev
,
328 struct device_attribute
*attr
,
329 const char *buf
, size_t len
)
331 if (!capable(CAP_NET_ADMIN
))
334 return netdev_store(dev
, attr
, buf
, len
, change_tx_queue_len
);
336 NETDEVICE_SHOW_RW(tx_queue_len
, fmt_ulong
);
338 static int change_gro_flush_timeout(struct net_device
*dev
, unsigned long val
)
340 dev
->gro_flush_timeout
= val
;
344 static ssize_t
gro_flush_timeout_store(struct device
*dev
,
345 struct device_attribute
*attr
,
346 const char *buf
, size_t len
)
348 if (!capable(CAP_NET_ADMIN
))
351 return netdev_store(dev
, attr
, buf
, len
, change_gro_flush_timeout
);
353 NETDEVICE_SHOW_RW(gro_flush_timeout
, fmt_ulong
);
355 static ssize_t
ifalias_store(struct device
*dev
, struct device_attribute
*attr
,
356 const char *buf
, size_t len
)
358 struct net_device
*netdev
= to_net_dev(dev
);
359 struct net
*net
= dev_net(netdev
);
363 if (!ns_capable(net
->user_ns
, CAP_NET_ADMIN
))
366 /* ignore trailing newline */
367 if (len
> 0 && buf
[len
- 1] == '\n')
371 return restart_syscall();
372 ret
= dev_set_alias(netdev
, buf
, count
);
375 return ret
< 0 ? ret
: len
;
378 static ssize_t
ifalias_show(struct device
*dev
,
379 struct device_attribute
*attr
, char *buf
)
381 const struct net_device
*netdev
= to_net_dev(dev
);
385 return restart_syscall();
387 ret
= sprintf(buf
, "%s\n", netdev
->ifalias
);
391 static DEVICE_ATTR_RW(ifalias
);
393 static int change_group(struct net_device
*dev
, unsigned long new_group
)
395 dev_set_group(dev
, (int) new_group
);
399 static ssize_t
group_store(struct device
*dev
, struct device_attribute
*attr
,
400 const char *buf
, size_t len
)
402 return netdev_store(dev
, attr
, buf
, len
, change_group
);
404 NETDEVICE_SHOW(group
, fmt_dec
);
405 static DEVICE_ATTR(netdev_group
, S_IRUGO
| S_IWUSR
, group_show
, group_store
);
407 static int change_proto_down(struct net_device
*dev
, unsigned long proto_down
)
409 return dev_change_proto_down(dev
, (bool) proto_down
);
412 static ssize_t
proto_down_store(struct device
*dev
,
413 struct device_attribute
*attr
,
414 const char *buf
, size_t len
)
416 return netdev_store(dev
, attr
, buf
, len
, change_proto_down
);
418 NETDEVICE_SHOW_RW(proto_down
, fmt_dec
);
420 static ssize_t
phys_port_id_show(struct device
*dev
,
421 struct device_attribute
*attr
, char *buf
)
423 struct net_device
*netdev
= to_net_dev(dev
);
424 ssize_t ret
= -EINVAL
;
427 return restart_syscall();
429 if (dev_isalive(netdev
)) {
430 struct netdev_phys_item_id ppid
;
432 ret
= dev_get_phys_port_id(netdev
, &ppid
);
434 ret
= sprintf(buf
, "%*phN\n", ppid
.id_len
, ppid
.id
);
440 static DEVICE_ATTR_RO(phys_port_id
);
442 static ssize_t
phys_port_name_show(struct device
*dev
,
443 struct device_attribute
*attr
, char *buf
)
445 struct net_device
*netdev
= to_net_dev(dev
);
446 ssize_t ret
= -EINVAL
;
449 return restart_syscall();
451 if (dev_isalive(netdev
)) {
454 ret
= dev_get_phys_port_name(netdev
, name
, sizeof(name
));
456 ret
= sprintf(buf
, "%s\n", name
);
462 static DEVICE_ATTR_RO(phys_port_name
);
464 static ssize_t
phys_switch_id_show(struct device
*dev
,
465 struct device_attribute
*attr
, char *buf
)
467 struct net_device
*netdev
= to_net_dev(dev
);
468 ssize_t ret
= -EINVAL
;
471 return restart_syscall();
473 if (dev_isalive(netdev
)) {
474 struct switchdev_attr attr
= {
475 .id
= SWITCHDEV_ATTR_PORT_PARENT_ID
,
476 .flags
= SWITCHDEV_F_NO_RECURSE
,
479 ret
= switchdev_port_attr_get(netdev
, &attr
);
481 ret
= sprintf(buf
, "%*phN\n", attr
.u
.ppid
.id_len
,
488 static DEVICE_ATTR_RO(phys_switch_id
);
490 static struct attribute
*net_class_attrs
[] = {
491 &dev_attr_netdev_group
.attr
,
493 &dev_attr_dev_id
.attr
,
494 &dev_attr_dev_port
.attr
,
495 &dev_attr_iflink
.attr
,
496 &dev_attr_ifindex
.attr
,
497 &dev_attr_name_assign_type
.attr
,
498 &dev_attr_addr_assign_type
.attr
,
499 &dev_attr_addr_len
.attr
,
500 &dev_attr_link_mode
.attr
,
501 &dev_attr_address
.attr
,
502 &dev_attr_broadcast
.attr
,
503 &dev_attr_speed
.attr
,
504 &dev_attr_duplex
.attr
,
505 &dev_attr_dormant
.attr
,
506 &dev_attr_operstate
.attr
,
507 &dev_attr_carrier_changes
.attr
,
508 &dev_attr_ifalias
.attr
,
509 &dev_attr_carrier
.attr
,
511 &dev_attr_flags
.attr
,
512 &dev_attr_tx_queue_len
.attr
,
513 &dev_attr_gro_flush_timeout
.attr
,
514 &dev_attr_phys_port_id
.attr
,
515 &dev_attr_phys_port_name
.attr
,
516 &dev_attr_phys_switch_id
.attr
,
517 &dev_attr_proto_down
.attr
,
520 ATTRIBUTE_GROUPS(net_class
);
522 /* Show a given an attribute in the statistics group */
523 static ssize_t
netstat_show(const struct device
*d
,
524 struct device_attribute
*attr
, char *buf
,
525 unsigned long offset
)
527 struct net_device
*dev
= to_net_dev(d
);
528 ssize_t ret
= -EINVAL
;
530 WARN_ON(offset
> sizeof(struct rtnl_link_stats64
) ||
531 offset
% sizeof(u64
) != 0);
533 read_lock(&dev_base_lock
);
534 if (dev_isalive(dev
)) {
535 struct rtnl_link_stats64 temp
;
536 const struct rtnl_link_stats64
*stats
= dev_get_stats(dev
, &temp
);
538 ret
= sprintf(buf
, fmt_u64
, *(u64
*)(((u8
*) stats
) + offset
));
540 read_unlock(&dev_base_lock
);
544 /* generate a read-only statistics attribute */
545 #define NETSTAT_ENTRY(name) \
546 static ssize_t name##_show(struct device *d, \
547 struct device_attribute *attr, char *buf) \
549 return netstat_show(d, attr, buf, \
550 offsetof(struct rtnl_link_stats64, name)); \
552 static DEVICE_ATTR_RO(name)
554 NETSTAT_ENTRY(rx_packets
);
555 NETSTAT_ENTRY(tx_packets
);
556 NETSTAT_ENTRY(rx_bytes
);
557 NETSTAT_ENTRY(tx_bytes
);
558 NETSTAT_ENTRY(rx_errors
);
559 NETSTAT_ENTRY(tx_errors
);
560 NETSTAT_ENTRY(rx_dropped
);
561 NETSTAT_ENTRY(tx_dropped
);
562 NETSTAT_ENTRY(multicast
);
563 NETSTAT_ENTRY(collisions
);
564 NETSTAT_ENTRY(rx_length_errors
);
565 NETSTAT_ENTRY(rx_over_errors
);
566 NETSTAT_ENTRY(rx_crc_errors
);
567 NETSTAT_ENTRY(rx_frame_errors
);
568 NETSTAT_ENTRY(rx_fifo_errors
);
569 NETSTAT_ENTRY(rx_missed_errors
);
570 NETSTAT_ENTRY(tx_aborted_errors
);
571 NETSTAT_ENTRY(tx_carrier_errors
);
572 NETSTAT_ENTRY(tx_fifo_errors
);
573 NETSTAT_ENTRY(tx_heartbeat_errors
);
574 NETSTAT_ENTRY(tx_window_errors
);
575 NETSTAT_ENTRY(rx_compressed
);
576 NETSTAT_ENTRY(tx_compressed
);
578 static struct attribute
*netstat_attrs
[] = {
579 &dev_attr_rx_packets
.attr
,
580 &dev_attr_tx_packets
.attr
,
581 &dev_attr_rx_bytes
.attr
,
582 &dev_attr_tx_bytes
.attr
,
583 &dev_attr_rx_errors
.attr
,
584 &dev_attr_tx_errors
.attr
,
585 &dev_attr_rx_dropped
.attr
,
586 &dev_attr_tx_dropped
.attr
,
587 &dev_attr_multicast
.attr
,
588 &dev_attr_collisions
.attr
,
589 &dev_attr_rx_length_errors
.attr
,
590 &dev_attr_rx_over_errors
.attr
,
591 &dev_attr_rx_crc_errors
.attr
,
592 &dev_attr_rx_frame_errors
.attr
,
593 &dev_attr_rx_fifo_errors
.attr
,
594 &dev_attr_rx_missed_errors
.attr
,
595 &dev_attr_tx_aborted_errors
.attr
,
596 &dev_attr_tx_carrier_errors
.attr
,
597 &dev_attr_tx_fifo_errors
.attr
,
598 &dev_attr_tx_heartbeat_errors
.attr
,
599 &dev_attr_tx_window_errors
.attr
,
600 &dev_attr_rx_compressed
.attr
,
601 &dev_attr_tx_compressed
.attr
,
606 static struct attribute_group netstat_group
= {
607 .name
= "statistics",
608 .attrs
= netstat_attrs
,
611 #if IS_ENABLED(CONFIG_WIRELESS_EXT) || IS_ENABLED(CONFIG_CFG80211)
612 static struct attribute
*wireless_attrs
[] = {
616 static struct attribute_group wireless_group
= {
618 .attrs
= wireless_attrs
,
622 #else /* CONFIG_SYSFS */
623 #define net_class_groups NULL
624 #endif /* CONFIG_SYSFS */
627 #define to_rx_queue_attr(_attr) container_of(_attr, \
628 struct rx_queue_attribute, attr)
630 #define to_rx_queue(obj) container_of(obj, struct netdev_rx_queue, kobj)
632 static ssize_t
rx_queue_attr_show(struct kobject
*kobj
, struct attribute
*attr
,
635 struct rx_queue_attribute
*attribute
= to_rx_queue_attr(attr
);
636 struct netdev_rx_queue
*queue
= to_rx_queue(kobj
);
638 if (!attribute
->show
)
641 return attribute
->show(queue
, attribute
, buf
);
644 static ssize_t
rx_queue_attr_store(struct kobject
*kobj
, struct attribute
*attr
,
645 const char *buf
, size_t count
)
647 struct rx_queue_attribute
*attribute
= to_rx_queue_attr(attr
);
648 struct netdev_rx_queue
*queue
= to_rx_queue(kobj
);
650 if (!attribute
->store
)
653 return attribute
->store(queue
, attribute
, buf
, count
);
656 static const struct sysfs_ops rx_queue_sysfs_ops
= {
657 .show
= rx_queue_attr_show
,
658 .store
= rx_queue_attr_store
,
662 static ssize_t
show_rps_map(struct netdev_rx_queue
*queue
,
663 struct rx_queue_attribute
*attribute
, char *buf
)
669 if (!zalloc_cpumask_var(&mask
, GFP_KERNEL
))
673 map
= rcu_dereference(queue
->rps_map
);
675 for (i
= 0; i
< map
->len
; i
++)
676 cpumask_set_cpu(map
->cpus
[i
], mask
);
678 len
= snprintf(buf
, PAGE_SIZE
, "%*pb\n", cpumask_pr_args(mask
));
680 free_cpumask_var(mask
);
682 return len
< PAGE_SIZE
? len
: -EINVAL
;
685 static ssize_t
store_rps_map(struct netdev_rx_queue
*queue
,
686 struct rx_queue_attribute
*attribute
,
687 const char *buf
, size_t len
)
689 struct rps_map
*old_map
, *map
;
692 static DEFINE_SPINLOCK(rps_map_lock
);
694 if (!capable(CAP_NET_ADMIN
))
697 if (!alloc_cpumask_var(&mask
, GFP_KERNEL
))
700 err
= bitmap_parse(buf
, len
, cpumask_bits(mask
), nr_cpumask_bits
);
702 free_cpumask_var(mask
);
706 map
= kzalloc(max_t(unsigned int,
707 RPS_MAP_SIZE(cpumask_weight(mask
)), L1_CACHE_BYTES
),
710 free_cpumask_var(mask
);
715 for_each_cpu_and(cpu
, mask
, cpu_online_mask
)
716 map
->cpus
[i
++] = cpu
;
725 spin_lock(&rps_map_lock
);
726 old_map
= rcu_dereference_protected(queue
->rps_map
,
727 lockdep_is_held(&rps_map_lock
));
728 rcu_assign_pointer(queue
->rps_map
, map
);
729 spin_unlock(&rps_map_lock
);
732 static_key_slow_inc(&rps_needed
);
734 kfree_rcu(old_map
, rcu
);
735 static_key_slow_dec(&rps_needed
);
737 free_cpumask_var(mask
);
741 static ssize_t
show_rps_dev_flow_table_cnt(struct netdev_rx_queue
*queue
,
742 struct rx_queue_attribute
*attr
,
745 struct rps_dev_flow_table
*flow_table
;
746 unsigned long val
= 0;
749 flow_table
= rcu_dereference(queue
->rps_flow_table
);
751 val
= (unsigned long)flow_table
->mask
+ 1;
754 return sprintf(buf
, "%lu\n", val
);
757 static void rps_dev_flow_table_release(struct rcu_head
*rcu
)
759 struct rps_dev_flow_table
*table
= container_of(rcu
,
760 struct rps_dev_flow_table
, rcu
);
764 static ssize_t
store_rps_dev_flow_table_cnt(struct netdev_rx_queue
*queue
,
765 struct rx_queue_attribute
*attr
,
766 const char *buf
, size_t len
)
768 unsigned long mask
, count
;
769 struct rps_dev_flow_table
*table
, *old_table
;
770 static DEFINE_SPINLOCK(rps_dev_flow_lock
);
773 if (!capable(CAP_NET_ADMIN
))
776 rc
= kstrtoul(buf
, 0, &count
);
782 /* mask = roundup_pow_of_two(count) - 1;
783 * without overflows...
785 while ((mask
| (mask
>> 1)) != mask
)
787 /* On 64 bit arches, must check mask fits in table->mask (u32),
788 * and on 32bit arches, must check
789 * RPS_DEV_FLOW_TABLE_SIZE(mask + 1) doesn't overflow.
791 #if BITS_PER_LONG > 32
792 if (mask
> (unsigned long)(u32
)mask
)
795 if (mask
> (ULONG_MAX
- RPS_DEV_FLOW_TABLE_SIZE(1))
796 / sizeof(struct rps_dev_flow
)) {
797 /* Enforce a limit to prevent overflow */
801 table
= vmalloc(RPS_DEV_FLOW_TABLE_SIZE(mask
+ 1));
806 for (count
= 0; count
<= mask
; count
++)
807 table
->flows
[count
].cpu
= RPS_NO_CPU
;
811 spin_lock(&rps_dev_flow_lock
);
812 old_table
= rcu_dereference_protected(queue
->rps_flow_table
,
813 lockdep_is_held(&rps_dev_flow_lock
));
814 rcu_assign_pointer(queue
->rps_flow_table
, table
);
815 spin_unlock(&rps_dev_flow_lock
);
818 call_rcu(&old_table
->rcu
, rps_dev_flow_table_release
);
823 static struct rx_queue_attribute rps_cpus_attribute
=
824 __ATTR(rps_cpus
, S_IRUGO
| S_IWUSR
, show_rps_map
, store_rps_map
);
827 static struct rx_queue_attribute rps_dev_flow_table_cnt_attribute
=
828 __ATTR(rps_flow_cnt
, S_IRUGO
| S_IWUSR
,
829 show_rps_dev_flow_table_cnt
, store_rps_dev_flow_table_cnt
);
830 #endif /* CONFIG_RPS */
832 static struct attribute
*rx_queue_default_attrs
[] = {
834 &rps_cpus_attribute
.attr
,
835 &rps_dev_flow_table_cnt_attribute
.attr
,
840 static void rx_queue_release(struct kobject
*kobj
)
842 struct netdev_rx_queue
*queue
= to_rx_queue(kobj
);
845 struct rps_dev_flow_table
*flow_table
;
848 map
= rcu_dereference_protected(queue
->rps_map
, 1);
850 RCU_INIT_POINTER(queue
->rps_map
, NULL
);
854 flow_table
= rcu_dereference_protected(queue
->rps_flow_table
, 1);
856 RCU_INIT_POINTER(queue
->rps_flow_table
, NULL
);
857 call_rcu(&flow_table
->rcu
, rps_dev_flow_table_release
);
861 memset(kobj
, 0, sizeof(*kobj
));
865 static const void *rx_queue_namespace(struct kobject
*kobj
)
867 struct netdev_rx_queue
*queue
= to_rx_queue(kobj
);
868 struct device
*dev
= &queue
->dev
->dev
;
869 const void *ns
= NULL
;
871 if (dev
->class && dev
->class->ns_type
)
872 ns
= dev
->class->namespace(dev
);
877 static struct kobj_type rx_queue_ktype
= {
878 .sysfs_ops
= &rx_queue_sysfs_ops
,
879 .release
= rx_queue_release
,
880 .default_attrs
= rx_queue_default_attrs
,
881 .namespace = rx_queue_namespace
884 static int rx_queue_add_kobject(struct net_device
*dev
, int index
)
886 struct netdev_rx_queue
*queue
= dev
->_rx
+ index
;
887 struct kobject
*kobj
= &queue
->kobj
;
890 kobj
->kset
= dev
->queues_kset
;
891 error
= kobject_init_and_add(kobj
, &rx_queue_ktype
, NULL
,
896 if (dev
->sysfs_rx_queue_group
) {
897 error
= sysfs_create_group(kobj
, dev
->sysfs_rx_queue_group
);
902 kobject_uevent(kobj
, KOBJ_ADD
);
903 dev_hold(queue
->dev
);
910 #endif /* CONFIG_SYSFS */
913 net_rx_queue_update_kobjects(struct net_device
*dev
, int old_num
, int new_num
)
920 if (!dev
->sysfs_rx_queue_group
)
923 for (i
= old_num
; i
< new_num
; i
++) {
924 error
= rx_queue_add_kobject(dev
, i
);
931 while (--i
>= new_num
) {
932 if (dev
->sysfs_rx_queue_group
)
933 sysfs_remove_group(&dev
->_rx
[i
].kobj
,
934 dev
->sysfs_rx_queue_group
);
935 kobject_put(&dev
->_rx
[i
].kobj
);
946 * netdev_queue sysfs structures and functions.
948 struct netdev_queue_attribute
{
949 struct attribute attr
;
950 ssize_t (*show
)(struct netdev_queue
*queue
,
951 struct netdev_queue_attribute
*attr
, char *buf
);
952 ssize_t (*store
)(struct netdev_queue
*queue
,
953 struct netdev_queue_attribute
*attr
, const char *buf
, size_t len
);
955 #define to_netdev_queue_attr(_attr) container_of(_attr, \
956 struct netdev_queue_attribute, attr)
958 #define to_netdev_queue(obj) container_of(obj, struct netdev_queue, kobj)
960 static ssize_t
netdev_queue_attr_show(struct kobject
*kobj
,
961 struct attribute
*attr
, char *buf
)
963 struct netdev_queue_attribute
*attribute
= to_netdev_queue_attr(attr
);
964 struct netdev_queue
*queue
= to_netdev_queue(kobj
);
966 if (!attribute
->show
)
969 return attribute
->show(queue
, attribute
, buf
);
972 static ssize_t
netdev_queue_attr_store(struct kobject
*kobj
,
973 struct attribute
*attr
,
974 const char *buf
, size_t count
)
976 struct netdev_queue_attribute
*attribute
= to_netdev_queue_attr(attr
);
977 struct netdev_queue
*queue
= to_netdev_queue(kobj
);
979 if (!attribute
->store
)
982 return attribute
->store(queue
, attribute
, buf
, count
);
985 static const struct sysfs_ops netdev_queue_sysfs_ops
= {
986 .show
= netdev_queue_attr_show
,
987 .store
= netdev_queue_attr_store
,
990 static ssize_t
show_trans_timeout(struct netdev_queue
*queue
,
991 struct netdev_queue_attribute
*attribute
,
994 unsigned long trans_timeout
;
996 spin_lock_irq(&queue
->_xmit_lock
);
997 trans_timeout
= queue
->trans_timeout
;
998 spin_unlock_irq(&queue
->_xmit_lock
);
1000 return sprintf(buf
, "%lu", trans_timeout
);
1004 static inline unsigned int get_netdev_queue_index(struct netdev_queue
*queue
)
1006 struct net_device
*dev
= queue
->dev
;
1009 for (i
= 0; i
< dev
->num_tx_queues
; i
++)
1010 if (queue
== &dev
->_tx
[i
])
1013 BUG_ON(i
>= dev
->num_tx_queues
);
1018 static ssize_t
show_tx_maxrate(struct netdev_queue
*queue
,
1019 struct netdev_queue_attribute
*attribute
,
1022 return sprintf(buf
, "%lu\n", queue
->tx_maxrate
);
1025 static ssize_t
set_tx_maxrate(struct netdev_queue
*queue
,
1026 struct netdev_queue_attribute
*attribute
,
1027 const char *buf
, size_t len
)
1029 struct net_device
*dev
= queue
->dev
;
1030 int err
, index
= get_netdev_queue_index(queue
);
1033 err
= kstrtou32(buf
, 10, &rate
);
1037 if (!rtnl_trylock())
1038 return restart_syscall();
1041 if (dev
->netdev_ops
->ndo_set_tx_maxrate
)
1042 err
= dev
->netdev_ops
->ndo_set_tx_maxrate(dev
, index
, rate
);
1046 queue
->tx_maxrate
= rate
;
1052 static struct netdev_queue_attribute queue_tx_maxrate
=
1053 __ATTR(tx_maxrate
, S_IRUGO
| S_IWUSR
,
1054 show_tx_maxrate
, set_tx_maxrate
);
1057 static struct netdev_queue_attribute queue_trans_timeout
=
1058 __ATTR(tx_timeout
, S_IRUGO
, show_trans_timeout
, NULL
);
1062 * Byte queue limits sysfs structures and functions.
1064 static ssize_t
bql_show(char *buf
, unsigned int value
)
1066 return sprintf(buf
, "%u\n", value
);
1069 static ssize_t
bql_set(const char *buf
, const size_t count
,
1070 unsigned int *pvalue
)
1075 if (!strcmp(buf
, "max") || !strcmp(buf
, "max\n"))
1076 value
= DQL_MAX_LIMIT
;
1078 err
= kstrtouint(buf
, 10, &value
);
1081 if (value
> DQL_MAX_LIMIT
)
1090 static ssize_t
bql_show_hold_time(struct netdev_queue
*queue
,
1091 struct netdev_queue_attribute
*attr
,
1094 struct dql
*dql
= &queue
->dql
;
1096 return sprintf(buf
, "%u\n", jiffies_to_msecs(dql
->slack_hold_time
));
1099 static ssize_t
bql_set_hold_time(struct netdev_queue
*queue
,
1100 struct netdev_queue_attribute
*attribute
,
1101 const char *buf
, size_t len
)
1103 struct dql
*dql
= &queue
->dql
;
1107 err
= kstrtouint(buf
, 10, &value
);
1111 dql
->slack_hold_time
= msecs_to_jiffies(value
);
1116 static struct netdev_queue_attribute bql_hold_time_attribute
=
1117 __ATTR(hold_time
, S_IRUGO
| S_IWUSR
, bql_show_hold_time
,
1120 static ssize_t
bql_show_inflight(struct netdev_queue
*queue
,
1121 struct netdev_queue_attribute
*attr
,
1124 struct dql
*dql
= &queue
->dql
;
1126 return sprintf(buf
, "%u\n", dql
->num_queued
- dql
->num_completed
);
1129 static struct netdev_queue_attribute bql_inflight_attribute
=
1130 __ATTR(inflight
, S_IRUGO
, bql_show_inflight
, NULL
);
1132 #define BQL_ATTR(NAME, FIELD) \
1133 static ssize_t bql_show_ ## NAME(struct netdev_queue *queue, \
1134 struct netdev_queue_attribute *attr, \
1137 return bql_show(buf, queue->dql.FIELD); \
1140 static ssize_t bql_set_ ## NAME(struct netdev_queue *queue, \
1141 struct netdev_queue_attribute *attr, \
1142 const char *buf, size_t len) \
1144 return bql_set(buf, len, &queue->dql.FIELD); \
1147 static struct netdev_queue_attribute bql_ ## NAME ## _attribute = \
1148 __ATTR(NAME, S_IRUGO | S_IWUSR, bql_show_ ## NAME, \
1151 BQL_ATTR(limit
, limit
)
1152 BQL_ATTR(limit_max
, max_limit
)
1153 BQL_ATTR(limit_min
, min_limit
)
1155 static struct attribute
*dql_attrs
[] = {
1156 &bql_limit_attribute
.attr
,
1157 &bql_limit_max_attribute
.attr
,
1158 &bql_limit_min_attribute
.attr
,
1159 &bql_hold_time_attribute
.attr
,
1160 &bql_inflight_attribute
.attr
,
1164 static struct attribute_group dql_group
= {
1165 .name
= "byte_queue_limits",
1168 #endif /* CONFIG_BQL */
1171 static ssize_t
show_xps_map(struct netdev_queue
*queue
,
1172 struct netdev_queue_attribute
*attribute
, char *buf
)
1174 struct net_device
*dev
= queue
->dev
;
1175 struct xps_dev_maps
*dev_maps
;
1177 unsigned long index
;
1180 if (!zalloc_cpumask_var(&mask
, GFP_KERNEL
))
1183 index
= get_netdev_queue_index(queue
);
1186 dev_maps
= rcu_dereference(dev
->xps_maps
);
1188 for_each_possible_cpu(i
) {
1189 struct xps_map
*map
=
1190 rcu_dereference(dev_maps
->cpu_map
[i
]);
1193 for (j
= 0; j
< map
->len
; j
++) {
1194 if (map
->queues
[j
] == index
) {
1195 cpumask_set_cpu(i
, mask
);
1204 len
= snprintf(buf
, PAGE_SIZE
, "%*pb\n", cpumask_pr_args(mask
));
1205 free_cpumask_var(mask
);
1206 return len
< PAGE_SIZE
? len
: -EINVAL
;
1209 static ssize_t
store_xps_map(struct netdev_queue
*queue
,
1210 struct netdev_queue_attribute
*attribute
,
1211 const char *buf
, size_t len
)
1213 struct net_device
*dev
= queue
->dev
;
1214 unsigned long index
;
1218 if (!capable(CAP_NET_ADMIN
))
1221 if (!alloc_cpumask_var(&mask
, GFP_KERNEL
))
1224 index
= get_netdev_queue_index(queue
);
1226 err
= bitmap_parse(buf
, len
, cpumask_bits(mask
), nr_cpumask_bits
);
1228 free_cpumask_var(mask
);
1232 err
= netif_set_xps_queue(dev
, mask
, index
);
1234 free_cpumask_var(mask
);
1239 static struct netdev_queue_attribute xps_cpus_attribute
=
1240 __ATTR(xps_cpus
, S_IRUGO
| S_IWUSR
, show_xps_map
, store_xps_map
);
1241 #endif /* CONFIG_XPS */
1243 static struct attribute
*netdev_queue_default_attrs
[] = {
1244 &queue_trans_timeout
.attr
,
1246 &xps_cpus_attribute
.attr
,
1247 &queue_tx_maxrate
.attr
,
1252 static void netdev_queue_release(struct kobject
*kobj
)
1254 struct netdev_queue
*queue
= to_netdev_queue(kobj
);
1256 memset(kobj
, 0, sizeof(*kobj
));
1257 dev_put(queue
->dev
);
1260 static const void *netdev_queue_namespace(struct kobject
*kobj
)
1262 struct netdev_queue
*queue
= to_netdev_queue(kobj
);
1263 struct device
*dev
= &queue
->dev
->dev
;
1264 const void *ns
= NULL
;
1266 if (dev
->class && dev
->class->ns_type
)
1267 ns
= dev
->class->namespace(dev
);
1272 static struct kobj_type netdev_queue_ktype
= {
1273 .sysfs_ops
= &netdev_queue_sysfs_ops
,
1274 .release
= netdev_queue_release
,
1275 .default_attrs
= netdev_queue_default_attrs
,
1276 .namespace = netdev_queue_namespace
,
1279 static int netdev_queue_add_kobject(struct net_device
*dev
, int index
)
1281 struct netdev_queue
*queue
= dev
->_tx
+ index
;
1282 struct kobject
*kobj
= &queue
->kobj
;
1285 kobj
->kset
= dev
->queues_kset
;
1286 error
= kobject_init_and_add(kobj
, &netdev_queue_ktype
, NULL
,
1292 error
= sysfs_create_group(kobj
, &dql_group
);
1297 kobject_uevent(kobj
, KOBJ_ADD
);
1298 dev_hold(queue
->dev
);
1305 #endif /* CONFIG_SYSFS */
1308 netdev_queue_update_kobjects(struct net_device
*dev
, int old_num
, int new_num
)
1314 for (i
= old_num
; i
< new_num
; i
++) {
1315 error
= netdev_queue_add_kobject(dev
, i
);
1322 while (--i
>= new_num
) {
1323 struct netdev_queue
*queue
= dev
->_tx
+ i
;
1326 sysfs_remove_group(&queue
->kobj
, &dql_group
);
1328 kobject_put(&queue
->kobj
);
1334 #endif /* CONFIG_SYSFS */
1337 static int register_queue_kobjects(struct net_device
*dev
)
1339 int error
= 0, txq
= 0, rxq
= 0, real_rx
= 0, real_tx
= 0;
1342 dev
->queues_kset
= kset_create_and_add("queues",
1343 NULL
, &dev
->dev
.kobj
);
1344 if (!dev
->queues_kset
)
1346 real_rx
= dev
->real_num_rx_queues
;
1348 real_tx
= dev
->real_num_tx_queues
;
1350 error
= net_rx_queue_update_kobjects(dev
, 0, real_rx
);
1355 error
= netdev_queue_update_kobjects(dev
, 0, real_tx
);
1363 netdev_queue_update_kobjects(dev
, txq
, 0);
1364 net_rx_queue_update_kobjects(dev
, rxq
, 0);
1368 static void remove_queue_kobjects(struct net_device
*dev
)
1370 int real_rx
= 0, real_tx
= 0;
1373 real_rx
= dev
->real_num_rx_queues
;
1375 real_tx
= dev
->real_num_tx_queues
;
1377 net_rx_queue_update_kobjects(dev
, real_rx
, 0);
1378 netdev_queue_update_kobjects(dev
, real_tx
, 0);
1380 kset_unregister(dev
->queues_kset
);
1384 static bool net_current_may_mount(void)
1386 struct net
*net
= current
->nsproxy
->net_ns
;
1388 return ns_capable(net
->user_ns
, CAP_SYS_ADMIN
);
1391 static void *net_grab_current_ns(void)
1393 struct net
*ns
= current
->nsproxy
->net_ns
;
1394 #ifdef CONFIG_NET_NS
1396 atomic_inc(&ns
->passive
);
1401 static const void *net_initial_ns(void)
1406 static const void *net_netlink_ns(struct sock
*sk
)
1408 return sock_net(sk
);
1411 struct kobj_ns_type_operations net_ns_type_operations
= {
1412 .type
= KOBJ_NS_TYPE_NET
,
1413 .current_may_mount
= net_current_may_mount
,
1414 .grab_current_ns
= net_grab_current_ns
,
1415 .netlink_ns
= net_netlink_ns
,
1416 .initial_ns
= net_initial_ns
,
1417 .drop_ns
= net_drop_ns
,
1419 EXPORT_SYMBOL_GPL(net_ns_type_operations
);
1421 static int netdev_uevent(struct device
*d
, struct kobj_uevent_env
*env
)
1423 struct net_device
*dev
= to_net_dev(d
);
1426 /* pass interface to uevent. */
1427 retval
= add_uevent_var(env
, "INTERFACE=%s", dev
->name
);
1431 /* pass ifindex to uevent.
1432 * ifindex is useful as it won't change (interface name may change)
1433 * and is what RtNetlink uses natively. */
1434 retval
= add_uevent_var(env
, "IFINDEX=%d", dev
->ifindex
);
1441 * netdev_release -- destroy and free a dead device.
1442 * Called when last reference to device kobject is gone.
1444 static void netdev_release(struct device
*d
)
1446 struct net_device
*dev
= to_net_dev(d
);
1448 BUG_ON(dev
->reg_state
!= NETREG_RELEASED
);
1450 kfree(dev
->ifalias
);
1451 netdev_freemem(dev
);
1454 static const void *net_namespace(struct device
*d
)
1456 struct net_device
*dev
;
1457 dev
= container_of(d
, struct net_device
, dev
);
1458 return dev_net(dev
);
1461 static struct class net_class
= {
1463 .dev_release
= netdev_release
,
1464 .dev_groups
= net_class_groups
,
1465 .dev_uevent
= netdev_uevent
,
1466 .ns_type
= &net_ns_type_operations
,
1467 .namespace = net_namespace
,
1470 #ifdef CONFIG_OF_NET
1471 static int of_dev_node_match(struct device
*dev
, const void *data
)
1476 ret
= dev
->parent
->of_node
== data
;
1478 return ret
== 0 ? dev
->of_node
== data
: ret
;
1481 struct net_device
*of_find_net_device_by_node(struct device_node
*np
)
1485 dev
= class_find_device(&net_class
, NULL
, np
, of_dev_node_match
);
1489 return to_net_dev(dev
);
1491 EXPORT_SYMBOL(of_find_net_device_by_node
);
1494 /* Delete sysfs entries but hold kobject reference until after all
1495 * netdev references are gone.
1497 void netdev_unregister_kobject(struct net_device
*ndev
)
1499 struct device
*dev
= &(ndev
->dev
);
1501 kobject_get(&dev
->kobj
);
1503 remove_queue_kobjects(ndev
);
1505 pm_runtime_set_memalloc_noio(dev
, false);
1510 /* Create sysfs entries for network device. */
1511 int netdev_register_kobject(struct net_device
*ndev
)
1513 struct device
*dev
= &(ndev
->dev
);
1514 const struct attribute_group
**groups
= ndev
->sysfs_groups
;
1517 device_initialize(dev
);
1518 dev
->class = &net_class
;
1519 dev
->platform_data
= ndev
;
1520 dev
->groups
= groups
;
1522 dev_set_name(dev
, "%s", ndev
->name
);
1525 /* Allow for a device specific group */
1529 *groups
++ = &netstat_group
;
1531 #if IS_ENABLED(CONFIG_WIRELESS_EXT) || IS_ENABLED(CONFIG_CFG80211)
1532 if (ndev
->ieee80211_ptr
)
1533 *groups
++ = &wireless_group
;
1534 #if IS_ENABLED(CONFIG_WIRELESS_EXT)
1535 else if (ndev
->wireless_handlers
)
1536 *groups
++ = &wireless_group
;
1539 #endif /* CONFIG_SYSFS */
1541 error
= device_add(dev
);
1545 error
= register_queue_kobjects(ndev
);
1551 pm_runtime_set_memalloc_noio(dev
, true);
1556 int netdev_class_create_file_ns(struct class_attribute
*class_attr
,
1559 return class_create_file_ns(&net_class
, class_attr
, ns
);
1561 EXPORT_SYMBOL(netdev_class_create_file_ns
);
1563 void netdev_class_remove_file_ns(struct class_attribute
*class_attr
,
1566 class_remove_file_ns(&net_class
, class_attr
, ns
);
1568 EXPORT_SYMBOL(netdev_class_remove_file_ns
);
1570 int __init
netdev_kobject_init(void)
1572 kobj_ns_type_register(&net_ns_type_operations
);
1573 return class_register(&net_class
);