2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * Definitions for the Interfaces handler.
8 * Version: @(#)dev.h 1.0.10 08/12/93
11 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
12 * Corey Minyard <wf-rch!minyard@relay.EU.net>
13 * Donald J. Becker, <becker@cesdis.gsfc.nasa.gov>
14 * Alan Cox, <alan@lxorguk.ukuu.org.uk>
15 * Bjorn Ekwall. <bj0rn@blox.se>
16 * Pekka Riikonen <priikone@poseidon.pspt.fi>
18 * This program is free software; you can redistribute it and/or
19 * modify it under the terms of the GNU General Public License
20 * as published by the Free Software Foundation; either version
21 * 2 of the License, or (at your option) any later version.
23 * Moved to /usr/include/linux for NET3
25 #ifndef _LINUX_NETDEVICE_H
26 #define _LINUX_NETDEVICE_H
29 #include <linux/if_ether.h>
30 #include <linux/if_packet.h>
31 #include <linux/if_link.h>
34 #include <linux/pm_qos.h>
35 #include <linux/timer.h>
36 #include <linux/delay.h>
37 #include <linux/atomic.h>
38 #include <asm/cache.h>
39 #include <asm/byteorder.h>
41 #include <linux/device.h>
42 #include <linux/percpu.h>
43 #include <linux/rculist.h>
44 #include <linux/dmaengine.h>
45 #include <linux/workqueue.h>
46 #include <linux/dynamic_queue_limits.h>
48 #include <linux/ethtool.h>
49 #include <net/net_namespace.h>
52 #include <net/dcbnl.h>
54 #include <net/netprio_cgroup.h>
56 #include <linux/netdev_features.h>
63 /* source back-compat hooks */
64 #define SET_ETHTOOL_OPS(netdev,ops) \
65 ( (netdev)->ethtool_ops = (ops) )
67 /* hardware address assignment types */
68 #define NET_ADDR_PERM 0 /* address is permanent (default) */
69 #define NET_ADDR_RANDOM 1 /* address is generated randomly */
70 #define NET_ADDR_STOLEN 2 /* address is stolen from other device */
72 /* Backlog congestion levels */
73 #define NET_RX_SUCCESS 0 /* keep 'em coming, baby */
74 #define NET_RX_DROP 1 /* packet dropped */
77 * Transmit return codes: transmit return codes originate from three different
80 * - qdisc return codes
81 * - driver transmit return codes
84 * Drivers are allowed to return any one of those in their hard_start_xmit()
85 * function. Real network devices commonly used with qdiscs should only return
86 * the driver transmit return codes though - when qdiscs are used, the actual
87 * transmission happens asynchronously, so the value is not propagated to
88 * higher layers. Virtual network devices transmit synchronously, in this case
89 * the driver transmit return codes are consumed by dev_queue_xmit(), all
90 * others are propagated to higher layers.
93 /* qdisc ->enqueue() return codes. */
94 #define NET_XMIT_SUCCESS 0x00
95 #define NET_XMIT_DROP 0x01 /* skb dropped */
96 #define NET_XMIT_CN 0x02 /* congestion notification */
97 #define NET_XMIT_POLICED 0x03 /* skb is shot by police */
98 #define NET_XMIT_MASK 0x0f /* qdisc flags in net/sch_generic.h */
100 /* NET_XMIT_CN is special. It does not guarantee that this packet is lost. It
101 * indicates that the device will soon be dropping packets, or already drops
102 * some packets of the same priority; prompting us to send less aggressively. */
103 #define net_xmit_eval(e) ((e) == NET_XMIT_CN ? 0 : (e))
104 #define net_xmit_errno(e) ((e) != NET_XMIT_CN ? -ENOBUFS : 0)
106 /* Driver transmit return codes */
107 #define NETDEV_TX_MASK 0xf0
110 __NETDEV_TX_MIN
= INT_MIN
, /* make sure enum is signed */
111 NETDEV_TX_OK
= 0x00, /* driver took care of packet */
112 NETDEV_TX_BUSY
= 0x10, /* driver tx path was busy*/
113 NETDEV_TX_LOCKED
= 0x20, /* driver tx lock was already taken */
115 typedef enum netdev_tx netdev_tx_t
;
118 * Current order: NETDEV_TX_MASK > NET_XMIT_MASK >= 0 is significant;
119 * hard_start_xmit() return < NET_XMIT_MASK means skb was consumed.
121 static inline bool dev_xmit_complete(int rc
)
124 * Positive cases with an skb consumed by a driver:
125 * - successful transmission (rc == NETDEV_TX_OK)
126 * - error while transmitting (rc < 0)
127 * - error while queueing to a different device (rc & NET_XMIT_MASK)
129 if (likely(rc
< NET_XMIT_MASK
))
137 #define MAX_ADDR_LEN 32 /* Largest hardware address length */
139 /* Initial net device group. All devices belong to group 0 by default. */
140 #define INIT_NETDEV_GROUP 0
144 * Compute the worst case header length according to the protocols
148 #if defined(CONFIG_WLAN) || IS_ENABLED(CONFIG_AX25)
149 # if defined(CONFIG_MAC80211_MESH)
150 # define LL_MAX_HEADER 128
152 # define LL_MAX_HEADER 96
154 #elif IS_ENABLED(CONFIG_TR)
155 # define LL_MAX_HEADER 48
157 # define LL_MAX_HEADER 32
160 #if !IS_ENABLED(CONFIG_NET_IPIP) && !IS_ENABLED(CONFIG_NET_IPGRE) && \
161 !IS_ENABLED(CONFIG_IPV6_SIT) && !IS_ENABLED(CONFIG_IPV6_TUNNEL)
162 #define MAX_HEADER LL_MAX_HEADER
164 #define MAX_HEADER (LL_MAX_HEADER + 48)
168 * Old network device statistics. Fields are native words
169 * (unsigned long) so they can be read and written atomically.
172 struct net_device_stats
{
173 unsigned long rx_packets
;
174 unsigned long tx_packets
;
175 unsigned long rx_bytes
;
176 unsigned long tx_bytes
;
177 unsigned long rx_errors
;
178 unsigned long tx_errors
;
179 unsigned long rx_dropped
;
180 unsigned long tx_dropped
;
181 unsigned long multicast
;
182 unsigned long collisions
;
183 unsigned long rx_length_errors
;
184 unsigned long rx_over_errors
;
185 unsigned long rx_crc_errors
;
186 unsigned long rx_frame_errors
;
187 unsigned long rx_fifo_errors
;
188 unsigned long rx_missed_errors
;
189 unsigned long tx_aborted_errors
;
190 unsigned long tx_carrier_errors
;
191 unsigned long tx_fifo_errors
;
192 unsigned long tx_heartbeat_errors
;
193 unsigned long tx_window_errors
;
194 unsigned long rx_compressed
;
195 unsigned long tx_compressed
;
198 #endif /* __KERNEL__ */
201 /* Media selection options. */
214 #include <linux/cache.h>
215 #include <linux/skbuff.h>
218 #include <linux/jump_label.h>
219 extern struct jump_label_key rps_needed
;
226 struct netdev_hw_addr
{
227 struct list_head list
;
228 unsigned char addr
[MAX_ADDR_LEN
];
230 #define NETDEV_HW_ADDR_T_LAN 1
231 #define NETDEV_HW_ADDR_T_SAN 2
232 #define NETDEV_HW_ADDR_T_SLAVE 3
233 #define NETDEV_HW_ADDR_T_UNICAST 4
234 #define NETDEV_HW_ADDR_T_MULTICAST 5
238 struct rcu_head rcu_head
;
241 struct netdev_hw_addr_list
{
242 struct list_head list
;
246 #define netdev_hw_addr_list_count(l) ((l)->count)
247 #define netdev_hw_addr_list_empty(l) (netdev_hw_addr_list_count(l) == 0)
248 #define netdev_hw_addr_list_for_each(ha, l) \
249 list_for_each_entry(ha, &(l)->list, list)
251 #define netdev_uc_count(dev) netdev_hw_addr_list_count(&(dev)->uc)
252 #define netdev_uc_empty(dev) netdev_hw_addr_list_empty(&(dev)->uc)
253 #define netdev_for_each_uc_addr(ha, dev) \
254 netdev_hw_addr_list_for_each(ha, &(dev)->uc)
256 #define netdev_mc_count(dev) netdev_hw_addr_list_count(&(dev)->mc)
257 #define netdev_mc_empty(dev) netdev_hw_addr_list_empty(&(dev)->mc)
258 #define netdev_for_each_mc_addr(ha, dev) \
259 netdev_hw_addr_list_for_each(ha, &(dev)->mc)
266 /* cached hardware header; allow for machine alignment needs. */
267 #define HH_DATA_MOD 16
268 #define HH_DATA_OFF(__len) \
269 (HH_DATA_MOD - (((__len - 1) & (HH_DATA_MOD - 1)) + 1))
270 #define HH_DATA_ALIGN(__len) \
271 (((__len)+(HH_DATA_MOD-1))&~(HH_DATA_MOD - 1))
272 unsigned long hh_data
[HH_DATA_ALIGN(LL_MAX_HEADER
) / sizeof(long)];
275 /* Reserve HH_DATA_MOD byte aligned hard_header_len, but at least that much.
277 * dev->hard_header_len ? (dev->hard_header_len +
278 * (HH_DATA_MOD - 1)) & ~(HH_DATA_MOD - 1) : 0
280 * We could use other alignment values, but we must maintain the
281 * relationship HH alignment <= LL alignment.
283 #define LL_RESERVED_SPACE(dev) \
284 ((((dev)->hard_header_len+(dev)->needed_headroom)&~(HH_DATA_MOD - 1)) + HH_DATA_MOD)
285 #define LL_RESERVED_SPACE_EXTRA(dev,extra) \
286 ((((dev)->hard_header_len+(dev)->needed_headroom+(extra))&~(HH_DATA_MOD - 1)) + HH_DATA_MOD)
289 int (*create
) (struct sk_buff
*skb
, struct net_device
*dev
,
290 unsigned short type
, const void *daddr
,
291 const void *saddr
, unsigned len
);
292 int (*parse
)(const struct sk_buff
*skb
, unsigned char *haddr
);
293 int (*rebuild
)(struct sk_buff
*skb
);
294 int (*cache
)(const struct neighbour
*neigh
, struct hh_cache
*hh
, __be16 type
);
295 void (*cache_update
)(struct hh_cache
*hh
,
296 const struct net_device
*dev
,
297 const unsigned char *haddr
);
300 /* These flag bits are private to the generic network queueing
301 * layer, they may not be explicitly referenced by any other
305 enum netdev_state_t
{
307 __LINK_STATE_PRESENT
,
308 __LINK_STATE_NOCARRIER
,
309 __LINK_STATE_LINKWATCH_PENDING
,
310 __LINK_STATE_DORMANT
,
315 * This structure holds at boot time configured netdevice settings. They
316 * are then used in the device probing.
318 struct netdev_boot_setup
{
322 #define NETDEV_BOOT_SETUP_MAX 8
324 extern int __init
netdev_boot_setup(char *str
);
327 * Structure for NAPI scheduling similar to tasklet but with weighting
330 /* The poll_list must only be managed by the entity which
331 * changes the state of the NAPI_STATE_SCHED bit. This means
332 * whoever atomically sets that bit can add this napi_struct
333 * to the per-cpu poll_list, and whoever clears that bit
334 * can remove from the list right before clearing the bit.
336 struct list_head poll_list
;
340 int (*poll
)(struct napi_struct
*, int);
341 #ifdef CONFIG_NETPOLL
342 spinlock_t poll_lock
;
346 unsigned int gro_count
;
348 struct net_device
*dev
;
349 struct list_head dev_list
;
350 struct sk_buff
*gro_list
;
355 NAPI_STATE_SCHED
, /* Poll is scheduled */
356 NAPI_STATE_DISABLE
, /* Disable pending */
357 NAPI_STATE_NPSVC
, /* Netpoll - don't dequeue from poll_list */
367 typedef enum gro_result gro_result_t
;
370 * enum rx_handler_result - Possible return values for rx_handlers.
371 * @RX_HANDLER_CONSUMED: skb was consumed by rx_handler, do not process it
373 * @RX_HANDLER_ANOTHER: Do another round in receive path. This is indicated in
374 * case skb->dev was changed by rx_handler.
375 * @RX_HANDLER_EXACT: Force exact delivery, no wildcard.
376 * @RX_HANDLER_PASS: Do nothing, passe the skb as if no rx_handler was called.
378 * rx_handlers are functions called from inside __netif_receive_skb(), to do
379 * special processing of the skb, prior to delivery to protocol handlers.
381 * Currently, a net_device can only have a single rx_handler registered. Trying
382 * to register a second rx_handler will return -EBUSY.
384 * To register a rx_handler on a net_device, use netdev_rx_handler_register().
385 * To unregister a rx_handler on a net_device, use
386 * netdev_rx_handler_unregister().
388 * Upon return, rx_handler is expected to tell __netif_receive_skb() what to
391 * If the rx_handler consumed to skb in some way, it should return
392 * RX_HANDLER_CONSUMED. This is appropriate when the rx_handler arranged for
393 * the skb to be delivered in some other ways.
395 * If the rx_handler changed skb->dev, to divert the skb to another
396 * net_device, it should return RX_HANDLER_ANOTHER. The rx_handler for the
397 * new device will be called if it exists.
399 * If the rx_handler consider the skb should be ignored, it should return
400 * RX_HANDLER_EXACT. The skb will only be delivered to protocol handlers that
401 * are registred on exact device (ptype->dev == skb->dev).
403 * If the rx_handler didn't changed skb->dev, but want the skb to be normally
404 * delivered, it should return RX_HANDLER_PASS.
406 * A device without a registered rx_handler will behave as if rx_handler
407 * returned RX_HANDLER_PASS.
410 enum rx_handler_result
{
416 typedef enum rx_handler_result rx_handler_result_t
;
417 typedef rx_handler_result_t
rx_handler_func_t(struct sk_buff
**pskb
);
419 extern void __napi_schedule(struct napi_struct
*n
);
421 static inline int napi_disable_pending(struct napi_struct
*n
)
423 return test_bit(NAPI_STATE_DISABLE
, &n
->state
);
427 * napi_schedule_prep - check if napi can be scheduled
430 * Test if NAPI routine is already running, and if not mark
431 * it as running. This is used as a condition variable
432 * insure only one NAPI poll instance runs. We also make
433 * sure there is no pending NAPI disable.
435 static inline int napi_schedule_prep(struct napi_struct
*n
)
437 return !napi_disable_pending(n
) &&
438 !test_and_set_bit(NAPI_STATE_SCHED
, &n
->state
);
442 * napi_schedule - schedule NAPI poll
445 * Schedule NAPI poll routine to be called if it is not already
448 static inline void napi_schedule(struct napi_struct
*n
)
450 if (napi_schedule_prep(n
))
454 /* Try to reschedule poll. Called by dev->poll() after napi_complete(). */
455 static inline int napi_reschedule(struct napi_struct
*napi
)
457 if (napi_schedule_prep(napi
)) {
458 __napi_schedule(napi
);
465 * napi_complete - NAPI processing complete
468 * Mark NAPI processing as complete.
470 extern void __napi_complete(struct napi_struct
*n
);
471 extern void napi_complete(struct napi_struct
*n
);
474 * napi_disable - prevent NAPI from scheduling
477 * Stop NAPI from being scheduled on this context.
478 * Waits till any outstanding processing completes.
480 static inline void napi_disable(struct napi_struct
*n
)
482 set_bit(NAPI_STATE_DISABLE
, &n
->state
);
483 while (test_and_set_bit(NAPI_STATE_SCHED
, &n
->state
))
485 clear_bit(NAPI_STATE_DISABLE
, &n
->state
);
489 * napi_enable - enable NAPI scheduling
492 * Resume NAPI from being scheduled on this context.
493 * Must be paired with napi_disable.
495 static inline void napi_enable(struct napi_struct
*n
)
497 BUG_ON(!test_bit(NAPI_STATE_SCHED
, &n
->state
));
498 smp_mb__before_clear_bit();
499 clear_bit(NAPI_STATE_SCHED
, &n
->state
);
504 * napi_synchronize - wait until NAPI is not running
507 * Wait until NAPI is done being scheduled on this context.
508 * Waits till any outstanding processing completes but
509 * does not disable future activations.
511 static inline void napi_synchronize(const struct napi_struct
*n
)
513 while (test_bit(NAPI_STATE_SCHED
, &n
->state
))
517 # define napi_synchronize(n) barrier()
520 enum netdev_queue_state_t
{
521 __QUEUE_STATE_DRV_XOFF
,
522 __QUEUE_STATE_STACK_XOFF
,
523 __QUEUE_STATE_FROZEN
,
524 #define QUEUE_STATE_ANY_XOFF ((1 << __QUEUE_STATE_DRV_XOFF) | \
525 (1 << __QUEUE_STATE_STACK_XOFF))
526 #define QUEUE_STATE_ANY_XOFF_OR_FROZEN (QUEUE_STATE_ANY_XOFF | \
527 (1 << __QUEUE_STATE_FROZEN))
530 * __QUEUE_STATE_DRV_XOFF is used by drivers to stop the transmit queue. The
531 * netif_tx_* functions below are used to manipulate this flag. The
532 * __QUEUE_STATE_STACK_XOFF flag is used by the stack to stop the transmit
533 * queue independently. The netif_xmit_*stopped functions below are called
534 * to check if the queue has been stopped by the driver or stack (either
535 * of the XOFF bits are set in the state). Drivers should not need to call
536 * netif_xmit*stopped functions, they should only be using netif_tx_*.
539 struct netdev_queue
{
543 struct net_device
*dev
;
545 struct Qdisc
*qdisc_sleeping
;
549 #if defined(CONFIG_XPS) && defined(CONFIG_NUMA)
555 spinlock_t _xmit_lock ____cacheline_aligned_in_smp
;
558 * please use this field instead of dev->trans_start
560 unsigned long trans_start
;
563 * Number of TX timeouts for this queue
564 * (/sys/class/net/DEV/Q/trans_timeout)
566 unsigned long trans_timeout
;
573 } ____cacheline_aligned_in_smp
;
575 static inline int netdev_queue_numa_node_read(const struct netdev_queue
*q
)
577 #if defined(CONFIG_XPS) && defined(CONFIG_NUMA)
584 static inline void netdev_queue_numa_node_write(struct netdev_queue
*q
, int node
)
586 #if defined(CONFIG_XPS) && defined(CONFIG_NUMA)
593 * This structure holds an RPS map which can be of variable length. The
594 * map is an array of CPUs.
601 #define RPS_MAP_SIZE(_num) (sizeof(struct rps_map) + (_num * sizeof(u16)))
604 * The rps_dev_flow structure contains the mapping of a flow to a CPU, the
605 * tail pointer for that CPU's input queue at the time of last enqueue, and
606 * a hardware filter index.
608 struct rps_dev_flow
{
611 unsigned int last_qtail
;
613 #define RPS_NO_FILTER 0xffff
616 * The rps_dev_flow_table structure contains a table of flow mappings.
618 struct rps_dev_flow_table
{
621 struct work_struct free_work
;
622 struct rps_dev_flow flows
[0];
624 #define RPS_DEV_FLOW_TABLE_SIZE(_num) (sizeof(struct rps_dev_flow_table) + \
625 (_num * sizeof(struct rps_dev_flow)))
628 * The rps_sock_flow_table contains mappings of flows to the last CPU
629 * on which they were processed by the application (set in recvmsg).
631 struct rps_sock_flow_table
{
635 #define RPS_SOCK_FLOW_TABLE_SIZE(_num) (sizeof(struct rps_sock_flow_table) + \
636 (_num * sizeof(u16)))
638 #define RPS_NO_CPU 0xffff
640 static inline void rps_record_sock_flow(struct rps_sock_flow_table
*table
,
644 unsigned int cpu
, index
= hash
& table
->mask
;
646 /* We only give a hint, preemption can change cpu under us */
647 cpu
= raw_smp_processor_id();
649 if (table
->ents
[index
] != cpu
)
650 table
->ents
[index
] = cpu
;
654 static inline void rps_reset_sock_flow(struct rps_sock_flow_table
*table
,
658 table
->ents
[hash
& table
->mask
] = RPS_NO_CPU
;
661 extern struct rps_sock_flow_table __rcu
*rps_sock_flow_table
;
663 #ifdef CONFIG_RFS_ACCEL
664 extern bool rps_may_expire_flow(struct net_device
*dev
, u16 rxq_index
,
665 u32 flow_id
, u16 filter_id
);
668 /* This structure contains an instance of an RX queue. */
669 struct netdev_rx_queue
{
670 struct rps_map __rcu
*rps_map
;
671 struct rps_dev_flow_table __rcu
*rps_flow_table
;
673 struct net_device
*dev
;
674 } ____cacheline_aligned_in_smp
;
675 #endif /* CONFIG_RPS */
679 * This structure holds an XPS map which can be of variable length. The
680 * map is an array of queues.
684 unsigned int alloc_len
;
688 #define XPS_MAP_SIZE(_num) (sizeof(struct xps_map) + (_num * sizeof(u16)))
689 #define XPS_MIN_MAP_ALLOC ((L1_CACHE_BYTES - sizeof(struct xps_map)) \
693 * This structure holds all XPS maps for device. Maps are indexed by CPU.
695 struct xps_dev_maps
{
697 struct xps_map __rcu
*cpu_map
[0];
699 #define XPS_DEV_MAPS_SIZE (sizeof(struct xps_dev_maps) + \
700 (nr_cpu_ids * sizeof(struct xps_map *)))
701 #endif /* CONFIG_XPS */
703 #define TC_MAX_QUEUE 16
704 #define TC_BITMASK 15
705 /* HW offloaded queuing disciplines txq count and offset maps */
706 struct netdev_tc_txq
{
712 * This structure defines the management hooks for network devices.
713 * The following hooks can be defined; unless noted otherwise, they are
714 * optional and can be filled with a null pointer.
716 * int (*ndo_init)(struct net_device *dev);
717 * This function is called once when network device is registered.
718 * The network device can use this to any late stage initializaton
719 * or semantic validattion. It can fail with an error code which will
720 * be propogated back to register_netdev
722 * void (*ndo_uninit)(struct net_device *dev);
723 * This function is called when device is unregistered or when registration
724 * fails. It is not called if init fails.
726 * int (*ndo_open)(struct net_device *dev);
727 * This function is called when network device transistions to the up
730 * int (*ndo_stop)(struct net_device *dev);
731 * This function is called when network device transistions to the down
734 * netdev_tx_t (*ndo_start_xmit)(struct sk_buff *skb,
735 * struct net_device *dev);
736 * Called when a packet needs to be transmitted.
737 * Must return NETDEV_TX_OK , NETDEV_TX_BUSY.
738 * (can also return NETDEV_TX_LOCKED iff NETIF_F_LLTX)
739 * Required can not be NULL.
741 * u16 (*ndo_select_queue)(struct net_device *dev, struct sk_buff *skb);
742 * Called to decide which queue to when device supports multiple
745 * void (*ndo_change_rx_flags)(struct net_device *dev, int flags);
746 * This function is called to allow device receiver to make
747 * changes to configuration when multicast or promiscious is enabled.
749 * void (*ndo_set_rx_mode)(struct net_device *dev);
750 * This function is called device changes address list filtering.
751 * If driver handles unicast address filtering, it should set
752 * IFF_UNICAST_FLT to its priv_flags.
754 * int (*ndo_set_mac_address)(struct net_device *dev, void *addr);
755 * This function is called when the Media Access Control address
756 * needs to be changed. If this interface is not defined, the
757 * mac address can not be changed.
759 * int (*ndo_validate_addr)(struct net_device *dev);
760 * Test if Media Access Control address is valid for the device.
762 * int (*ndo_do_ioctl)(struct net_device *dev, struct ifreq *ifr, int cmd);
763 * Called when a user request an ioctl which can't be handled by
764 * the generic interface code. If not defined ioctl's return
765 * not supported error code.
767 * int (*ndo_set_config)(struct net_device *dev, struct ifmap *map);
768 * Used to set network devices bus interface parameters. This interface
769 * is retained for legacy reason, new devices should use the bus
770 * interface (PCI) for low level management.
772 * int (*ndo_change_mtu)(struct net_device *dev, int new_mtu);
773 * Called when a user wants to change the Maximum Transfer Unit
774 * of a device. If not defined, any request to change MTU will
775 * will return an error.
777 * void (*ndo_tx_timeout)(struct net_device *dev);
778 * Callback uses when the transmitter has not made any progress
779 * for dev->watchdog ticks.
781 * struct rtnl_link_stats64* (*ndo_get_stats64)(struct net_device *dev,
782 * struct rtnl_link_stats64 *storage);
783 * struct net_device_stats* (*ndo_get_stats)(struct net_device *dev);
784 * Called when a user wants to get the network device usage
785 * statistics. Drivers must do one of the following:
786 * 1. Define @ndo_get_stats64 to fill in a zero-initialised
787 * rtnl_link_stats64 structure passed by the caller.
788 * 2. Define @ndo_get_stats to update a net_device_stats structure
789 * (which should normally be dev->stats) and return a pointer to
790 * it. The structure may be changed asynchronously only if each
791 * field is written atomically.
792 * 3. Update dev->stats asynchronously and atomically, and define
795 * void (*ndo_vlan_rx_add_vid)(struct net_device *dev, unsigned short vid);
796 * If device support VLAN filtering (dev->features & NETIF_F_HW_VLAN_FILTER)
797 * this function is called when a VLAN id is registered.
799 * void (*ndo_vlan_rx_kill_vid)(struct net_device *dev, unsigned short vid);
800 * If device support VLAN filtering (dev->features & NETIF_F_HW_VLAN_FILTER)
801 * this function is called when a VLAN id is unregistered.
803 * void (*ndo_poll_controller)(struct net_device *dev);
805 * SR-IOV management functions.
806 * int (*ndo_set_vf_mac)(struct net_device *dev, int vf, u8* mac);
807 * int (*ndo_set_vf_vlan)(struct net_device *dev, int vf, u16 vlan, u8 qos);
808 * int (*ndo_set_vf_tx_rate)(struct net_device *dev, int vf, int rate);
809 * int (*ndo_set_vf_spoofchk)(struct net_device *dev, int vf, bool setting);
810 * int (*ndo_get_vf_config)(struct net_device *dev,
811 * int vf, struct ifla_vf_info *ivf);
812 * int (*ndo_set_vf_port)(struct net_device *dev, int vf,
813 * struct nlattr *port[]);
814 * int (*ndo_get_vf_port)(struct net_device *dev, int vf, struct sk_buff *skb);
815 * int (*ndo_setup_tc)(struct net_device *dev, u8 tc)
816 * Called to setup 'tc' number of traffic classes in the net device. This
817 * is always called from the stack with the rtnl lock held and netif tx
818 * queues stopped. This allows the netdevice to perform queue management
821 * Fiber Channel over Ethernet (FCoE) offload functions.
822 * int (*ndo_fcoe_enable)(struct net_device *dev);
823 * Called when the FCoE protocol stack wants to start using LLD for FCoE
824 * so the underlying device can perform whatever needed configuration or
825 * initialization to support acceleration of FCoE traffic.
827 * int (*ndo_fcoe_disable)(struct net_device *dev);
828 * Called when the FCoE protocol stack wants to stop using LLD for FCoE
829 * so the underlying device can perform whatever needed clean-ups to
830 * stop supporting acceleration of FCoE traffic.
832 * int (*ndo_fcoe_ddp_setup)(struct net_device *dev, u16 xid,
833 * struct scatterlist *sgl, unsigned int sgc);
834 * Called when the FCoE Initiator wants to initialize an I/O that
835 * is a possible candidate for Direct Data Placement (DDP). The LLD can
836 * perform necessary setup and returns 1 to indicate the device is set up
837 * successfully to perform DDP on this I/O, otherwise this returns 0.
839 * int (*ndo_fcoe_ddp_done)(struct net_device *dev, u16 xid);
840 * Called when the FCoE Initiator/Target is done with the DDPed I/O as
841 * indicated by the FC exchange id 'xid', so the underlying device can
842 * clean up and reuse resources for later DDP requests.
844 * int (*ndo_fcoe_ddp_target)(struct net_device *dev, u16 xid,
845 * struct scatterlist *sgl, unsigned int sgc);
846 * Called when the FCoE Target wants to initialize an I/O that
847 * is a possible candidate for Direct Data Placement (DDP). The LLD can
848 * perform necessary setup and returns 1 to indicate the device is set up
849 * successfully to perform DDP on this I/O, otherwise this returns 0.
851 * int (*ndo_fcoe_get_wwn)(struct net_device *dev, u64 *wwn, int type);
852 * Called when the underlying device wants to override default World Wide
853 * Name (WWN) generation mechanism in FCoE protocol stack to pass its own
854 * World Wide Port Name (WWPN) or World Wide Node Name (WWNN) to the FCoE
855 * protocol stack to use.
858 * int (*ndo_rx_flow_steer)(struct net_device *dev, const struct sk_buff *skb,
859 * u16 rxq_index, u32 flow_id);
860 * Set hardware filter for RFS. rxq_index is the target queue index;
861 * flow_id is a flow ID to be passed to rps_may_expire_flow() later.
862 * Return the filter ID on success, or a negative error code.
864 * Slave management functions (for bridge, bonding, etc). User should
865 * call netdev_set_master() to set dev->master properly.
866 * int (*ndo_add_slave)(struct net_device *dev, struct net_device *slave_dev);
867 * Called to make another netdev an underling.
869 * int (*ndo_del_slave)(struct net_device *dev, struct net_device *slave_dev);
870 * Called to release previously enslaved netdev.
872 * Feature/offload setting functions.
873 * netdev_features_t (*ndo_fix_features)(struct net_device *dev,
874 * netdev_features_t features);
875 * Adjusts the requested feature flags according to device-specific
876 * constraints, and returns the resulting flags. Must not modify
879 * int (*ndo_set_features)(struct net_device *dev, netdev_features_t features);
880 * Called to update device configuration to new features. Passed
881 * feature set might be less than what was returned by ndo_fix_features()).
882 * Must return >0 or -errno if it changed dev->features itself.
885 struct net_device_ops
{
886 int (*ndo_init
)(struct net_device
*dev
);
887 void (*ndo_uninit
)(struct net_device
*dev
);
888 int (*ndo_open
)(struct net_device
*dev
);
889 int (*ndo_stop
)(struct net_device
*dev
);
890 netdev_tx_t (*ndo_start_xmit
) (struct sk_buff
*skb
,
891 struct net_device
*dev
);
892 u16 (*ndo_select_queue
)(struct net_device
*dev
,
893 struct sk_buff
*skb
);
894 void (*ndo_change_rx_flags
)(struct net_device
*dev
,
896 void (*ndo_set_rx_mode
)(struct net_device
*dev
);
897 int (*ndo_set_mac_address
)(struct net_device
*dev
,
899 int (*ndo_validate_addr
)(struct net_device
*dev
);
900 int (*ndo_do_ioctl
)(struct net_device
*dev
,
901 struct ifreq
*ifr
, int cmd
);
902 int (*ndo_set_config
)(struct net_device
*dev
,
904 int (*ndo_change_mtu
)(struct net_device
*dev
,
906 int (*ndo_neigh_setup
)(struct net_device
*dev
,
907 struct neigh_parms
*);
908 void (*ndo_tx_timeout
) (struct net_device
*dev
);
910 struct rtnl_link_stats64
* (*ndo_get_stats64
)(struct net_device
*dev
,
911 struct rtnl_link_stats64
*storage
);
912 struct net_device_stats
* (*ndo_get_stats
)(struct net_device
*dev
);
914 void (*ndo_vlan_rx_add_vid
)(struct net_device
*dev
,
916 void (*ndo_vlan_rx_kill_vid
)(struct net_device
*dev
,
918 #ifdef CONFIG_NET_POLL_CONTROLLER
919 void (*ndo_poll_controller
)(struct net_device
*dev
);
920 int (*ndo_netpoll_setup
)(struct net_device
*dev
,
921 struct netpoll_info
*info
);
922 void (*ndo_netpoll_cleanup
)(struct net_device
*dev
);
924 int (*ndo_set_vf_mac
)(struct net_device
*dev
,
926 int (*ndo_set_vf_vlan
)(struct net_device
*dev
,
927 int queue
, u16 vlan
, u8 qos
);
928 int (*ndo_set_vf_tx_rate
)(struct net_device
*dev
,
930 int (*ndo_set_vf_spoofchk
)(struct net_device
*dev
,
931 int vf
, bool setting
);
932 int (*ndo_get_vf_config
)(struct net_device
*dev
,
934 struct ifla_vf_info
*ivf
);
935 int (*ndo_set_vf_port
)(struct net_device
*dev
,
937 struct nlattr
*port
[]);
938 int (*ndo_get_vf_port
)(struct net_device
*dev
,
939 int vf
, struct sk_buff
*skb
);
940 int (*ndo_setup_tc
)(struct net_device
*dev
, u8 tc
);
941 #if IS_ENABLED(CONFIG_FCOE)
942 int (*ndo_fcoe_enable
)(struct net_device
*dev
);
943 int (*ndo_fcoe_disable
)(struct net_device
*dev
);
944 int (*ndo_fcoe_ddp_setup
)(struct net_device
*dev
,
946 struct scatterlist
*sgl
,
948 int (*ndo_fcoe_ddp_done
)(struct net_device
*dev
,
950 int (*ndo_fcoe_ddp_target
)(struct net_device
*dev
,
952 struct scatterlist
*sgl
,
956 #if IS_ENABLED(CONFIG_LIBFCOE)
957 #define NETDEV_FCOE_WWNN 0
958 #define NETDEV_FCOE_WWPN 1
959 int (*ndo_fcoe_get_wwn
)(struct net_device
*dev
,
963 #ifdef CONFIG_RFS_ACCEL
964 int (*ndo_rx_flow_steer
)(struct net_device
*dev
,
965 const struct sk_buff
*skb
,
969 int (*ndo_add_slave
)(struct net_device
*dev
,
970 struct net_device
*slave_dev
);
971 int (*ndo_del_slave
)(struct net_device
*dev
,
972 struct net_device
*slave_dev
);
973 netdev_features_t (*ndo_fix_features
)(struct net_device
*dev
,
974 netdev_features_t features
);
975 int (*ndo_set_features
)(struct net_device
*dev
,
976 netdev_features_t features
);
977 int (*ndo_neigh_construct
)(struct neighbour
*n
);
978 void (*ndo_neigh_destroy
)(struct neighbour
*n
);
982 * The DEVICE structure.
983 * Actually, this whole structure is a big mistake. It mixes I/O
984 * data with strictly "high-level" data, and it has to know about
985 * almost every data structure used in the INET module.
987 * FIXME: cleanup struct net_device such that network protocol info
994 * This is the first field of the "visible" part of this structure
995 * (i.e. as seen by users in the "Space.c" file). It is the name
1000 struct pm_qos_request pm_qos_req
;
1002 /* device name hash chain */
1003 struct hlist_node name_hlist
;
1008 * I/O specific fields
1009 * FIXME: Merge these and struct ifmap into one
1011 unsigned long mem_end
; /* shared mem end */
1012 unsigned long mem_start
; /* shared mem start */
1013 unsigned long base_addr
; /* device I/O address */
1014 unsigned int irq
; /* device IRQ number */
1017 * Some hardware also needs these fields, but they are not
1018 * part of the usual set specified in Space.c.
1021 unsigned long state
;
1023 struct list_head dev_list
;
1024 struct list_head napi_list
;
1025 struct list_head unreg_list
;
1027 /* currently active device features */
1028 netdev_features_t features
;
1029 /* user-changeable features */
1030 netdev_features_t hw_features
;
1031 /* user-requested features */
1032 netdev_features_t wanted_features
;
1033 /* mask of features inheritable by VLAN devices */
1034 netdev_features_t vlan_features
;
1036 /* Interface index. Unique device identifier */
1040 struct net_device_stats stats
;
1041 atomic_long_t rx_dropped
; /* dropped packets by core network
1042 * Do not use this in drivers.
1045 #ifdef CONFIG_WIRELESS_EXT
1046 /* List of functions to handle Wireless Extensions (instead of ioctl).
1047 * See <net/iw_handler.h> for details. Jean II */
1048 const struct iw_handler_def
* wireless_handlers
;
1049 /* Instance data managed by the core of Wireless Extensions. */
1050 struct iw_public_data
* wireless_data
;
1052 /* Management operations */
1053 const struct net_device_ops
*netdev_ops
;
1054 const struct ethtool_ops
*ethtool_ops
;
1056 /* Hardware header description */
1057 const struct header_ops
*header_ops
;
1059 unsigned int flags
; /* interface flags (a la BSD) */
1060 unsigned int priv_flags
; /* Like 'flags' but invisible to userspace. */
1061 unsigned short gflags
;
1062 unsigned short padded
; /* How much padding added by alloc_netdev() */
1064 unsigned char operstate
; /* RFC2863 operstate */
1065 unsigned char link_mode
; /* mapping policy to operstate */
1067 unsigned char if_port
; /* Selectable AUI, TP,..*/
1068 unsigned char dma
; /* DMA channel */
1070 unsigned int mtu
; /* interface MTU value */
1071 unsigned short type
; /* interface hardware type */
1072 unsigned short hard_header_len
; /* hardware hdr length */
1074 /* extra head- and tailroom the hardware may need, but not in all cases
1075 * can this be guaranteed, especially tailroom. Some cases also use
1076 * LL_MAX_HEADER instead to allocate the skb.
1078 unsigned short needed_headroom
;
1079 unsigned short needed_tailroom
;
1081 /* Interface address info. */
1082 unsigned char perm_addr
[MAX_ADDR_LEN
]; /* permanent hw address */
1083 unsigned char addr_assign_type
; /* hw address assignment type */
1084 unsigned char addr_len
; /* hardware address length */
1085 unsigned char neigh_priv_len
;
1086 unsigned short dev_id
; /* for shared network cards */
1088 spinlock_t addr_list_lock
;
1089 struct netdev_hw_addr_list uc
; /* Unicast mac addresses */
1090 struct netdev_hw_addr_list mc
; /* Multicast mac addresses */
1092 unsigned int promiscuity
;
1093 unsigned int allmulti
;
1096 /* Protocol specific pointers */
1098 #if IS_ENABLED(CONFIG_VLAN_8021Q)
1099 struct vlan_group __rcu
*vlgrp
; /* VLAN group */
1101 #if IS_ENABLED(CONFIG_NET_DSA)
1102 struct dsa_switch_tree
*dsa_ptr
; /* dsa specific data */
1104 void *atalk_ptr
; /* AppleTalk link */
1105 struct in_device __rcu
*ip_ptr
; /* IPv4 specific data */
1106 struct dn_dev __rcu
*dn_ptr
; /* DECnet specific data */
1107 struct inet6_dev __rcu
*ip6_ptr
; /* IPv6 specific data */
1108 void *ec_ptr
; /* Econet specific data */
1109 void *ax25_ptr
; /* AX.25 specific data */
1110 struct wireless_dev
*ieee80211_ptr
; /* IEEE 802.11 specific data,
1111 assign before registering */
1114 * Cache lines mostly used on receive path (including eth_type_trans())
1116 unsigned long last_rx
; /* Time of last Rx
1117 * This should not be set in
1118 * drivers, unless really needed,
1119 * because network stack (bonding)
1120 * use it if/when necessary, to
1121 * avoid dirtying this cache line.
1124 struct net_device
*master
; /* Pointer to master device of a group,
1125 * which this device is member of.
1128 /* Interface address info used in eth_type_trans() */
1129 unsigned char *dev_addr
; /* hw address, (before bcast
1130 because most packets are
1133 struct netdev_hw_addr_list dev_addrs
; /* list of device
1136 unsigned char broadcast
[MAX_ADDR_LEN
]; /* hw bcast add */
1139 struct kset
*queues_kset
;
1143 struct netdev_rx_queue
*_rx
;
1145 /* Number of RX queues allocated at register_netdev() time */
1146 unsigned int num_rx_queues
;
1148 /* Number of RX queues currently active in device */
1149 unsigned int real_num_rx_queues
;
1151 #ifdef CONFIG_RFS_ACCEL
1152 /* CPU reverse-mapping for RX completion interrupts, indexed
1153 * by RX queue number. Assigned by driver. This must only be
1154 * set if the ndo_rx_flow_steer operation is defined. */
1155 struct cpu_rmap
*rx_cpu_rmap
;
1159 rx_handler_func_t __rcu
*rx_handler
;
1160 void __rcu
*rx_handler_data
;
1162 struct netdev_queue __rcu
*ingress_queue
;
1165 * Cache lines mostly used on transmit path
1167 struct netdev_queue
*_tx ____cacheline_aligned_in_smp
;
1169 /* Number of TX queues allocated at alloc_netdev_mq() time */
1170 unsigned int num_tx_queues
;
1172 /* Number of TX queues currently active in device */
1173 unsigned int real_num_tx_queues
;
1175 /* root qdisc from userspace point of view */
1176 struct Qdisc
*qdisc
;
1178 unsigned long tx_queue_len
; /* Max frames per queue allowed */
1179 spinlock_t tx_global_lock
;
1182 struct xps_dev_maps __rcu
*xps_maps
;
1185 /* These may be needed for future network-power-down code. */
1188 * trans_start here is expensive for high speed devices on SMP,
1189 * please use netdev_queue->trans_start instead.
1191 unsigned long trans_start
; /* Time (in jiffies) of last Tx */
1193 int watchdog_timeo
; /* used by dev_watchdog() */
1194 struct timer_list watchdog_timer
;
1196 /* Number of references to this device */
1197 int __percpu
*pcpu_refcnt
;
1199 /* delayed register/unregister */
1200 struct list_head todo_list
;
1201 /* device index hash chain */
1202 struct hlist_node index_hlist
;
1204 struct list_head link_watch_list
;
1206 /* register/unregister state machine */
1207 enum { NETREG_UNINITIALIZED
=0,
1208 NETREG_REGISTERED
, /* completed register_netdevice */
1209 NETREG_UNREGISTERING
, /* called unregister_netdevice */
1210 NETREG_UNREGISTERED
, /* completed unregister todo */
1211 NETREG_RELEASED
, /* called free_netdev */
1212 NETREG_DUMMY
, /* dummy device for NAPI poll */
1215 bool dismantle
; /* device is going do be freed */
1218 RTNL_LINK_INITIALIZED
,
1219 RTNL_LINK_INITIALIZING
,
1220 } rtnl_link_state
:16;
1222 /* Called from unregister, can be used to call free_netdev */
1223 void (*destructor
)(struct net_device
*dev
);
1225 #ifdef CONFIG_NETPOLL
1226 struct netpoll_info
*npinfo
;
1229 #ifdef CONFIG_NET_NS
1230 /* Network namespace this network device is inside */
1234 /* mid-layer private */
1237 struct pcpu_lstats __percpu
*lstats
; /* loopback stats */
1238 struct pcpu_tstats __percpu
*tstats
; /* tunnel stats */
1239 struct pcpu_dstats __percpu
*dstats
; /* dummy stats */
1242 struct garp_port __rcu
*garp_port
;
1244 /* class/net/name entry */
1246 /* space for optional device, statistics, and wireless sysfs groups */
1247 const struct attribute_group
*sysfs_groups
[4];
1249 /* rtnetlink link ops */
1250 const struct rtnl_link_ops
*rtnl_link_ops
;
1252 /* for setting kernel sock attribute on TCP connection setup */
1253 #define GSO_MAX_SIZE 65536
1254 unsigned int gso_max_size
;
1257 /* Data Center Bridging netlink ops */
1258 const struct dcbnl_rtnl_ops
*dcbnl_ops
;
1261 struct netdev_tc_txq tc_to_txq
[TC_MAX_QUEUE
];
1262 u8 prio_tc_map
[TC_BITMASK
+ 1];
1264 #if IS_ENABLED(CONFIG_FCOE)
1265 /* max exchange id for FCoE LRO by ddp */
1266 unsigned int fcoe_ddp_xid
;
1268 #if IS_ENABLED(CONFIG_NETPRIO_CGROUP)
1269 struct netprio_map __rcu
*priomap
;
1271 /* phy device may attach itself for hardware timestamping */
1272 struct phy_device
*phydev
;
1274 /* group the device belongs to */
1277 #define to_net_dev(d) container_of(d, struct net_device, dev)
1279 #define NETDEV_ALIGN 32
1282 int netdev_get_prio_tc_map(const struct net_device
*dev
, u32 prio
)
1284 return dev
->prio_tc_map
[prio
& TC_BITMASK
];
1288 int netdev_set_prio_tc_map(struct net_device
*dev
, u8 prio
, u8 tc
)
1290 if (tc
>= dev
->num_tc
)
1293 dev
->prio_tc_map
[prio
& TC_BITMASK
] = tc
& TC_BITMASK
;
1298 void netdev_reset_tc(struct net_device
*dev
)
1301 memset(dev
->tc_to_txq
, 0, sizeof(dev
->tc_to_txq
));
1302 memset(dev
->prio_tc_map
, 0, sizeof(dev
->prio_tc_map
));
1306 int netdev_set_tc_queue(struct net_device
*dev
, u8 tc
, u16 count
, u16 offset
)
1308 if (tc
>= dev
->num_tc
)
1311 dev
->tc_to_txq
[tc
].count
= count
;
1312 dev
->tc_to_txq
[tc
].offset
= offset
;
1317 int netdev_set_num_tc(struct net_device
*dev
, u8 num_tc
)
1319 if (num_tc
> TC_MAX_QUEUE
)
1322 dev
->num_tc
= num_tc
;
1327 int netdev_get_num_tc(struct net_device
*dev
)
1333 struct netdev_queue
*netdev_get_tx_queue(const struct net_device
*dev
,
1336 return &dev
->_tx
[index
];
1339 static inline void netdev_for_each_tx_queue(struct net_device
*dev
,
1340 void (*f
)(struct net_device
*,
1341 struct netdev_queue
*,
1347 for (i
= 0; i
< dev
->num_tx_queues
; i
++)
1348 f(dev
, &dev
->_tx
[i
], arg
);
1352 * Net namespace inlines
1355 struct net
*dev_net(const struct net_device
*dev
)
1357 return read_pnet(&dev
->nd_net
);
1361 void dev_net_set(struct net_device
*dev
, struct net
*net
)
1363 #ifdef CONFIG_NET_NS
1364 release_net(dev
->nd_net
);
1365 dev
->nd_net
= hold_net(net
);
1369 static inline bool netdev_uses_dsa_tags(struct net_device
*dev
)
1371 #ifdef CONFIG_NET_DSA_TAG_DSA
1372 if (dev
->dsa_ptr
!= NULL
)
1373 return dsa_uses_dsa_tags(dev
->dsa_ptr
);
1379 #ifndef CONFIG_NET_NS
1380 static inline void skb_set_dev(struct sk_buff
*skb
, struct net_device
*dev
)
1384 #else /* CONFIG_NET_NS */
1385 void skb_set_dev(struct sk_buff
*skb
, struct net_device
*dev
);
1388 static inline bool netdev_uses_trailer_tags(struct net_device
*dev
)
1390 #ifdef CONFIG_NET_DSA_TAG_TRAILER
1391 if (dev
->dsa_ptr
!= NULL
)
1392 return dsa_uses_trailer_tags(dev
->dsa_ptr
);
1399 * netdev_priv - access network device private data
1400 * @dev: network device
1402 * Get network device private data
1404 static inline void *netdev_priv(const struct net_device
*dev
)
1406 return (char *)dev
+ ALIGN(sizeof(struct net_device
), NETDEV_ALIGN
);
1409 /* Set the sysfs physical device reference for the network logical device
1410 * if set prior to registration will cause a symlink during initialization.
1412 #define SET_NETDEV_DEV(net, pdev) ((net)->dev.parent = (pdev))
1414 /* Set the sysfs device type for the network logical device to allow
1415 * fin grained indentification of different network device types. For
1416 * example Ethernet, Wirelss LAN, Bluetooth, WiMAX etc.
1418 #define SET_NETDEV_DEVTYPE(net, devtype) ((net)->dev.type = (devtype))
1421 * netif_napi_add - initialize a napi context
1422 * @dev: network device
1423 * @napi: napi context
1424 * @poll: polling function
1425 * @weight: default weight
1427 * netif_napi_add() must be used to initialize a napi context prior to calling
1428 * *any* of the other napi related functions.
1430 void netif_napi_add(struct net_device
*dev
, struct napi_struct
*napi
,
1431 int (*poll
)(struct napi_struct
*, int), int weight
);
1434 * netif_napi_del - remove a napi context
1435 * @napi: napi context
1437 * netif_napi_del() removes a napi context from the network device napi list
1439 void netif_napi_del(struct napi_struct
*napi
);
1441 struct napi_gro_cb
{
1442 /* Virtual address of skb_shinfo(skb)->frags[0].page + offset. */
1445 /* Length of frag0. */
1446 unsigned int frag0_len
;
1448 /* This indicates where we are processing relative to skb->data. */
1451 /* This is non-zero if the packet may be of the same flow. */
1454 /* This is non-zero if the packet cannot be merged with the new skb. */
1457 /* Number of segments aggregated. */
1464 #define NAPI_GRO_CB(skb) ((struct napi_gro_cb *)(skb)->cb)
1466 struct packet_type
{
1467 __be16 type
; /* This is really htons(ether_type). */
1468 struct net_device
*dev
; /* NULL is wildcarded here */
1469 int (*func
) (struct sk_buff
*,
1470 struct net_device
*,
1471 struct packet_type
*,
1472 struct net_device
*);
1473 struct sk_buff
*(*gso_segment
)(struct sk_buff
*skb
,
1474 netdev_features_t features
);
1475 int (*gso_send_check
)(struct sk_buff
*skb
);
1476 struct sk_buff
**(*gro_receive
)(struct sk_buff
**head
,
1477 struct sk_buff
*skb
);
1478 int (*gro_complete
)(struct sk_buff
*skb
);
1479 void *af_packet_priv
;
1480 struct list_head list
;
1483 #include <linux/notifier.h>
1485 /* netdevice notifier chain. Please remember to update the rtnetlink
1486 * notification exclusion list in rtnetlink_event() when adding new
1489 #define NETDEV_UP 0x0001 /* For now you can't veto a device up/down */
1490 #define NETDEV_DOWN 0x0002
1491 #define NETDEV_REBOOT 0x0003 /* Tell a protocol stack a network interface
1492 detected a hardware crash and restarted
1493 - we can use this eg to kick tcp sessions
1495 #define NETDEV_CHANGE 0x0004 /* Notify device state change */
1496 #define NETDEV_REGISTER 0x0005
1497 #define NETDEV_UNREGISTER 0x0006
1498 #define NETDEV_CHANGEMTU 0x0007
1499 #define NETDEV_CHANGEADDR 0x0008
1500 #define NETDEV_GOING_DOWN 0x0009
1501 #define NETDEV_CHANGENAME 0x000A
1502 #define NETDEV_FEAT_CHANGE 0x000B
1503 #define NETDEV_BONDING_FAILOVER 0x000C
1504 #define NETDEV_PRE_UP 0x000D
1505 #define NETDEV_PRE_TYPE_CHANGE 0x000E
1506 #define NETDEV_POST_TYPE_CHANGE 0x000F
1507 #define NETDEV_POST_INIT 0x0010
1508 #define NETDEV_UNREGISTER_BATCH 0x0011
1509 #define NETDEV_RELEASE 0x0012
1510 #define NETDEV_NOTIFY_PEERS 0x0013
1511 #define NETDEV_JOIN 0x0014
1513 extern int register_netdevice_notifier(struct notifier_block
*nb
);
1514 extern int unregister_netdevice_notifier(struct notifier_block
*nb
);
1515 extern int call_netdevice_notifiers(unsigned long val
, struct net_device
*dev
);
1518 extern rwlock_t dev_base_lock
; /* Device list lock */
1521 #define for_each_netdev(net, d) \
1522 list_for_each_entry(d, &(net)->dev_base_head, dev_list)
1523 #define for_each_netdev_reverse(net, d) \
1524 list_for_each_entry_reverse(d, &(net)->dev_base_head, dev_list)
1525 #define for_each_netdev_rcu(net, d) \
1526 list_for_each_entry_rcu(d, &(net)->dev_base_head, dev_list)
1527 #define for_each_netdev_safe(net, d, n) \
1528 list_for_each_entry_safe(d, n, &(net)->dev_base_head, dev_list)
1529 #define for_each_netdev_continue(net, d) \
1530 list_for_each_entry_continue(d, &(net)->dev_base_head, dev_list)
1531 #define for_each_netdev_continue_rcu(net, d) \
1532 list_for_each_entry_continue_rcu(d, &(net)->dev_base_head, dev_list)
1533 #define net_device_entry(lh) list_entry(lh, struct net_device, dev_list)
1535 static inline struct net_device
*next_net_device(struct net_device
*dev
)
1537 struct list_head
*lh
;
1541 lh
= dev
->dev_list
.next
;
1542 return lh
== &net
->dev_base_head
? NULL
: net_device_entry(lh
);
1545 static inline struct net_device
*next_net_device_rcu(struct net_device
*dev
)
1547 struct list_head
*lh
;
1551 lh
= rcu_dereference(list_next_rcu(&dev
->dev_list
));
1552 return lh
== &net
->dev_base_head
? NULL
: net_device_entry(lh
);
1555 static inline struct net_device
*first_net_device(struct net
*net
)
1557 return list_empty(&net
->dev_base_head
) ? NULL
:
1558 net_device_entry(net
->dev_base_head
.next
);
1561 static inline struct net_device
*first_net_device_rcu(struct net
*net
)
1563 struct list_head
*lh
= rcu_dereference(list_next_rcu(&net
->dev_base_head
));
1565 return lh
== &net
->dev_base_head
? NULL
: net_device_entry(lh
);
1568 extern int netdev_boot_setup_check(struct net_device
*dev
);
1569 extern unsigned long netdev_boot_base(const char *prefix
, int unit
);
1570 extern struct net_device
*dev_getbyhwaddr_rcu(struct net
*net
, unsigned short type
,
1571 const char *hwaddr
);
1572 extern struct net_device
*dev_getfirstbyhwtype(struct net
*net
, unsigned short type
);
1573 extern struct net_device
*__dev_getfirstbyhwtype(struct net
*net
, unsigned short type
);
1574 extern void dev_add_pack(struct packet_type
*pt
);
1575 extern void dev_remove_pack(struct packet_type
*pt
);
1576 extern void __dev_remove_pack(struct packet_type
*pt
);
1578 extern struct net_device
*dev_get_by_flags_rcu(struct net
*net
, unsigned short flags
,
1579 unsigned short mask
);
1580 extern struct net_device
*dev_get_by_name(struct net
*net
, const char *name
);
1581 extern struct net_device
*dev_get_by_name_rcu(struct net
*net
, const char *name
);
1582 extern struct net_device
*__dev_get_by_name(struct net
*net
, const char *name
);
1583 extern int dev_alloc_name(struct net_device
*dev
, const char *name
);
1584 extern int dev_open(struct net_device
*dev
);
1585 extern int dev_close(struct net_device
*dev
);
1586 extern void dev_disable_lro(struct net_device
*dev
);
1587 extern int dev_queue_xmit(struct sk_buff
*skb
);
1588 extern int register_netdevice(struct net_device
*dev
);
1589 extern void unregister_netdevice_queue(struct net_device
*dev
,
1590 struct list_head
*head
);
1591 extern void unregister_netdevice_many(struct list_head
*head
);
1592 static inline void unregister_netdevice(struct net_device
*dev
)
1594 unregister_netdevice_queue(dev
, NULL
);
1597 extern int netdev_refcnt_read(const struct net_device
*dev
);
1598 extern void free_netdev(struct net_device
*dev
);
1599 extern void synchronize_net(void);
1600 extern int init_dummy_netdev(struct net_device
*dev
);
1601 extern void netdev_resync_ops(struct net_device
*dev
);
1603 extern struct net_device
*dev_get_by_index(struct net
*net
, int ifindex
);
1604 extern struct net_device
*__dev_get_by_index(struct net
*net
, int ifindex
);
1605 extern struct net_device
*dev_get_by_index_rcu(struct net
*net
, int ifindex
);
1606 extern int dev_restart(struct net_device
*dev
);
1607 #ifdef CONFIG_NETPOLL_TRAP
1608 extern int netpoll_trap(void);
1610 extern int skb_gro_receive(struct sk_buff
**head
,
1611 struct sk_buff
*skb
);
1612 extern void skb_gro_reset_offset(struct sk_buff
*skb
);
1614 static inline unsigned int skb_gro_offset(const struct sk_buff
*skb
)
1616 return NAPI_GRO_CB(skb
)->data_offset
;
1619 static inline unsigned int skb_gro_len(const struct sk_buff
*skb
)
1621 return skb
->len
- NAPI_GRO_CB(skb
)->data_offset
;
1624 static inline void skb_gro_pull(struct sk_buff
*skb
, unsigned int len
)
1626 NAPI_GRO_CB(skb
)->data_offset
+= len
;
1629 static inline void *skb_gro_header_fast(struct sk_buff
*skb
,
1630 unsigned int offset
)
1632 return NAPI_GRO_CB(skb
)->frag0
+ offset
;
1635 static inline int skb_gro_header_hard(struct sk_buff
*skb
, unsigned int hlen
)
1637 return NAPI_GRO_CB(skb
)->frag0_len
< hlen
;
1640 static inline void *skb_gro_header_slow(struct sk_buff
*skb
, unsigned int hlen
,
1641 unsigned int offset
)
1643 if (!pskb_may_pull(skb
, hlen
))
1646 NAPI_GRO_CB(skb
)->frag0
= NULL
;
1647 NAPI_GRO_CB(skb
)->frag0_len
= 0;
1648 return skb
->data
+ offset
;
1651 static inline void *skb_gro_mac_header(struct sk_buff
*skb
)
1653 return NAPI_GRO_CB(skb
)->frag0
?: skb_mac_header(skb
);
1656 static inline void *skb_gro_network_header(struct sk_buff
*skb
)
1658 return (NAPI_GRO_CB(skb
)->frag0
?: skb
->data
) +
1659 skb_network_offset(skb
);
1662 static inline int dev_hard_header(struct sk_buff
*skb
, struct net_device
*dev
,
1663 unsigned short type
,
1664 const void *daddr
, const void *saddr
,
1667 if (!dev
->header_ops
|| !dev
->header_ops
->create
)
1670 return dev
->header_ops
->create(skb
, dev
, type
, daddr
, saddr
, len
);
1673 static inline int dev_parse_header(const struct sk_buff
*skb
,
1674 unsigned char *haddr
)
1676 const struct net_device
*dev
= skb
->dev
;
1678 if (!dev
->header_ops
|| !dev
->header_ops
->parse
)
1680 return dev
->header_ops
->parse(skb
, haddr
);
1683 typedef int gifconf_func_t(struct net_device
* dev
, char __user
* bufptr
, int len
);
1684 extern int register_gifconf(unsigned int family
, gifconf_func_t
* gifconf
);
1685 static inline int unregister_gifconf(unsigned int family
)
1687 return register_gifconf(family
, NULL
);
1691 * Incoming packets are placed on per-cpu queues
1693 struct softnet_data
{
1694 struct Qdisc
*output_queue
;
1695 struct Qdisc
**output_queue_tailp
;
1696 struct list_head poll_list
;
1697 struct sk_buff
*completion_queue
;
1698 struct sk_buff_head process_queue
;
1701 unsigned int processed
;
1702 unsigned int time_squeeze
;
1703 unsigned int cpu_collision
;
1704 unsigned int received_rps
;
1707 struct softnet_data
*rps_ipi_list
;
1709 /* Elements below can be accessed between CPUs for RPS */
1710 struct call_single_data csd ____cacheline_aligned_in_smp
;
1711 struct softnet_data
*rps_ipi_next
;
1713 unsigned int input_queue_head
;
1714 unsigned int input_queue_tail
;
1717 struct sk_buff_head input_pkt_queue
;
1718 struct napi_struct backlog
;
1721 static inline void input_queue_head_incr(struct softnet_data
*sd
)
1724 sd
->input_queue_head
++;
1728 static inline void input_queue_tail_incr_save(struct softnet_data
*sd
,
1729 unsigned int *qtail
)
1732 *qtail
= ++sd
->input_queue_tail
;
1736 DECLARE_PER_CPU_ALIGNED(struct softnet_data
, softnet_data
);
1738 extern void __netif_schedule(struct Qdisc
*q
);
1740 static inline void netif_schedule_queue(struct netdev_queue
*txq
)
1742 if (!(txq
->state
& QUEUE_STATE_ANY_XOFF
))
1743 __netif_schedule(txq
->qdisc
);
1746 static inline void netif_tx_schedule_all(struct net_device
*dev
)
1750 for (i
= 0; i
< dev
->num_tx_queues
; i
++)
1751 netif_schedule_queue(netdev_get_tx_queue(dev
, i
));
1754 static inline void netif_tx_start_queue(struct netdev_queue
*dev_queue
)
1756 clear_bit(__QUEUE_STATE_DRV_XOFF
, &dev_queue
->state
);
1760 * netif_start_queue - allow transmit
1761 * @dev: network device
1763 * Allow upper layers to call the device hard_start_xmit routine.
1765 static inline void netif_start_queue(struct net_device
*dev
)
1767 netif_tx_start_queue(netdev_get_tx_queue(dev
, 0));
1770 static inline void netif_tx_start_all_queues(struct net_device
*dev
)
1774 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
1775 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
1776 netif_tx_start_queue(txq
);
1780 static inline void netif_tx_wake_queue(struct netdev_queue
*dev_queue
)
1782 #ifdef CONFIG_NETPOLL_TRAP
1783 if (netpoll_trap()) {
1784 netif_tx_start_queue(dev_queue
);
1788 if (test_and_clear_bit(__QUEUE_STATE_DRV_XOFF
, &dev_queue
->state
))
1789 __netif_schedule(dev_queue
->qdisc
);
1793 * netif_wake_queue - restart transmit
1794 * @dev: network device
1796 * Allow upper layers to call the device hard_start_xmit routine.
1797 * Used for flow control when transmit resources are available.
1799 static inline void netif_wake_queue(struct net_device
*dev
)
1801 netif_tx_wake_queue(netdev_get_tx_queue(dev
, 0));
1804 static inline void netif_tx_wake_all_queues(struct net_device
*dev
)
1808 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
1809 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
1810 netif_tx_wake_queue(txq
);
1814 static inline void netif_tx_stop_queue(struct netdev_queue
*dev_queue
)
1816 if (WARN_ON(!dev_queue
)) {
1817 pr_info("netif_stop_queue() cannot be called before register_netdev()\n");
1820 set_bit(__QUEUE_STATE_DRV_XOFF
, &dev_queue
->state
);
1824 * netif_stop_queue - stop transmitted packets
1825 * @dev: network device
1827 * Stop upper layers calling the device hard_start_xmit routine.
1828 * Used for flow control when transmit resources are unavailable.
1830 static inline void netif_stop_queue(struct net_device
*dev
)
1832 netif_tx_stop_queue(netdev_get_tx_queue(dev
, 0));
1835 static inline void netif_tx_stop_all_queues(struct net_device
*dev
)
1839 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
1840 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
1841 netif_tx_stop_queue(txq
);
1845 static inline int netif_tx_queue_stopped(const struct netdev_queue
*dev_queue
)
1847 return test_bit(__QUEUE_STATE_DRV_XOFF
, &dev_queue
->state
);
1851 * netif_queue_stopped - test if transmit queue is flowblocked
1852 * @dev: network device
1854 * Test if transmit queue on device is currently unable to send.
1856 static inline int netif_queue_stopped(const struct net_device
*dev
)
1858 return netif_tx_queue_stopped(netdev_get_tx_queue(dev
, 0));
1861 static inline int netif_xmit_stopped(const struct netdev_queue
*dev_queue
)
1863 return dev_queue
->state
& QUEUE_STATE_ANY_XOFF
;
1866 static inline int netif_xmit_frozen_or_stopped(const struct netdev_queue
*dev_queue
)
1868 return dev_queue
->state
& QUEUE_STATE_ANY_XOFF_OR_FROZEN
;
1871 static inline void netdev_tx_sent_queue(struct netdev_queue
*dev_queue
,
1875 dql_queued(&dev_queue
->dql
, bytes
);
1876 if (unlikely(dql_avail(&dev_queue
->dql
) < 0)) {
1877 set_bit(__QUEUE_STATE_STACK_XOFF
, &dev_queue
->state
);
1878 if (unlikely(dql_avail(&dev_queue
->dql
) >= 0))
1879 clear_bit(__QUEUE_STATE_STACK_XOFF
,
1885 static inline void netdev_sent_queue(struct net_device
*dev
, unsigned int bytes
)
1887 netdev_tx_sent_queue(netdev_get_tx_queue(dev
, 0), bytes
);
1890 static inline void netdev_tx_completed_queue(struct netdev_queue
*dev_queue
,
1891 unsigned pkts
, unsigned bytes
)
1894 if (likely(bytes
)) {
1895 dql_completed(&dev_queue
->dql
, bytes
);
1896 if (unlikely(test_bit(__QUEUE_STATE_STACK_XOFF
,
1897 &dev_queue
->state
) &&
1898 dql_avail(&dev_queue
->dql
) >= 0)) {
1899 if (test_and_clear_bit(__QUEUE_STATE_STACK_XOFF
,
1901 netif_schedule_queue(dev_queue
);
1907 static inline void netdev_completed_queue(struct net_device
*dev
,
1908 unsigned pkts
, unsigned bytes
)
1910 netdev_tx_completed_queue(netdev_get_tx_queue(dev
, 0), pkts
, bytes
);
1913 static inline void netdev_tx_reset_queue(struct netdev_queue
*q
)
1920 static inline void netdev_reset_queue(struct net_device
*dev_queue
)
1922 netdev_tx_reset_queue(netdev_get_tx_queue(dev_queue
, 0));
1926 * netif_running - test if up
1927 * @dev: network device
1929 * Test if the device has been brought up.
1931 static inline int netif_running(const struct net_device
*dev
)
1933 return test_bit(__LINK_STATE_START
, &dev
->state
);
1937 * Routines to manage the subqueues on a device. We only need start
1938 * stop, and a check if it's stopped. All other device management is
1939 * done at the overall netdevice level.
1940 * Also test the device if we're multiqueue.
1944 * netif_start_subqueue - allow sending packets on subqueue
1945 * @dev: network device
1946 * @queue_index: sub queue index
1948 * Start individual transmit queue of a device with multiple transmit queues.
1950 static inline void netif_start_subqueue(struct net_device
*dev
, u16 queue_index
)
1952 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, queue_index
);
1954 netif_tx_start_queue(txq
);
1958 * netif_stop_subqueue - stop sending packets on subqueue
1959 * @dev: network device
1960 * @queue_index: sub queue index
1962 * Stop individual transmit queue of a device with multiple transmit queues.
1964 static inline void netif_stop_subqueue(struct net_device
*dev
, u16 queue_index
)
1966 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, queue_index
);
1967 #ifdef CONFIG_NETPOLL_TRAP
1971 netif_tx_stop_queue(txq
);
1975 * netif_subqueue_stopped - test status of subqueue
1976 * @dev: network device
1977 * @queue_index: sub queue index
1979 * Check individual transmit queue of a device with multiple transmit queues.
1981 static inline int __netif_subqueue_stopped(const struct net_device
*dev
,
1984 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, queue_index
);
1986 return netif_tx_queue_stopped(txq
);
1989 static inline int netif_subqueue_stopped(const struct net_device
*dev
,
1990 struct sk_buff
*skb
)
1992 return __netif_subqueue_stopped(dev
, skb_get_queue_mapping(skb
));
1996 * netif_wake_subqueue - allow sending packets on subqueue
1997 * @dev: network device
1998 * @queue_index: sub queue index
2000 * Resume individual transmit queue of a device with multiple transmit queues.
2002 static inline void netif_wake_subqueue(struct net_device
*dev
, u16 queue_index
)
2004 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, queue_index
);
2005 #ifdef CONFIG_NETPOLL_TRAP
2009 if (test_and_clear_bit(__QUEUE_STATE_DRV_XOFF
, &txq
->state
))
2010 __netif_schedule(txq
->qdisc
);
2014 * Returns a Tx hash for the given packet when dev->real_num_tx_queues is used
2015 * as a distribution range limit for the returned value.
2017 static inline u16
skb_tx_hash(const struct net_device
*dev
,
2018 const struct sk_buff
*skb
)
2020 return __skb_tx_hash(dev
, skb
, dev
->real_num_tx_queues
);
2024 * netif_is_multiqueue - test if device has multiple transmit queues
2025 * @dev: network device
2027 * Check if device has multiple transmit queues
2029 static inline int netif_is_multiqueue(const struct net_device
*dev
)
2031 return dev
->num_tx_queues
> 1;
2034 extern int netif_set_real_num_tx_queues(struct net_device
*dev
,
2038 extern int netif_set_real_num_rx_queues(struct net_device
*dev
,
2041 static inline int netif_set_real_num_rx_queues(struct net_device
*dev
,
2048 static inline int netif_copy_real_num_queues(struct net_device
*to_dev
,
2049 const struct net_device
*from_dev
)
2051 netif_set_real_num_tx_queues(to_dev
, from_dev
->real_num_tx_queues
);
2053 return netif_set_real_num_rx_queues(to_dev
,
2054 from_dev
->real_num_rx_queues
);
2060 /* Use this variant when it is known for sure that it
2061 * is executing from hardware interrupt context or with hardware interrupts
2064 extern void dev_kfree_skb_irq(struct sk_buff
*skb
);
2066 /* Use this variant in places where it could be invoked
2067 * from either hardware interrupt or other context, with hardware interrupts
2068 * either disabled or enabled.
2070 extern void dev_kfree_skb_any(struct sk_buff
*skb
);
2072 extern int netif_rx(struct sk_buff
*skb
);
2073 extern int netif_rx_ni(struct sk_buff
*skb
);
2074 extern int netif_receive_skb(struct sk_buff
*skb
);
2075 extern gro_result_t
dev_gro_receive(struct napi_struct
*napi
,
2076 struct sk_buff
*skb
);
2077 extern gro_result_t
napi_skb_finish(gro_result_t ret
, struct sk_buff
*skb
);
2078 extern gro_result_t
napi_gro_receive(struct napi_struct
*napi
,
2079 struct sk_buff
*skb
);
2080 extern void napi_gro_flush(struct napi_struct
*napi
);
2081 extern struct sk_buff
* napi_get_frags(struct napi_struct
*napi
);
2082 extern gro_result_t
napi_frags_finish(struct napi_struct
*napi
,
2083 struct sk_buff
*skb
,
2085 extern struct sk_buff
* napi_frags_skb(struct napi_struct
*napi
);
2086 extern gro_result_t
napi_gro_frags(struct napi_struct
*napi
);
2088 static inline void napi_free_frags(struct napi_struct
*napi
)
2090 kfree_skb(napi
->skb
);
2094 extern int netdev_rx_handler_register(struct net_device
*dev
,
2095 rx_handler_func_t
*rx_handler
,
2096 void *rx_handler_data
);
2097 extern void netdev_rx_handler_unregister(struct net_device
*dev
);
2099 extern int dev_valid_name(const char *name
);
2100 extern int dev_ioctl(struct net
*net
, unsigned int cmd
, void __user
*);
2101 extern int dev_ethtool(struct net
*net
, struct ifreq
*);
2102 extern unsigned dev_get_flags(const struct net_device
*);
2103 extern int __dev_change_flags(struct net_device
*, unsigned int flags
);
2104 extern int dev_change_flags(struct net_device
*, unsigned);
2105 extern void __dev_notify_flags(struct net_device
*, unsigned int old_flags
);
2106 extern int dev_change_name(struct net_device
*, const char *);
2107 extern int dev_set_alias(struct net_device
*, const char *, size_t);
2108 extern int dev_change_net_namespace(struct net_device
*,
2109 struct net
*, const char *);
2110 extern int dev_set_mtu(struct net_device
*, int);
2111 extern void dev_set_group(struct net_device
*, int);
2112 extern int dev_set_mac_address(struct net_device
*,
2114 extern int dev_hard_start_xmit(struct sk_buff
*skb
,
2115 struct net_device
*dev
,
2116 struct netdev_queue
*txq
);
2117 extern int dev_forward_skb(struct net_device
*dev
,
2118 struct sk_buff
*skb
);
2120 extern int netdev_budget
;
2122 /* Called by rtnetlink.c:rtnl_unlock() */
2123 extern void netdev_run_todo(void);
2126 * dev_put - release reference to device
2127 * @dev: network device
2129 * Release reference to device to allow it to be freed.
2131 static inline void dev_put(struct net_device
*dev
)
2133 irqsafe_cpu_dec(*dev
->pcpu_refcnt
);
2137 * dev_hold - get reference to device
2138 * @dev: network device
2140 * Hold reference to device to keep it from being freed.
2142 static inline void dev_hold(struct net_device
*dev
)
2144 irqsafe_cpu_inc(*dev
->pcpu_refcnt
);
2147 /* Carrier loss detection, dial on demand. The functions netif_carrier_on
2148 * and _off may be called from IRQ context, but it is caller
2149 * who is responsible for serialization of these calls.
2151 * The name carrier is inappropriate, these functions should really be
2152 * called netif_lowerlayer_*() because they represent the state of any
2153 * kind of lower layer not just hardware media.
2156 extern void linkwatch_fire_event(struct net_device
*dev
);
2157 extern void linkwatch_forget_dev(struct net_device
*dev
);
2160 * netif_carrier_ok - test if carrier present
2161 * @dev: network device
2163 * Check if carrier is present on device
2165 static inline int netif_carrier_ok(const struct net_device
*dev
)
2167 return !test_bit(__LINK_STATE_NOCARRIER
, &dev
->state
);
2170 extern unsigned long dev_trans_start(struct net_device
*dev
);
2172 extern void __netdev_watchdog_up(struct net_device
*dev
);
2174 extern void netif_carrier_on(struct net_device
*dev
);
2176 extern void netif_carrier_off(struct net_device
*dev
);
2178 extern void netif_notify_peers(struct net_device
*dev
);
2181 * netif_dormant_on - mark device as dormant.
2182 * @dev: network device
2184 * Mark device as dormant (as per RFC2863).
2186 * The dormant state indicates that the relevant interface is not
2187 * actually in a condition to pass packets (i.e., it is not 'up') but is
2188 * in a "pending" state, waiting for some external event. For "on-
2189 * demand" interfaces, this new state identifies the situation where the
2190 * interface is waiting for events to place it in the up state.
2193 static inline void netif_dormant_on(struct net_device
*dev
)
2195 if (!test_and_set_bit(__LINK_STATE_DORMANT
, &dev
->state
))
2196 linkwatch_fire_event(dev
);
2200 * netif_dormant_off - set device as not dormant.
2201 * @dev: network device
2203 * Device is not in dormant state.
2205 static inline void netif_dormant_off(struct net_device
*dev
)
2207 if (test_and_clear_bit(__LINK_STATE_DORMANT
, &dev
->state
))
2208 linkwatch_fire_event(dev
);
2212 * netif_dormant - test if carrier present
2213 * @dev: network device
2215 * Check if carrier is present on device
2217 static inline int netif_dormant(const struct net_device
*dev
)
2219 return test_bit(__LINK_STATE_DORMANT
, &dev
->state
);
2224 * netif_oper_up - test if device is operational
2225 * @dev: network device
2227 * Check if carrier is operational
2229 static inline int netif_oper_up(const struct net_device
*dev
)
2231 return (dev
->operstate
== IF_OPER_UP
||
2232 dev
->operstate
== IF_OPER_UNKNOWN
/* backward compat */);
2236 * netif_device_present - is device available or removed
2237 * @dev: network device
2239 * Check if device has not been removed from system.
2241 static inline int netif_device_present(struct net_device
*dev
)
2243 return test_bit(__LINK_STATE_PRESENT
, &dev
->state
);
2246 extern void netif_device_detach(struct net_device
*dev
);
2248 extern void netif_device_attach(struct net_device
*dev
);
2251 * Network interface message level settings
2255 NETIF_MSG_DRV
= 0x0001,
2256 NETIF_MSG_PROBE
= 0x0002,
2257 NETIF_MSG_LINK
= 0x0004,
2258 NETIF_MSG_TIMER
= 0x0008,
2259 NETIF_MSG_IFDOWN
= 0x0010,
2260 NETIF_MSG_IFUP
= 0x0020,
2261 NETIF_MSG_RX_ERR
= 0x0040,
2262 NETIF_MSG_TX_ERR
= 0x0080,
2263 NETIF_MSG_TX_QUEUED
= 0x0100,
2264 NETIF_MSG_INTR
= 0x0200,
2265 NETIF_MSG_TX_DONE
= 0x0400,
2266 NETIF_MSG_RX_STATUS
= 0x0800,
2267 NETIF_MSG_PKTDATA
= 0x1000,
2268 NETIF_MSG_HW
= 0x2000,
2269 NETIF_MSG_WOL
= 0x4000,
2272 #define netif_msg_drv(p) ((p)->msg_enable & NETIF_MSG_DRV)
2273 #define netif_msg_probe(p) ((p)->msg_enable & NETIF_MSG_PROBE)
2274 #define netif_msg_link(p) ((p)->msg_enable & NETIF_MSG_LINK)
2275 #define netif_msg_timer(p) ((p)->msg_enable & NETIF_MSG_TIMER)
2276 #define netif_msg_ifdown(p) ((p)->msg_enable & NETIF_MSG_IFDOWN)
2277 #define netif_msg_ifup(p) ((p)->msg_enable & NETIF_MSG_IFUP)
2278 #define netif_msg_rx_err(p) ((p)->msg_enable & NETIF_MSG_RX_ERR)
2279 #define netif_msg_tx_err(p) ((p)->msg_enable & NETIF_MSG_TX_ERR)
2280 #define netif_msg_tx_queued(p) ((p)->msg_enable & NETIF_MSG_TX_QUEUED)
2281 #define netif_msg_intr(p) ((p)->msg_enable & NETIF_MSG_INTR)
2282 #define netif_msg_tx_done(p) ((p)->msg_enable & NETIF_MSG_TX_DONE)
2283 #define netif_msg_rx_status(p) ((p)->msg_enable & NETIF_MSG_RX_STATUS)
2284 #define netif_msg_pktdata(p) ((p)->msg_enable & NETIF_MSG_PKTDATA)
2285 #define netif_msg_hw(p) ((p)->msg_enable & NETIF_MSG_HW)
2286 #define netif_msg_wol(p) ((p)->msg_enable & NETIF_MSG_WOL)
2288 static inline u32
netif_msg_init(int debug_value
, int default_msg_enable_bits
)
2291 if (debug_value
< 0 || debug_value
>= (sizeof(u32
) * 8))
2292 return default_msg_enable_bits
;
2293 if (debug_value
== 0) /* no output */
2295 /* set low N bits */
2296 return (1 << debug_value
) - 1;
2299 static inline void __netif_tx_lock(struct netdev_queue
*txq
, int cpu
)
2301 spin_lock(&txq
->_xmit_lock
);
2302 txq
->xmit_lock_owner
= cpu
;
2305 static inline void __netif_tx_lock_bh(struct netdev_queue
*txq
)
2307 spin_lock_bh(&txq
->_xmit_lock
);
2308 txq
->xmit_lock_owner
= smp_processor_id();
2311 static inline int __netif_tx_trylock(struct netdev_queue
*txq
)
2313 int ok
= spin_trylock(&txq
->_xmit_lock
);
2315 txq
->xmit_lock_owner
= smp_processor_id();
2319 static inline void __netif_tx_unlock(struct netdev_queue
*txq
)
2321 txq
->xmit_lock_owner
= -1;
2322 spin_unlock(&txq
->_xmit_lock
);
2325 static inline void __netif_tx_unlock_bh(struct netdev_queue
*txq
)
2327 txq
->xmit_lock_owner
= -1;
2328 spin_unlock_bh(&txq
->_xmit_lock
);
2331 static inline void txq_trans_update(struct netdev_queue
*txq
)
2333 if (txq
->xmit_lock_owner
!= -1)
2334 txq
->trans_start
= jiffies
;
2338 * netif_tx_lock - grab network device transmit lock
2339 * @dev: network device
2341 * Get network device transmit lock
2343 static inline void netif_tx_lock(struct net_device
*dev
)
2348 spin_lock(&dev
->tx_global_lock
);
2349 cpu
= smp_processor_id();
2350 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
2351 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
2353 /* We are the only thread of execution doing a
2354 * freeze, but we have to grab the _xmit_lock in
2355 * order to synchronize with threads which are in
2356 * the ->hard_start_xmit() handler and already
2357 * checked the frozen bit.
2359 __netif_tx_lock(txq
, cpu
);
2360 set_bit(__QUEUE_STATE_FROZEN
, &txq
->state
);
2361 __netif_tx_unlock(txq
);
2365 static inline void netif_tx_lock_bh(struct net_device
*dev
)
2371 static inline void netif_tx_unlock(struct net_device
*dev
)
2375 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
2376 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
2378 /* No need to grab the _xmit_lock here. If the
2379 * queue is not stopped for another reason, we
2382 clear_bit(__QUEUE_STATE_FROZEN
, &txq
->state
);
2383 netif_schedule_queue(txq
);
2385 spin_unlock(&dev
->tx_global_lock
);
2388 static inline void netif_tx_unlock_bh(struct net_device
*dev
)
2390 netif_tx_unlock(dev
);
2394 #define HARD_TX_LOCK(dev, txq, cpu) { \
2395 if ((dev->features & NETIF_F_LLTX) == 0) { \
2396 __netif_tx_lock(txq, cpu); \
2400 #define HARD_TX_UNLOCK(dev, txq) { \
2401 if ((dev->features & NETIF_F_LLTX) == 0) { \
2402 __netif_tx_unlock(txq); \
2406 static inline void netif_tx_disable(struct net_device
*dev
)
2412 cpu
= smp_processor_id();
2413 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
2414 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
2416 __netif_tx_lock(txq
, cpu
);
2417 netif_tx_stop_queue(txq
);
2418 __netif_tx_unlock(txq
);
2423 static inline void netif_addr_lock(struct net_device
*dev
)
2425 spin_lock(&dev
->addr_list_lock
);
2428 static inline void netif_addr_lock_bh(struct net_device
*dev
)
2430 spin_lock_bh(&dev
->addr_list_lock
);
2433 static inline void netif_addr_unlock(struct net_device
*dev
)
2435 spin_unlock(&dev
->addr_list_lock
);
2438 static inline void netif_addr_unlock_bh(struct net_device
*dev
)
2440 spin_unlock_bh(&dev
->addr_list_lock
);
2444 * dev_addrs walker. Should be used only for read access. Call with
2445 * rcu_read_lock held.
2447 #define for_each_dev_addr(dev, ha) \
2448 list_for_each_entry_rcu(ha, &dev->dev_addrs.list, list)
2450 /* These functions live elsewhere (drivers/net/net_init.c, but related) */
2452 extern void ether_setup(struct net_device
*dev
);
2454 /* Support for loadable net-drivers */
2455 extern struct net_device
*alloc_netdev_mqs(int sizeof_priv
, const char *name
,
2456 void (*setup
)(struct net_device
*),
2457 unsigned int txqs
, unsigned int rxqs
);
2458 #define alloc_netdev(sizeof_priv, name, setup) \
2459 alloc_netdev_mqs(sizeof_priv, name, setup, 1, 1)
2461 #define alloc_netdev_mq(sizeof_priv, name, setup, count) \
2462 alloc_netdev_mqs(sizeof_priv, name, setup, count, count)
2464 extern int register_netdev(struct net_device
*dev
);
2465 extern void unregister_netdev(struct net_device
*dev
);
2467 /* General hardware address lists handling functions */
2468 extern int __hw_addr_add_multiple(struct netdev_hw_addr_list
*to_list
,
2469 struct netdev_hw_addr_list
*from_list
,
2470 int addr_len
, unsigned char addr_type
);
2471 extern void __hw_addr_del_multiple(struct netdev_hw_addr_list
*to_list
,
2472 struct netdev_hw_addr_list
*from_list
,
2473 int addr_len
, unsigned char addr_type
);
2474 extern int __hw_addr_sync(struct netdev_hw_addr_list
*to_list
,
2475 struct netdev_hw_addr_list
*from_list
,
2477 extern void __hw_addr_unsync(struct netdev_hw_addr_list
*to_list
,
2478 struct netdev_hw_addr_list
*from_list
,
2480 extern void __hw_addr_flush(struct netdev_hw_addr_list
*list
);
2481 extern void __hw_addr_init(struct netdev_hw_addr_list
*list
);
2483 /* Functions used for device addresses handling */
2484 extern int dev_addr_add(struct net_device
*dev
, unsigned char *addr
,
2485 unsigned char addr_type
);
2486 extern int dev_addr_del(struct net_device
*dev
, unsigned char *addr
,
2487 unsigned char addr_type
);
2488 extern int dev_addr_add_multiple(struct net_device
*to_dev
,
2489 struct net_device
*from_dev
,
2490 unsigned char addr_type
);
2491 extern int dev_addr_del_multiple(struct net_device
*to_dev
,
2492 struct net_device
*from_dev
,
2493 unsigned char addr_type
);
2494 extern void dev_addr_flush(struct net_device
*dev
);
2495 extern int dev_addr_init(struct net_device
*dev
);
2497 /* Functions used for unicast addresses handling */
2498 extern int dev_uc_add(struct net_device
*dev
, unsigned char *addr
);
2499 extern int dev_uc_del(struct net_device
*dev
, unsigned char *addr
);
2500 extern int dev_uc_sync(struct net_device
*to
, struct net_device
*from
);
2501 extern void dev_uc_unsync(struct net_device
*to
, struct net_device
*from
);
2502 extern void dev_uc_flush(struct net_device
*dev
);
2503 extern void dev_uc_init(struct net_device
*dev
);
2505 /* Functions used for multicast addresses handling */
2506 extern int dev_mc_add(struct net_device
*dev
, unsigned char *addr
);
2507 extern int dev_mc_add_global(struct net_device
*dev
, unsigned char *addr
);
2508 extern int dev_mc_del(struct net_device
*dev
, unsigned char *addr
);
2509 extern int dev_mc_del_global(struct net_device
*dev
, unsigned char *addr
);
2510 extern int dev_mc_sync(struct net_device
*to
, struct net_device
*from
);
2511 extern void dev_mc_unsync(struct net_device
*to
, struct net_device
*from
);
2512 extern void dev_mc_flush(struct net_device
*dev
);
2513 extern void dev_mc_init(struct net_device
*dev
);
2515 /* Functions used for secondary unicast and multicast support */
2516 extern void dev_set_rx_mode(struct net_device
*dev
);
2517 extern void __dev_set_rx_mode(struct net_device
*dev
);
2518 extern int dev_set_promiscuity(struct net_device
*dev
, int inc
);
2519 extern int dev_set_allmulti(struct net_device
*dev
, int inc
);
2520 extern void netdev_state_change(struct net_device
*dev
);
2521 extern int netdev_bonding_change(struct net_device
*dev
,
2522 unsigned long event
);
2523 extern void netdev_features_change(struct net_device
*dev
);
2524 /* Load a device via the kmod */
2525 extern void dev_load(struct net
*net
, const char *name
);
2526 extern void dev_mcast_init(void);
2527 extern struct rtnl_link_stats64
*dev_get_stats(struct net_device
*dev
,
2528 struct rtnl_link_stats64
*storage
);
2530 extern int netdev_max_backlog
;
2531 extern int netdev_tstamp_prequeue
;
2532 extern int weight_p
;
2533 extern int bpf_jit_enable
;
2534 extern int netdev_set_master(struct net_device
*dev
, struct net_device
*master
);
2535 extern int netdev_set_bond_master(struct net_device
*dev
,
2536 struct net_device
*master
);
2537 extern int skb_checksum_help(struct sk_buff
*skb
);
2538 extern struct sk_buff
*skb_gso_segment(struct sk_buff
*skb
,
2539 netdev_features_t features
);
2541 extern void netdev_rx_csum_fault(struct net_device
*dev
);
2543 static inline void netdev_rx_csum_fault(struct net_device
*dev
)
2547 /* rx skb timestamps */
2548 extern void net_enable_timestamp(void);
2549 extern void net_disable_timestamp(void);
2551 #ifdef CONFIG_PROC_FS
2552 extern void *dev_seq_start(struct seq_file
*seq
, loff_t
*pos
);
2553 extern void *dev_seq_next(struct seq_file
*seq
, void *v
, loff_t
*pos
);
2554 extern void dev_seq_stop(struct seq_file
*seq
, void *v
);
2555 extern int dev_seq_open_ops(struct inode
*inode
, struct file
*file
,
2556 const struct seq_operations
*ops
);
2559 extern int netdev_class_create_file(struct class_attribute
*class_attr
);
2560 extern void netdev_class_remove_file(struct class_attribute
*class_attr
);
2562 extern struct kobj_ns_type_operations net_ns_type_operations
;
2564 extern const char *netdev_drivername(const struct net_device
*dev
);
2566 extern void linkwatch_run_queue(void);
2568 static inline netdev_features_t
netdev_get_wanted_features(
2569 struct net_device
*dev
)
2571 return (dev
->features
& ~dev
->hw_features
) | dev
->wanted_features
;
2573 netdev_features_t
netdev_increment_features(netdev_features_t all
,
2574 netdev_features_t one
, netdev_features_t mask
);
2575 int __netdev_update_features(struct net_device
*dev
);
2576 void netdev_update_features(struct net_device
*dev
);
2577 void netdev_change_features(struct net_device
*dev
);
2579 void netif_stacked_transfer_operstate(const struct net_device
*rootdev
,
2580 struct net_device
*dev
);
2582 netdev_features_t
netif_skb_features(struct sk_buff
*skb
);
2584 static inline int net_gso_ok(netdev_features_t features
, int gso_type
)
2586 netdev_features_t feature
= gso_type
<< NETIF_F_GSO_SHIFT
;
2588 /* check flags correspondence */
2589 BUILD_BUG_ON(SKB_GSO_TCPV4
!= (NETIF_F_TSO
>> NETIF_F_GSO_SHIFT
));
2590 BUILD_BUG_ON(SKB_GSO_UDP
!= (NETIF_F_UFO
>> NETIF_F_GSO_SHIFT
));
2591 BUILD_BUG_ON(SKB_GSO_DODGY
!= (NETIF_F_GSO_ROBUST
>> NETIF_F_GSO_SHIFT
));
2592 BUILD_BUG_ON(SKB_GSO_TCP_ECN
!= (NETIF_F_TSO_ECN
>> NETIF_F_GSO_SHIFT
));
2593 BUILD_BUG_ON(SKB_GSO_TCPV6
!= (NETIF_F_TSO6
>> NETIF_F_GSO_SHIFT
));
2594 BUILD_BUG_ON(SKB_GSO_FCOE
!= (NETIF_F_FSO
>> NETIF_F_GSO_SHIFT
));
2596 return (features
& feature
) == feature
;
2599 static inline int skb_gso_ok(struct sk_buff
*skb
, netdev_features_t features
)
2601 return net_gso_ok(features
, skb_shinfo(skb
)->gso_type
) &&
2602 (!skb_has_frag_list(skb
) || (features
& NETIF_F_FRAGLIST
));
2605 static inline int netif_needs_gso(struct sk_buff
*skb
,
2606 netdev_features_t features
)
2608 return skb_is_gso(skb
) && (!skb_gso_ok(skb
, features
) ||
2609 unlikely(skb
->ip_summed
!= CHECKSUM_PARTIAL
));
2612 static inline void netif_set_gso_max_size(struct net_device
*dev
,
2615 dev
->gso_max_size
= size
;
2618 static inline int netif_is_bond_slave(struct net_device
*dev
)
2620 return dev
->flags
& IFF_SLAVE
&& dev
->priv_flags
& IFF_BONDING
;
2623 extern struct pernet_operations __net_initdata loopback_net_ops
;
2625 /* Logging, debugging and troubleshooting/diagnostic helpers. */
2627 /* netdev_printk helpers, similar to dev_printk */
2629 static inline const char *netdev_name(const struct net_device
*dev
)
2631 if (dev
->reg_state
!= NETREG_REGISTERED
)
2632 return "(unregistered net_device)";
2636 extern int __netdev_printk(const char *level
, const struct net_device
*dev
,
2637 struct va_format
*vaf
);
2639 extern __printf(3, 4)
2640 int netdev_printk(const char *level
, const struct net_device
*dev
,
2641 const char *format
, ...);
2642 extern __printf(2, 3)
2643 int netdev_emerg(const struct net_device
*dev
, const char *format
, ...);
2644 extern __printf(2, 3)
2645 int netdev_alert(const struct net_device
*dev
, const char *format
, ...);
2646 extern __printf(2, 3)
2647 int netdev_crit(const struct net_device
*dev
, const char *format
, ...);
2648 extern __printf(2, 3)
2649 int netdev_err(const struct net_device
*dev
, const char *format
, ...);
2650 extern __printf(2, 3)
2651 int netdev_warn(const struct net_device
*dev
, const char *format
, ...);
2652 extern __printf(2, 3)
2653 int netdev_notice(const struct net_device
*dev
, const char *format
, ...);
2654 extern __printf(2, 3)
2655 int netdev_info(const struct net_device
*dev
, const char *format
, ...);
2657 #define MODULE_ALIAS_NETDEV(device) \
2658 MODULE_ALIAS("netdev-" device)
2661 #define netdev_dbg(__dev, format, args...) \
2662 netdev_printk(KERN_DEBUG, __dev, format, ##args)
2663 #elif defined(CONFIG_DYNAMIC_DEBUG)
2664 #define netdev_dbg(__dev, format, args...) \
2666 dynamic_netdev_dbg(__dev, format, ##args); \
2669 #define netdev_dbg(__dev, format, args...) \
2672 netdev_printk(KERN_DEBUG, __dev, format, ##args); \
2677 #if defined(VERBOSE_DEBUG)
2678 #define netdev_vdbg netdev_dbg
2681 #define netdev_vdbg(dev, format, args...) \
2684 netdev_printk(KERN_DEBUG, dev, format, ##args); \
2690 * netdev_WARN() acts like dev_printk(), but with the key difference
2691 * of using a WARN/WARN_ON to get the message out, including the
2692 * file/line information and a backtrace.
2694 #define netdev_WARN(dev, format, args...) \
2695 WARN(1, "netdevice: %s\n" format, netdev_name(dev), ##args);
2697 /* netif printk helpers, similar to netdev_printk */
2699 #define netif_printk(priv, type, level, dev, fmt, args...) \
2701 if (netif_msg_##type(priv)) \
2702 netdev_printk(level, (dev), fmt, ##args); \
2705 #define netif_level(level, priv, type, dev, fmt, args...) \
2707 if (netif_msg_##type(priv)) \
2708 netdev_##level(dev, fmt, ##args); \
2711 #define netif_emerg(priv, type, dev, fmt, args...) \
2712 netif_level(emerg, priv, type, dev, fmt, ##args)
2713 #define netif_alert(priv, type, dev, fmt, args...) \
2714 netif_level(alert, priv, type, dev, fmt, ##args)
2715 #define netif_crit(priv, type, dev, fmt, args...) \
2716 netif_level(crit, priv, type, dev, fmt, ##args)
2717 #define netif_err(priv, type, dev, fmt, args...) \
2718 netif_level(err, priv, type, dev, fmt, ##args)
2719 #define netif_warn(priv, type, dev, fmt, args...) \
2720 netif_level(warn, priv, type, dev, fmt, ##args)
2721 #define netif_notice(priv, type, dev, fmt, args...) \
2722 netif_level(notice, priv, type, dev, fmt, ##args)
2723 #define netif_info(priv, type, dev, fmt, args...) \
2724 netif_level(info, priv, type, dev, fmt, ##args)
2727 #define netif_dbg(priv, type, dev, format, args...) \
2728 netif_printk(priv, type, KERN_DEBUG, dev, format, ##args)
2729 #elif defined(CONFIG_DYNAMIC_DEBUG)
2730 #define netif_dbg(priv, type, netdev, format, args...) \
2732 if (netif_msg_##type(priv)) \
2733 dynamic_netdev_dbg(netdev, format, ##args); \
2736 #define netif_dbg(priv, type, dev, format, args...) \
2739 netif_printk(priv, type, KERN_DEBUG, dev, format, ##args); \
2744 #if defined(VERBOSE_DEBUG)
2745 #define netif_vdbg netif_dbg
2747 #define netif_vdbg(priv, type, dev, format, args...) \
2750 netif_printk(priv, type, KERN_DEBUG, dev, format, ##args); \
2755 #endif /* __KERNEL__ */
2757 #endif /* _LINUX_NETDEVICE_H */