mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2025-01-22 19:09:43 +07:00
77162022ab
This adds two new flags NTF_MASTER and NTF_SELF that can now be used to specify where PF_BRIDGE netlink commands should be sent. NTF_MASTER sends the commands to the 'dev->master' device for parsing. Typically this will be the linux net/bridge, or open-vswitch devices. Also without any flags set the command will be handled by the master device as well so that current user space tools continue to work as expected. The NTF_SELF flag will push the PF_BRIDGE commands to the device. In the basic example below the commands are then parsed and programmed in the embedded bridge. Note if both NTF_SELF and NTF_MASTER bits are set then the command will be sent to both 'dev->master' and 'dev' this allows user space to easily keep the embedded bridge and software bridge in sync. There is a slight complication in the case with both flags set when an error occurs. To resolve this the rtnl handler clears the NTF_ flag in the netlink ack to indicate which sets completed successfully. The add/del handlers will abort as soon as any error occurs. To support this new net device ops were added to call into the device and the existing bridging code was refactored to use these. There should be no required changes in user space to support the current bridge behavior. A basic setup with a SR-IOV enabled NIC looks like this, veth0 veth2 | | ------------ | bridge0 | <---- software bridging ------------ / / ethx.y ethx VF PF \ \ <---- propagate FDB entries to HW \ \ -------------------- | Embedded Bridge | <---- hardware offloaded switching -------------------- In this case the embedded bridge must be managed to allow 'veth0' to communicate with 'ethx.y' correctly. At present drivers managing the embedded bridge either send frames onto the network which then get dropped by the switch OR the embedded bridge will flood these frames. With this patch we have a mechanism to manage the embedded bridge correctly from user space. This example is specific to SR-IOV but replacing the VF with another PF or dropping this into the DSA framework generates similar management issues. Examples session using the 'br'[1] tool to add, dump and then delete a mac address with a new "embedded" option and enabled ixgbe driver: # br fdb add 22:35:19:ac:60:59 dev eth3 # br fdb port mac addr flags veth0 22:35:19:ac:60:58 static veth0 9a:5f:81:f7:f6:ec local eth3 00:1b:21:55:23:59 local eth3 22:35:19:ac:60:59 static veth0 22:35:19:ac:60:57 static #br fdb add 22:35:19:ac:60:59 embedded dev eth3 #br fdb port mac addr flags veth0 22:35:19:ac:60:58 static veth0 9a:5f:81:f7:f6:ec local eth3 00:1b:21:55:23:59 local eth3 22:35:19:ac:60:59 static veth0 22:35:19:ac:60:57 static eth3 22:35:19:ac:60:59 local embedded #br fdb del 22:35:19:ac:60:59 embedded dev eth3 I added a couple lines to 'br' to set the flags correctly is all. It is my opinion that the merit of this patch is now embedded and SW bridges can both be modeled correctly in user space using very nearly the same message passing. [1] 'br' tool was published as an RFC here and will be renamed 'bridge' http://patchwork.ozlabs.org/patch/117664/ Thanks to Jamal Hadi Salim, Stephen Hemminger and Ben Hutchings for valuable feedback, suggestions, and review. v2: fixed api descriptions and error case with both NTF_SELF and NTF_MASTER set plus updated patch description. Signed-off-by: John Fastabend <john.r.fastabend@intel.com> Signed-off-by: David S. Miller <davem@davemloft.net>
812 lines
21 KiB
C
812 lines
21 KiB
C
#ifndef __LINUX_RTNETLINK_H
|
|
#define __LINUX_RTNETLINK_H
|
|
|
|
#include <linux/types.h>
|
|
#include <linux/netlink.h>
|
|
#include <linux/if_link.h>
|
|
#include <linux/if_addr.h>
|
|
#include <linux/neighbour.h>
|
|
|
|
/* rtnetlink families. Values up to 127 are reserved for real address
|
|
* families, values above 128 may be used arbitrarily.
|
|
*/
|
|
#define RTNL_FAMILY_IPMR 128
|
|
#define RTNL_FAMILY_IP6MR 129
|
|
#define RTNL_FAMILY_MAX 129
|
|
|
|
/****
|
|
* Routing/neighbour discovery messages.
|
|
****/
|
|
|
|
/* Types of messages */
|
|
|
|
enum {
|
|
RTM_BASE = 16,
|
|
#define RTM_BASE RTM_BASE
|
|
|
|
RTM_NEWLINK = 16,
|
|
#define RTM_NEWLINK RTM_NEWLINK
|
|
RTM_DELLINK,
|
|
#define RTM_DELLINK RTM_DELLINK
|
|
RTM_GETLINK,
|
|
#define RTM_GETLINK RTM_GETLINK
|
|
RTM_SETLINK,
|
|
#define RTM_SETLINK RTM_SETLINK
|
|
|
|
RTM_NEWADDR = 20,
|
|
#define RTM_NEWADDR RTM_NEWADDR
|
|
RTM_DELADDR,
|
|
#define RTM_DELADDR RTM_DELADDR
|
|
RTM_GETADDR,
|
|
#define RTM_GETADDR RTM_GETADDR
|
|
|
|
RTM_NEWROUTE = 24,
|
|
#define RTM_NEWROUTE RTM_NEWROUTE
|
|
RTM_DELROUTE,
|
|
#define RTM_DELROUTE RTM_DELROUTE
|
|
RTM_GETROUTE,
|
|
#define RTM_GETROUTE RTM_GETROUTE
|
|
|
|
RTM_NEWNEIGH = 28,
|
|
#define RTM_NEWNEIGH RTM_NEWNEIGH
|
|
RTM_DELNEIGH,
|
|
#define RTM_DELNEIGH RTM_DELNEIGH
|
|
RTM_GETNEIGH,
|
|
#define RTM_GETNEIGH RTM_GETNEIGH
|
|
|
|
RTM_NEWRULE = 32,
|
|
#define RTM_NEWRULE RTM_NEWRULE
|
|
RTM_DELRULE,
|
|
#define RTM_DELRULE RTM_DELRULE
|
|
RTM_GETRULE,
|
|
#define RTM_GETRULE RTM_GETRULE
|
|
|
|
RTM_NEWQDISC = 36,
|
|
#define RTM_NEWQDISC RTM_NEWQDISC
|
|
RTM_DELQDISC,
|
|
#define RTM_DELQDISC RTM_DELQDISC
|
|
RTM_GETQDISC,
|
|
#define RTM_GETQDISC RTM_GETQDISC
|
|
|
|
RTM_NEWTCLASS = 40,
|
|
#define RTM_NEWTCLASS RTM_NEWTCLASS
|
|
RTM_DELTCLASS,
|
|
#define RTM_DELTCLASS RTM_DELTCLASS
|
|
RTM_GETTCLASS,
|
|
#define RTM_GETTCLASS RTM_GETTCLASS
|
|
|
|
RTM_NEWTFILTER = 44,
|
|
#define RTM_NEWTFILTER RTM_NEWTFILTER
|
|
RTM_DELTFILTER,
|
|
#define RTM_DELTFILTER RTM_DELTFILTER
|
|
RTM_GETTFILTER,
|
|
#define RTM_GETTFILTER RTM_GETTFILTER
|
|
|
|
RTM_NEWACTION = 48,
|
|
#define RTM_NEWACTION RTM_NEWACTION
|
|
RTM_DELACTION,
|
|
#define RTM_DELACTION RTM_DELACTION
|
|
RTM_GETACTION,
|
|
#define RTM_GETACTION RTM_GETACTION
|
|
|
|
RTM_NEWPREFIX = 52,
|
|
#define RTM_NEWPREFIX RTM_NEWPREFIX
|
|
|
|
RTM_GETMULTICAST = 58,
|
|
#define RTM_GETMULTICAST RTM_GETMULTICAST
|
|
|
|
RTM_GETANYCAST = 62,
|
|
#define RTM_GETANYCAST RTM_GETANYCAST
|
|
|
|
RTM_NEWNEIGHTBL = 64,
|
|
#define RTM_NEWNEIGHTBL RTM_NEWNEIGHTBL
|
|
RTM_GETNEIGHTBL = 66,
|
|
#define RTM_GETNEIGHTBL RTM_GETNEIGHTBL
|
|
RTM_SETNEIGHTBL,
|
|
#define RTM_SETNEIGHTBL RTM_SETNEIGHTBL
|
|
|
|
RTM_NEWNDUSEROPT = 68,
|
|
#define RTM_NEWNDUSEROPT RTM_NEWNDUSEROPT
|
|
|
|
RTM_NEWADDRLABEL = 72,
|
|
#define RTM_NEWADDRLABEL RTM_NEWADDRLABEL
|
|
RTM_DELADDRLABEL,
|
|
#define RTM_DELADDRLABEL RTM_DELADDRLABEL
|
|
RTM_GETADDRLABEL,
|
|
#define RTM_GETADDRLABEL RTM_GETADDRLABEL
|
|
|
|
RTM_GETDCB = 78,
|
|
#define RTM_GETDCB RTM_GETDCB
|
|
RTM_SETDCB,
|
|
#define RTM_SETDCB RTM_SETDCB
|
|
|
|
__RTM_MAX,
|
|
#define RTM_MAX (((__RTM_MAX + 3) & ~3) - 1)
|
|
};
|
|
|
|
#define RTM_NR_MSGTYPES (RTM_MAX + 1 - RTM_BASE)
|
|
#define RTM_NR_FAMILIES (RTM_NR_MSGTYPES >> 2)
|
|
#define RTM_FAM(cmd) (((cmd) - RTM_BASE) >> 2)
|
|
|
|
/*
|
|
Generic structure for encapsulation of optional route information.
|
|
It is reminiscent of sockaddr, but with sa_family replaced
|
|
with attribute type.
|
|
*/
|
|
|
|
struct rtattr {
|
|
unsigned short rta_len;
|
|
unsigned short rta_type;
|
|
};
|
|
|
|
/* Macros to handle rtattributes */
|
|
|
|
#define RTA_ALIGNTO 4
|
|
#define RTA_ALIGN(len) ( ((len)+RTA_ALIGNTO-1) & ~(RTA_ALIGNTO-1) )
|
|
#define RTA_OK(rta,len) ((len) >= (int)sizeof(struct rtattr) && \
|
|
(rta)->rta_len >= sizeof(struct rtattr) && \
|
|
(rta)->rta_len <= (len))
|
|
#define RTA_NEXT(rta,attrlen) ((attrlen) -= RTA_ALIGN((rta)->rta_len), \
|
|
(struct rtattr*)(((char*)(rta)) + RTA_ALIGN((rta)->rta_len)))
|
|
#define RTA_LENGTH(len) (RTA_ALIGN(sizeof(struct rtattr)) + (len))
|
|
#define RTA_SPACE(len) RTA_ALIGN(RTA_LENGTH(len))
|
|
#define RTA_DATA(rta) ((void*)(((char*)(rta)) + RTA_LENGTH(0)))
|
|
#define RTA_PAYLOAD(rta) ((int)((rta)->rta_len) - RTA_LENGTH(0))
|
|
|
|
|
|
|
|
|
|
/******************************************************************************
|
|
* Definitions used in routing table administration.
|
|
****/
|
|
|
|
struct rtmsg {
|
|
unsigned char rtm_family;
|
|
unsigned char rtm_dst_len;
|
|
unsigned char rtm_src_len;
|
|
unsigned char rtm_tos;
|
|
|
|
unsigned char rtm_table; /* Routing table id */
|
|
unsigned char rtm_protocol; /* Routing protocol; see below */
|
|
unsigned char rtm_scope; /* See below */
|
|
unsigned char rtm_type; /* See below */
|
|
|
|
unsigned rtm_flags;
|
|
};
|
|
|
|
/* rtm_type */
|
|
|
|
enum {
|
|
RTN_UNSPEC,
|
|
RTN_UNICAST, /* Gateway or direct route */
|
|
RTN_LOCAL, /* Accept locally */
|
|
RTN_BROADCAST, /* Accept locally as broadcast,
|
|
send as broadcast */
|
|
RTN_ANYCAST, /* Accept locally as broadcast,
|
|
but send as unicast */
|
|
RTN_MULTICAST, /* Multicast route */
|
|
RTN_BLACKHOLE, /* Drop */
|
|
RTN_UNREACHABLE, /* Destination is unreachable */
|
|
RTN_PROHIBIT, /* Administratively prohibited */
|
|
RTN_THROW, /* Not in this table */
|
|
RTN_NAT, /* Translate this address */
|
|
RTN_XRESOLVE, /* Use external resolver */
|
|
__RTN_MAX
|
|
};
|
|
|
|
#define RTN_MAX (__RTN_MAX - 1)
|
|
|
|
|
|
/* rtm_protocol */
|
|
|
|
#define RTPROT_UNSPEC 0
|
|
#define RTPROT_REDIRECT 1 /* Route installed by ICMP redirects;
|
|
not used by current IPv4 */
|
|
#define RTPROT_KERNEL 2 /* Route installed by kernel */
|
|
#define RTPROT_BOOT 3 /* Route installed during boot */
|
|
#define RTPROT_STATIC 4 /* Route installed by administrator */
|
|
|
|
/* Values of protocol >= RTPROT_STATIC are not interpreted by kernel;
|
|
they are just passed from user and back as is.
|
|
It will be used by hypothetical multiple routing daemons.
|
|
Note that protocol values should be standardized in order to
|
|
avoid conflicts.
|
|
*/
|
|
|
|
#define RTPROT_GATED 8 /* Apparently, GateD */
|
|
#define RTPROT_RA 9 /* RDISC/ND router advertisements */
|
|
#define RTPROT_MRT 10 /* Merit MRT */
|
|
#define RTPROT_ZEBRA 11 /* Zebra */
|
|
#define RTPROT_BIRD 12 /* BIRD */
|
|
#define RTPROT_DNROUTED 13 /* DECnet routing daemon */
|
|
#define RTPROT_XORP 14 /* XORP */
|
|
#define RTPROT_NTK 15 /* Netsukuku */
|
|
#define RTPROT_DHCP 16 /* DHCP client */
|
|
|
|
/* rtm_scope
|
|
|
|
Really it is not scope, but sort of distance to the destination.
|
|
NOWHERE are reserved for not existing destinations, HOST is our
|
|
local addresses, LINK are destinations, located on directly attached
|
|
link and UNIVERSE is everywhere in the Universe.
|
|
|
|
Intermediate values are also possible f.e. interior routes
|
|
could be assigned a value between UNIVERSE and LINK.
|
|
*/
|
|
|
|
enum rt_scope_t {
|
|
RT_SCOPE_UNIVERSE=0,
|
|
/* User defined values */
|
|
RT_SCOPE_SITE=200,
|
|
RT_SCOPE_LINK=253,
|
|
RT_SCOPE_HOST=254,
|
|
RT_SCOPE_NOWHERE=255
|
|
};
|
|
|
|
/* rtm_flags */
|
|
|
|
#define RTM_F_NOTIFY 0x100 /* Notify user of route change */
|
|
#define RTM_F_CLONED 0x200 /* This route is cloned */
|
|
#define RTM_F_EQUALIZE 0x400 /* Multipath equalizer: NI */
|
|
#define RTM_F_PREFIX 0x800 /* Prefix addresses */
|
|
|
|
/* Reserved table identifiers */
|
|
|
|
enum rt_class_t {
|
|
RT_TABLE_UNSPEC=0,
|
|
/* User defined values */
|
|
RT_TABLE_COMPAT=252,
|
|
RT_TABLE_DEFAULT=253,
|
|
RT_TABLE_MAIN=254,
|
|
RT_TABLE_LOCAL=255,
|
|
RT_TABLE_MAX=0xFFFFFFFF
|
|
};
|
|
|
|
|
|
/* Routing message attributes */
|
|
|
|
enum rtattr_type_t {
|
|
RTA_UNSPEC,
|
|
RTA_DST,
|
|
RTA_SRC,
|
|
RTA_IIF,
|
|
RTA_OIF,
|
|
RTA_GATEWAY,
|
|
RTA_PRIORITY,
|
|
RTA_PREFSRC,
|
|
RTA_METRICS,
|
|
RTA_MULTIPATH,
|
|
RTA_PROTOINFO, /* no longer used */
|
|
RTA_FLOW,
|
|
RTA_CACHEINFO,
|
|
RTA_SESSION, /* no longer used */
|
|
RTA_MP_ALGO, /* no longer used */
|
|
RTA_TABLE,
|
|
RTA_MARK,
|
|
__RTA_MAX
|
|
};
|
|
|
|
#define RTA_MAX (__RTA_MAX - 1)
|
|
|
|
#define RTM_RTA(r) ((struct rtattr*)(((char*)(r)) + NLMSG_ALIGN(sizeof(struct rtmsg))))
|
|
#define RTM_PAYLOAD(n) NLMSG_PAYLOAD(n,sizeof(struct rtmsg))
|
|
|
|
/* RTM_MULTIPATH --- array of struct rtnexthop.
|
|
*
|
|
* "struct rtnexthop" describes all necessary nexthop information,
|
|
* i.e. parameters of path to a destination via this nexthop.
|
|
*
|
|
* At the moment it is impossible to set different prefsrc, mtu, window
|
|
* and rtt for different paths from multipath.
|
|
*/
|
|
|
|
struct rtnexthop {
|
|
unsigned short rtnh_len;
|
|
unsigned char rtnh_flags;
|
|
unsigned char rtnh_hops;
|
|
int rtnh_ifindex;
|
|
};
|
|
|
|
/* rtnh_flags */
|
|
|
|
#define RTNH_F_DEAD 1 /* Nexthop is dead (used by multipath) */
|
|
#define RTNH_F_PERVASIVE 2 /* Do recursive gateway lookup */
|
|
#define RTNH_F_ONLINK 4 /* Gateway is forced on link */
|
|
|
|
/* Macros to handle hexthops */
|
|
|
|
#define RTNH_ALIGNTO 4
|
|
#define RTNH_ALIGN(len) ( ((len)+RTNH_ALIGNTO-1) & ~(RTNH_ALIGNTO-1) )
|
|
#define RTNH_OK(rtnh,len) ((rtnh)->rtnh_len >= sizeof(struct rtnexthop) && \
|
|
((int)(rtnh)->rtnh_len) <= (len))
|
|
#define RTNH_NEXT(rtnh) ((struct rtnexthop*)(((char*)(rtnh)) + RTNH_ALIGN((rtnh)->rtnh_len)))
|
|
#define RTNH_LENGTH(len) (RTNH_ALIGN(sizeof(struct rtnexthop)) + (len))
|
|
#define RTNH_SPACE(len) RTNH_ALIGN(RTNH_LENGTH(len))
|
|
#define RTNH_DATA(rtnh) ((struct rtattr*)(((char*)(rtnh)) + RTNH_LENGTH(0)))
|
|
|
|
/* RTM_CACHEINFO */
|
|
|
|
struct rta_cacheinfo {
|
|
__u32 rta_clntref;
|
|
__u32 rta_lastuse;
|
|
__s32 rta_expires;
|
|
__u32 rta_error;
|
|
__u32 rta_used;
|
|
|
|
#define RTNETLINK_HAVE_PEERINFO 1
|
|
__u32 rta_id;
|
|
__u32 rta_ts;
|
|
__u32 rta_tsage;
|
|
};
|
|
|
|
/* RTM_METRICS --- array of struct rtattr with types of RTAX_* */
|
|
|
|
enum {
|
|
RTAX_UNSPEC,
|
|
#define RTAX_UNSPEC RTAX_UNSPEC
|
|
RTAX_LOCK,
|
|
#define RTAX_LOCK RTAX_LOCK
|
|
RTAX_MTU,
|
|
#define RTAX_MTU RTAX_MTU
|
|
RTAX_WINDOW,
|
|
#define RTAX_WINDOW RTAX_WINDOW
|
|
RTAX_RTT,
|
|
#define RTAX_RTT RTAX_RTT
|
|
RTAX_RTTVAR,
|
|
#define RTAX_RTTVAR RTAX_RTTVAR
|
|
RTAX_SSTHRESH,
|
|
#define RTAX_SSTHRESH RTAX_SSTHRESH
|
|
RTAX_CWND,
|
|
#define RTAX_CWND RTAX_CWND
|
|
RTAX_ADVMSS,
|
|
#define RTAX_ADVMSS RTAX_ADVMSS
|
|
RTAX_REORDERING,
|
|
#define RTAX_REORDERING RTAX_REORDERING
|
|
RTAX_HOPLIMIT,
|
|
#define RTAX_HOPLIMIT RTAX_HOPLIMIT
|
|
RTAX_INITCWND,
|
|
#define RTAX_INITCWND RTAX_INITCWND
|
|
RTAX_FEATURES,
|
|
#define RTAX_FEATURES RTAX_FEATURES
|
|
RTAX_RTO_MIN,
|
|
#define RTAX_RTO_MIN RTAX_RTO_MIN
|
|
RTAX_INITRWND,
|
|
#define RTAX_INITRWND RTAX_INITRWND
|
|
__RTAX_MAX
|
|
};
|
|
|
|
#define RTAX_MAX (__RTAX_MAX - 1)
|
|
|
|
#define RTAX_FEATURE_ECN 0x00000001
|
|
#define RTAX_FEATURE_SACK 0x00000002
|
|
#define RTAX_FEATURE_TIMESTAMP 0x00000004
|
|
#define RTAX_FEATURE_ALLFRAG 0x00000008
|
|
|
|
struct rta_session {
|
|
__u8 proto;
|
|
__u8 pad1;
|
|
__u16 pad2;
|
|
|
|
union {
|
|
struct {
|
|
__u16 sport;
|
|
__u16 dport;
|
|
} ports;
|
|
|
|
struct {
|
|
__u8 type;
|
|
__u8 code;
|
|
__u16 ident;
|
|
} icmpt;
|
|
|
|
__u32 spi;
|
|
} u;
|
|
};
|
|
|
|
/****
|
|
* General form of address family dependent message.
|
|
****/
|
|
|
|
struct rtgenmsg {
|
|
unsigned char rtgen_family;
|
|
};
|
|
|
|
/*****************************************************************
|
|
* Link layer specific messages.
|
|
****/
|
|
|
|
/* struct ifinfomsg
|
|
* passes link level specific information, not dependent
|
|
* on network protocol.
|
|
*/
|
|
|
|
struct ifinfomsg {
|
|
unsigned char ifi_family;
|
|
unsigned char __ifi_pad;
|
|
unsigned short ifi_type; /* ARPHRD_* */
|
|
int ifi_index; /* Link index */
|
|
unsigned ifi_flags; /* IFF_* flags */
|
|
unsigned ifi_change; /* IFF_* change mask */
|
|
};
|
|
|
|
/********************************************************************
|
|
* prefix information
|
|
****/
|
|
|
|
struct prefixmsg {
|
|
unsigned char prefix_family;
|
|
unsigned char prefix_pad1;
|
|
unsigned short prefix_pad2;
|
|
int prefix_ifindex;
|
|
unsigned char prefix_type;
|
|
unsigned char prefix_len;
|
|
unsigned char prefix_flags;
|
|
unsigned char prefix_pad3;
|
|
};
|
|
|
|
enum
|
|
{
|
|
PREFIX_UNSPEC,
|
|
PREFIX_ADDRESS,
|
|
PREFIX_CACHEINFO,
|
|
__PREFIX_MAX
|
|
};
|
|
|
|
#define PREFIX_MAX (__PREFIX_MAX - 1)
|
|
|
|
struct prefix_cacheinfo {
|
|
__u32 preferred_time;
|
|
__u32 valid_time;
|
|
};
|
|
|
|
|
|
/*****************************************************************
|
|
* Traffic control messages.
|
|
****/
|
|
|
|
struct tcmsg {
|
|
unsigned char tcm_family;
|
|
unsigned char tcm__pad1;
|
|
unsigned short tcm__pad2;
|
|
int tcm_ifindex;
|
|
__u32 tcm_handle;
|
|
__u32 tcm_parent;
|
|
__u32 tcm_info;
|
|
};
|
|
|
|
enum {
|
|
TCA_UNSPEC,
|
|
TCA_KIND,
|
|
TCA_OPTIONS,
|
|
TCA_STATS,
|
|
TCA_XSTATS,
|
|
TCA_RATE,
|
|
TCA_FCNT,
|
|
TCA_STATS2,
|
|
TCA_STAB,
|
|
__TCA_MAX
|
|
};
|
|
|
|
#define TCA_MAX (__TCA_MAX - 1)
|
|
|
|
#define TCA_RTA(r) ((struct rtattr*)(((char*)(r)) + NLMSG_ALIGN(sizeof(struct tcmsg))))
|
|
#define TCA_PAYLOAD(n) NLMSG_PAYLOAD(n,sizeof(struct tcmsg))
|
|
|
|
/********************************************************************
|
|
* Neighbor Discovery userland options
|
|
****/
|
|
|
|
struct nduseroptmsg {
|
|
unsigned char nduseropt_family;
|
|
unsigned char nduseropt_pad1;
|
|
unsigned short nduseropt_opts_len; /* Total length of options */
|
|
int nduseropt_ifindex;
|
|
__u8 nduseropt_icmp_type;
|
|
__u8 nduseropt_icmp_code;
|
|
unsigned short nduseropt_pad2;
|
|
unsigned int nduseropt_pad3;
|
|
/* Followed by one or more ND options */
|
|
};
|
|
|
|
enum {
|
|
NDUSEROPT_UNSPEC,
|
|
NDUSEROPT_SRCADDR,
|
|
__NDUSEROPT_MAX
|
|
};
|
|
|
|
#define NDUSEROPT_MAX (__NDUSEROPT_MAX - 1)
|
|
|
|
#ifndef __KERNEL__
|
|
/* RTnetlink multicast groups - backwards compatibility for userspace */
|
|
#define RTMGRP_LINK 1
|
|
#define RTMGRP_NOTIFY 2
|
|
#define RTMGRP_NEIGH 4
|
|
#define RTMGRP_TC 8
|
|
|
|
#define RTMGRP_IPV4_IFADDR 0x10
|
|
#define RTMGRP_IPV4_MROUTE 0x20
|
|
#define RTMGRP_IPV4_ROUTE 0x40
|
|
#define RTMGRP_IPV4_RULE 0x80
|
|
|
|
#define RTMGRP_IPV6_IFADDR 0x100
|
|
#define RTMGRP_IPV6_MROUTE 0x200
|
|
#define RTMGRP_IPV6_ROUTE 0x400
|
|
#define RTMGRP_IPV6_IFINFO 0x800
|
|
|
|
#define RTMGRP_DECnet_IFADDR 0x1000
|
|
#define RTMGRP_DECnet_ROUTE 0x4000
|
|
|
|
#define RTMGRP_IPV6_PREFIX 0x20000
|
|
#endif
|
|
|
|
/* RTnetlink multicast groups */
|
|
enum rtnetlink_groups {
|
|
RTNLGRP_NONE,
|
|
#define RTNLGRP_NONE RTNLGRP_NONE
|
|
RTNLGRP_LINK,
|
|
#define RTNLGRP_LINK RTNLGRP_LINK
|
|
RTNLGRP_NOTIFY,
|
|
#define RTNLGRP_NOTIFY RTNLGRP_NOTIFY
|
|
RTNLGRP_NEIGH,
|
|
#define RTNLGRP_NEIGH RTNLGRP_NEIGH
|
|
RTNLGRP_TC,
|
|
#define RTNLGRP_TC RTNLGRP_TC
|
|
RTNLGRP_IPV4_IFADDR,
|
|
#define RTNLGRP_IPV4_IFADDR RTNLGRP_IPV4_IFADDR
|
|
RTNLGRP_IPV4_MROUTE,
|
|
#define RTNLGRP_IPV4_MROUTE RTNLGRP_IPV4_MROUTE
|
|
RTNLGRP_IPV4_ROUTE,
|
|
#define RTNLGRP_IPV4_ROUTE RTNLGRP_IPV4_ROUTE
|
|
RTNLGRP_IPV4_RULE,
|
|
#define RTNLGRP_IPV4_RULE RTNLGRP_IPV4_RULE
|
|
RTNLGRP_IPV6_IFADDR,
|
|
#define RTNLGRP_IPV6_IFADDR RTNLGRP_IPV6_IFADDR
|
|
RTNLGRP_IPV6_MROUTE,
|
|
#define RTNLGRP_IPV6_MROUTE RTNLGRP_IPV6_MROUTE
|
|
RTNLGRP_IPV6_ROUTE,
|
|
#define RTNLGRP_IPV6_ROUTE RTNLGRP_IPV6_ROUTE
|
|
RTNLGRP_IPV6_IFINFO,
|
|
#define RTNLGRP_IPV6_IFINFO RTNLGRP_IPV6_IFINFO
|
|
RTNLGRP_DECnet_IFADDR,
|
|
#define RTNLGRP_DECnet_IFADDR RTNLGRP_DECnet_IFADDR
|
|
RTNLGRP_NOP2,
|
|
RTNLGRP_DECnet_ROUTE,
|
|
#define RTNLGRP_DECnet_ROUTE RTNLGRP_DECnet_ROUTE
|
|
RTNLGRP_DECnet_RULE,
|
|
#define RTNLGRP_DECnet_RULE RTNLGRP_DECnet_RULE
|
|
RTNLGRP_NOP4,
|
|
RTNLGRP_IPV6_PREFIX,
|
|
#define RTNLGRP_IPV6_PREFIX RTNLGRP_IPV6_PREFIX
|
|
RTNLGRP_IPV6_RULE,
|
|
#define RTNLGRP_IPV6_RULE RTNLGRP_IPV6_RULE
|
|
RTNLGRP_ND_USEROPT,
|
|
#define RTNLGRP_ND_USEROPT RTNLGRP_ND_USEROPT
|
|
RTNLGRP_PHONET_IFADDR,
|
|
#define RTNLGRP_PHONET_IFADDR RTNLGRP_PHONET_IFADDR
|
|
RTNLGRP_PHONET_ROUTE,
|
|
#define RTNLGRP_PHONET_ROUTE RTNLGRP_PHONET_ROUTE
|
|
RTNLGRP_DCB,
|
|
#define RTNLGRP_DCB RTNLGRP_DCB
|
|
__RTNLGRP_MAX
|
|
};
|
|
#define RTNLGRP_MAX (__RTNLGRP_MAX - 1)
|
|
|
|
/* TC action piece */
|
|
struct tcamsg {
|
|
unsigned char tca_family;
|
|
unsigned char tca__pad1;
|
|
unsigned short tca__pad2;
|
|
};
|
|
#define TA_RTA(r) ((struct rtattr*)(((char*)(r)) + NLMSG_ALIGN(sizeof(struct tcamsg))))
|
|
#define TA_PAYLOAD(n) NLMSG_PAYLOAD(n,sizeof(struct tcamsg))
|
|
#define TCA_ACT_TAB 1 /* attr type must be >=1 */
|
|
#define TCAA_MAX 1
|
|
|
|
/* New extended info filters for IFLA_EXT_MASK */
|
|
#define RTEXT_FILTER_VF (1 << 0)
|
|
|
|
/* End of information exported to user level */
|
|
|
|
#ifdef __KERNEL__
|
|
|
|
#include <linux/mutex.h>
|
|
#include <linux/netdevice.h>
|
|
|
|
static __inline__ int rtattr_strcmp(const struct rtattr *rta, const char *str)
|
|
{
|
|
int len = strlen(str) + 1;
|
|
return len > rta->rta_len || memcmp(RTA_DATA(rta), str, len);
|
|
}
|
|
|
|
extern int rtnetlink_send(struct sk_buff *skb, struct net *net, u32 pid, u32 group, int echo);
|
|
extern int rtnl_unicast(struct sk_buff *skb, struct net *net, u32 pid);
|
|
extern void rtnl_notify(struct sk_buff *skb, struct net *net, u32 pid,
|
|
u32 group, struct nlmsghdr *nlh, gfp_t flags);
|
|
extern void rtnl_set_sk_err(struct net *net, u32 group, int error);
|
|
extern int rtnetlink_put_metrics(struct sk_buff *skb, u32 *metrics);
|
|
extern int rtnl_put_cacheinfo(struct sk_buff *skb, struct dst_entry *dst,
|
|
u32 id, u32 ts, u32 tsage, long expires,
|
|
u32 error);
|
|
|
|
extern void __rta_fill(struct sk_buff *skb, int attrtype, int attrlen, const void *data);
|
|
|
|
#define RTA_PUT(skb, attrtype, attrlen, data) \
|
|
({ if (unlikely(skb_tailroom(skb) < (int)RTA_SPACE(attrlen))) \
|
|
goto rtattr_failure; \
|
|
__rta_fill(skb, attrtype, attrlen, data); })
|
|
|
|
#define RTA_APPEND(skb, attrlen, data) \
|
|
({ if (unlikely(skb_tailroom(skb) < (int)(attrlen))) \
|
|
goto rtattr_failure; \
|
|
memcpy(skb_put(skb, attrlen), data, attrlen); })
|
|
|
|
#define RTA_PUT_NOHDR(skb, attrlen, data) \
|
|
({ RTA_APPEND(skb, RTA_ALIGN(attrlen), data); \
|
|
memset(skb_tail_pointer(skb) - (RTA_ALIGN(attrlen) - attrlen), 0, \
|
|
RTA_ALIGN(attrlen) - attrlen); })
|
|
|
|
#define RTA_PUT_U8(skb, attrtype, value) \
|
|
({ u8 _tmp = (value); \
|
|
RTA_PUT(skb, attrtype, sizeof(u8), &_tmp); })
|
|
|
|
#define RTA_PUT_U16(skb, attrtype, value) \
|
|
({ u16 _tmp = (value); \
|
|
RTA_PUT(skb, attrtype, sizeof(u16), &_tmp); })
|
|
|
|
#define RTA_PUT_U32(skb, attrtype, value) \
|
|
({ u32 _tmp = (value); \
|
|
RTA_PUT(skb, attrtype, sizeof(u32), &_tmp); })
|
|
|
|
#define RTA_PUT_U64(skb, attrtype, value) \
|
|
({ u64 _tmp = (value); \
|
|
RTA_PUT(skb, attrtype, sizeof(u64), &_tmp); })
|
|
|
|
#define RTA_PUT_SECS(skb, attrtype, value) \
|
|
RTA_PUT_U64(skb, attrtype, (value) / HZ)
|
|
|
|
#define RTA_PUT_MSECS(skb, attrtype, value) \
|
|
RTA_PUT_U64(skb, attrtype, jiffies_to_msecs(value))
|
|
|
|
#define RTA_PUT_STRING(skb, attrtype, value) \
|
|
RTA_PUT(skb, attrtype, strlen(value) + 1, value)
|
|
|
|
#define RTA_PUT_FLAG(skb, attrtype) \
|
|
RTA_PUT(skb, attrtype, 0, NULL);
|
|
|
|
#define RTA_NEST(skb, type) \
|
|
({ struct rtattr *__start = (struct rtattr *)skb_tail_pointer(skb); \
|
|
RTA_PUT(skb, type, 0, NULL); \
|
|
__start; })
|
|
|
|
#define RTA_NEST_END(skb, start) \
|
|
({ (start)->rta_len = skb_tail_pointer(skb) - (unsigned char *)(start); \
|
|
(skb)->len; })
|
|
|
|
#define RTA_NEST_COMPAT(skb, type, attrlen, data) \
|
|
({ struct rtattr *__start = (struct rtattr *)skb_tail_pointer(skb); \
|
|
RTA_PUT(skb, type, attrlen, data); \
|
|
RTA_NEST(skb, type); \
|
|
__start; })
|
|
|
|
#define RTA_NEST_COMPAT_END(skb, start) \
|
|
({ struct rtattr *__nest = (void *)(start) + NLMSG_ALIGN((start)->rta_len); \
|
|
(start)->rta_len = skb_tail_pointer(skb) - (unsigned char *)(start); \
|
|
RTA_NEST_END(skb, __nest); \
|
|
(skb)->len; })
|
|
|
|
#define RTA_NEST_CANCEL(skb, start) \
|
|
({ if (start) \
|
|
skb_trim(skb, (unsigned char *) (start) - (skb)->data); \
|
|
-1; })
|
|
|
|
#define RTA_GET_U8(rta) \
|
|
({ if (!rta || RTA_PAYLOAD(rta) < sizeof(u8)) \
|
|
goto rtattr_failure; \
|
|
*(u8 *) RTA_DATA(rta); })
|
|
|
|
#define RTA_GET_U16(rta) \
|
|
({ if (!rta || RTA_PAYLOAD(rta) < sizeof(u16)) \
|
|
goto rtattr_failure; \
|
|
*(u16 *) RTA_DATA(rta); })
|
|
|
|
#define RTA_GET_U32(rta) \
|
|
({ if (!rta || RTA_PAYLOAD(rta) < sizeof(u32)) \
|
|
goto rtattr_failure; \
|
|
*(u32 *) RTA_DATA(rta); })
|
|
|
|
#define RTA_GET_U64(rta) \
|
|
({ u64 _tmp; \
|
|
if (!rta || RTA_PAYLOAD(rta) < sizeof(u64)) \
|
|
goto rtattr_failure; \
|
|
memcpy(&_tmp, RTA_DATA(rta), sizeof(_tmp)); \
|
|
_tmp; })
|
|
|
|
#define RTA_GET_FLAG(rta) (!!(rta))
|
|
|
|
#define RTA_GET_SECS(rta) ((unsigned long) RTA_GET_U64(rta) * HZ)
|
|
#define RTA_GET_MSECS(rta) (msecs_to_jiffies((unsigned long) RTA_GET_U64(rta)))
|
|
|
|
static inline struct rtattr *
|
|
__rta_reserve(struct sk_buff *skb, int attrtype, int attrlen)
|
|
{
|
|
struct rtattr *rta;
|
|
int size = RTA_LENGTH(attrlen);
|
|
|
|
rta = (struct rtattr*)skb_put(skb, RTA_ALIGN(size));
|
|
rta->rta_type = attrtype;
|
|
rta->rta_len = size;
|
|
memset(RTA_DATA(rta) + attrlen, 0, RTA_ALIGN(size) - size);
|
|
return rta;
|
|
}
|
|
|
|
#define __RTA_PUT(skb, attrtype, attrlen) \
|
|
({ if (unlikely(skb_tailroom(skb) < (int)RTA_SPACE(attrlen))) \
|
|
goto rtattr_failure; \
|
|
__rta_reserve(skb, attrtype, attrlen); })
|
|
|
|
extern void rtmsg_ifinfo(int type, struct net_device *dev, unsigned change);
|
|
|
|
/* RTNL is used as a global lock for all changes to network configuration */
|
|
extern void rtnl_lock(void);
|
|
extern void rtnl_unlock(void);
|
|
extern int rtnl_trylock(void);
|
|
extern int rtnl_is_locked(void);
|
|
#ifdef CONFIG_PROVE_LOCKING
|
|
extern int lockdep_rtnl_is_held(void);
|
|
#endif /* #ifdef CONFIG_PROVE_LOCKING */
|
|
|
|
/**
|
|
* rcu_dereference_rtnl - rcu_dereference with debug checking
|
|
* @p: The pointer to read, prior to dereferencing
|
|
*
|
|
* Do an rcu_dereference(p), but check caller either holds rcu_read_lock()
|
|
* or RTNL. Note : Please prefer rtnl_dereference() or rcu_dereference()
|
|
*/
|
|
#define rcu_dereference_rtnl(p) \
|
|
rcu_dereference_check(p, lockdep_rtnl_is_held())
|
|
|
|
/**
|
|
* rtnl_dereference - fetch RCU pointer when updates are prevented by RTNL
|
|
* @p: The pointer to read, prior to dereferencing
|
|
*
|
|
* Return the value of the specified RCU-protected pointer, but omit
|
|
* both the smp_read_barrier_depends() and the ACCESS_ONCE(), because
|
|
* caller holds RTNL.
|
|
*/
|
|
#define rtnl_dereference(p) \
|
|
rcu_dereference_protected(p, lockdep_rtnl_is_held())
|
|
|
|
static inline struct netdev_queue *dev_ingress_queue(struct net_device *dev)
|
|
{
|
|
return rtnl_dereference(dev->ingress_queue);
|
|
}
|
|
|
|
extern struct netdev_queue *dev_ingress_queue_create(struct net_device *dev);
|
|
|
|
extern void rtnetlink_init(void);
|
|
extern void __rtnl_unlock(void);
|
|
|
|
#define ASSERT_RTNL() do { \
|
|
if (unlikely(!rtnl_is_locked())) { \
|
|
printk(KERN_ERR "RTNL: assertion failed at %s (%d)\n", \
|
|
__FILE__, __LINE__); \
|
|
dump_stack(); \
|
|
} \
|
|
} while(0)
|
|
|
|
static inline u32 rtm_get_table(struct rtattr **rta, u8 table)
|
|
{
|
|
return RTA_GET_U32(rta[RTA_TABLE-1]);
|
|
rtattr_failure:
|
|
return table;
|
|
}
|
|
|
|
extern int ndo_dflt_fdb_dump(struct sk_buff *skb,
|
|
struct netlink_callback *cb,
|
|
struct net_device *dev,
|
|
int idx);
|
|
#endif /* __KERNEL__ */
|
|
|
|
|
|
#endif /* __LINUX_RTNETLINK_H */
|