Skip site navigation (1)Skip section navigation (2)
Date:      Fri, 9 Oct 2020 12:06:43 +0000 (UTC)
From:      Richard Scheffenegger <rscheff@FreeBSD.org>
To:        src-committers@freebsd.org, svn-src-all@freebsd.org, svn-src-head@freebsd.org
Subject:   svn commit: r366569 - in head/sys: net netinet netinet6
Message-ID:  <202010091206.099C6hPe025004@repo.freebsd.org>

next in thread | raw e-mail | index | archive | help
Author: rscheff
Date: Fri Oct  9 12:06:43 2020
New Revision: 366569
URL: https://svnweb.freebsd.org/changeset/base/366569

Log:
  Add IP(V6)_VLAN_PCP to set 802.1 priority per-flow.
  
  This adds a new IP_PROTO / IPV6_PROTO setsockopt (getsockopt)
  option IP(V6)_VLAN_PCP, which can be set to -1 (interface
  default), or explicitly to any priority between 0 and 7.
  
  Note that for untagged traffic, explicitly adding a
  priority will insert a special 801.1Q vlan header with
  vlan ID = 0 to carry the priority setting
  
  Reviewed by:	gallatin, rrs
  MFC after:	2 weeks
  Sponsored by:	NetApp, Inc.
  Differential Revision:	https://reviews.freebsd.org/D26409

Modified:
  head/sys/net/if_ethersubr.c
  head/sys/netinet/in.h
  head/sys/netinet/in_pcb.h
  head/sys/netinet/ip_output.c
  head/sys/netinet6/in6.h
  head/sys/netinet6/ip6_output.c

Modified: head/sys/net/if_ethersubr.c
==============================================================================
--- head/sys/net/if_ethersubr.c	Fri Oct  9 11:24:19 2020	(r366568)
+++ head/sys/net/if_ethersubr.c	Fri Oct  9 12:06:43 2020	(r366569)
@@ -1388,6 +1388,13 @@ ether_8021q_frame(struct mbuf **mp, struct ifnet *ife,
 	}
 
 	/*
+	 * If PCP is set in mbuf, use it
+	 */
+	if ((*mp)->m_flags & M_VLANTAG) {
+		pcp = EVL_PRIOFTAG((*mp)->m_pkthdr.ether_vtag);
+	}
+
+	/*
 	 * If underlying interface can do VLAN tag insertion itself,
 	 * just pass the packet along. However, we need some way to
 	 * tell the interface where the packet came from so that it

Modified: head/sys/netinet/in.h
==============================================================================
--- head/sys/netinet/in.h	Fri Oct  9 11:24:19 2020	(r366568)
+++ head/sys/netinet/in.h	Fri Oct  9 12:06:43 2020	(r366569)
@@ -483,6 +483,10 @@ __END_DECLS
 /* The following option is private; do not use it from user applications. */
 #define	IP_MSFILTER			74   /* set/get filter list */
 
+/* The following option deals with the 802.1Q Ethernet Priority Code Point */
+#define	IP_VLAN_PCP		75   /* int; set/get PCP used for packet, */
+				     /*      -1 use interface default */
+
 /* Protocol Independent Multicast API [RFC3678] */
 #define	MCAST_JOIN_GROUP		80   /* join an any-source group */
 #define	MCAST_LEAVE_GROUP		81   /* leave all sources for group */

Modified: head/sys/netinet/in_pcb.h
==============================================================================
--- head/sys/netinet/in_pcb.h	Fri Oct  9 11:24:19 2020	(r366568)
+++ head/sys/netinet/in_pcb.h	Fri Oct  9 12:06:43 2020	(r366569)
@@ -748,6 +748,13 @@ int	inp_so_options(const struct inpcb *inp);
 #define INP_SUPPORTS_MBUFQ	0x00004000 /* Supports the mbuf queue method of LRO */
 #define INP_MBUF_QUEUE_READY	0x00008000 /* The transport is pacing, inputs can be queued */
 #define INP_DONT_SACK_QUEUE	0x00010000 /* If a sack arrives do not wake me */
+#define INP_2PCP_SET		0x00020000 /* If the Eth PCP should be set explicitly */
+#define INP_2PCP_BIT0		0x00040000 /* Eth PCP Bit 0 */
+#define INP_2PCP_BIT1		0x00080000 /* Eth PCP Bit 1 */
+#define INP_2PCP_BIT2		0x00100000 /* Eth PCP Bit 2 */
+#define INP_2PCP_BASE	INP_2PCP_BIT0
+#define INP_2PCP_MASK	(INP_2PCP_BIT0 | INP_2PCP_BIT1 | INP_2PCP_BIT2)
+#define INP_2PCP_SHIFT		18         /* shift PCP field in/out of inp_flags2 */
 /*
  * Flags passed to in_pcblookup*() functions.
  */

Modified: head/sys/netinet/ip_output.c
==============================================================================
--- head/sys/netinet/ip_output.c	Fri Oct  9 11:24:19 2020	(r366568)
+++ head/sys/netinet/ip_output.c	Fri Oct  9 12:06:43 2020	(r366569)
@@ -62,7 +62,9 @@ __FBSDID("$FreeBSD$");
 
 #include <net/if.h>
 #include <net/if_var.h>
+#include <net/if_vlan_var.h>
 #include <net/if_llatbl.h>
+#include <net/ethernet.h>
 #include <net/netisr.h>
 #include <net/pfil.h>
 #include <net/route.h>
@@ -324,6 +326,7 @@ ip_output(struct mbuf *m, struct mbuf *opt, struct rou
 	int hlen = sizeof (struct ip);
 	int mtu = 0;
 	int error = 0;
+	int vlan_pcp = -1;
 	struct sockaddr_in *dst, sin;
 	const struct sockaddr_in *gw;
 	struct in_ifaddr *ia = NULL;
@@ -345,6 +348,9 @@ ip_output(struct mbuf *m, struct mbuf *opt, struct rou
 			m->m_pkthdr.flowid = inp->inp_flowid;
 			M_HASHTYPE_SET(m, inp->inp_flowtype);
 		}
+		if ((inp->inp_flags2 & INP_2PCP_SET) != 0)
+			vlan_pcp = (inp->inp_flags2 & INP_2PCP_MASK) >>
+			    INP_2PCP_SHIFT;
 #ifdef NUMA
 		m->m_pkthdr.numa_domain = inp->inp_numa_domain;
 #endif
@@ -717,6 +723,9 @@ sendit:
 		}
 	}
 
+	if (vlan_pcp > -1)
+		EVL_APPLY_PRI(m, vlan_pcp);
+
 	/* IN_LOOPBACK must not appear on the wire - RFC1122. */
 	if (IN_LOOPBACK(ntohl(ip->ip_dst.s_addr)) ||
 	    IN_LOOPBACK(ntohl(ip->ip_src.s_addr))) {
@@ -1210,6 +1219,7 @@ ip_ctloutput(struct socket *so, struct sockopt *sopt)
 #ifdef	RSS
 		case IP_RECVRSSBUCKETID:
 #endif
+		case IP_VLAN_PCP:
 			error = sooptcopyin(sopt, &optval, sizeof optval,
 					    sizeof optval);
 			if (error)
@@ -1305,6 +1315,28 @@ ip_ctloutput(struct socket *so, struct sockopt *sopt)
 				OPTSET2(INP_RECVRSSBUCKETID, optval);
 				break;
 #endif
+			case IP_VLAN_PCP:
+				if ((optval >= -1) && (optval <=
+				    (INP_2PCP_MASK >> INP_2PCP_SHIFT))) {
+					if (optval == -1) {
+						INP_WLOCK(inp);
+						inp->inp_flags2 &=
+						    ~(INP_2PCP_SET |
+						      INP_2PCP_MASK);
+						INP_WUNLOCK(inp);
+					} else {
+						INP_WLOCK(inp);
+						inp->inp_flags2 |=
+						    INP_2PCP_SET;
+						inp->inp_flags2 &=
+						    ~INP_2PCP_MASK;
+						inp->inp_flags2 |=
+						    optval << INP_2PCP_SHIFT;
+						INP_WUNLOCK(inp);
+					}
+				} else
+					error = EINVAL;
+				break;
 			}
 			break;
 #undef OPTSET
@@ -1425,6 +1457,7 @@ ip_ctloutput(struct socket *so, struct sockopt *sopt)
 		case IP_RSSBUCKETID:
 		case IP_RECVRSSBUCKETID:
 #endif
+		case IP_VLAN_PCP:
 			switch (sopt->sopt_name) {
 			case IP_TOS:
 				optval = inp->inp_ip_tos;
@@ -1511,6 +1544,14 @@ ip_ctloutput(struct socket *so, struct sockopt *sopt)
 #endif
 			case IP_BINDMULTI:
 				optval = OPTBIT2(INP_BINDMULTI);
+				break;
+			case IP_VLAN_PCP:
+				if (OPTBIT2(INP_2PCP_SET)) {
+					optval = (inp->inp_flags2 &
+					    INP_2PCP_MASK) >> INP_2PCP_SHIFT;
+				} else {
+					optval = -1;
+				}
 				break;
 			}
 			error = sooptcopyout(sopt, &optval, sizeof optval);

Modified: head/sys/netinet6/in6.h
==============================================================================
--- head/sys/netinet6/in6.h	Fri Oct  9 11:24:19 2020	(r366568)
+++ head/sys/netinet6/in6.h	Fri Oct  9 12:06:43 2020	(r366569)
@@ -511,6 +511,10 @@ struct route_in6 {
 				    * set/get multicast source filter list.
 				    */
 
+/* The following option deals with the 802.1Q Ethernet Priority Code Point */
+#define	IPV6_VLAN_PCP		75  /* int; set/get PCP used for packet, */
+				    /*      -1 use interface default */
+
 /* to define items, should talk with KAME guys first, for *BSD compatibility */
 
 #define IPV6_RTHDR_LOOSE     0 /* this hop need not be a neighbor. XXX old spec */

Modified: head/sys/netinet6/ip6_output.c
==============================================================================
--- head/sys/netinet6/ip6_output.c	Fri Oct  9 11:24:19 2020	(r366568)
+++ head/sys/netinet6/ip6_output.c	Fri Oct  9 12:06:43 2020	(r366569)
@@ -92,7 +92,9 @@ __FBSDID("$FreeBSD$");
 
 #include <net/if.h>
 #include <net/if_var.h>
+#include <net/if_vlan_var.h>
 #include <net/if_llatbl.h>
+#include <net/ethernet.h>
 #include <net/netisr.h>
 #include <net/route.h>
 #include <net/route/nhop.h>
@@ -436,6 +438,7 @@ ip6_output(struct mbuf *m0, struct ip6_pktopts *opt,
 	u_char *nexthdrp;
 	int tlen, len;
 	int error = 0;
+	int vlan_pcp = -1;
 	struct in6_ifaddr *ia = NULL;
 	u_long mtu;
 	int alwaysfrag, dontfrag;
@@ -460,6 +463,9 @@ ip6_output(struct mbuf *m0, struct ip6_pktopts *opt,
 			m->m_pkthdr.flowid = inp->inp_flowid;
 			M_HASHTYPE_SET(m, inp->inp_flowtype);
 		}
+		if ((inp->inp_flags2 & INP_2PCP_SET) != 0)
+			vlan_pcp = (inp->inp_flags2 & INP_2PCP_MASK) >>
+			    INP_2PCP_SHIFT;
 #ifdef NUMA
 		m->m_pkthdr.numa_domain = inp->inp_numa_domain;
 #endif
@@ -1098,6 +1104,8 @@ nonh6lookup:
 	}
 
 passout:
+	if (vlan_pcp > -1)
+		EVL_APPLY_PRI(m, vlan_pcp);
 	/*
 	 * Send the packet to the outgoing interface.
 	 * If necessary, do IPv6 fragmentation before sending.
@@ -1265,6 +1273,8 @@ sendorfree:
 				counter_u64_add(ia->ia_ifa.ifa_obytes,
 				    m->m_pkthdr.len);
 			}
+			if (vlan_pcp > -1)
+				EVL_APPLY_PRI(m, vlan_pcp);
 			error = ip6_output_send(inp, ifp, origifp, m, dst, ro,
 			    true);
 		} else
@@ -1752,6 +1762,7 @@ ip6_ctloutput(struct socket *so, struct sockopt *sopt)
 #ifdef	RSS
 			case IPV6_RSS_LISTEN_BUCKET:
 #endif
+			case IPV6_VLAN_PCP:
 				if (optname == IPV6_BINDANY && td != NULL) {
 					error = priv_check(td,
 					    PRIV_NETINET_BINDANY);
@@ -1945,6 +1956,29 @@ do {									\
 					}
 					break;
 #endif
+				case IPV6_VLAN_PCP:
+					if ((optval >= -1) && (optval <=
+					    (INP_2PCP_MASK >> INP_2PCP_SHIFT))) {
+						if (optval == -1) {
+							INP_WLOCK(inp);
+							inp->inp_flags2 &=
+							    ~(INP_2PCP_SET |
+							    INP_2PCP_MASK);
+							INP_WUNLOCK(inp);
+						} else {
+							INP_WLOCK(inp);
+							inp->inp_flags2 |=
+							    INP_2PCP_SET;
+							inp->inp_flags2 &=
+							    ~INP_2PCP_MASK;
+							inp->inp_flags2 |=
+							    optval <<
+							    INP_2PCP_SHIFT;
+							INP_WUNLOCK(inp);
+						}
+					} else
+						error = EINVAL;
+					break;
 				}
 				break;
 
@@ -2168,6 +2202,7 @@ do {									\
 			case IPV6_RECVRSSBUCKETID:
 #endif
 			case IPV6_BINDMULTI:
+			case IPV6_VLAN_PCP:
 				switch (optname) {
 				case IPV6_RECVHOPOPTS:
 					optval = OPTBIT(IN6P_HOPOPTS);
@@ -2264,7 +2299,18 @@ do {									\
 				case IPV6_BINDMULTI:
 					optval = OPTBIT2(INP_BINDMULTI);
 					break;
+
+				case IPV6_VLAN_PCP:
+					if (OPTBIT2(INP_2PCP_SET)) {
+						optval = (inp->inp_flags2 &
+							    INP_2PCP_MASK) >>
+							    INP_2PCP_SHIFT;
+					} else {
+						optval = -1;
+					}
+					break;
 				}
+
 				if (error)
 					break;
 				error = sooptcopyout(sopt, &optval,



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?202010091206.099C6hPe025004>