linma / rpms / iproute

Forked from rpms/iproute 4 years ago
Clone

Blame SOURCES/0043-tc-f_flower-add-geneve-option-match-support-to-flowe.patch

930fb9
From 9dd748cd49d15b7e90a7a65de53d431a2c515c86 Mon Sep 17 00:00:00 2001
930fb9
From: Phil Sutter <psutter@redhat.com>
930fb9
Date: Thu, 31 Jan 2019 17:13:07 +0100
930fb9
Subject: [PATCH] tc: f_flower: add geneve option match support to flower
930fb9
930fb9
Bugzilla: https://bugzilla.redhat.com/show_bug.cgi?id=1654761
930fb9
Upstream Status: iproute2.git commit 56155d4df86d4
930fb9
930fb9
commit 56155d4df86d489c4207444c8a90ce4e0e22e49f
930fb9
Author: Pieter Jansen van Vuuren <pieter.jansenvanvuuren@netronome.com>
930fb9
Date:   Fri Sep 28 16:03:39 2018 +0200
930fb9
930fb9
    tc: f_flower: add geneve option match support to flower
930fb9
930fb9
    Allow matching on options in Geneve tunnel headers.
930fb9
930fb9
    The options can be described in the form
930fb9
    CLASS:TYPE:DATA/CLASS_MASK:TYPE_MASK:DATA_MASK, where CLASS is
930fb9
    represented as a 16bit hexadecimal value, TYPE as an 8bit
930fb9
    hexadecimal value and DATA as a variable length hexadecimal value.
930fb9
930fb9
    e.g.
930fb9
     # ip link add name geneve0 type geneve dstport 0 external
930fb9
     # tc qdisc add dev geneve0 ingress
930fb9
     # tc filter add dev geneve0 protocol ip parent ffff: \
930fb9
         flower \
930fb9
           enc_src_ip 10.0.99.192 \
930fb9
           enc_dst_ip 10.0.99.193 \
930fb9
           enc_key_id 11 \
930fb9
           geneve_opts 0102:80:1122334421314151/ffff:ff:ffffffffffffffff \
930fb9
           ip_proto udp \
930fb9
           action mirred egress redirect dev eth1
930fb9
930fb9
    Signed-off-by: Pieter Jansen van Vuuren <pieter.jansenvanvuuren@netronome.com>
930fb9
    Signed-off-by: Simon Horman <simon.horman@netronome.com>
930fb9
    Signed-off-by: David Ahern <dsahern@gmail.com>
930fb9
---
930fb9
 man/man8/tc-flower.8 |  13 ++-
930fb9
 tc/f_flower.c        | 282 +++++++++++++++++++++++++++++++++++++++++++++++++++
930fb9
 2 files changed, 294 insertions(+), 1 deletion(-)
930fb9
930fb9
diff --git a/man/man8/tc-flower.8 b/man/man8/tc-flower.8
930fb9
index f917f24..276b527 100644
930fb9
--- a/man/man8/tc-flower.8
930fb9
+++ b/man/man8/tc-flower.8
930fb9
@@ -74,6 +74,8 @@ flower \- flow based traffic control filter
930fb9
 .IR TOS " | "
930fb9
 .B enc_ttl
930fb9
 .IR TTL " | "
930fb9
+.B geneve_opts
930fb9
+.IR OPTIONS " | "
930fb9
 .BR ip_flags
930fb9
 .IR IP_FLAGS
930fb9
 .SH DESCRIPTION
930fb9
@@ -260,6 +262,8 @@ bits is assumed.
930fb9
 .BI enc_tos " NUMBER"
930fb9
 .TQ
930fb9
 .BI enc_ttl " NUMBER"
930fb9
+.TQ
930fb9
+.BI geneve_opts " OPTIONS"
930fb9
 Match on IP tunnel metadata. Key id
930fb9
 .I NUMBER
930fb9
 is a 32 bit tunnel key id (e.g. VNI for VXLAN tunnel).
930fb9
@@ -272,7 +276,14 @@ is a 16 bit UDP dst port. Tos
930fb9
 .I NUMBER
930fb9
 is an 8 bit tos (dscp+ecn) value, ttl
930fb9
 .I NUMBER
930fb9
-is an 8 bit time-to-live value.
930fb9
+is an 8 bit time-to-live value. geneve_opts
930fb9
+.I OPTIONS
930fb9
+must be a valid list of comma-separated geneve options where each option
930fb9
+consists of a key optionally followed by a slash and corresponding mask. If
930fb9
+the masks is missing, \fBtc\fR assumes a full-length match. The options can
930fb9
+be described in the form CLASS:TYPE:DATA/CLASS_MASK:TYPE_MASK:DATA_MASK,
930fb9
+where CLASS is represented as a 16bit hexadecimal value, TYPE as an 8bit
930fb9
+hexadecimal value and DATA as a variable length hexadecimal value.
930fb9
 .TP
930fb9
 .BI ip_flags " IP_FLAGS"
930fb9
 .I IP_FLAGS
930fb9
diff --git a/tc/f_flower.c b/tc/f_flower.c
930fb9
index cd102f2..43102c8 100644
930fb9
--- a/tc/f_flower.c
930fb9
+++ b/tc/f_flower.c
930fb9
@@ -76,6 +76,7 @@ static void explain(void)
930fb9
 		"                       enc_key_id [ KEY-ID ] |\n"
930fb9
 		"                       enc_tos MASKED-IP_TOS |\n"
930fb9
 		"                       enc_ttl MASKED-IP_TTL |\n"
930fb9
+		"                       geneve_opts MASKED-OPTIONS |\n"
930fb9
 		"                       ip_flags IP-FLAGS | \n"
930fb9
 		"                       enc_dst_port [ port_number ] }\n"
930fb9
 		"       FILTERID := X:Y:Z\n"
930fb9
@@ -580,6 +581,179 @@ static int flower_parse_enc_port(char *str, int type, struct nlmsghdr *n)
930fb9
 	return 0;
930fb9
 }
930fb9
 
930fb9
+static int flower_parse_geneve_opts(char *str, struct nlmsghdr *n)
930fb9
+{
930fb9
+	struct rtattr *nest;
930fb9
+	char *token;
930fb9
+	int i, err;
930fb9
+
930fb9
+	nest = addattr_nest(n, MAX_MSG, TCA_FLOWER_KEY_ENC_OPTS_GENEVE);
930fb9
+
930fb9
+	i = 1;
930fb9
+	token = strsep(&str, ":");
930fb9
+	while (token) {
930fb9
+		switch (i) {
930fb9
+		case TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS:
930fb9
+		{
930fb9
+			__be16 opt_class;
930fb9
+
930fb9
+			if (!strlen(token))
930fb9
+				break;
930fb9
+			err = get_be16(&opt_class, token, 16);
930fb9
+			if (err)
930fb9
+				return err;
930fb9
+
930fb9
+			addattr16(n, MAX_MSG, i, opt_class);
930fb9
+			break;
930fb9
+		}
930fb9
+		case TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE:
930fb9
+		{
930fb9
+			__u8 opt_type;
930fb9
+
930fb9
+			if (!strlen(token))
930fb9
+				break;
930fb9
+			err = get_u8(&opt_type, token, 16);
930fb9
+			if (err)
930fb9
+				return err;
930fb9
+
930fb9
+			addattr8(n, MAX_MSG, i, opt_type);
930fb9
+			break;
930fb9
+		}
930fb9
+		case TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA:
930fb9
+		{
930fb9
+			size_t token_len = strlen(token);
930fb9
+			__u8 *opts;
930fb9
+
930fb9
+			if (!token_len)
930fb9
+				break;
930fb9
+			opts = malloc(token_len / 2);
930fb9
+			if (!opts)
930fb9
+				return -1;
930fb9
+			if (hex2mem(token, opts, token_len / 2) < 0) {
930fb9
+				free(opts);
930fb9
+				return -1;
930fb9
+			}
930fb9
+			addattr_l(n, MAX_MSG, i, opts, token_len / 2);
930fb9
+			free(opts);
930fb9
+
930fb9
+			break;
930fb9
+		}
930fb9
+		default:
930fb9
+			fprintf(stderr, "Unknown \"geneve_opts\" type\n");
930fb9
+			return -1;
930fb9
+		}
930fb9
+
930fb9
+		token = strsep(&str, ":");
930fb9
+		i++;
930fb9
+	}
930fb9
+	addattr_nest_end(n, nest);
930fb9
+
930fb9
+	return 0;
930fb9
+}
930fb9
+
930fb9
+static int flower_parse_enc_opt_part(char *str, struct nlmsghdr *n)
930fb9
+{
930fb9
+	char *token;
930fb9
+	int err;
930fb9
+
930fb9
+	token = strsep(&str, ",");
930fb9
+	while (token) {
930fb9
+		err = flower_parse_geneve_opts(token, n);
930fb9
+		if (err)
930fb9
+			return err;
930fb9
+
930fb9
+		token = strsep(&str, ",");
930fb9
+	}
930fb9
+
930fb9
+	return 0;
930fb9
+}
930fb9
+
930fb9
+static int flower_check_enc_opt_key(char *key)
930fb9
+{
930fb9
+	int key_len, col_cnt = 0;
930fb9
+
930fb9
+	key_len = strlen(key);
930fb9
+	while ((key = strchr(key, ':'))) {
930fb9
+		if (strlen(key) == key_len)
930fb9
+			return -1;
930fb9
+
930fb9
+		key_len = strlen(key) - 1;
930fb9
+		col_cnt++;
930fb9
+		key++;
930fb9
+	}
930fb9
+
930fb9
+	if (col_cnt != 2 || !key_len)
930fb9
+		return -1;
930fb9
+
930fb9
+	return 0;
930fb9
+}
930fb9
+
930fb9
+static int flower_parse_enc_opts(char *str, struct nlmsghdr *n)
930fb9
+{
930fb9
+	char key[XATTR_SIZE_MAX], mask[XATTR_SIZE_MAX];
930fb9
+	int data_len, key_len, mask_len, err;
930fb9
+	char *token, *slash;
930fb9
+	struct rtattr *nest;
930fb9
+
930fb9
+	key_len = 0;
930fb9
+	mask_len = 0;
930fb9
+	token = strsep(&str, ",");
930fb9
+	while (token) {
930fb9
+		slash = strchr(token, '/');
930fb9
+		if (slash)
930fb9
+			*slash = '\0';
930fb9
+
930fb9
+		if ((key_len + strlen(token) > XATTR_SIZE_MAX) ||
930fb9
+		    flower_check_enc_opt_key(token))
930fb9
+			return -1;
930fb9
+
930fb9
+		strcpy(&key[key_len], token);
930fb9
+		key_len += strlen(token) + 1;
930fb9
+		key[key_len - 1] = ',';
930fb9
+
930fb9
+		if (!slash) {
930fb9
+			/* Pad out mask when not provided */
930fb9
+			if (mask_len + strlen(token) > XATTR_SIZE_MAX)
930fb9
+				return -1;
930fb9
+
930fb9
+			data_len = strlen(rindex(token, ':'));
930fb9
+			sprintf(&mask[mask_len], "ffff:ff:");
930fb9
+			mask_len += 8;
930fb9
+			memset(&mask[mask_len], 'f', data_len - 1);
930fb9
+			mask_len += data_len;
930fb9
+			mask[mask_len - 1] = ',';
930fb9
+			token = strsep(&str, ",");
930fb9
+			continue;
930fb9
+		}
930fb9
+
930fb9
+		if (mask_len + strlen(slash + 1) > XATTR_SIZE_MAX)
930fb9
+			return -1;
930fb9
+
930fb9
+		strcpy(&mask[mask_len], slash + 1);
930fb9
+		mask_len += strlen(slash + 1) + 1;
930fb9
+		mask[mask_len - 1] = ',';
930fb9
+
930fb9
+		*slash = '/';
930fb9
+		token = strsep(&str, ",");
930fb9
+	}
930fb9
+	key[key_len - 1] = '\0';
930fb9
+	mask[mask_len - 1] = '\0';
930fb9
+
930fb9
+	nest = addattr_nest(n, MAX_MSG, TCA_FLOWER_KEY_ENC_OPTS);
930fb9
+	err = flower_parse_enc_opt_part(key, n);
930fb9
+	if (err)
930fb9
+		return err;
930fb9
+	addattr_nest_end(n, nest);
930fb9
+
930fb9
+	nest = addattr_nest(n, MAX_MSG, TCA_FLOWER_KEY_ENC_OPTS_MASK);
930fb9
+	err = flower_parse_enc_opt_part(mask, n);
930fb9
+	if (err)
930fb9
+		return err;
930fb9
+	addattr_nest_end(n, nest);
930fb9
+
930fb9
+	return 0;
930fb9
+}
930fb9
+
930fb9
 static int flower_parse_opt(struct filter_util *qu, char *handle,
930fb9
 			    int argc, char **argv, struct nlmsghdr *n)
930fb9
 {
930fb9
@@ -994,6 +1168,13 @@ static int flower_parse_opt(struct filter_util *qu, char *handle,
930fb9
 				fprintf(stderr, "Illegal \"enc_ttl\"\n");
930fb9
 				return -1;
930fb9
 			}
930fb9
+		} else if (matches(*argv, "geneve_opts") == 0) {
930fb9
+			NEXT_ARG();
930fb9
+			ret = flower_parse_enc_opts(*argv, n);
930fb9
+			if (ret < 0) {
930fb9
+				fprintf(stderr, "Illegal \"geneve_opts\"\n");
930fb9
+				return -1;
930fb9
+			}
930fb9
 		} else if (matches(*argv, "action") == 0) {
930fb9
 			NEXT_ARG();
930fb9
 			ret = parse_action(&argc, &argv, TCA_FLOWER_ACT, n);
930fb9
@@ -1291,6 +1472,105 @@ static void flower_print_key_id(const char *name, struct rtattr *attr)
930fb9
 	print_uint(PRINT_ANY, name, namefrm, rta_getattr_be32(attr));
930fb9
 }
930fb9
 
930fb9
+static void flower_print_geneve_opts(const char *name, struct rtattr *attr,
930fb9
+				     char *strbuf)
930fb9
+{
930fb9
+	struct rtattr *tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1];
930fb9
+	int ii, data_len, offset = 0, slen = 0;
930fb9
+	struct rtattr *i = RTA_DATA(attr);
930fb9
+	int rem = RTA_PAYLOAD(attr);
930fb9
+	__u8 type, data_r[rem];
930fb9
+	char data[rem * 2 + 1];
930fb9
+	__u16 class;
930fb9
+
930fb9
+	open_json_array(PRINT_JSON, name);
930fb9
+	while (rem) {
930fb9
+		parse_rtattr(tb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX, i, rem);
930fb9
+		class = rta_getattr_be16(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]);
930fb9
+		type = rta_getattr_u8(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]);
930fb9
+		data_len = RTA_PAYLOAD(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]);
930fb9
+		hexstring_n2a(RTA_DATA(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]),
930fb9
+			      data_len, data, sizeof(data));
930fb9
+		hex2mem(data, data_r, data_len);
930fb9
+		offset += data_len + 20;
930fb9
+		rem -= data_len + 20;
930fb9
+		i = RTA_DATA(attr) + offset;
930fb9
+
930fb9
+		open_json_object(NULL);
930fb9
+		print_uint(PRINT_JSON, "class", NULL, class);
930fb9
+		print_uint(PRINT_JSON, "type", NULL, type);
930fb9
+		open_json_array(PRINT_JSON, "data");
930fb9
+		for (ii = 0; ii < data_len; ii++)
930fb9
+			print_uint(PRINT_JSON, NULL, NULL, data_r[ii]);
930fb9
+		close_json_array(PRINT_JSON, "data");
930fb9
+		close_json_object();
930fb9
+
930fb9
+		slen += sprintf(strbuf + slen, "%04x:%02x:%s",
930fb9
+				class, type, data);
930fb9
+		if (rem)
930fb9
+			slen += sprintf(strbuf + slen, ",");
930fb9
+	}
930fb9
+	close_json_array(PRINT_JSON, name);
930fb9
+}
930fb9
+
930fb9
+static void flower_print_geneve_parts(const char *name, struct rtattr *attr,
930fb9
+				      char *key, char *mask)
930fb9
+{
930fb9
+	char *namefrm = "\n  geneve_opt %s";
930fb9
+	char *key_token, *mask_token, *out;
930fb9
+	int len;
930fb9
+
930fb9
+	out = malloc(RTA_PAYLOAD(attr) * 4 + 3);
930fb9
+	if (!out)
930fb9
+		return;
930fb9
+
930fb9
+	len = 0;
930fb9
+	key_token = strsep(&key, ",");
930fb9
+	mask_token = strsep(&mask, ",");
930fb9
+	while (key_token) {
930fb9
+		len += sprintf(&out[len], "%s/%s,", key_token, mask_token);
930fb9
+		mask_token = strsep(&mask, ",");
930fb9
+		key_token = strsep(&key, ",");
930fb9
+	}
930fb9
+
930fb9
+	out[len - 1] = '\0';
930fb9
+	print_string(PRINT_FP, name, namefrm, out);
930fb9
+	free(out);
930fb9
+}
930fb9
+
930fb9
+static void flower_print_enc_opts(const char *name, struct rtattr *attr,
930fb9
+				  struct rtattr *mask_attr)
930fb9
+{
930fb9
+	struct rtattr *key_tb[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1];
930fb9
+	struct rtattr *msk_tb[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1];
930fb9
+	char *key, *msk;
930fb9
+
930fb9
+	if (!attr)
930fb9
+		return;
930fb9
+
930fb9
+	key = malloc(RTA_PAYLOAD(attr) * 2 + 1);
930fb9
+	if (!key)
930fb9
+		return;
930fb9
+
930fb9
+	msk = malloc(RTA_PAYLOAD(attr) * 2 + 1);
930fb9
+	if (!msk)
930fb9
+		goto err_key_free;
930fb9
+
930fb9
+	parse_rtattr_nested(key_tb, TCA_FLOWER_KEY_ENC_OPTS_MAX, attr);
930fb9
+	flower_print_geneve_opts("geneve_opt_key",
930fb9
+				 key_tb[TCA_FLOWER_KEY_ENC_OPTS_GENEVE], key);
930fb9
+
930fb9
+	parse_rtattr_nested(msk_tb, TCA_FLOWER_KEY_ENC_OPTS_MAX, mask_attr);
930fb9
+	flower_print_geneve_opts("geneve_opt_mask",
930fb9
+				 msk_tb[TCA_FLOWER_KEY_ENC_OPTS_GENEVE], msk);
930fb9
+
930fb9
+	flower_print_geneve_parts(name, attr, key, msk);
930fb9
+
930fb9
+	free(msk);
930fb9
+err_key_free:
930fb9
+	free(key);
930fb9
+}
930fb9
+
930fb9
 static void flower_print_masked_u8(const char *name, struct rtattr *attr,
930fb9
 				   struct rtattr *mask_attr,
930fb9
 				   const char *(*value_to_str)(__u8 value))
930fb9
@@ -1489,6 +1769,8 @@ static int flower_print_opt(struct filter_util *qu, FILE *f,
930fb9
 			    tb[TCA_FLOWER_KEY_ENC_IP_TOS_MASK]);
930fb9
 	flower_print_ip_attr("enc_ttl", tb[TCA_FLOWER_KEY_ENC_IP_TTL],
930fb9
 			    tb[TCA_FLOWER_KEY_ENC_IP_TTL_MASK]);
930fb9
+	flower_print_enc_opts("enc_opt", tb[TCA_FLOWER_KEY_ENC_OPTS],
930fb9
+			      tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]);
930fb9
 
930fb9
 	flower_print_matching_flags("ip_flags", FLOWER_IP_FLAGS,
930fb9
 				    tb[TCA_FLOWER_KEY_FLAGS],
930fb9
-- 
930fb9
1.8.3.1
930fb9