linma / rpms / iproute

Forked from rpms/iproute 4 years ago
Clone

Blame SOURCES/0043-tc-f_flower-add-geneve-option-match-support-to-flowe.patch

7e752c
From 9dd748cd49d15b7e90a7a65de53d431a2c515c86 Mon Sep 17 00:00:00 2001
7e752c
From: Phil Sutter <psutter@redhat.com>
7e752c
Date: Thu, 31 Jan 2019 17:13:07 +0100
7e752c
Subject: [PATCH] tc: f_flower: add geneve option match support to flower
7e752c
7e752c
Bugzilla: https://bugzilla.redhat.com/show_bug.cgi?id=1654761
7e752c
Upstream Status: iproute2.git commit 56155d4df86d4
7e752c
7e752c
commit 56155d4df86d489c4207444c8a90ce4e0e22e49f
7e752c
Author: Pieter Jansen van Vuuren <pieter.jansenvanvuuren@netronome.com>
7e752c
Date:   Fri Sep 28 16:03:39 2018 +0200
7e752c
7e752c
    tc: f_flower: add geneve option match support to flower
7e752c
7e752c
    Allow matching on options in Geneve tunnel headers.
7e752c
7e752c
    The options can be described in the form
7e752c
    CLASS:TYPE:DATA/CLASS_MASK:TYPE_MASK:DATA_MASK, where CLASS is
7e752c
    represented as a 16bit hexadecimal value, TYPE as an 8bit
7e752c
    hexadecimal value and DATA as a variable length hexadecimal value.
7e752c
7e752c
    e.g.
7e752c
     # ip link add name geneve0 type geneve dstport 0 external
7e752c
     # tc qdisc add dev geneve0 ingress
7e752c
     # tc filter add dev geneve0 protocol ip parent ffff: \
7e752c
         flower \
7e752c
           enc_src_ip 10.0.99.192 \
7e752c
           enc_dst_ip 10.0.99.193 \
7e752c
           enc_key_id 11 \
7e752c
           geneve_opts 0102:80:1122334421314151/ffff:ff:ffffffffffffffff \
7e752c
           ip_proto udp \
7e752c
           action mirred egress redirect dev eth1
7e752c
7e752c
    Signed-off-by: Pieter Jansen van Vuuren <pieter.jansenvanvuuren@netronome.com>
7e752c
    Signed-off-by: Simon Horman <simon.horman@netronome.com>
7e752c
    Signed-off-by: David Ahern <dsahern@gmail.com>
7e752c
---
7e752c
 man/man8/tc-flower.8 |  13 ++-
7e752c
 tc/f_flower.c        | 282 +++++++++++++++++++++++++++++++++++++++++++++++++++
7e752c
 2 files changed, 294 insertions(+), 1 deletion(-)
7e752c
7e752c
diff --git a/man/man8/tc-flower.8 b/man/man8/tc-flower.8
7e752c
index f917f24..276b527 100644
7e752c
--- a/man/man8/tc-flower.8
7e752c
+++ b/man/man8/tc-flower.8
7e752c
@@ -74,6 +74,8 @@ flower \- flow based traffic control filter
7e752c
 .IR TOS " | "
7e752c
 .B enc_ttl
7e752c
 .IR TTL " | "
7e752c
+.B geneve_opts
7e752c
+.IR OPTIONS " | "
7e752c
 .BR ip_flags
7e752c
 .IR IP_FLAGS
7e752c
 .SH DESCRIPTION
7e752c
@@ -260,6 +262,8 @@ bits is assumed.
7e752c
 .BI enc_tos " NUMBER"
7e752c
 .TQ
7e752c
 .BI enc_ttl " NUMBER"
7e752c
+.TQ
7e752c
+.BI geneve_opts " OPTIONS"
7e752c
 Match on IP tunnel metadata. Key id
7e752c
 .I NUMBER
7e752c
 is a 32 bit tunnel key id (e.g. VNI for VXLAN tunnel).
7e752c
@@ -272,7 +276,14 @@ is a 16 bit UDP dst port. Tos
7e752c
 .I NUMBER
7e752c
 is an 8 bit tos (dscp+ecn) value, ttl
7e752c
 .I NUMBER
7e752c
-is an 8 bit time-to-live value.
7e752c
+is an 8 bit time-to-live value. geneve_opts
7e752c
+.I OPTIONS
7e752c
+must be a valid list of comma-separated geneve options where each option
7e752c
+consists of a key optionally followed by a slash and corresponding mask. If
7e752c
+the masks is missing, \fBtc\fR assumes a full-length match. The options can
7e752c
+be described in the form CLASS:TYPE:DATA/CLASS_MASK:TYPE_MASK:DATA_MASK,
7e752c
+where CLASS is represented as a 16bit hexadecimal value, TYPE as an 8bit
7e752c
+hexadecimal value and DATA as a variable length hexadecimal value.
7e752c
 .TP
7e752c
 .BI ip_flags " IP_FLAGS"
7e752c
 .I IP_FLAGS
7e752c
diff --git a/tc/f_flower.c b/tc/f_flower.c
7e752c
index cd102f2..43102c8 100644
7e752c
--- a/tc/f_flower.c
7e752c
+++ b/tc/f_flower.c
7e752c
@@ -76,6 +76,7 @@ static void explain(void)
7e752c
 		"                       enc_key_id [ KEY-ID ] |\n"
7e752c
 		"                       enc_tos MASKED-IP_TOS |\n"
7e752c
 		"                       enc_ttl MASKED-IP_TTL |\n"
7e752c
+		"                       geneve_opts MASKED-OPTIONS |\n"
7e752c
 		"                       ip_flags IP-FLAGS | \n"
7e752c
 		"                       enc_dst_port [ port_number ] }\n"
7e752c
 		"       FILTERID := X:Y:Z\n"
7e752c
@@ -580,6 +581,179 @@ static int flower_parse_enc_port(char *str, int type, struct nlmsghdr *n)
7e752c
 	return 0;
7e752c
 }
7e752c
 
7e752c
+static int flower_parse_geneve_opts(char *str, struct nlmsghdr *n)
7e752c
+{
7e752c
+	struct rtattr *nest;
7e752c
+	char *token;
7e752c
+	int i, err;
7e752c
+
7e752c
+	nest = addattr_nest(n, MAX_MSG, TCA_FLOWER_KEY_ENC_OPTS_GENEVE);
7e752c
+
7e752c
+	i = 1;
7e752c
+	token = strsep(&str, ":");
7e752c
+	while (token) {
7e752c
+		switch (i) {
7e752c
+		case TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS:
7e752c
+		{
7e752c
+			__be16 opt_class;
7e752c
+
7e752c
+			if (!strlen(token))
7e752c
+				break;
7e752c
+			err = get_be16(&opt_class, token, 16);
7e752c
+			if (err)
7e752c
+				return err;
7e752c
+
7e752c
+			addattr16(n, MAX_MSG, i, opt_class);
7e752c
+			break;
7e752c
+		}
7e752c
+		case TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE:
7e752c
+		{
7e752c
+			__u8 opt_type;
7e752c
+
7e752c
+			if (!strlen(token))
7e752c
+				break;
7e752c
+			err = get_u8(&opt_type, token, 16);
7e752c
+			if (err)
7e752c
+				return err;
7e752c
+
7e752c
+			addattr8(n, MAX_MSG, i, opt_type);
7e752c
+			break;
7e752c
+		}
7e752c
+		case TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA:
7e752c
+		{
7e752c
+			size_t token_len = strlen(token);
7e752c
+			__u8 *opts;
7e752c
+
7e752c
+			if (!token_len)
7e752c
+				break;
7e752c
+			opts = malloc(token_len / 2);
7e752c
+			if (!opts)
7e752c
+				return -1;
7e752c
+			if (hex2mem(token, opts, token_len / 2) < 0) {
7e752c
+				free(opts);
7e752c
+				return -1;
7e752c
+			}
7e752c
+			addattr_l(n, MAX_MSG, i, opts, token_len / 2);
7e752c
+			free(opts);
7e752c
+
7e752c
+			break;
7e752c
+		}
7e752c
+		default:
7e752c
+			fprintf(stderr, "Unknown \"geneve_opts\" type\n");
7e752c
+			return -1;
7e752c
+		}
7e752c
+
7e752c
+		token = strsep(&str, ":");
7e752c
+		i++;
7e752c
+	}
7e752c
+	addattr_nest_end(n, nest);
7e752c
+
7e752c
+	return 0;
7e752c
+}
7e752c
+
7e752c
+static int flower_parse_enc_opt_part(char *str, struct nlmsghdr *n)
7e752c
+{
7e752c
+	char *token;
7e752c
+	int err;
7e752c
+
7e752c
+	token = strsep(&str, ",");
7e752c
+	while (token) {
7e752c
+		err = flower_parse_geneve_opts(token, n);
7e752c
+		if (err)
7e752c
+			return err;
7e752c
+
7e752c
+		token = strsep(&str, ",");
7e752c
+	}
7e752c
+
7e752c
+	return 0;
7e752c
+}
7e752c
+
7e752c
+static int flower_check_enc_opt_key(char *key)
7e752c
+{
7e752c
+	int key_len, col_cnt = 0;
7e752c
+
7e752c
+	key_len = strlen(key);
7e752c
+	while ((key = strchr(key, ':'))) {
7e752c
+		if (strlen(key) == key_len)
7e752c
+			return -1;
7e752c
+
7e752c
+		key_len = strlen(key) - 1;
7e752c
+		col_cnt++;
7e752c
+		key++;
7e752c
+	}
7e752c
+
7e752c
+	if (col_cnt != 2 || !key_len)
7e752c
+		return -1;
7e752c
+
7e752c
+	return 0;
7e752c
+}
7e752c
+
7e752c
+static int flower_parse_enc_opts(char *str, struct nlmsghdr *n)
7e752c
+{
7e752c
+	char key[XATTR_SIZE_MAX], mask[XATTR_SIZE_MAX];
7e752c
+	int data_len, key_len, mask_len, err;
7e752c
+	char *token, *slash;
7e752c
+	struct rtattr *nest;
7e752c
+
7e752c
+	key_len = 0;
7e752c
+	mask_len = 0;
7e752c
+	token = strsep(&str, ",");
7e752c
+	while (token) {
7e752c
+		slash = strchr(token, '/');
7e752c
+		if (slash)
7e752c
+			*slash = '\0';
7e752c
+
7e752c
+		if ((key_len + strlen(token) > XATTR_SIZE_MAX) ||
7e752c
+		    flower_check_enc_opt_key(token))
7e752c
+			return -1;
7e752c
+
7e752c
+		strcpy(&key[key_len], token);
7e752c
+		key_len += strlen(token) + 1;
7e752c
+		key[key_len - 1] = ',';
7e752c
+
7e752c
+		if (!slash) {
7e752c
+			/* Pad out mask when not provided */
7e752c
+			if (mask_len + strlen(token) > XATTR_SIZE_MAX)
7e752c
+				return -1;
7e752c
+
7e752c
+			data_len = strlen(rindex(token, ':'));
7e752c
+			sprintf(&mask[mask_len], "ffff:ff:");
7e752c
+			mask_len += 8;
7e752c
+			memset(&mask[mask_len], 'f', data_len - 1);
7e752c
+			mask_len += data_len;
7e752c
+			mask[mask_len - 1] = ',';
7e752c
+			token = strsep(&str, ",");
7e752c
+			continue;
7e752c
+		}
7e752c
+
7e752c
+		if (mask_len + strlen(slash + 1) > XATTR_SIZE_MAX)
7e752c
+			return -1;
7e752c
+
7e752c
+		strcpy(&mask[mask_len], slash + 1);
7e752c
+		mask_len += strlen(slash + 1) + 1;
7e752c
+		mask[mask_len - 1] = ',';
7e752c
+
7e752c
+		*slash = '/';
7e752c
+		token = strsep(&str, ",");
7e752c
+	}
7e752c
+	key[key_len - 1] = '\0';
7e752c
+	mask[mask_len - 1] = '\0';
7e752c
+
7e752c
+	nest = addattr_nest(n, MAX_MSG, TCA_FLOWER_KEY_ENC_OPTS);
7e752c
+	err = flower_parse_enc_opt_part(key, n);
7e752c
+	if (err)
7e752c
+		return err;
7e752c
+	addattr_nest_end(n, nest);
7e752c
+
7e752c
+	nest = addattr_nest(n, MAX_MSG, TCA_FLOWER_KEY_ENC_OPTS_MASK);
7e752c
+	err = flower_parse_enc_opt_part(mask, n);
7e752c
+	if (err)
7e752c
+		return err;
7e752c
+	addattr_nest_end(n, nest);
7e752c
+
7e752c
+	return 0;
7e752c
+}
7e752c
+
7e752c
 static int flower_parse_opt(struct filter_util *qu, char *handle,
7e752c
 			    int argc, char **argv, struct nlmsghdr *n)
7e752c
 {
7e752c
@@ -994,6 +1168,13 @@ static int flower_parse_opt(struct filter_util *qu, char *handle,
7e752c
 				fprintf(stderr, "Illegal \"enc_ttl\"\n");
7e752c
 				return -1;
7e752c
 			}
7e752c
+		} else if (matches(*argv, "geneve_opts") == 0) {
7e752c
+			NEXT_ARG();
7e752c
+			ret = flower_parse_enc_opts(*argv, n);
7e752c
+			if (ret < 0) {
7e752c
+				fprintf(stderr, "Illegal \"geneve_opts\"\n");
7e752c
+				return -1;
7e752c
+			}
7e752c
 		} else if (matches(*argv, "action") == 0) {
7e752c
 			NEXT_ARG();
7e752c
 			ret = parse_action(&argc, &argv, TCA_FLOWER_ACT, n);
7e752c
@@ -1291,6 +1472,105 @@ static void flower_print_key_id(const char *name, struct rtattr *attr)
7e752c
 	print_uint(PRINT_ANY, name, namefrm, rta_getattr_be32(attr));
7e752c
 }
7e752c
 
7e752c
+static void flower_print_geneve_opts(const char *name, struct rtattr *attr,
7e752c
+				     char *strbuf)
7e752c
+{
7e752c
+	struct rtattr *tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1];
7e752c
+	int ii, data_len, offset = 0, slen = 0;
7e752c
+	struct rtattr *i = RTA_DATA(attr);
7e752c
+	int rem = RTA_PAYLOAD(attr);
7e752c
+	__u8 type, data_r[rem];
7e752c
+	char data[rem * 2 + 1];
7e752c
+	__u16 class;
7e752c
+
7e752c
+	open_json_array(PRINT_JSON, name);
7e752c
+	while (rem) {
7e752c
+		parse_rtattr(tb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX, i, rem);
7e752c
+		class = rta_getattr_be16(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]);
7e752c
+		type = rta_getattr_u8(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]);
7e752c
+		data_len = RTA_PAYLOAD(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]);
7e752c
+		hexstring_n2a(RTA_DATA(tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]),
7e752c
+			      data_len, data, sizeof(data));
7e752c
+		hex2mem(data, data_r, data_len);
7e752c
+		offset += data_len + 20;
7e752c
+		rem -= data_len + 20;
7e752c
+		i = RTA_DATA(attr) + offset;
7e752c
+
7e752c
+		open_json_object(NULL);
7e752c
+		print_uint(PRINT_JSON, "class", NULL, class);
7e752c
+		print_uint(PRINT_JSON, "type", NULL, type);
7e752c
+		open_json_array(PRINT_JSON, "data");
7e752c
+		for (ii = 0; ii < data_len; ii++)
7e752c
+			print_uint(PRINT_JSON, NULL, NULL, data_r[ii]);
7e752c
+		close_json_array(PRINT_JSON, "data");
7e752c
+		close_json_object();
7e752c
+
7e752c
+		slen += sprintf(strbuf + slen, "%04x:%02x:%s",
7e752c
+				class, type, data);
7e752c
+		if (rem)
7e752c
+			slen += sprintf(strbuf + slen, ",");
7e752c
+	}
7e752c
+	close_json_array(PRINT_JSON, name);
7e752c
+}
7e752c
+
7e752c
+static void flower_print_geneve_parts(const char *name, struct rtattr *attr,
7e752c
+				      char *key, char *mask)
7e752c
+{
7e752c
+	char *namefrm = "\n  geneve_opt %s";
7e752c
+	char *key_token, *mask_token, *out;
7e752c
+	int len;
7e752c
+
7e752c
+	out = malloc(RTA_PAYLOAD(attr) * 4 + 3);
7e752c
+	if (!out)
7e752c
+		return;
7e752c
+
7e752c
+	len = 0;
7e752c
+	key_token = strsep(&key, ",");
7e752c
+	mask_token = strsep(&mask, ",");
7e752c
+	while (key_token) {
7e752c
+		len += sprintf(&out[len], "%s/%s,", key_token, mask_token);
7e752c
+		mask_token = strsep(&mask, ",");
7e752c
+		key_token = strsep(&key, ",");
7e752c
+	}
7e752c
+
7e752c
+	out[len - 1] = '\0';
7e752c
+	print_string(PRINT_FP, name, namefrm, out);
7e752c
+	free(out);
7e752c
+}
7e752c
+
7e752c
+static void flower_print_enc_opts(const char *name, struct rtattr *attr,
7e752c
+				  struct rtattr *mask_attr)
7e752c
+{
7e752c
+	struct rtattr *key_tb[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1];
7e752c
+	struct rtattr *msk_tb[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1];
7e752c
+	char *key, *msk;
7e752c
+
7e752c
+	if (!attr)
7e752c
+		return;
7e752c
+
7e752c
+	key = malloc(RTA_PAYLOAD(attr) * 2 + 1);
7e752c
+	if (!key)
7e752c
+		return;
7e752c
+
7e752c
+	msk = malloc(RTA_PAYLOAD(attr) * 2 + 1);
7e752c
+	if (!msk)
7e752c
+		goto err_key_free;
7e752c
+
7e752c
+	parse_rtattr_nested(key_tb, TCA_FLOWER_KEY_ENC_OPTS_MAX, attr);
7e752c
+	flower_print_geneve_opts("geneve_opt_key",
7e752c
+				 key_tb[TCA_FLOWER_KEY_ENC_OPTS_GENEVE], key);
7e752c
+
7e752c
+	parse_rtattr_nested(msk_tb, TCA_FLOWER_KEY_ENC_OPTS_MAX, mask_attr);
7e752c
+	flower_print_geneve_opts("geneve_opt_mask",
7e752c
+				 msk_tb[TCA_FLOWER_KEY_ENC_OPTS_GENEVE], msk);
7e752c
+
7e752c
+	flower_print_geneve_parts(name, attr, key, msk);
7e752c
+
7e752c
+	free(msk);
7e752c
+err_key_free:
7e752c
+	free(key);
7e752c
+}
7e752c
+
7e752c
 static void flower_print_masked_u8(const char *name, struct rtattr *attr,
7e752c
 				   struct rtattr *mask_attr,
7e752c
 				   const char *(*value_to_str)(__u8 value))
7e752c
@@ -1489,6 +1769,8 @@ static int flower_print_opt(struct filter_util *qu, FILE *f,
7e752c
 			    tb[TCA_FLOWER_KEY_ENC_IP_TOS_MASK]);
7e752c
 	flower_print_ip_attr("enc_ttl", tb[TCA_FLOWER_KEY_ENC_IP_TTL],
7e752c
 			    tb[TCA_FLOWER_KEY_ENC_IP_TTL_MASK]);
7e752c
+	flower_print_enc_opts("enc_opt", tb[TCA_FLOWER_KEY_ENC_OPTS],
7e752c
+			      tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]);
7e752c
 
7e752c
 	flower_print_matching_flags("ip_flags", FLOWER_IP_FLAGS,
7e752c
 				    tb[TCA_FLOWER_KEY_FLAGS],
7e752c
-- 
7e752c
1.8.3.1
7e752c