linma / rpms / iproute

Forked from rpms/iproute 4 years ago
Clone

Blame SOURCES/0039-ss-add-AF_VSOCK-support.patch

be97f7
From fe898bd10be2bc527f81421f06afff77e8ba42eb Mon Sep 17 00:00:00 2001
be97f7
From: Stefano Brivio <sbrivio@redhat.com>
be97f7
Date: Sun, 22 Oct 2017 21:44:27 +0200
be97f7
Subject: [PATCH] ss: add AF_VSOCK support
be97f7
be97f7
Bugzilla: https://bugzilla.redhat.com/show_bug.cgi?id=1472759
be97f7
Upstream Status: iproute2.git commit c759116a0b2b
be97f7
be97f7
commit c759116a0b2b6da8df9687b0a40ac69050132c77
be97f7
Author: Stefan Hajnoczi <stefanha@redhat.com>
be97f7
Date:   Fri Oct 6 11:48:41 2017 -0400
be97f7
be97f7
    ss: add AF_VSOCK support
be97f7
be97f7
    The AF_VSOCK address family is a host<->guest communications channel
be97f7
    supported by VMware, KVM, and Hyper-V.  Initial VMware support was
be97f7
    released in Linux 3.9 in 2013 and transports for other hypervisors were
be97f7
    added later.
be97f7
be97f7
    AF_VSOCK addresses are <u32 cid, u32 port> tuples.  The 32-bit cid
be97f7
    integer is comparable to an IP address.  AF_VSOCK ports work like
be97f7
    TCP/UDP ports.
be97f7
be97f7
    Both SOCK_STREAM and SOCK_DGRAM socket types are available.
be97f7
be97f7
    This patch adds AF_VSOCK support to ss(8) so that sockets can be
be97f7
    observed.
be97f7
be97f7
    Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
be97f7
be97f7
Signed-off-by: Stefano Brivio <sbrivio@redhat.com>
be97f7
---
be97f7
 man/man8/ss.8 |   8 ++-
be97f7
 misc/ss.c     | 184 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++-
be97f7
 2 files changed, 188 insertions(+), 4 deletions(-)
be97f7
be97f7
diff --git a/man/man8/ss.8 b/man/man8/ss.8
be97f7
index 81de69d..4323eee 100644
be97f7
--- a/man/man8/ss.8
be97f7
+++ b/man/man8/ss.8
be97f7
@@ -125,14 +125,18 @@ Display Unix domain sockets (alias for -f unix).
be97f7
 .B \-S, \-\-sctp
be97f7
 Display SCTP sockets.
be97f7
 .TP
be97f7
+.B \-\-vsock
be97f7
+Display vsock sockets (alias for -f vsock).
be97f7
+.TP
be97f7
 .B \-f FAMILY, \-\-family=FAMILY
be97f7
 Display sockets of type FAMILY.
be97f7
-Currently the following families are supported: unix, inet, inet6, link, netlink.
be97f7
+Currently the following families are supported: unix, inet, inet6, link, netlink, vsock.
be97f7
 .TP
be97f7
 .B \-A QUERY, \-\-query=QUERY, \-\-socket=QUERY
be97f7
 List of socket tables to dump, separated by commas. The following identifiers
be97f7
 are understood: all, inet, tcp, udp, raw, unix, packet, netlink, unix_dgram,
be97f7
-unix_stream, unix_seqpacket, packet_raw, packet_dgram, dccp, sctp.
be97f7
+unix_stream, unix_seqpacket, packet_raw, packet_dgram, dccp, sctp,
be97f7
+vsock_stream, vsock_dgram.
be97f7
 .TP
be97f7
 .B \-D FILE, \-\-diag=FILE
be97f7
 Do not display anything, just dump raw information about TCP sockets to FILE after applying filters. If FILE is - stdout is used.
be97f7
diff --git a/misc/ss.c b/misc/ss.c
be97f7
index 0d64527..e922665 100644
be97f7
--- a/misc/ss.c
be97f7
+++ b/misc/ss.c
be97f7
@@ -44,6 +44,7 @@
be97f7
 #include <linux/packet_diag.h>
be97f7
 #include <linux/netlink_diag.h>
be97f7
 #include <linux/sctp.h>
be97f7
+#include <linux/vm_sockets_diag.h>
be97f7
 
be97f7
 #define MAGIC_SEQ 123456
be97f7
 
be97f7
@@ -126,6 +127,8 @@ enum {
be97f7
 	PACKET_R_DB,
be97f7
 	NETLINK_DB,
be97f7
 	SCTP_DB,
be97f7
+	VSOCK_ST_DB,
be97f7
+	VSOCK_DG_DB,
be97f7
 	MAX_DB
be97f7
 };
be97f7
 
be97f7
@@ -134,6 +137,7 @@ enum {
be97f7
 #define ALL_DB ((1<
be97f7
 #define INET_L4_DBM ((1<
be97f7
 #define INET_DBM (INET_L4_DBM | (1<
be97f7
+#define VSOCK_DBM ((1<
be97f7
 
be97f7
 enum {
be97f7
 	SS_UNKNOWN,
be97f7
@@ -222,6 +226,14 @@ static const struct filter default_dbs[MAX_DB] = {
be97f7
 		.states   = SS_CONN,
be97f7
 		.families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
be97f7
 	},
be97f7
+	[VSOCK_ST_DB] = {
be97f7
+		.states   = SS_CONN,
be97f7
+		.families = FAMILY_MASK(AF_VSOCK),
be97f7
+	},
be97f7
+	[VSOCK_DG_DB] = {
be97f7
+		.states   = SS_CONN,
be97f7
+		.families = FAMILY_MASK(AF_VSOCK),
be97f7
+	},
be97f7
 };
be97f7
 
be97f7
 static const struct filter default_afs[AF_MAX] = {
be97f7
@@ -245,6 +257,10 @@ static const struct filter default_afs[AF_MAX] = {
be97f7
 		.dbs    = (1 << NETLINK_DB),
be97f7
 		.states = (1 << SS_CLOSE),
be97f7
 	},
be97f7
+	[AF_VSOCK] = {
be97f7
+		.dbs    = VSOCK_DBM,
be97f7
+		.states = SS_CONN,
be97f7
+	},
be97f7
 };
be97f7
 
be97f7
 static int do_default = 1;
be97f7
@@ -283,6 +299,8 @@ static void filter_default_dbs(struct filter *f)
be97f7
 	filter_db_set(f, PACKET_DG_DB);
be97f7
 	filter_db_set(f, NETLINK_DB);
be97f7
 	filter_db_set(f, SCTP_DB);
be97f7
+	filter_db_set(f, VSOCK_ST_DB);
be97f7
+	filter_db_set(f, VSOCK_DG_DB);
be97f7
 }
be97f7
 
be97f7
 static void filter_states_set(struct filter *f, int states)
be97f7
@@ -792,6 +810,18 @@ static const char *proto_name(int protocol)
be97f7
 	return "???";
be97f7
 }
be97f7
 
be97f7
+static const char *vsock_netid_name(int type)
be97f7
+{
be97f7
+	switch (type) {
be97f7
+	case SOCK_STREAM:
be97f7
+		return "v_str";
be97f7
+	case SOCK_DGRAM:
be97f7
+		return "v_dgr";
be97f7
+	default:
be97f7
+		return "???";
be97f7
+	}
be97f7
+}
be97f7
+
be97f7
 static void sock_state_print(struct sockstat *s)
be97f7
 {
be97f7
 	const char *sock_name;
be97f7
@@ -824,6 +854,9 @@ static void sock_state_print(struct sockstat *s)
be97f7
 	case AF_NETLINK:
be97f7
 		sock_name = "nl";
be97f7
 		break;
be97f7
+	case AF_VSOCK:
be97f7
+		sock_name = vsock_netid_name(s->type);
be97f7
+		break;
be97f7
 	default:
be97f7
 		sock_name = "unknown";
be97f7
 	}
be97f7
@@ -1139,6 +1172,8 @@ static int run_ssfilter(struct ssfilter *f, struct sockstat *s)
be97f7
 			return s->lport == 0 && s->local.data[0] == 0;
be97f7
 		if (s->local.family == AF_NETLINK)
be97f7
 			return s->lport < 0;
be97f7
+		if (s->local.family == AF_VSOCK)
be97f7
+			return s->lport > 1023;
be97f7
 
be97f7
 		return is_ephemeral(s->lport);
be97f7
 	}
be97f7
@@ -1515,6 +1550,15 @@ void *parse_devcond(char *name)
be97f7
 	return res;
be97f7
 }
be97f7
 
be97f7
+static void vsock_set_inet_prefix(inet_prefix *a, __u32 cid)
be97f7
+{
be97f7
+	*a = (inet_prefix){
be97f7
+		.bytelen = sizeof(cid),
be97f7
+		.family = AF_VSOCK,
be97f7
+	};
be97f7
+	memcpy(a->data, &cid, sizeof(cid));
be97f7
+}
be97f7
+
be97f7
 void *parse_hostcond(char *addr, bool is_port)
be97f7
 {
be97f7
 	char *port = NULL;
be97f7
@@ -1589,6 +1633,37 @@ void *parse_hostcond(char *addr, bool is_port)
be97f7
 		goto out;
be97f7
 	}
be97f7
 
be97f7
+	if (fam == AF_VSOCK || strncmp(addr, "vsock:", 6) == 0) {
be97f7
+		__u32 cid = ~(__u32)0;
be97f7
+
be97f7
+		a.addr.family = AF_VSOCK;
be97f7
+		if (strncmp(addr, "vsock:", 6) == 0)
be97f7
+			addr += 6;
be97f7
+
be97f7
+		if (is_port)
be97f7
+			port = addr;
be97f7
+		else {
be97f7
+			port = strchr(addr, ':');
be97f7
+			if (port) {
be97f7
+				*port = '\0';
be97f7
+				port++;
be97f7
+			}
be97f7
+		}
be97f7
+
be97f7
+		if (port && strcmp(port, "*") &&
be97f7
+		    get_u32((__u32 *)&a.port, port, 0))
be97f7
+			return NULL;
be97f7
+
be97f7
+		if (addr[0] && strcmp(addr, "*")) {
be97f7
+			a.addr.bitlen = 32;
be97f7
+			if (get_u32(&cid, addr, 0))
be97f7
+				return NULL;
be97f7
+		}
be97f7
+		vsock_set_inet_prefix(&a.addr, cid);
be97f7
+		fam = AF_VSOCK;
be97f7
+		goto out;
be97f7
+	}
be97f7
+
be97f7
 	if (fam == AF_INET || !strncmp(addr, "inet:", 5)) {
be97f7
 		fam = AF_INET;
be97f7
 		if (!strncmp(addr, "inet:", 5))
be97f7
@@ -3653,6 +3728,88 @@ static int netlink_show(struct filter *f)
be97f7
 	return 0;
be97f7
 }
be97f7
 
be97f7
+static bool vsock_type_skip(struct sockstat *s, struct filter *f)
be97f7
+{
be97f7
+	if (s->type == SOCK_STREAM && !(f->dbs & (1 << VSOCK_ST_DB)))
be97f7
+		return true;
be97f7
+	if (s->type == SOCK_DGRAM && !(f->dbs & (1 << VSOCK_DG_DB)))
be97f7
+		return true;
be97f7
+	return false;
be97f7
+}
be97f7
+
be97f7
+static void vsock_addr_print(inet_prefix *a, __u32 port)
be97f7
+{
be97f7
+	char cid_str[sizeof("4294967295")];
be97f7
+	char port_str[sizeof("4294967295")];
be97f7
+	__u32 cid;
be97f7
+
be97f7
+	memcpy(&cid, a->data, sizeof(cid));
be97f7
+
be97f7
+	if (cid == ~(__u32)0)
be97f7
+		snprintf(cid_str, sizeof(cid_str), "*");
be97f7
+	else
be97f7
+		snprintf(cid_str, sizeof(cid_str), "%u", cid);
be97f7
+
be97f7
+	if (port == ~(__u32)0)
be97f7
+		snprintf(port_str, sizeof(port_str), "*");
be97f7
+	else
be97f7
+		snprintf(port_str, sizeof(port_str), "%u", port);
be97f7
+
be97f7
+	sock_addr_print(cid_str, ":", port_str, NULL);
be97f7
+}
be97f7
+
be97f7
+static void vsock_stats_print(struct sockstat *s, struct filter *f)
be97f7
+{
be97f7
+	sock_state_print(s);
be97f7
+
be97f7
+	vsock_addr_print(&s->local, s->lport);
be97f7
+	vsock_addr_print(&s->remote, s->rport);
be97f7
+
be97f7
+	proc_ctx_print(s);
be97f7
+
be97f7
+	printf("\n");
be97f7
+}
be97f7
+
be97f7
+static int vsock_show_sock(const struct sockaddr_nl *addr,
be97f7
+			   struct nlmsghdr *nlh, void *arg)
be97f7
+{
be97f7
+	struct filter *f = (struct filter *)arg;
be97f7
+	struct vsock_diag_msg *r = NLMSG_DATA(nlh);
be97f7
+	struct sockstat stat = {
be97f7
+		.type = r->vdiag_type,
be97f7
+		.lport = r->vdiag_src_port,
be97f7
+		.rport = r->vdiag_dst_port,
be97f7
+		.state = r->vdiag_state,
be97f7
+		.ino = r->vdiag_ino,
be97f7
+	};
be97f7
+
be97f7
+	vsock_set_inet_prefix(&stat.local, r->vdiag_src_cid);
be97f7
+	vsock_set_inet_prefix(&stat.remote, r->vdiag_dst_cid);
be97f7
+
be97f7
+	if (vsock_type_skip(&stat, f))
be97f7
+		return 0;
be97f7
+
be97f7
+	if (f->f && run_ssfilter(f->f, &stat) == 0)
be97f7
+		return 0;
be97f7
+
be97f7
+	vsock_stats_print(&stat, f);
be97f7
+
be97f7
+	return 0;
be97f7
+}
be97f7
+
be97f7
+static int vsock_show(struct filter *f)
be97f7
+{
be97f7
+	DIAG_REQUEST(req, struct vsock_diag_req r);
be97f7
+
be97f7
+	if (!filter_af_get(f, AF_VSOCK))
be97f7
+		return 0;
be97f7
+
be97f7
+	req.r.sdiag_family = AF_VSOCK;
be97f7
+	req.r.vdiag_states = f->states;
be97f7
+
be97f7
+	return handle_netlink_request(f, &req.nlh, sizeof(req), vsock_show_sock);
be97f7
+}
be97f7
+
be97f7
 struct sock_diag_msg {
be97f7
 	__u8 sdiag_family;
be97f7
 };
be97f7
@@ -3673,6 +3830,8 @@ static int generic_show_sock(const struct sockaddr_nl *addr,
be97f7
 		return packet_show_sock(addr, nlh, arg);
be97f7
 	case AF_NETLINK:
be97f7
 		return netlink_show_sock(addr, nlh, arg);
be97f7
+	case AF_VSOCK:
be97f7
+		return vsock_show_sock(addr, nlh, arg);
be97f7
 	default:
be97f7
 		return -1;
be97f7
 	}
be97f7
@@ -3900,14 +4059,15 @@ static void _usage(FILE *dest)
be97f7
 "   -d, --dccp          display only DCCP sockets\n"
be97f7
 "   -w, --raw           display only RAW sockets\n"
be97f7
 "   -x, --unix          display only Unix domain sockets\n"
be97f7
+"       --vsock         display only vsock sockets\n"
be97f7
 "   -f, --family=FAMILY display sockets of type FAMILY\n"
be97f7
-"       FAMILY := {inet|inet6|link|unix|netlink|help}\n"
be97f7
+"       FAMILY := {inet|inet6|link|unix|netlink|vsock|help}\n"
be97f7
 "\n"
be97f7
 "   -K, --kill          forcibly close sockets, display what was closed\n"
be97f7
 "   -H, --no-header     Suppress header line\n"
be97f7
 "\n"
be97f7
 "   -A, --query=QUERY, --socket=QUERY\n"
be97f7
-"       QUERY := {all|inet|tcp|udp|raw|unix|unix_dgram|unix_stream|unix_seqpacket|packet|netlink}[,QUERY]\n"
be97f7
+"       QUERY := {all|inet|tcp|udp|raw|unix|unix_dgram|unix_stream|unix_seqpacket|packet|netlink|vsock_stream|vsock_dgram}[,QUERY]\n"
be97f7
 "\n"
be97f7
 "   -D, --diag=FILE     Dump raw information about TCP sockets to FILE\n"
be97f7
 "   -F, --filter=FILE   read filter information from FILE\n"
be97f7
@@ -3980,6 +4140,9 @@ static int scan_state(const char *state)
be97f7
 	exit(-1);
be97f7
 }
be97f7
 
be97f7
+/* Values 'v' and 'V' are already used so a non-character is used */
be97f7
+#define OPT_VSOCK 256
be97f7
+
be97f7
 static const struct option long_opts[] = {
be97f7
 	{ "numeric", 0, 0, 'n' },
be97f7
 	{ "resolve", 0, 0, 'r' },
be97f7
@@ -3996,6 +4159,7 @@ static const struct option long_opts[] = {
be97f7
 	{ "udp", 0, 0, 'u' },
be97f7
 	{ "raw", 0, 0, 'w' },
be97f7
 	{ "unix", 0, 0, 'x' },
be97f7
+	{ "vsock", 0, 0, OPT_VSOCK },
be97f7
 	{ "all", 0, 0, 'a' },
be97f7
 	{ "listening", 0, 0, 'l' },
be97f7
 	{ "ipv4", 0, 0, '4' },
be97f7
@@ -4081,6 +4245,9 @@ int main(int argc, char *argv[])
be97f7
 		case 'x':
be97f7
 			filter_af_set(&current_filter, AF_UNIX);
be97f7
 			break;
be97f7
+		case OPT_VSOCK:
be97f7
+			filter_af_set(&current_filter, AF_VSOCK);
be97f7
+			break;
be97f7
 		case 'a':
be97f7
 			state_filter = SS_ALL;
be97f7
 			break;
be97f7
@@ -4107,6 +4274,8 @@ int main(int argc, char *argv[])
be97f7
 				filter_af_set(&current_filter, AF_UNIX);
be97f7
 			else if (strcmp(optarg, "netlink") == 0)
be97f7
 				filter_af_set(&current_filter, AF_NETLINK);
be97f7
+			else if (strcmp(optarg, "vsock") == 0)
be97f7
+				filter_af_set(&current_filter, AF_VSOCK);
be97f7
 			else if (strcmp(optarg, "help") == 0)
be97f7
 				help();
be97f7
 			else {
be97f7
@@ -4172,6 +4341,15 @@ int main(int argc, char *argv[])
be97f7
 					filter_db_set(&current_filter, PACKET_DG_DB);
be97f7
 				} else if (strcmp(p, "netlink") == 0) {
be97f7
 					filter_db_set(&current_filter, NETLINK_DB);
be97f7
+				} else if (strcmp(p, "vsock") == 0) {
be97f7
+					filter_db_set(&current_filter, VSOCK_ST_DB);
be97f7
+					filter_db_set(&current_filter, VSOCK_DG_DB);
be97f7
+				} else if (strcmp(p, "vsock_stream") == 0 ||
be97f7
+					   strcmp(p, "v_str") == 0) {
be97f7
+					filter_db_set(&current_filter, VSOCK_ST_DB);
be97f7
+				} else if (strcmp(p, "vsock_dgram") == 0 ||
be97f7
+					   strcmp(p, "v_dgr") == 0) {
be97f7
+					filter_db_set(&current_filter, VSOCK_DG_DB);
be97f7
 				} else {
be97f7
 					fprintf(stderr, "ss: \"%s\" is illegal socket table id\n", p);
be97f7
 					usage();
be97f7
@@ -4387,6 +4565,8 @@ int main(int argc, char *argv[])
be97f7
 		dccp_show(&current_filter);
be97f7
 	if (current_filter.dbs & (1<
be97f7
 		sctp_show(&current_filter);
be97f7
+	if (current_filter.dbs & VSOCK_DBM)
be97f7
+		vsock_show(&current_filter);
be97f7
 
be97f7
 	if (show_users || show_proc_ctx || show_sock_ctx)
be97f7
 		user_ent_destroy();
be97f7
-- 
be97f7
1.8.3.1
be97f7