94084c
commit e098446037da532d4a250efac9a813bc22f3669f
94084c
Author: Adhemerval Zanella <adhemerval.zanella@linaro.org>
94084c
Date:   Mon Jan 24 08:55:53 2022 -0300
94084c
94084c
    linux: Fix ancillary 64-bit time timestamp conversion (BZ #28349, BZ#28350)
94084c
    
94084c
    The __convert_scm_timestamps only updates the control message last
94084c
    pointer for SOL_SOCKET type, so if the message control buffer contains
94084c
    multiple ancillary message types the converted timestamp one might
94084c
    overwrite a valid message.
94084c
    
94084c
    The test checks if the extra ancillary space is correctly handled
94084c
    by recvmsg/recvmmsg, where if there is no extra space for the 64-bit
94084c
    time_t converted message the control buffer should be marked with
94084c
    MSG_TRUNC.  It also check if recvmsg/recvmmsg handle correctly multiple
94084c
    ancillary data.
94084c
    
94084c
    Checked on x86_64-linux and on i686-linux-gnu on both 5.11 and
94084c
    4.15 kernel.
94084c
    
94084c
    Co-authored-by: Fabian Vogt <fvogt@suse.de>
94084c
    
94084c
    Reviewed-by: Florian Weimer <fweimer@redhat.com>
94084c
    
94084c
    (cherry picked from commit 8fba672472ae0055387e9315fc2eddfa6775ca79)
94084c
94084c
diff --git a/sysdeps/unix/sysv/linux/Makefile b/sysdeps/unix/sysv/linux/Makefile
94084c
index cdc01a3f023ec09a..7c75e22c6d0e9ff5 100644
94084c
--- a/sysdeps/unix/sysv/linux/Makefile
94084c
+++ b/sysdeps/unix/sysv/linux/Makefile
94084c
@@ -273,6 +273,9 @@ sysdep_routines += cmsg_nxthdr
94084c
 CFLAGS-recvmmsg.c = -fexceptions -fasynchronous-unwind-tables
94084c
 CFLAGS-sendmmsg.c = -fexceptions -fasynchronous-unwind-tables
94084c
 
94084c
+tests += tst-socket-timestamp
94084c
+tests-time64 += tst-socket-timestamp-time64
94084c
+
94084c
 tests-special += $(objpfx)tst-socket-consts.out
94084c
 $(objpfx)tst-socket-consts.out: ../sysdeps/unix/sysv/linux/tst-socket-consts.py
94084c
 	PYTHONPATH=../scripts \
94084c
diff --git a/sysdeps/unix/sysv/linux/convert_scm_timestamps.c b/sysdeps/unix/sysv/linux/convert_scm_timestamps.c
94084c
index 00c934c4135f0d42..5d3c4199e0b32944 100644
94084c
--- a/sysdeps/unix/sysv/linux/convert_scm_timestamps.c
94084c
+++ b/sysdeps/unix/sysv/linux/convert_scm_timestamps.c
94084c
@@ -54,6 +54,8 @@ __convert_scm_timestamps (struct msghdr *msg, socklen_t msgsize)
94084c
        cmsg != NULL;
94084c
        cmsg = CMSG_NXTHDR (msg, cmsg))
94084c
     {
94084c
+      last = cmsg;
94084c
+
94084c
       if (cmsg->cmsg_level != SOL_SOCKET)
94084c
 	continue;
94084c
 
94084c
@@ -75,11 +77,9 @@ __convert_scm_timestamps (struct msghdr *msg, socklen_t msgsize)
94084c
 	  tvts[1] = tmp[1];
94084c
 	  break;
94084c
 	}
94084c
-
94084c
-      last = cmsg;
94084c
     }
94084c
 
94084c
-  if (last == NULL || type == 0)
94084c
+  if (type == 0)
94084c
     return;
94084c
 
94084c
   if (CMSG_SPACE (sizeof tvts) > msgsize - msg->msg_controllen)
94084c
@@ -88,10 +88,12 @@ __convert_scm_timestamps (struct msghdr *msg, socklen_t msgsize)
94084c
       return;
94084c
     }
94084c
 
94084c
+  /* Zero memory for the new cmsghdr, so reading cmsg_len field
94084c
+     by CMSG_NXTHDR does not trigger UB.  */
94084c
+  memset (msg->msg_control + msg->msg_controllen, 0,
94084c
+	  CMSG_SPACE (sizeof tvts));
94084c
   msg->msg_controllen += CMSG_SPACE (sizeof tvts);
94084c
-  cmsg = CMSG_NXTHDR(msg, last);
94084c
-  if (cmsg == NULL)
94084c
-    return;
94084c
+  cmsg = CMSG_NXTHDR (msg, last);
94084c
   cmsg->cmsg_level = SOL_SOCKET;
94084c
   cmsg->cmsg_type = type;
94084c
   cmsg->cmsg_len = CMSG_LEN (sizeof tvts);
94084c
diff --git a/sysdeps/unix/sysv/linux/tst-socket-timestamp-time64.c b/sysdeps/unix/sysv/linux/tst-socket-timestamp-time64.c
94084c
new file mode 100644
94084c
index 0000000000000000..ae424c2a70026cf5
94084c
--- /dev/null
94084c
+++ b/sysdeps/unix/sysv/linux/tst-socket-timestamp-time64.c
94084c
@@ -0,0 +1 @@
94084c
+#include "tst-socket-timestamp.c"
94084c
diff --git a/sysdeps/unix/sysv/linux/tst-socket-timestamp.c b/sysdeps/unix/sysv/linux/tst-socket-timestamp.c
94084c
new file mode 100644
94084c
index 0000000000000000..9c2e76f7e27bd312
94084c
--- /dev/null
94084c
+++ b/sysdeps/unix/sysv/linux/tst-socket-timestamp.c
94084c
@@ -0,0 +1,336 @@
94084c
+/* Check recvmsg/recvmmsg 64-bit timestamp support.
94084c
+   Copyright (C) 2022 Free Software Foundation, Inc.
94084c
+   This file is part of the GNU C Library.
94084c
+
94084c
+   The GNU C Library is free software; you can redistribute it and/or
94084c
+   modify it under the terms of the GNU Lesser General Public
94084c
+   License as published by the Free Software Foundation; either
94084c
+   version 2.1 of the License, or (at your option) any later version.
94084c
+
94084c
+   The GNU C Library is distributed in the hope that it will be useful,
94084c
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
94084c
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
94084c
+   Lesser General Public License for more details.
94084c
+
94084c
+   You should have received a copy of the GNU Lesser General Public
94084c
+   License along with the GNU C Library; if not, see
94084c
+   <https://www.gnu.org/licenses/>.  */
94084c
+
94084c
+#include <array_length.h>
94084c
+#include <arpa/inet.h>
94084c
+#include <errno.h>
94084c
+#include <string.h>
94084c
+#include <stdio.h>
94084c
+#include <support/check.h>
94084c
+#include <support/next_to_fault.h>
94084c
+#include <support/support.h>
94084c
+#include <support/test-driver.h>
94084c
+#include <support/xunistd.h>
94084c
+#include <support/xsocket.h>
94084c
+#include <sys/mman.h>
94084c
+
94084c
+/* Some extra space added for ancillary data, it might be used to convert
94084c
+   32-bit timestamp to 64-bit for _TIME_BITS=64.  */
94084c
+enum { slack_max_size = 64 };
94084c
+static const int slack[] = { 0, 4, 8, 16, 32, slack_max_size };
94084c
+
94084c
+static bool support_64_timestamp;
94084c
+/* AF_INET socket and address used to receive data.  */
94084c
+static int srv;
94084c
+static struct sockaddr_in srv_addr;
94084c
+
94084c
+static int
94084c
+do_sendto (const struct sockaddr_in *addr, int nmsgs)
94084c
+{
94084c
+  int s = xsocket (AF_INET, SOCK_DGRAM | SOCK_CLOEXEC, 0);
94084c
+  xconnect (s, (const struct sockaddr *) addr, sizeof (*addr));
94084c
+
94084c
+  for (int i = 0; i < nmsgs; i++)
94084c
+    xsendto (s, &i, sizeof (i), 0, (const struct sockaddr *) addr,
94084c
+	     sizeof (*addr));
94084c
+
94084c
+  xclose (s);
94084c
+
94084c
+  return 0;
94084c
+}
94084c
+
94084c
+static void
94084c
+do_recvmsg_slack_ancillary (bool use_multi_call, int s, void *cmsg,
94084c
+			    size_t slack, size_t tsize, int exp_payload)
94084c
+{
94084c
+  int payload;
94084c
+  struct iovec iov =
94084c
+    {
94084c
+      .iov_base = &payload,
94084c
+      .iov_len = sizeof (payload)
94084c
+    };
94084c
+  size_t msg_controllen = CMSG_SPACE (tsize) + slack;
94084c
+  char *msg_control = cmsg - msg_controllen;
94084c
+  memset (msg_control, 0x55, msg_controllen);
94084c
+  struct mmsghdr mmhdr =
94084c
+    {
94084c
+      .msg_hdr =
94084c
+      {
94084c
+        .msg_name = NULL,
94084c
+        .msg_namelen = 0,
94084c
+        .msg_iov = &iov,
94084c
+        .msg_iovlen = 1,
94084c
+        .msg_control = msg_control,
94084c
+        .msg_controllen = msg_controllen
94084c
+      },
94084c
+    };
94084c
+
94084c
+  int r;
94084c
+  if (use_multi_call)
94084c
+    {
94084c
+      r = recvmmsg (s, &mmhdr, 1, 0, NULL);
94084c
+      if (r >= 0)
94084c
+	r = mmhdr.msg_len;
94084c
+    }
94084c
+  else
94084c
+    r = recvmsg (s, &mmhdr.msg_hdr, 0);
94084c
+  TEST_COMPARE (r, sizeof (int));
94084c
+  TEST_COMPARE (payload, exp_payload);
94084c
+
94084c
+  if (cmsg == NULL)
94084c
+    return;
94084c
+
94084c
+  /* A timestamp is expected if 32-bit timestamp are used (support in every
94084c
+     configuration) or if underlying kernel support 64-bit timestamps.
94084c
+     Otherwise recvmsg will need extra space do add the 64-bit timestamp.  */
94084c
+  bool exp_timestamp;
94084c
+  if (sizeof (time_t) == 4 || support_64_timestamp)
94084c
+    exp_timestamp = true;
94084c
+   else
94084c
+    exp_timestamp = slack >= CMSG_SPACE (tsize);
94084c
+
94084c
+  bool timestamp = false;
94084c
+  for (struct cmsghdr *cmsg = CMSG_FIRSTHDR (&mmhdr.msg_hdr);
94084c
+       cmsg != NULL;
94084c
+       cmsg = CMSG_NXTHDR (&mmhdr.msg_hdr, cmsg))
94084c
+    {
94084c
+      if (cmsg->cmsg_level != SOL_SOCKET)
94084c
+	continue;
94084c
+      if (cmsg->cmsg_type == SCM_TIMESTAMP
94084c
+	  && cmsg->cmsg_len == CMSG_LEN (sizeof (struct timeval)))
94084c
+	{
94084c
+	  struct timeval tv;
94084c
+	  memcpy (&tv, CMSG_DATA (cmsg), sizeof (tv));
94084c
+	  if (test_verbose)
94084c
+	    printf ("SCM_TIMESTAMP:   {%jd, %jd}\n", (intmax_t)tv.tv_sec,
94084c
+		    (intmax_t)tv.tv_usec);
94084c
+	  timestamp = true;
94084c
+	}
94084c
+      else if (cmsg->cmsg_type == SCM_TIMESTAMPNS
94084c
+	       && cmsg->cmsg_len == CMSG_LEN (sizeof (struct timespec)))
94084c
+	{
94084c
+	  struct timespec ts;
94084c
+	  memcpy (&ts, CMSG_DATA (cmsg), sizeof (ts));
94084c
+	  if (test_verbose)
94084c
+	    printf ("SCM_TIMESTAMPNS: {%jd, %jd}\n", (intmax_t)ts.tv_sec,
94084c
+		    (intmax_t)ts.tv_nsec);
94084c
+	  timestamp = true;
94084c
+	}
94084c
+    }
94084c
+
94084c
+  TEST_COMPARE (timestamp, exp_timestamp);
94084c
+}
94084c
+
94084c
+/* Check if the extra ancillary space is correctly handled by recvmsg and
94084c
+   recvmmsg with different extra space for the ancillaty buffer.  */
94084c
+static void
94084c
+do_test_slack_space (void)
94084c
+{
94084c
+  /* Setup the ancillary data buffer with an extra page with PROT_NONE to
94084c
+     check the possible timestamp conversion on some systems.  */
94084c
+  struct support_next_to_fault nf =
94084c
+    support_next_to_fault_allocate (slack_max_size);
94084c
+  void *msgbuf = nf.buffer + slack_max_size;
94084c
+
94084c
+  /* Enable the timestamp using struct timeval precision.  */
94084c
+  {
94084c
+    int r = setsockopt (srv, SOL_SOCKET, SO_TIMESTAMP, &(int){1},
94084c
+			sizeof (int));
94084c
+    TEST_VERIFY_EXIT (r != -1);
94084c
+  }
94084c
+  /* Check recvmsg.  */
94084c
+  do_sendto (&srv_addr, array_length (slack));
94084c
+  for (int s = 0; s < array_length (slack); s++)
94084c
+    {
94084c
+      memset (nf.buffer, 0x55, nf.length);
94084c
+      do_recvmsg_slack_ancillary (false, srv, msgbuf, slack[s],
94084c
+				  sizeof (struct timeval), s);
94084c
+    }
94084c
+  /* Check recvmmsg.  */
94084c
+  do_sendto (&srv_addr, array_length (slack));
94084c
+  for (int s = 0; s < array_length (slack); s++)
94084c
+    {
94084c
+      memset (nf.buffer, 0x55, nf.length);
94084c
+      do_recvmsg_slack_ancillary (true, srv, msgbuf, slack[s],
94084c
+				  sizeof (struct timeval), s);
94084c
+    }
94084c
+
94084c
+  /* Now enable timestamp using a higher precision, it overwrites the previous
94084c
+     precision.  */
94084c
+  {
94084c
+    int r = setsockopt (srv, SOL_SOCKET, SO_TIMESTAMPNS, &(int){1},
94084c
+			sizeof (int));
94084c
+    TEST_VERIFY_EXIT (r != -1);
94084c
+  }
94084c
+  /* Check recvmsg.  */
94084c
+  do_sendto (&srv_addr, array_length (slack));
94084c
+  for (int s = 0; s < array_length (slack); s++)
94084c
+    do_recvmsg_slack_ancillary (false, srv, msgbuf, slack[s],
94084c
+				sizeof (struct timespec), s);
94084c
+  /* Check recvmmsg.  */
94084c
+  do_sendto (&srv_addr, array_length (slack));
94084c
+  for (int s = 0; s < array_length (slack); s++)
94084c
+    do_recvmsg_slack_ancillary (true, srv, msgbuf, slack[s],
94084c
+				sizeof (struct timespec), s);
94084c
+
94084c
+  support_next_to_fault_free (&nf);
94084c
+}
94084c
+
94084c
+/* Check if the converted 64-bit timestamp is correctly appended when there
94084c
+   are multiple ancillary messages.  */
94084c
+static void
94084c
+do_recvmsg_multiple_ancillary (bool use_multi_call, int s, void *cmsg,
94084c
+			       size_t cmsgsize, int exp_msg)
94084c
+{
94084c
+  int msg;
94084c
+  struct iovec iov =
94084c
+    {
94084c
+      .iov_base = &msg,
94084c
+      .iov_len = sizeof (msg)
94084c
+    };
94084c
+  size_t msgs = cmsgsize;
94084c
+  struct mmsghdr mmhdr =
94084c
+    {
94084c
+      .msg_hdr =
94084c
+      {
94084c
+        .msg_name = NULL,
94084c
+        .msg_namelen = 0,
94084c
+        .msg_iov = &iov,
94084c
+        .msg_iovlen = 1,
94084c
+        .msg_controllen = msgs,
94084c
+        .msg_control = cmsg,
94084c
+      },
94084c
+    };
94084c
+
94084c
+  int r;
94084c
+  if (use_multi_call)
94084c
+    {
94084c
+      r = recvmmsg (s, &mmhdr, 1, 0, NULL);
94084c
+      if (r >= 0)
94084c
+	r = mmhdr.msg_len;
94084c
+    }
94084c
+  else
94084c
+    r = recvmsg (s, &mmhdr.msg_hdr, 0);
94084c
+  TEST_COMPARE (r, sizeof (int));
94084c
+  TEST_COMPARE (msg, exp_msg);
94084c
+
94084c
+  if (cmsg == NULL)
94084c
+    return;
94084c
+
94084c
+  bool timestamp = false;
94084c
+  bool origdstaddr = false;
94084c
+  for (struct cmsghdr *cmsg = CMSG_FIRSTHDR (&mmhdr.msg_hdr);
94084c
+       cmsg != NULL;
94084c
+       cmsg = CMSG_NXTHDR (&mmhdr.msg_hdr, cmsg))
94084c
+    {
94084c
+      if (cmsg->cmsg_level == SOL_IP
94084c
+	  && cmsg->cmsg_type == IP_ORIGDSTADDR
94084c
+	  && cmsg->cmsg_len >= CMSG_LEN (sizeof (struct sockaddr_in)))
94084c
+	{
94084c
+	  struct sockaddr_in sa;
94084c
+	  memcpy (&sa, CMSG_DATA (cmsg), sizeof (sa));
94084c
+	  if (test_verbose)
94084c
+	    {
94084c
+	      char str[INET_ADDRSTRLEN];
94084c
+	      inet_ntop (AF_INET, &sa.sin_addr, str, INET_ADDRSTRLEN);
94084c
+	      printf ("IP_ORIGDSTADDR:  %s:%d\n", str, ntohs (sa.sin_port));
94084c
+	    }
94084c
+	  origdstaddr = sa.sin_addr.s_addr == srv_addr.sin_addr.s_addr
94084c
+			&& sa.sin_port == srv_addr.sin_port;
94084c
+	}
94084c
+      if (cmsg->cmsg_level == SOL_SOCKET
94084c
+	  && cmsg->cmsg_type == SCM_TIMESTAMP
94084c
+	  && cmsg->cmsg_len >= CMSG_LEN (sizeof (struct timeval)))
94084c
+	{
94084c
+	  struct timeval tv;
94084c
+	  memcpy (&tv, CMSG_DATA (cmsg), sizeof (tv));
94084c
+	  if (test_verbose)
94084c
+	    printf ("SCM_TIMESTAMP:   {%jd, %jd}\n", (intmax_t)tv.tv_sec,
94084c
+		    (intmax_t)tv.tv_usec);
94084c
+	  timestamp = true;
94084c
+	}
94084c
+    }
94084c
+
94084c
+  TEST_COMPARE (timestamp, true);
94084c
+  TEST_COMPARE (origdstaddr, true);
94084c
+}
94084c
+
94084c
+static void
94084c
+do_test_multiple_ancillary (void)
94084c
+{
94084c
+  {
94084c
+    int r = setsockopt (srv, SOL_SOCKET, SO_TIMESTAMP, &(int){1},
94084c
+			sizeof (int));
94084c
+    TEST_VERIFY_EXIT (r != -1);
94084c
+  }
94084c
+  {
94084c
+    int r = setsockopt (srv, IPPROTO_IP, IP_RECVORIGDSTADDR, &(int){1},
94084c
+			sizeof (int));
94084c
+    TEST_VERIFY_EXIT (r != -1);
94084c
+  }
94084c
+
94084c
+  /* Enougth data for default SO_TIMESTAMP, the IP_RECVORIGDSTADDR, and the
94084c
+     extra 64-bit SO_TIMESTAMP.  */
94084c
+  enum { msgbuflen = CMSG_SPACE (2 * sizeof (uint64_t))
94084c
+		     + CMSG_SPACE (sizeof (struct sockaddr_in))
94084c
+		     + CMSG_SPACE (2 * sizeof (uint64_t)) };
94084c
+  char msgbuf[msgbuflen];
94084c
+
94084c
+  enum { nmsgs = 8 };
94084c
+  /* Check recvmsg.  */
94084c
+  do_sendto (&srv_addr, nmsgs);
94084c
+  for (int s = 0; s < nmsgs; s++)
94084c
+    do_recvmsg_multiple_ancillary (false, srv, msgbuf, msgbuflen, s);
94084c
+  /* Check recvmmsg.  */
94084c
+  do_sendto (&srv_addr, nmsgs);
94084c
+  for (int s = 0; s < nmsgs; s++)
94084c
+    do_recvmsg_multiple_ancillary (true, srv, msgbuf, msgbuflen, s);
94084c
+}
94084c
+
94084c
+static int
94084c
+do_test (void)
94084c
+{
94084c
+  srv = xsocket (AF_INET, SOCK_DGRAM, 0);
94084c
+  srv_addr = (struct sockaddr_in) {
94084c
+    .sin_family = AF_INET,
94084c
+    .sin_addr = {.s_addr = htonl (INADDR_LOOPBACK) },
94084c
+  };
94084c
+  xbind (srv, (struct sockaddr *) &srv_addr, sizeof (srv_addr));
94084c
+  {
94084c
+    socklen_t sa_len = sizeof (srv_addr);
94084c
+    xgetsockname (srv, (struct sockaddr *) &srv_addr, &sa_len);
94084c
+    TEST_VERIFY (sa_len == sizeof (srv_addr));
94084c
+  }
94084c
+
94084c
+  TEST_COMPARE (recvmsg (-1, NULL, 0), -1);
94084c
+  TEST_COMPARE (errno, EBADF);
94084c
+  TEST_COMPARE (recvmmsg (-1, NULL, 0, 0, NULL), -1);
94084c
+  TEST_COMPARE (errno, EBADF);
94084c
+
94084c
+  /* If underlying kernel does not support   */
94084c
+  support_64_timestamp = support_socket_so_timestamp_time64 (srv);
94084c
+
94084c
+  do_test_slack_space ();
94084c
+  do_test_multiple_ancillary ();
94084c
+
94084c
+  xclose (srv);
94084c
+
94084c
+  return 0;
94084c
+}
94084c
+
94084c
+#include <support/test-driver.c>