93dc2d
commit e098446037da532d4a250efac9a813bc22f3669f
93dc2d
Author: Adhemerval Zanella <adhemerval.zanella@linaro.org>
93dc2d
Date:   Mon Jan 24 08:55:53 2022 -0300
93dc2d
93dc2d
    linux: Fix ancillary 64-bit time timestamp conversion (BZ #28349, BZ#28350)
93dc2d
    
93dc2d
    The __convert_scm_timestamps only updates the control message last
93dc2d
    pointer for SOL_SOCKET type, so if the message control buffer contains
93dc2d
    multiple ancillary message types the converted timestamp one might
93dc2d
    overwrite a valid message.
93dc2d
    
93dc2d
    The test checks if the extra ancillary space is correctly handled
93dc2d
    by recvmsg/recvmmsg, where if there is no extra space for the 64-bit
93dc2d
    time_t converted message the control buffer should be marked with
93dc2d
    MSG_TRUNC.  It also check if recvmsg/recvmmsg handle correctly multiple
93dc2d
    ancillary data.
93dc2d
    
93dc2d
    Checked on x86_64-linux and on i686-linux-gnu on both 5.11 and
93dc2d
    4.15 kernel.
93dc2d
    
93dc2d
    Co-authored-by: Fabian Vogt <fvogt@suse.de>
93dc2d
    
93dc2d
    Reviewed-by: Florian Weimer <fweimer@redhat.com>
93dc2d
    
93dc2d
    (cherry picked from commit 8fba672472ae0055387e9315fc2eddfa6775ca79)
93dc2d
93dc2d
diff --git a/sysdeps/unix/sysv/linux/Makefile b/sysdeps/unix/sysv/linux/Makefile
93dc2d
index cdc01a3f023ec09a..7c75e22c6d0e9ff5 100644
93dc2d
--- a/sysdeps/unix/sysv/linux/Makefile
93dc2d
+++ b/sysdeps/unix/sysv/linux/Makefile
93dc2d
@@ -273,6 +273,9 @@ sysdep_routines += cmsg_nxthdr
93dc2d
 CFLAGS-recvmmsg.c = -fexceptions -fasynchronous-unwind-tables
93dc2d
 CFLAGS-sendmmsg.c = -fexceptions -fasynchronous-unwind-tables
93dc2d
 
93dc2d
+tests += tst-socket-timestamp
93dc2d
+tests-time64 += tst-socket-timestamp-time64
93dc2d
+
93dc2d
 tests-special += $(objpfx)tst-socket-consts.out
93dc2d
 $(objpfx)tst-socket-consts.out: ../sysdeps/unix/sysv/linux/tst-socket-consts.py
93dc2d
 	PYTHONPATH=../scripts \
93dc2d
diff --git a/sysdeps/unix/sysv/linux/convert_scm_timestamps.c b/sysdeps/unix/sysv/linux/convert_scm_timestamps.c
93dc2d
index 00c934c4135f0d42..5d3c4199e0b32944 100644
93dc2d
--- a/sysdeps/unix/sysv/linux/convert_scm_timestamps.c
93dc2d
+++ b/sysdeps/unix/sysv/linux/convert_scm_timestamps.c
93dc2d
@@ -54,6 +54,8 @@ __convert_scm_timestamps (struct msghdr *msg, socklen_t msgsize)
93dc2d
        cmsg != NULL;
93dc2d
        cmsg = CMSG_NXTHDR (msg, cmsg))
93dc2d
     {
93dc2d
+      last = cmsg;
93dc2d
+
93dc2d
       if (cmsg->cmsg_level != SOL_SOCKET)
93dc2d
 	continue;
93dc2d
 
93dc2d
@@ -75,11 +77,9 @@ __convert_scm_timestamps (struct msghdr *msg, socklen_t msgsize)
93dc2d
 	  tvts[1] = tmp[1];
93dc2d
 	  break;
93dc2d
 	}
93dc2d
-
93dc2d
-      last = cmsg;
93dc2d
     }
93dc2d
 
93dc2d
-  if (last == NULL || type == 0)
93dc2d
+  if (type == 0)
93dc2d
     return;
93dc2d
 
93dc2d
   if (CMSG_SPACE (sizeof tvts) > msgsize - msg->msg_controllen)
93dc2d
@@ -88,10 +88,12 @@ __convert_scm_timestamps (struct msghdr *msg, socklen_t msgsize)
93dc2d
       return;
93dc2d
     }
93dc2d
 
93dc2d
+  /* Zero memory for the new cmsghdr, so reading cmsg_len field
93dc2d
+     by CMSG_NXTHDR does not trigger UB.  */
93dc2d
+  memset (msg->msg_control + msg->msg_controllen, 0,
93dc2d
+	  CMSG_SPACE (sizeof tvts));
93dc2d
   msg->msg_controllen += CMSG_SPACE (sizeof tvts);
93dc2d
-  cmsg = CMSG_NXTHDR(msg, last);
93dc2d
-  if (cmsg == NULL)
93dc2d
-    return;
93dc2d
+  cmsg = CMSG_NXTHDR (msg, last);
93dc2d
   cmsg->cmsg_level = SOL_SOCKET;
93dc2d
   cmsg->cmsg_type = type;
93dc2d
   cmsg->cmsg_len = CMSG_LEN (sizeof tvts);
93dc2d
diff --git a/sysdeps/unix/sysv/linux/tst-socket-timestamp-time64.c b/sysdeps/unix/sysv/linux/tst-socket-timestamp-time64.c
93dc2d
new file mode 100644
93dc2d
index 0000000000000000..ae424c2a70026cf5
93dc2d
--- /dev/null
93dc2d
+++ b/sysdeps/unix/sysv/linux/tst-socket-timestamp-time64.c
93dc2d
@@ -0,0 +1 @@
93dc2d
+#include "tst-socket-timestamp.c"
93dc2d
diff --git a/sysdeps/unix/sysv/linux/tst-socket-timestamp.c b/sysdeps/unix/sysv/linux/tst-socket-timestamp.c
93dc2d
new file mode 100644
93dc2d
index 0000000000000000..9c2e76f7e27bd312
93dc2d
--- /dev/null
93dc2d
+++ b/sysdeps/unix/sysv/linux/tst-socket-timestamp.c
93dc2d
@@ -0,0 +1,336 @@
93dc2d
+/* Check recvmsg/recvmmsg 64-bit timestamp support.
93dc2d
+   Copyright (C) 2022 Free Software Foundation, Inc.
93dc2d
+   This file is part of the GNU C Library.
93dc2d
+
93dc2d
+   The GNU C Library is free software; you can redistribute it and/or
93dc2d
+   modify it under the terms of the GNU Lesser General Public
93dc2d
+   License as published by the Free Software Foundation; either
93dc2d
+   version 2.1 of the License, or (at your option) any later version.
93dc2d
+
93dc2d
+   The GNU C Library is distributed in the hope that it will be useful,
93dc2d
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
93dc2d
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
93dc2d
+   Lesser General Public License for more details.
93dc2d
+
93dc2d
+   You should have received a copy of the GNU Lesser General Public
93dc2d
+   License along with the GNU C Library; if not, see
93dc2d
+   <https://www.gnu.org/licenses/>.  */
93dc2d
+
93dc2d
+#include <array_length.h>
93dc2d
+#include <arpa/inet.h>
93dc2d
+#include <errno.h>
93dc2d
+#include <string.h>
93dc2d
+#include <stdio.h>
93dc2d
+#include <support/check.h>
93dc2d
+#include <support/next_to_fault.h>
93dc2d
+#include <support/support.h>
93dc2d
+#include <support/test-driver.h>
93dc2d
+#include <support/xunistd.h>
93dc2d
+#include <support/xsocket.h>
93dc2d
+#include <sys/mman.h>
93dc2d
+
93dc2d
+/* Some extra space added for ancillary data, it might be used to convert
93dc2d
+   32-bit timestamp to 64-bit for _TIME_BITS=64.  */
93dc2d
+enum { slack_max_size = 64 };
93dc2d
+static const int slack[] = { 0, 4, 8, 16, 32, slack_max_size };
93dc2d
+
93dc2d
+static bool support_64_timestamp;
93dc2d
+/* AF_INET socket and address used to receive data.  */
93dc2d
+static int srv;
93dc2d
+static struct sockaddr_in srv_addr;
93dc2d
+
93dc2d
+static int
93dc2d
+do_sendto (const struct sockaddr_in *addr, int nmsgs)
93dc2d
+{
93dc2d
+  int s = xsocket (AF_INET, SOCK_DGRAM | SOCK_CLOEXEC, 0);
93dc2d
+  xconnect (s, (const struct sockaddr *) addr, sizeof (*addr));
93dc2d
+
93dc2d
+  for (int i = 0; i < nmsgs; i++)
93dc2d
+    xsendto (s, &i, sizeof (i), 0, (const struct sockaddr *) addr,
93dc2d
+	     sizeof (*addr));
93dc2d
+
93dc2d
+  xclose (s);
93dc2d
+
93dc2d
+  return 0;
93dc2d
+}
93dc2d
+
93dc2d
+static void
93dc2d
+do_recvmsg_slack_ancillary (bool use_multi_call, int s, void *cmsg,
93dc2d
+			    size_t slack, size_t tsize, int exp_payload)
93dc2d
+{
93dc2d
+  int payload;
93dc2d
+  struct iovec iov =
93dc2d
+    {
93dc2d
+      .iov_base = &payload,
93dc2d
+      .iov_len = sizeof (payload)
93dc2d
+    };
93dc2d
+  size_t msg_controllen = CMSG_SPACE (tsize) + slack;
93dc2d
+  char *msg_control = cmsg - msg_controllen;
93dc2d
+  memset (msg_control, 0x55, msg_controllen);
93dc2d
+  struct mmsghdr mmhdr =
93dc2d
+    {
93dc2d
+      .msg_hdr =
93dc2d
+      {
93dc2d
+        .msg_name = NULL,
93dc2d
+        .msg_namelen = 0,
93dc2d
+        .msg_iov = &iov,
93dc2d
+        .msg_iovlen = 1,
93dc2d
+        .msg_control = msg_control,
93dc2d
+        .msg_controllen = msg_controllen
93dc2d
+      },
93dc2d
+    };
93dc2d
+
93dc2d
+  int r;
93dc2d
+  if (use_multi_call)
93dc2d
+    {
93dc2d
+      r = recvmmsg (s, &mmhdr, 1, 0, NULL);
93dc2d
+      if (r >= 0)
93dc2d
+	r = mmhdr.msg_len;
93dc2d
+    }
93dc2d
+  else
93dc2d
+    r = recvmsg (s, &mmhdr.msg_hdr, 0);
93dc2d
+  TEST_COMPARE (r, sizeof (int));
93dc2d
+  TEST_COMPARE (payload, exp_payload);
93dc2d
+
93dc2d
+  if (cmsg == NULL)
93dc2d
+    return;
93dc2d
+
93dc2d
+  /* A timestamp is expected if 32-bit timestamp are used (support in every
93dc2d
+     configuration) or if underlying kernel support 64-bit timestamps.
93dc2d
+     Otherwise recvmsg will need extra space do add the 64-bit timestamp.  */
93dc2d
+  bool exp_timestamp;
93dc2d
+  if (sizeof (time_t) == 4 || support_64_timestamp)
93dc2d
+    exp_timestamp = true;
93dc2d
+   else
93dc2d
+    exp_timestamp = slack >= CMSG_SPACE (tsize);
93dc2d
+
93dc2d
+  bool timestamp = false;
93dc2d
+  for (struct cmsghdr *cmsg = CMSG_FIRSTHDR (&mmhdr.msg_hdr);
93dc2d
+       cmsg != NULL;
93dc2d
+       cmsg = CMSG_NXTHDR (&mmhdr.msg_hdr, cmsg))
93dc2d
+    {
93dc2d
+      if (cmsg->cmsg_level != SOL_SOCKET)
93dc2d
+	continue;
93dc2d
+      if (cmsg->cmsg_type == SCM_TIMESTAMP
93dc2d
+	  && cmsg->cmsg_len == CMSG_LEN (sizeof (struct timeval)))
93dc2d
+	{
93dc2d
+	  struct timeval tv;
93dc2d
+	  memcpy (&tv, CMSG_DATA (cmsg), sizeof (tv));
93dc2d
+	  if (test_verbose)
93dc2d
+	    printf ("SCM_TIMESTAMP:   {%jd, %jd}\n", (intmax_t)tv.tv_sec,
93dc2d
+		    (intmax_t)tv.tv_usec);
93dc2d
+	  timestamp = true;
93dc2d
+	}
93dc2d
+      else if (cmsg->cmsg_type == SCM_TIMESTAMPNS
93dc2d
+	       && cmsg->cmsg_len == CMSG_LEN (sizeof (struct timespec)))
93dc2d
+	{
93dc2d
+	  struct timespec ts;
93dc2d
+	  memcpy (&ts, CMSG_DATA (cmsg), sizeof (ts));
93dc2d
+	  if (test_verbose)
93dc2d
+	    printf ("SCM_TIMESTAMPNS: {%jd, %jd}\n", (intmax_t)ts.tv_sec,
93dc2d
+		    (intmax_t)ts.tv_nsec);
93dc2d
+	  timestamp = true;
93dc2d
+	}
93dc2d
+    }
93dc2d
+
93dc2d
+  TEST_COMPARE (timestamp, exp_timestamp);
93dc2d
+}
93dc2d
+
93dc2d
+/* Check if the extra ancillary space is correctly handled by recvmsg and
93dc2d
+   recvmmsg with different extra space for the ancillaty buffer.  */
93dc2d
+static void
93dc2d
+do_test_slack_space (void)
93dc2d
+{
93dc2d
+  /* Setup the ancillary data buffer with an extra page with PROT_NONE to
93dc2d
+     check the possible timestamp conversion on some systems.  */
93dc2d
+  struct support_next_to_fault nf =
93dc2d
+    support_next_to_fault_allocate (slack_max_size);
93dc2d
+  void *msgbuf = nf.buffer + slack_max_size;
93dc2d
+
93dc2d
+  /* Enable the timestamp using struct timeval precision.  */
93dc2d
+  {
93dc2d
+    int r = setsockopt (srv, SOL_SOCKET, SO_TIMESTAMP, &(int){1},
93dc2d
+			sizeof (int));
93dc2d
+    TEST_VERIFY_EXIT (r != -1);
93dc2d
+  }
93dc2d
+  /* Check recvmsg.  */
93dc2d
+  do_sendto (&srv_addr, array_length (slack));
93dc2d
+  for (int s = 0; s < array_length (slack); s++)
93dc2d
+    {
93dc2d
+      memset (nf.buffer, 0x55, nf.length);
93dc2d
+      do_recvmsg_slack_ancillary (false, srv, msgbuf, slack[s],
93dc2d
+				  sizeof (struct timeval), s);
93dc2d
+    }
93dc2d
+  /* Check recvmmsg.  */
93dc2d
+  do_sendto (&srv_addr, array_length (slack));
93dc2d
+  for (int s = 0; s < array_length (slack); s++)
93dc2d
+    {
93dc2d
+      memset (nf.buffer, 0x55, nf.length);
93dc2d
+      do_recvmsg_slack_ancillary (true, srv, msgbuf, slack[s],
93dc2d
+				  sizeof (struct timeval), s);
93dc2d
+    }
93dc2d
+
93dc2d
+  /* Now enable timestamp using a higher precision, it overwrites the previous
93dc2d
+     precision.  */
93dc2d
+  {
93dc2d
+    int r = setsockopt (srv, SOL_SOCKET, SO_TIMESTAMPNS, &(int){1},
93dc2d
+			sizeof (int));
93dc2d
+    TEST_VERIFY_EXIT (r != -1);
93dc2d
+  }
93dc2d
+  /* Check recvmsg.  */
93dc2d
+  do_sendto (&srv_addr, array_length (slack));
93dc2d
+  for (int s = 0; s < array_length (slack); s++)
93dc2d
+    do_recvmsg_slack_ancillary (false, srv, msgbuf, slack[s],
93dc2d
+				sizeof (struct timespec), s);
93dc2d
+  /* Check recvmmsg.  */
93dc2d
+  do_sendto (&srv_addr, array_length (slack));
93dc2d
+  for (int s = 0; s < array_length (slack); s++)
93dc2d
+    do_recvmsg_slack_ancillary (true, srv, msgbuf, slack[s],
93dc2d
+				sizeof (struct timespec), s);
93dc2d
+
93dc2d
+  support_next_to_fault_free (&nf);
93dc2d
+}
93dc2d
+
93dc2d
+/* Check if the converted 64-bit timestamp is correctly appended when there
93dc2d
+   are multiple ancillary messages.  */
93dc2d
+static void
93dc2d
+do_recvmsg_multiple_ancillary (bool use_multi_call, int s, void *cmsg,
93dc2d
+			       size_t cmsgsize, int exp_msg)
93dc2d
+{
93dc2d
+  int msg;
93dc2d
+  struct iovec iov =
93dc2d
+    {
93dc2d
+      .iov_base = &msg,
93dc2d
+      .iov_len = sizeof (msg)
93dc2d
+    };
93dc2d
+  size_t msgs = cmsgsize;
93dc2d
+  struct mmsghdr mmhdr =
93dc2d
+    {
93dc2d
+      .msg_hdr =
93dc2d
+      {
93dc2d
+        .msg_name = NULL,
93dc2d
+        .msg_namelen = 0,
93dc2d
+        .msg_iov = &iov,
93dc2d
+        .msg_iovlen = 1,
93dc2d
+        .msg_controllen = msgs,
93dc2d
+        .msg_control = cmsg,
93dc2d
+      },
93dc2d
+    };
93dc2d
+
93dc2d
+  int r;
93dc2d
+  if (use_multi_call)
93dc2d
+    {
93dc2d
+      r = recvmmsg (s, &mmhdr, 1, 0, NULL);
93dc2d
+      if (r >= 0)
93dc2d
+	r = mmhdr.msg_len;
93dc2d
+    }
93dc2d
+  else
93dc2d
+    r = recvmsg (s, &mmhdr.msg_hdr, 0);
93dc2d
+  TEST_COMPARE (r, sizeof (int));
93dc2d
+  TEST_COMPARE (msg, exp_msg);
93dc2d
+
93dc2d
+  if (cmsg == NULL)
93dc2d
+    return;
93dc2d
+
93dc2d
+  bool timestamp = false;
93dc2d
+  bool origdstaddr = false;
93dc2d
+  for (struct cmsghdr *cmsg = CMSG_FIRSTHDR (&mmhdr.msg_hdr);
93dc2d
+       cmsg != NULL;
93dc2d
+       cmsg = CMSG_NXTHDR (&mmhdr.msg_hdr, cmsg))
93dc2d
+    {
93dc2d
+      if (cmsg->cmsg_level == SOL_IP
93dc2d
+	  && cmsg->cmsg_type == IP_ORIGDSTADDR
93dc2d
+	  && cmsg->cmsg_len >= CMSG_LEN (sizeof (struct sockaddr_in)))
93dc2d
+	{
93dc2d
+	  struct sockaddr_in sa;
93dc2d
+	  memcpy (&sa, CMSG_DATA (cmsg), sizeof (sa));
93dc2d
+	  if (test_verbose)
93dc2d
+	    {
93dc2d
+	      char str[INET_ADDRSTRLEN];
93dc2d
+	      inet_ntop (AF_INET, &sa.sin_addr, str, INET_ADDRSTRLEN);
93dc2d
+	      printf ("IP_ORIGDSTADDR:  %s:%d\n", str, ntohs (sa.sin_port));
93dc2d
+	    }
93dc2d
+	  origdstaddr = sa.sin_addr.s_addr == srv_addr.sin_addr.s_addr
93dc2d
+			&& sa.sin_port == srv_addr.sin_port;
93dc2d
+	}
93dc2d
+      if (cmsg->cmsg_level == SOL_SOCKET
93dc2d
+	  && cmsg->cmsg_type == SCM_TIMESTAMP
93dc2d
+	  && cmsg->cmsg_len >= CMSG_LEN (sizeof (struct timeval)))
93dc2d
+	{
93dc2d
+	  struct timeval tv;
93dc2d
+	  memcpy (&tv, CMSG_DATA (cmsg), sizeof (tv));
93dc2d
+	  if (test_verbose)
93dc2d
+	    printf ("SCM_TIMESTAMP:   {%jd, %jd}\n", (intmax_t)tv.tv_sec,
93dc2d
+		    (intmax_t)tv.tv_usec);
93dc2d
+	  timestamp = true;
93dc2d
+	}
93dc2d
+    }
93dc2d
+
93dc2d
+  TEST_COMPARE (timestamp, true);
93dc2d
+  TEST_COMPARE (origdstaddr, true);
93dc2d
+}
93dc2d
+
93dc2d
+static void
93dc2d
+do_test_multiple_ancillary (void)
93dc2d
+{
93dc2d
+  {
93dc2d
+    int r = setsockopt (srv, SOL_SOCKET, SO_TIMESTAMP, &(int){1},
93dc2d
+			sizeof (int));
93dc2d
+    TEST_VERIFY_EXIT (r != -1);
93dc2d
+  }
93dc2d
+  {
93dc2d
+    int r = setsockopt (srv, IPPROTO_IP, IP_RECVORIGDSTADDR, &(int){1},
93dc2d
+			sizeof (int));
93dc2d
+    TEST_VERIFY_EXIT (r != -1);
93dc2d
+  }
93dc2d
+
93dc2d
+  /* Enougth data for default SO_TIMESTAMP, the IP_RECVORIGDSTADDR, and the
93dc2d
+     extra 64-bit SO_TIMESTAMP.  */
93dc2d
+  enum { msgbuflen = CMSG_SPACE (2 * sizeof (uint64_t))
93dc2d
+		     + CMSG_SPACE (sizeof (struct sockaddr_in))
93dc2d
+		     + CMSG_SPACE (2 * sizeof (uint64_t)) };
93dc2d
+  char msgbuf[msgbuflen];
93dc2d
+
93dc2d
+  enum { nmsgs = 8 };
93dc2d
+  /* Check recvmsg.  */
93dc2d
+  do_sendto (&srv_addr, nmsgs);
93dc2d
+  for (int s = 0; s < nmsgs; s++)
93dc2d
+    do_recvmsg_multiple_ancillary (false, srv, msgbuf, msgbuflen, s);
93dc2d
+  /* Check recvmmsg.  */
93dc2d
+  do_sendto (&srv_addr, nmsgs);
93dc2d
+  for (int s = 0; s < nmsgs; s++)
93dc2d
+    do_recvmsg_multiple_ancillary (true, srv, msgbuf, msgbuflen, s);
93dc2d
+}
93dc2d
+
93dc2d
+static int
93dc2d
+do_test (void)
93dc2d
+{
93dc2d
+  srv = xsocket (AF_INET, SOCK_DGRAM, 0);
93dc2d
+  srv_addr = (struct sockaddr_in) {
93dc2d
+    .sin_family = AF_INET,
93dc2d
+    .sin_addr = {.s_addr = htonl (INADDR_LOOPBACK) },
93dc2d
+  };
93dc2d
+  xbind (srv, (struct sockaddr *) &srv_addr, sizeof (srv_addr));
93dc2d
+  {
93dc2d
+    socklen_t sa_len = sizeof (srv_addr);
93dc2d
+    xgetsockname (srv, (struct sockaddr *) &srv_addr, &sa_len);
93dc2d
+    TEST_VERIFY (sa_len == sizeof (srv_addr));
93dc2d
+  }
93dc2d
+
93dc2d
+  TEST_COMPARE (recvmsg (-1, NULL, 0), -1);
93dc2d
+  TEST_COMPARE (errno, EBADF);
93dc2d
+  TEST_COMPARE (recvmmsg (-1, NULL, 0, 0, NULL), -1);
93dc2d
+  TEST_COMPARE (errno, EBADF);
93dc2d
+
93dc2d
+  /* If underlying kernel does not support   */
93dc2d
+  support_64_timestamp = support_socket_so_timestamp_time64 (srv);
93dc2d
+
93dc2d
+  do_test_slack_space ();
93dc2d
+  do_test_multiple_ancillary ();
93dc2d
+
93dc2d
+  xclose (srv);
93dc2d
+
93dc2d
+  return 0;
93dc2d
+}
93dc2d
+
93dc2d
+#include <support/test-driver.c>