[PATCH v4] socket: Check lengths before advancing pointer in CMSG_NXTHDR
Siddhesh Poyarekar
siddhesh@gotplt.org
Fri Jul 29 16:40:43 GMT 2022
On 2022-07-29 09:26, Arjun Shankar wrote:
> The inline and library functions that the CMSG_NXTHDR macro may expand
> to increment the pointer to the header before checking the stride of
> the increment against available space. Since C only allows incrementing
> pointers to one past the end of an array, the increment must be done
> after a length check. This commit fixes that and includes a regression
> test for CMSG_FIRSTHDR and CMSG_NXTHDR.
>
> The Linux, Hurd, and generic headers are all changed.
>
> Tested on Linux on armv7hl, i686, x86_64, aarch64, ppc64le, and s390x.
>
> [BZ #28846]
> ---
> v3: https://sourceware.org/pipermail/libc-alpha/2022-July/140854.html
>
> Notes on v4:
>
> * Addressed review comments from Siddhesh:
>
> 1. (sizeof (struct cmsghdr) + __CMSG_PADDING (cmsg_len)):
> defined as size_needed.
>
> 2.
>> OK, but I wonder if there's utility in making the padding a generic
>> macro, e.g.
>
>> #define ALIGN_PADDING(n, a) ((a - (n & (a - 1))) & (a - 1))
>
> This sounds useful, and actually it would be great to move *all* of the
> duplicate code between these versions into a separate file and include it
> in these variants. I'll try to do a follow-up with this soon. I'm going to
> note it down in my TODO.
>
> 3.
>> __msg_control_ptr doesn't really need the __ since it's a local variable.
>
> I thought so too. But Florian pointed out that it would interfere with
> things like users #define'ing msg_control_ptr before including socket.h.
> ---
> bits/socket.h | 40 ++++++++++--
> socket/Makefile | 1 +
> socket/tst-cmsghdr-skeleton.c | 92 +++++++++++++++++++++++++++
> socket/tst-cmsghdr.c | 56 ++++++++++++++++
> sysdeps/mach/hurd/bits/socket.h | 40 ++++++++++--
> sysdeps/unix/sysv/linux/bits/socket.h | 40 ++++++++++--
> sysdeps/unix/sysv/linux/cmsg_nxthdr.c | 36 ++++++++---
> 7 files changed, 276 insertions(+), 29 deletions(-)
> create mode 100644 socket/tst-cmsghdr-skeleton.c
> create mode 100644 socket/tst-cmsghdr.c
LGTM.
Reviewed-by: Siddhesh Poyarekar <siddhesh@sourceware.org>
>
> diff --git a/bits/socket.h b/bits/socket.h
> index 2b99dea33b..aac8c49b00 100644
> --- a/bits/socket.h
> +++ b/bits/socket.h
> @@ -245,6 +245,12 @@ struct cmsghdr
> + CMSG_ALIGN (sizeof (struct cmsghdr)))
> #define CMSG_LEN(len) (CMSG_ALIGN (sizeof (struct cmsghdr)) + (len))
>
> +/* Given a length, return the additional padding necessary such that
> + len + __CMSG_PADDING(len) == CMSG_ALIGN (len). */
> +#define __CMSG_PADDING(len) ((sizeof (size_t) \
> + - ((len) & (sizeof (size_t) - 1))) \
> + & (sizeof (size_t) - 1))
> +
> extern struct cmsghdr *__cmsg_nxthdr (struct msghdr *__mhdr,
> struct cmsghdr *__cmsg) __THROW;
> #ifdef __USE_EXTERN_INLINES
> @@ -254,18 +260,38 @@ extern struct cmsghdr *__cmsg_nxthdr (struct msghdr *__mhdr,
> _EXTERN_INLINE struct cmsghdr *
> __NTH (__cmsg_nxthdr (struct msghdr *__mhdr, struct cmsghdr *__cmsg))
> {
> + /* We may safely assume that __cmsg lies between __mhdr->msg_control and
> + __mhdr->msg_controllen because the user is required to obtain the first
> + cmsg via CMSG_FIRSTHDR, set its length, then obtain subsequent cmsgs
> + via CMSG_NXTHDR, setting lengths along the way. However, we don't yet
> + trust the value of __cmsg->cmsg_len and therefore do not use it in any
> + pointer arithmetic until we check its value. */
> +
> + unsigned char * __msg_control_ptr = (unsigned char *) __mhdr->msg_control;
> + unsigned char * __cmsg_ptr = (unsigned char *) __cmsg;
> +
> + size_t __size_needed = sizeof (struct cmsghdr)
> + + __CMSG_PADDING (__cmsg->cmsg_len);
> +
> + /* The current header is malformed, too small to be a full header. */
> if ((size_t) __cmsg->cmsg_len < sizeof (struct cmsghdr))
> - /* The kernel header does this so there may be a reason. */
> return (struct cmsghdr *) 0;
>
> + /* There isn't enough space between __cmsg and the end of the buffer to
> + hold the current cmsg *and* the next one. */
> + if (((size_t)
> + (__msg_control_ptr + __mhdr->msg_controllen - __cmsg_ptr)
> + < __size_needed)
> + || ((size_t)
> + (__msg_control_ptr + __mhdr->msg_controllen - __cmsg_ptr
> + - __size_needed)
> + < __cmsg->cmsg_len))
> +
> + return (struct cmsghdr *) 0;
> +
> + /* Now, we trust cmsg_len and can use it to find the next header. */
> __cmsg = (struct cmsghdr *) ((unsigned char *) __cmsg
> + CMSG_ALIGN (__cmsg->cmsg_len));
> - if ((unsigned char *) (__cmsg + 1) > ((unsigned char *) __mhdr->msg_control
> - + __mhdr->msg_controllen)
> - || ((unsigned char *) __cmsg + CMSG_ALIGN (__cmsg->cmsg_len)
> - > ((unsigned char *) __mhdr->msg_control + __mhdr->msg_controllen)))
> - /* No more entries. */
> - return (struct cmsghdr *) 0;
> return __cmsg;
> }
> #endif /* Use `extern inline'. */
> diff --git a/socket/Makefile b/socket/Makefile
> index 156eec6c85..2bde78387f 100644
> --- a/socket/Makefile
> +++ b/socket/Makefile
> @@ -34,6 +34,7 @@ routines := accept bind connect getpeername getsockname getsockopt \
> tests := \
> tst-accept4 \
> tst-sockopt \
> + tst-cmsghdr \
> # tests
>
> tests-internal := \
> diff --git a/socket/tst-cmsghdr-skeleton.c b/socket/tst-cmsghdr-skeleton.c
> new file mode 100644
> index 0000000000..4c6898569b
> --- /dev/null
> +++ b/socket/tst-cmsghdr-skeleton.c
> @@ -0,0 +1,92 @@
> +/* Test ancillary data header creation.
> + Copyright (C) 2022 Free Software Foundation, Inc.
> + This file is part of the GNU C Library.
> +
> + The GNU C Library is free software; you can redistribute it and/or
> + modify it under the terms of the GNU Lesser General Public
> + License as published by the Free Software Foundation; either
> + version 2.1 of the License, or (at your option) any later version.
> +
> + The GNU C Library is distributed in the hope that it will be useful,
> + but WITHOUT ANY WARRANTY; without even the implied warranty of
> + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> + Lesser General Public License for more details.
> +
> + You should have received a copy of the GNU Lesser General Public
> + License along with the GNU C Library; if not, see
> + <https://www.gnu.org/licenses/>. */
> +
> +/* We use the preprocessor to generate the function/macro tests instead of
> + using indirection because having all the macro expansions alongside
> + each other lets the compiler warn us about suspicious pointer
> + arithmetic across subsequent CMSG_{FIRST,NXT}HDR expansions. */
> +
> +#include <stdint.h>
> +
> +#define RUN_TEST_CONCAT(suffix) run_test_##suffix
> +#define RUN_TEST_FUNCNAME(suffix) RUN_TEST_CONCAT (suffix)
> +
> +static void
> +RUN_TEST_FUNCNAME (CMSG_NXTHDR_IMPL) (void)
> +{
> + struct msghdr m = {0};
> + struct cmsghdr *cmsg;
> + char cmsgbuf[3 * CMSG_SPACE (sizeof (PAYLOAD))] = {0};
> +
> + m.msg_control = cmsgbuf;
> + m.msg_controllen = sizeof (cmsgbuf);
> +
> + /* First header should point to the start of the buffer. */
> + cmsg = CMSG_FIRSTHDR (&m);
> + TEST_VERIFY_EXIT ((char *) cmsg == cmsgbuf);
> +
> + /* If the first header length consumes the entire buffer, there is no
> + space remaining for additional headers. */
> + cmsg->cmsg_len = sizeof (cmsgbuf);
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg == NULL);
> +
> + /* The first header length is so big, using it would cause an overflow. */
> + cmsg = CMSG_FIRSTHDR (&m);
> + TEST_VERIFY_EXIT ((char *) cmsg == cmsgbuf);
> + cmsg->cmsg_len = SIZE_MAX;
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg == NULL);
> +
> + /* The first header leaves just enough space to hold another header. */
> + cmsg = CMSG_FIRSTHDR (&m);
> + TEST_VERIFY_EXIT ((char *) cmsg == cmsgbuf);
> + cmsg->cmsg_len = sizeof (cmsgbuf) - sizeof (struct cmsghdr);
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg != NULL);
> +
> + /* The first header leaves space but not enough for another header. */
> + cmsg = CMSG_FIRSTHDR (&m);
> + TEST_VERIFY_EXIT ((char *) cmsg == cmsgbuf);
> + cmsg->cmsg_len ++;
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg == NULL);
> +
> + /* The second header leaves just enough space to hold another header. */
> + cmsg = CMSG_FIRSTHDR (&m);
> + TEST_VERIFY_EXIT ((char *) cmsg == cmsgbuf);
> + cmsg->cmsg_len = CMSG_LEN (sizeof (PAYLOAD));
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg != NULL);
> + cmsg->cmsg_len = sizeof (cmsgbuf)
> + - CMSG_SPACE (sizeof (PAYLOAD)) /* First header. */
> + - sizeof (struct cmsghdr);
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg != NULL);
> +
> + /* The second header leaves space but not enough for another header. */
> + cmsg = CMSG_FIRSTHDR (&m);
> + TEST_VERIFY_EXIT ((char *) cmsg == cmsgbuf);
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg != NULL);
> + cmsg->cmsg_len ++;
> + cmsg = CMSG_NXTHDR_IMPL (&m, cmsg);
> + TEST_VERIFY_EXIT (cmsg == NULL);
> +
> + return;
> +}
> diff --git a/socket/tst-cmsghdr.c b/socket/tst-cmsghdr.c
> new file mode 100644
> index 0000000000..68c96d3c9d
> --- /dev/null
> +++ b/socket/tst-cmsghdr.c
> @@ -0,0 +1,56 @@
> +/* Test ancillary data header creation.
> + Copyright (C) 2022 Free Software Foundation, Inc.
> + This file is part of the GNU C Library.
> +
> + The GNU C Library is free software; you can redistribute it and/or
> + modify it under the terms of the GNU Lesser General Public
> + License as published by the Free Software Foundation; either
> + version 2.1 of the License, or (at your option) any later version.
> +
> + The GNU C Library is distributed in the hope that it will be useful,
> + but WITHOUT ANY WARRANTY; without even the implied warranty of
> + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> + Lesser General Public License for more details.
> +
> + You should have received a copy of the GNU Lesser General Public
> + License along with the GNU C Library; if not, see
> + <https://www.gnu.org/licenses/>. */
> +
> +#include <sys/socket.h>
> +#include <gnu/lib-names.h>
> +#include <support/xdlfcn.h>
> +#include <support/check.h>
> +
> +#define PAYLOAD "Hello, World!"
> +
> +/* CMSG_NXTHDR is a macro that calls an inline function defined in
> + bits/socket.h. In case the function cannot be inlined, libc.so carries
> + a copy. Both versions need to be tested. */
> +
> +#define CMSG_NXTHDR_IMPL CMSG_NXTHDR
> +#include "tst-cmsghdr-skeleton.c"
> +#undef CMSG_NXTHDR_IMPL
> +
> +static struct cmsghdr * (* cmsg_nxthdr) (struct msghdr *, struct cmsghdr *);
> +
> +#define CMSG_NXTHDR_IMPL cmsg_nxthdr
> +#include "tst-cmsghdr-skeleton.c"
> +#undef CMSG_NXTHDR_IMPL
> +
> +static int
> +do_test (void)
> +{
> + static void *handle;
> +
> + run_test_CMSG_NXTHDR ();
> +
> + handle = xdlopen (LIBC_SO, RTLD_LAZY);
> + cmsg_nxthdr = (struct cmsghdr * (*) (struct msghdr *, struct cmsghdr *))
> + xdlsym (handle, "__cmsg_nxthdr");
> +
> + run_test_cmsg_nxthdr ();
> +
> + return 0;
> +}
> +
> +#include <support/test-driver.c>
> diff --git a/sysdeps/mach/hurd/bits/socket.h b/sysdeps/mach/hurd/bits/socket.h
> index 5b35ea81ec..70fce4fb27 100644
> --- a/sysdeps/mach/hurd/bits/socket.h
> +++ b/sysdeps/mach/hurd/bits/socket.h
> @@ -249,6 +249,12 @@ struct cmsghdr
> + CMSG_ALIGN (sizeof (struct cmsghdr)))
> #define CMSG_LEN(len) (CMSG_ALIGN (sizeof (struct cmsghdr)) + (len))
>
> +/* Given a length, return the additional padding necessary such that
> + len + __CMSG_PADDING(len) == CMSG_ALIGN (len). */
> +#define __CMSG_PADDING(len) ((sizeof (size_t) \
> + - ((len) & (sizeof (size_t) - 1))) \
> + & (sizeof (size_t) - 1))
> +
> extern struct cmsghdr *__cmsg_nxthdr (struct msghdr *__mhdr,
> struct cmsghdr *__cmsg) __THROW;
> #ifdef __USE_EXTERN_INLINES
> @@ -258,18 +264,38 @@ extern struct cmsghdr *__cmsg_nxthdr (struct msghdr *__mhdr,
> _EXTERN_INLINE struct cmsghdr *
> __NTH (__cmsg_nxthdr (struct msghdr *__mhdr, struct cmsghdr *__cmsg))
> {
> + /* We may safely assume that __cmsg lies between __mhdr->msg_control and
> + __mhdr->msg_controllen because the user is required to obtain the first
> + cmsg via CMSG_FIRSTHDR, set its length, then obtain subsequent cmsgs
> + via CMSG_NXTHDR, setting lengths along the way. However, we don't yet
> + trust the value of __cmsg->cmsg_len and therefore do not use it in any
> + pointer arithmetic until we check its value. */
> +
> + unsigned char * __msg_control_ptr = (unsigned char *) __mhdr->msg_control;
> + unsigned char * __cmsg_ptr = (unsigned char *) __cmsg;
> +
> + size_t __size_needed = sizeof (struct cmsghdr)
> + + __CMSG_PADDING (__cmsg->cmsg_len);
> +
> + /* The current header is malformed, too small to be a full header. */
> if ((size_t) __cmsg->cmsg_len < sizeof (struct cmsghdr))
> - /* The kernel header does this so there may be a reason. */
> return (struct cmsghdr *) 0;
>
> + /* There isn't enough space between __cmsg and the end of the buffer to
> + hold the current cmsg *and* the next one. */
> + if (((size_t)
> + (__msg_control_ptr + __mhdr->msg_controllen - __cmsg_ptr)
> + < __size_needed)
> + || ((size_t)
> + (__msg_control_ptr + __mhdr->msg_controllen - __cmsg_ptr
> + - __size_needed)
> + < __cmsg->cmsg_len))
> +
> + return (struct cmsghdr *) 0;
> +
> + /* Now, we trust cmsg_len and can use it to find the next header. */
> __cmsg = (struct cmsghdr *) ((unsigned char *) __cmsg
> + CMSG_ALIGN (__cmsg->cmsg_len));
> - if ((unsigned char *) (__cmsg + 1) > ((unsigned char *) __mhdr->msg_control
> - + __mhdr->msg_controllen)
> - || ((unsigned char *) __cmsg + CMSG_ALIGN (__cmsg->cmsg_len)
> - > ((unsigned char *) __mhdr->msg_control + __mhdr->msg_controllen)))
> - /* No more entries. */
> - return (struct cmsghdr *) 0;
> return __cmsg;
> }
> #endif /* Use `extern inline'. */
> diff --git a/sysdeps/unix/sysv/linux/bits/socket.h b/sysdeps/unix/sysv/linux/bits/socket.h
> index 4f1f810ea1..539b8d7716 100644
> --- a/sysdeps/unix/sysv/linux/bits/socket.h
> +++ b/sysdeps/unix/sysv/linux/bits/socket.h
> @@ -307,6 +307,12 @@ struct cmsghdr
> + CMSG_ALIGN (sizeof (struct cmsghdr)))
> #define CMSG_LEN(len) (CMSG_ALIGN (sizeof (struct cmsghdr)) + (len))
>
> +/* Given a length, return the additional padding necessary such that
> + len + __CMSG_PADDING(len) == CMSG_ALIGN (len). */
> +#define __CMSG_PADDING(len) ((sizeof (size_t) \
> + - ((len) & (sizeof (size_t) - 1))) \
> + & (sizeof (size_t) - 1))
> +
> extern struct cmsghdr *__cmsg_nxthdr (struct msghdr *__mhdr,
> struct cmsghdr *__cmsg) __THROW;
> #ifdef __USE_EXTERN_INLINES
> @@ -316,18 +322,38 @@ extern struct cmsghdr *__cmsg_nxthdr (struct msghdr *__mhdr,
> _EXTERN_INLINE struct cmsghdr *
> __NTH (__cmsg_nxthdr (struct msghdr *__mhdr, struct cmsghdr *__cmsg))
> {
> + /* We may safely assume that __cmsg lies between __mhdr->msg_control and
> + __mhdr->msg_controllen because the user is required to obtain the first
> + cmsg via CMSG_FIRSTHDR, set its length, then obtain subsequent cmsgs
> + via CMSG_NXTHDR, setting lengths along the way. However, we don't yet
> + trust the value of __cmsg->cmsg_len and therefore do not use it in any
> + pointer arithmetic until we check its value. */
> +
> + unsigned char * __msg_control_ptr = (unsigned char *) __mhdr->msg_control;
> + unsigned char * __cmsg_ptr = (unsigned char *) __cmsg;
> +
> + size_t __size_needed = sizeof (struct cmsghdr)
> + + __CMSG_PADDING (__cmsg->cmsg_len);
> +
> + /* The current header is malformed, too small to be a full header. */
> if ((size_t) __cmsg->cmsg_len < sizeof (struct cmsghdr))
> - /* The kernel header does this so there may be a reason. */
> return (struct cmsghdr *) 0;
>
> + /* There isn't enough space between __cmsg and the end of the buffer to
> + hold the current cmsg *and* the next one. */
> + if (((size_t)
> + (__msg_control_ptr + __mhdr->msg_controllen - __cmsg_ptr)
> + < __size_needed)
> + || ((size_t)
> + (__msg_control_ptr + __mhdr->msg_controllen - __cmsg_ptr
> + - __size_needed)
> + < __cmsg->cmsg_len))
> +
> + return (struct cmsghdr *) 0;
> +
> + /* Now, we trust cmsg_len and can use it to find the next header. */
> __cmsg = (struct cmsghdr *) ((unsigned char *) __cmsg
> + CMSG_ALIGN (__cmsg->cmsg_len));
> - if ((unsigned char *) (__cmsg + 1) > ((unsigned char *) __mhdr->msg_control
> - + __mhdr->msg_controllen)
> - || ((unsigned char *) __cmsg + CMSG_ALIGN (__cmsg->cmsg_len)
> - > ((unsigned char *) __mhdr->msg_control + __mhdr->msg_controllen)))
> - /* No more entries. */
> - return (struct cmsghdr *) 0;
> return __cmsg;
> }
> #endif /* Use `extern inline'. */
> diff --git a/sysdeps/unix/sysv/linux/cmsg_nxthdr.c b/sysdeps/unix/sysv/linux/cmsg_nxthdr.c
> index 15b7a3a925..24f72b797a 100644
> --- a/sysdeps/unix/sysv/linux/cmsg_nxthdr.c
> +++ b/sysdeps/unix/sysv/linux/cmsg_nxthdr.c
> @@ -23,18 +23,38 @@
> struct cmsghdr *
> __cmsg_nxthdr (struct msghdr *mhdr, struct cmsghdr *cmsg)
> {
> + /* We may safely assume that cmsg lies between mhdr->msg_control and
> + mhdr->msg_controllen because the user is required to obtain the first
> + cmsg via CMSG_FIRSTHDR, set its length, then obtain subsequent cmsgs
> + via CMSG_NXTHDR, setting lengths along the way. However, we don't yet
> + trust the value of cmsg->cmsg_len and therefore do not use it in any
> + pointer arithmetic until we check its value. */
> +
> + unsigned char * msg_control_ptr = (unsigned char *) mhdr->msg_control;
> + unsigned char * cmsg_ptr = (unsigned char *) cmsg;
> +
> + size_t size_needed = sizeof (struct cmsghdr)
> + + __CMSG_PADDING (cmsg->cmsg_len);
> +
> + /* The current header is malformed, too small to be a full header. */
> if ((size_t) cmsg->cmsg_len < sizeof (struct cmsghdr))
> - /* The kernel header does this so there may be a reason. */
> - return NULL;
> + return (struct cmsghdr *) 0;
> +
> + /* There isn't enough space between cmsg and the end of the buffer to
> + hold the current cmsg *and* the next one. */
> + if (((size_t)
> + (msg_control_ptr + mhdr->msg_controllen - cmsg_ptr)
> + < size_needed)
> + || ((size_t)
> + (msg_control_ptr + mhdr->msg_controllen - cmsg_ptr
> + - size_needed)
> + < cmsg->cmsg_len))
> +
> + return (struct cmsghdr *) 0;
>
> + /* Now, we trust cmsg_len and can use it to find the next header. */
> cmsg = (struct cmsghdr *) ((unsigned char *) cmsg
> + CMSG_ALIGN (cmsg->cmsg_len));
> - if ((unsigned char *) (cmsg + 1) > ((unsigned char *) mhdr->msg_control
> - + mhdr->msg_controllen)
> - || ((unsigned char *) cmsg + CMSG_ALIGN (cmsg->cmsg_len)
> - > ((unsigned char *) mhdr->msg_control + mhdr->msg_controllen)))
> - /* No more entries. */
> - return NULL;
> return cmsg;
> }
> libc_hidden_def (__cmsg_nxthdr)
More information about the Libc-alpha
mailing list