ed3f42
From bcab8c3cd877506de75f50e0f9ed98827ed554b0 Mon Sep 17 00:00:00 2001
ed3f42
From: Peter Zhu <peter@peterzhu.ca>
ed3f42
Date: Tue, 23 Feb 2021 16:28:56 -0500
ed3f42
Subject: [PATCH] Use mmap for allocating heap pages
ed3f42
ed3f42
---
ed3f42
 configure.ac                 |  16 ++++
ed3f42
 gc.c                         | 149 ++++++++++++++++++++++++++---------
ed3f42
 test/ruby/test_gc_compact.rb |  41 ++++++----
ed3f42
 3 files changed, 155 insertions(+), 51 deletions(-)
ed3f42
ed3f42
diff --git a/configure.ac b/configure.ac
ed3f42
index 2dcebdde9f..b1b190004d 100644
ed3f42
--- a/configure.ac
ed3f42
+++ b/configure.ac
ed3f42
@@ -1944,6 +1944,7 @@ AC_CHECK_FUNCS(memmem)
ed3f42
 AC_CHECK_FUNCS(mkfifo)
ed3f42
 AC_CHECK_FUNCS(mknod)
ed3f42
 AC_CHECK_FUNCS(mktime)
ed3f42
+AC_CHECK_FUNCS(mmap)
ed3f42
 AC_CHECK_FUNCS(openat)
ed3f42
 AC_CHECK_FUNCS(pipe2)
ed3f42
 AC_CHECK_FUNCS(poll)
ed3f42
@@ -2666,6 +2667,21 @@ main(int argc, char *argv[])
ed3f42
 	rb_cv_fork_with_pthread=yes)])
ed3f42
     test x$rb_cv_fork_with_pthread = xyes || AC_DEFINE(CANNOT_FORK_WITH_PTHREAD)
ed3f42
 ])
ed3f42
+
ed3f42
+AC_CHECK_HEADERS([sys/user.h])
ed3f42
+AS_IF([test "x$ac_cv_func_mmap" = xyes], [
ed3f42
+    AC_CACHE_CHECK([whether PAGE_SIZE is compile-time const], rb_cv_const_page_size,
ed3f42
+	[malloc_headers=`sed -n '/MALLOC_HEADERS_BEGIN/,/MALLOC_HEADERS_END/p' ${srcdir}/gc.c`
ed3f42
+	AC_COMPILE_IFELSE([AC_LANG_PROGRAM([[$malloc_headers
ed3f42
+            typedef char conftest_page[PAGE_SIZE];
ed3f42
+        ]], [[]])],
ed3f42
+        [rb_cv_const_page_size=yes],
ed3f42
+        [rb_cv_const_page_size=no])])
ed3f42
+])
ed3f42
+AS_IF([test "x$rb_cv_const_page_size" = xyes],
ed3f42
+    [AC_DEFINE(HAVE_CONST_PAGE_SIZE, 1)],
ed3f42
+    [AC_DEFINE(HAVE_CONST_PAGE_SIZE, 0)]
ed3f42
+)
ed3f42
 }
ed3f42
 
ed3f42
 : "runtime section" && {
ed3f42
diff --git a/gc.c b/gc.c
ed3f42
index f6acf3e117..6f8e5f242d 100644
ed3f42
--- a/gc.c
ed3f42
+++ b/gc.c
ed3f42
@@ -32,6 +32,7 @@
ed3f42
 #include <stdarg.h>
ed3f42
 #include <stdio.h>
ed3f42
 
ed3f42
+/* MALLOC_HEADERS_BEGIN */
ed3f42
 #ifndef HAVE_MALLOC_USABLE_SIZE
ed3f42
 # ifdef _WIN32
ed3f42
 #  define HAVE_MALLOC_USABLE_SIZE
ed3f42
@@ -54,6 +55,12 @@
ed3f42
 # endif
ed3f42
 #endif
ed3f42
 
ed3f42
+#if !defined(PAGE_SIZE) && defined(HAVE_SYS_USER_H)
ed3f42
+/* LIST_HEAD conflicts with sys/queue.h on macOS */
ed3f42
+# include <sys/user.h>
ed3f42
+#endif
ed3f42
+/* MALLOC_HEADERS_END */
ed3f42
+
ed3f42
 #ifdef HAVE_SYS_TIME_H
ed3f42
 # include <sys/time.h>
ed3f42
 #endif
ed3f42
@@ -821,6 +828,25 @@ enum {
ed3f42
     HEAP_PAGE_BITMAP_SIZE = (BITS_SIZE * HEAP_PAGE_BITMAP_LIMIT),
ed3f42
     HEAP_PAGE_BITMAP_PLANES = 4 /* RGENGC: mark, unprotected, uncollectible, marking */
ed3f42
 };
ed3f42
+#define HEAP_PAGE_ALIGN (1 << HEAP_PAGE_ALIGN_LOG)
ed3f42
+#define HEAP_PAGE_SIZE HEAP_PAGE_ALIGN
ed3f42
+
ed3f42
+#ifdef HAVE_MMAP
ed3f42
+# if HAVE_CONST_PAGE_SIZE
ed3f42
+/* If we have the HEAP_PAGE and it is a constant, then we can directly use it. */
ed3f42
+static const bool USE_MMAP_ALIGNED_ALLOC = (PAGE_SIZE <= HEAP_PAGE_SIZE);
ed3f42
+# elif defined(PAGE_MAX_SIZE) && (PAGE_MAX_SIZE <= HEAP_PAGE_SIZE)
ed3f42
+/* PAGE_SIZE <= HEAP_PAGE_SIZE */
ed3f42
+static const bool USE_MMAP_ALIGNED_ALLOC = true;
ed3f42
+# else
ed3f42
+/* Otherwise, fall back to determining if we can use mmap during runtime. */
ed3f42
+#  define USE_MMAP_ALIGNED_ALLOC (use_mmap_aligned_alloc != false)
ed3f42
+
ed3f42
+static bool use_mmap_aligned_alloc;
ed3f42
+# endif
ed3f42
+#elif !defined(__MINGW32__) && !defined(_WIN32)
ed3f42
+static const bool USE_MMAP_ALIGNED_ALLOC = false;
ed3f42
+#endif
ed3f42
 
ed3f42
 struct heap_page {
ed3f42
     short total_slots;
ed3f42
@@ -1760,14 +1786,14 @@ heap_unlink_page(rb_objspace_t *objspace, rb_heap_t *heap, struct heap_page *pag
ed3f42
     heap->total_slots -= page->total_slots;
ed3f42
 }
ed3f42
 
ed3f42
-static void rb_aligned_free(void *ptr);
ed3f42
+static void rb_aligned_free(void *ptr, size_t size);
ed3f42
 
ed3f42
 static void
ed3f42
 heap_page_free(rb_objspace_t *objspace, struct heap_page *page)
ed3f42
 {
ed3f42
     heap_allocated_pages--;
ed3f42
     objspace->profile.total_freed_pages++;
ed3f42
-    rb_aligned_free(GET_PAGE_BODY(page->start));
ed3f42
+    rb_aligned_free(GET_PAGE_BODY(page->start), HEAP_PAGE_SIZE);
ed3f42
     free(page);
ed3f42
 }
ed3f42
 
ed3f42
@@ -1819,7 +1845,7 @@ heap_page_allocate(rb_objspace_t *objspace)
ed3f42
     /* assign heap_page entry */
ed3f42
     page = calloc1(sizeof(struct heap_page));
ed3f42
     if (page == 0) {
ed3f42
-        rb_aligned_free(page_body);
ed3f42
+        rb_aligned_free(page_body, HEAP_PAGE_SIZE);
ed3f42
 	rb_memerror();
ed3f42
     }
ed3f42
 
ed3f42
@@ -3159,15 +3185,18 @@ Init_heap(void)
ed3f42
 {
ed3f42
     rb_objspace_t *objspace = &rb_objspace;
ed3f42
 
ed3f42
-#if defined(HAVE_SYSCONF) && defined(_SC_PAGE_SIZE)
ed3f42
-    /* If Ruby's heap pages are not a multiple of the system page size, we
ed3f42
-     * cannot use mprotect for the read barrier, so we must disable automatic
ed3f42
-     * compaction. */
ed3f42
-    int pagesize;
ed3f42
-    pagesize = (int)sysconf(_SC_PAGE_SIZE);
ed3f42
-    if ((HEAP_PAGE_SIZE % pagesize) != 0) {
ed3f42
-        ruby_enable_autocompact = 0;
ed3f42
-    }
ed3f42
+#if defined(HAVE_MMAP) && !HAVE_CONST_PAGE_SIZE && !defined(PAGE_MAX_SIZE)
ed3f42
+    /* Need to determine if we can use mmap at runtime. */
ed3f42
+# ifdef PAGE_SIZE
ed3f42
+    /* If the PAGE_SIZE macro can be used. */
ed3f42
+    use_mmap_aligned_alloc = PAGE_SIZE <= HEAP_PAGE_SIZE;
ed3f42
+# elif defined(HAVE_SYSCONF) && defined(_SC_PAGE_SIZE)
ed3f42
+    /* If we can use sysconf to determine the page size. */
ed3f42
+    use_mmap_aligned_alloc = sysconf(_SC_PAGE_SIZE) <= HEAP_PAGE_SIZE;
ed3f42
+# else
ed3f42
+    /* Otherwise we can't determine the system page size, so don't use mmap. */
ed3f42
+    use_mmap_aligned_alloc = FALSE;
ed3f42
+# endif
ed3f42
 #endif
ed3f42
 
ed3f42
     objspace->next_object_id = INT2FIX(OBJ_ID_INITIAL);
ed3f42
@@ -8533,6 +8562,14 @@ gc_start_internal(rb_execution_context_t *ec, VALUE self, VALUE full_mark, VALUE
ed3f42
 
ed3f42
     /* For now, compact implies full mark / sweep, so ignore other flags */
ed3f42
     if (RTEST(compact)) {
ed3f42
+        /* If not MinGW, Windows, or does not have mmap, we cannot use mprotect for
ed3f42
+         * the read barrier, so we must disable compaction. */
ed3f42
+#if !defined(__MINGW32__) && !defined(_WIN32)
ed3f42
+        if (!USE_MMAP_ALIGNED_ALLOC) {
ed3f42
+            rb_raise(rb_eNotImpError, "Compaction isn't available on this platform");
ed3f42
+        }
ed3f42
+#endif
ed3f42
+
ed3f42
         reason |= GPR_FLAG_COMPACT;
ed3f42
     } else {
ed3f42
         if (!RTEST(full_mark))       reason &= ~GPR_FLAG_FULL_MARK;
ed3f42
@@ -9944,16 +9981,14 @@ gc_disable(rb_execution_context_t *ec, VALUE _)
ed3f42
 static VALUE
ed3f42
 gc_set_auto_compact(rb_execution_context_t *ec, VALUE _, VALUE v)
ed3f42
 {
ed3f42
-#if defined(HAVE_SYSCONF) && defined(_SC_PAGE_SIZE)
ed3f42
-    /* If Ruby's heap pages are not a multiple of the system page size, we
ed3f42
-     * cannot use mprotect for the read barrier, so we must disable automatic
ed3f42
-     * compaction. */
ed3f42
-    int pagesize;
ed3f42
-    pagesize = (int)sysconf(_SC_PAGE_SIZE);
ed3f42
-    if ((HEAP_PAGE_SIZE % pagesize) != 0) {
ed3f42
+    /* If not MinGW, Windows, or does not have mmap, we cannot use mprotect for
ed3f42
+     * the read barrier, so we must disable automatic compaction. */
ed3f42
+#if !defined(__MINGW32__) && !defined(_WIN32)
ed3f42
+    if (!USE_MMAP_ALIGNED_ALLOC) {
ed3f42
         rb_raise(rb_eNotImpError, "Automatic compaction isn't available on this platform");
ed3f42
     }
ed3f42
 #endif
ed3f42
+
ed3f42
     ruby_enable_autocompact = RTEST(v);
ed3f42
     return v;
ed3f42
 }
ed3f42
@@ -10350,22 +10385,54 @@ rb_aligned_malloc(size_t alignment, size_t size)
ed3f42
 #elif defined _WIN32
ed3f42
     void *_aligned_malloc(size_t, size_t);
ed3f42
     res = _aligned_malloc(size, alignment);
ed3f42
-#elif defined(HAVE_POSIX_MEMALIGN)
ed3f42
-    if (posix_memalign(&res, alignment, size) == 0) {
ed3f42
-        return res;
ed3f42
+#else
ed3f42
+    if (USE_MMAP_ALIGNED_ALLOC) {
ed3f42
+        GC_ASSERT(alignment % sysconf(_SC_PAGE_SIZE) == 0);
ed3f42
+
ed3f42
+        char *ptr = mmap(NULL, alignment + size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
ed3f42
+        if (ptr == MAP_FAILED) {
ed3f42
+            return NULL;
ed3f42
+        }
ed3f42
+
ed3f42
+        char *aligned = ptr + alignment;
ed3f42
+        aligned -= ((VALUE)aligned & (alignment - 1));
ed3f42
+        GC_ASSERT(aligned > ptr);
ed3f42
+        GC_ASSERT(aligned <= ptr + alignment);
ed3f42
+
ed3f42
+        size_t start_out_of_range_size = aligned - ptr;
ed3f42
+        GC_ASSERT(start_out_of_range_size % sysconf(_SC_PAGE_SIZE) == 0);
ed3f42
+        if (start_out_of_range_size > 0) {
ed3f42
+            if (munmap(ptr, start_out_of_range_size)) {
ed3f42
+                rb_bug("rb_aligned_malloc: munmap failed for start");
ed3f42
+            }
ed3f42
+        }
ed3f42
+
ed3f42
+        size_t end_out_of_range_size = alignment - start_out_of_range_size;
ed3f42
+        GC_ASSERT(end_out_of_range_size % sysconf(_SC_PAGE_SIZE) == 0);
ed3f42
+        if (end_out_of_range_size > 0) {
ed3f42
+            if (munmap(aligned + size, end_out_of_range_size)) {
ed3f42
+                rb_bug("rb_aligned_malloc: munmap failed for end");
ed3f42
+            }
ed3f42
+        }
ed3f42
+
ed3f42
+        res = (void *)aligned;
ed3f42
     }
ed3f42
     else {
ed3f42
-        return NULL;
ed3f42
+# if defined(HAVE_POSIX_MEMALIGN)
ed3f42
+        if (posix_memalign(&res, alignment, size) != 0) {
ed3f42
+            return NULL;
ed3f42
+        }
ed3f42
+# elif defined(HAVE_MEMALIGN)
ed3f42
+        res = memalign(alignment, size);
ed3f42
+# else
ed3f42
+        char* aligned;
ed3f42
+        res = malloc(alignment + size + sizeof(void*));
ed3f42
+        aligned = (char*)res + alignment + sizeof(void*);
ed3f42
+        aligned -= ((VALUE)aligned & (alignment - 1));
ed3f42
+        ((void**)aligned)[-1] = res;
ed3f42
+        res = (void*)aligned;
ed3f42
+# endif
ed3f42
     }
ed3f42
-#elif defined(HAVE_MEMALIGN)
ed3f42
-    res = memalign(alignment, size);
ed3f42
-#else
ed3f42
-    char* aligned;
ed3f42
-    res = malloc(alignment + size + sizeof(void*));
ed3f42
-    aligned = (char*)res + alignment + sizeof(void*);
ed3f42
-    aligned -= ((VALUE)aligned & (alignment - 1));
ed3f42
-    ((void**)aligned)[-1] = res;
ed3f42
-    res = (void*)aligned;
ed3f42
 #endif
ed3f42
 
ed3f42
     /* alignment must be a power of 2 */
ed3f42
@@ -10375,16 +10442,26 @@ rb_aligned_malloc(size_t alignment, size_t size)
ed3f42
 }
ed3f42
 
ed3f42
 static void
ed3f42
-rb_aligned_free(void *ptr)
ed3f42
+rb_aligned_free(void *ptr, size_t size)
ed3f42
 {
ed3f42
 #if defined __MINGW32__
ed3f42
     __mingw_aligned_free(ptr);
ed3f42
 #elif defined _WIN32
ed3f42
     _aligned_free(ptr);
ed3f42
-#elif defined(HAVE_MEMALIGN) || defined(HAVE_POSIX_MEMALIGN)
ed3f42
-    free(ptr);
ed3f42
 #else
ed3f42
-    free(((void**)ptr)[-1]);
ed3f42
+    if (USE_MMAP_ALIGNED_ALLOC) {
ed3f42
+        GC_ASSERT(size % sysconf(_SC_PAGE_SIZE) == 0);
ed3f42
+        if (munmap(ptr, size)) {
ed3f42
+            rb_bug("rb_aligned_free: munmap failed");
ed3f42
+        }
ed3f42
+    }
ed3f42
+    else {
ed3f42
+# if defined(HAVE_POSIX_MEMALIGN) || defined(HAVE_MEMALIGN)
ed3f42
+        free(ptr);
ed3f42
+# else
ed3f42
+        free(((void**)ptr)[-1]);
ed3f42
+# endif
ed3f42
+    }
ed3f42
 #endif
ed3f42
 }
ed3f42
 
ed3f42
diff --git a/test/ruby/test_gc_compact.rb b/test/ruby/test_gc_compact.rb
ed3f42
index 4a8cff33f4..f5cab55ba7 100644
ed3f42
--- a/test/ruby/test_gc_compact.rb
ed3f42
+++ b/test/ruby/test_gc_compact.rb
ed3f42
@@ -4,12 +4,32 @@
ed3f42
 require 'etc'
ed3f42
 
ed3f42
 class TestGCCompact < Test::Unit::TestCase
ed3f42
-  class AutoCompact < Test::Unit::TestCase
ed3f42
+  module SupportsCompact
ed3f42
     def setup
ed3f42
       skip "autocompact not supported on this platform" unless supports_auto_compact?
ed3f42
       super
ed3f42
     end
ed3f42
 
ed3f42
+    private
ed3f42
+
ed3f42
+    def supports_auto_compact?
ed3f42
+      return true unless defined?(Etc::SC_PAGE_SIZE)
ed3f42
+
ed3f42
+      begin
ed3f42
+        return GC::INTERNAL_CONSTANTS[:HEAP_PAGE_SIZE] % Etc.sysconf(Etc::SC_PAGE_SIZE) == 0
ed3f42
+      rescue NotImplementedError
ed3f42
+      rescue ArgumentError
ed3f42
+      end
ed3f42
+
ed3f42
+      true
ed3f42
+    end
ed3f42
+  end
ed3f42
+
ed3f42
+  include SupportsCompact
ed3f42
+
ed3f42
+  class AutoCompact < Test::Unit::TestCase
ed3f42
+    include SupportsCompact
ed3f42
+
ed3f42
     def test_enable_autocompact
ed3f42
       before = GC.auto_compact
ed3f42
       GC.auto_compact = true
ed3f42
@@ -59,26 +79,17 @@ def test_implicit_compaction_does_something
ed3f42
     ensure
ed3f42
       GC.auto_compact = before
ed3f42
     end
ed3f42
-
ed3f42
-    private
ed3f42
-
ed3f42
-    def supports_auto_compact?
ed3f42
-      return true unless defined?(Etc::SC_PAGE_SIZE)
ed3f42
-
ed3f42
-      begin
ed3f42
-        return GC::INTERNAL_CONSTANTS[:HEAP_PAGE_SIZE] % Etc.sysconf(Etc::SC_PAGE_SIZE) == 0
ed3f42
-      rescue NotImplementedError
ed3f42
-      rescue ArgumentError
ed3f42
-      end
ed3f42
-
ed3f42
-      true
ed3f42
-    end
ed3f42
   end
ed3f42
 
ed3f42
   def os_page_size
ed3f42
     return true unless defined?(Etc::SC_PAGE_SIZE)
ed3f42
   end
ed3f42
 
ed3f42
+  def setup
ed3f42
+    skip "autocompact not supported on this platform" unless supports_auto_compact?
ed3f42
+    super
ed3f42
+  end
ed3f42
+
ed3f42
   def test_gc_compact_stats
ed3f42
     list = []
ed3f42
 
ed3f42
-- 
ed3f42
2.30.1 (Apple Git-130)
ed3f42