Blame SOURCES/memcached-restart-shutdown-segfault.patch

a2abc3
commit e360e34b1fd2cd69c3a08bfb7fa4fe75281b942a
a2abc3
Author: Tomas Korbar <tkorbar@redhat.com>
a2abc3
Date:   Tue May 19 08:42:12 2020 +0200
a2abc3
a2abc3
    restart: fix rare segfault on shutdown
a2abc3
a2abc3
diff --git a/memcached.c b/memcached.c
a2abc3
index d769b4a..ac03b93 100644
a2abc3
--- a/memcached.c
a2abc3
+++ b/memcached.c
a2abc3
@@ -1009,6 +1009,18 @@ static void conn_shrink(conn *c) {
a2abc3
     }
a2abc3
 }
a2abc3
 
a2abc3
+// Since some connections might be off on side threads and some are managed as
a2abc3
+// listeners we need to walk through them all from a central point.
a2abc3
+// Must be called with all worker threads hung or in the process of closing.
a2abc3
+void conn_close_all(void) {
a2abc3
+    int i;
a2abc3
+    for (i = 0; i < max_fds; i++) {
a2abc3
+        if (conns[i] && conns[i]->state != conn_closed) {
a2abc3
+            conn_close(conns[i]);
a2abc3
+        }
a2abc3
+    }
a2abc3
+}
a2abc3
+
a2abc3
 /**
a2abc3
  * Convert a state name to a human readable form.
a2abc3
  */
a2abc3
@@ -9860,13 +9872,6 @@ int main (int argc, char **argv) {
a2abc3
     }
a2abc3
 
a2abc3
     stop_threads();
a2abc3
-    int i;
a2abc3
-    // FIXME: make a function callable from threads.c
a2abc3
-    for (i = 0; i < max_fds; i++) {
a2abc3
-        if (conns[i] && conns[i]->state != conn_closed) {
a2abc3
-            conn_close(conns[i]);
a2abc3
-        }
a2abc3
-    }
a2abc3
     if (memory_file != NULL && stop_main_loop == GRACE_STOP) {
a2abc3
         restart_mmap_close();
a2abc3
     }
a2abc3
diff --git a/memcached.h b/memcached.h
a2abc3
index 6b1fe4a..bc2b395 100644
a2abc3
--- a/memcached.h
a2abc3
+++ b/memcached.h
a2abc3
@@ -814,9 +814,8 @@ enum delta_result_type add_delta(conn *c, const char *key,
a2abc3
                                  const int64_t delta, char *buf,
a2abc3
                                  uint64_t *cas);
a2abc3
 void accept_new_conns(const bool do_accept);
a2abc3
-conn *conn_from_freelist(void);
a2abc3
-bool  conn_add_to_freelist(conn *c);
a2abc3
 void  conn_close_idle(conn *c);
a2abc3
+void  conn_close_all(void);
a2abc3
 item *item_alloc(char *key, size_t nkey, int flags, rel_time_t exptime, int nbytes);
a2abc3
 #define DO_UPDATE true
a2abc3
 #define DONT_UPDATE false
a2abc3
diff --git a/thread.c b/thread.c
a2abc3
index 7cba01e..6e19a2e 100644
a2abc3
--- a/thread.c
a2abc3
+++ b/thread.c
a2abc3
@@ -205,6 +205,7 @@ void stop_threads(void) {
a2abc3
     if (settings.verbose > 0)
a2abc3
         fprintf(stderr, "asking workers to stop\n");
a2abc3
     buf[0] = 's';
a2abc3
+    pthread_mutex_lock(&worker_hang_lock);
a2abc3
     pthread_mutex_lock(&init_lock);
a2abc3
     init_count = 0;
a2abc3
     for (i = 0; i < settings.num_threads; i++) {
a2abc3
@@ -216,6 +217,8 @@ void stop_threads(void) {
a2abc3
     wait_for_thread_registration(settings.num_threads);
a2abc3
     pthread_mutex_unlock(&init_lock);
a2abc3
 
a2abc3
+    // All of the workers are hung but haven't done cleanup yet.
a2abc3
+
a2abc3
     if (settings.verbose > 0)
a2abc3
         fprintf(stderr, "asking background threads to stop\n");
a2abc3
 
a2abc3
@@ -237,6 +240,17 @@ void stop_threads(void) {
a2abc3
     if (settings.verbose > 0)
a2abc3
         fprintf(stderr, "stopped idle timeout thread\n");
a2abc3
 
a2abc3
+    // Close all connections then let the workers finally exit.
a2abc3
+    if (settings.verbose > 0)
a2abc3
+        fprintf(stderr, "closing connections\n");
a2abc3
+    conn_close_all();
a2abc3
+    pthread_mutex_unlock(&worker_hang_lock);
a2abc3
+    if (settings.verbose > 0)
a2abc3
+        fprintf(stderr, "reaping worker threads\n");
a2abc3
+    for (i = 0; i < settings.num_threads; i++) {
a2abc3
+        pthread_join(threads[i].thread_id, NULL);
a2abc3
+    }
a2abc3
+
a2abc3
     if (settings.verbose > 0)
a2abc3
         fprintf(stderr, "all background threads stopped\n");
a2abc3