Blame SOURCES/bz1231032-redis-update.patch.patch

659c12
From c982683ac8c2de64f69c5f47727242c65e00df90 Mon Sep 17 00:00:00 2001
659c12
From: David Vossel <dvossel@redhat.com>
659c12
Date: Mon, 29 Jun 2015 13:07:14 -0500
659c12
Subject: [PATCH 2/3] bz1231032-redis-update.patch
659c12
659c12
---
659c12
 heartbeat/redis | 51 ++++++++++++++++++++++++++++++++++++++++++++++-----
659c12
 1 file changed, 46 insertions(+), 5 deletions(-)
659c12
659c12
diff --git a/heartbeat/redis b/heartbeat/redis
659c12
index 6b479b2..b63a2b9 100644
659c12
--- a/heartbeat/redis
659c12
+++ b/heartbeat/redis
659c12
@@ -20,6 +20,7 @@ fi
659c12
 
659c12
 CHECK_SLAVE_STATE=0
659c12
 
659c12
+REDIS_CHECK_DUMP="/usr/bin/redis-check-dump"
659c12
 REDIS_SERVER="$OCF_RESKEY_bin"
659c12
 REDIS_CLIENT="$OCF_RESKEY_client_bin"
659c12
 REDIS_CONFIG="$OCF_RESKEY_config"
659c12
@@ -29,6 +30,17 @@ REDIS_PIDFILE="$OCF_RESKEY_rundir/$OCF_RESKEY_pidfile_name"
659c12
 REDIS_SOCKET="$OCF_RESKEY_rundir/$OCF_RESKEY_socket_name"
659c12
 REDIS_REPLICATION_PORT="$OCF_RESKEY_port"
659c12
 
659c12
+if ! [ -f $REDIS_CHECK_DUMP ]; then
659c12
+	REDIS_CHECK_DUMP="$(which redis-check-dump 2>/dev/null)"
659c12
+fi
659c12
+
659c12
+if [ -f "$REDIS_CONFIG" ]; then
659c12
+	REDIS_DUMP_DIR="$(cat $REDIS_CONFIG | grep "^\s*dir\s" | awk '{ print $2 }' 2>/dev/null)"
659c12
+	REDIS_DUMP_FILE="$(cat $REDIS_CONFIG | grep "^\s*dbfilename\s" | awk '{ print $2 }' 2>/dev/null)"
659c12
+fi
659c12
+: ${REDIS_DUMP_DIR:=/var/lib/redis/}
659c12
+: ${REDIS_DUMP_FILE:=dump.rdb}
659c12
+
659c12
 function meta_data() {
659c12
 	cat <
659c12
 
659c12
@@ -289,6 +301,14 @@ function monitor() {
659c12
 	return $OCF_SUCCESS
659c12
 }
659c12
 
659c12
+function check_dump_file()
659c12
+{
659c12
+	if ! have_binary "$REDIS_CHECK_DUMP"; then
659c12
+		return 0
659c12
+	fi
659c12
+	$REDIS_CHECK_DUMP ${REDIS_DUMP_DIR}/${REDIS_DUMP_FILE} 2>&1
659c12
+}
659c12
+
659c12
 function start() {
659c12
 	monitor
659c12
 	status=$?
659c12
@@ -301,6 +321,16 @@ function start() {
659c12
 	[[ ! -d "$REDIS_RUNDIR" ]] && mkdir -p "$REDIS_RUNDIR"
659c12
 	chown -R "$REDIS_USER" "$REDIS_RUNDIR"
659c12
 
659c12
+	# check for 0 byte database dump file. This is an unrecoverable start
659c12
+	# condition that we can avoid by deleting the 0 byte database file.
659c12
+	if [ -f "${REDIS_DUMP_DIR}/${REDIS_DUMP_FILE}" ]; then
659c12
+		local size="$(stat --format "%s" ${REDIS_DUMP_DIR}/${REDIS_DUMP_FILE})"
659c12
+		if [ "$?" -eq "0" ] && [ "$size" -eq "0" ]; then
659c12
+			ocf_log notice "Detected 0 byte ${REDIS_DUMP_FILE}, deleting zero length file to avoid start failure."
659c12
+			rm -f ${REDIS_DUMP_DIR}/${REDIS_DUMP_FILE}
659c12
+		fi
659c12
+	fi
659c12
+
659c12
 	ocf_log info "start: $REDIS_SERVER --daemonize yes --unixsocket '$REDIS_SOCKET' --pidfile '$REDIS_PIDFILE'"
659c12
 	output="$(su "$REDIS_USER" -s /bin/sh -c "cd '$REDIS_RUNDIR'; exec '$REDIS_SERVER' '$REDIS_CONFIG' --daemonize yes --unixsocket '$REDIS_SOCKET' --pidfile '$REDIS_PIDFILE'" 2>&1)"
659c12
 
659c12
@@ -325,7 +355,8 @@ function start() {
659c12
 			# It's possible that the `pidof` will pick up a different redis, but in that case, the start operation will just time out
659c12
 			sleep 1
659c12
 		else
659c12
-			ocf_log err "start: Unknown error waiting for redis to start"
659c12
+			check_output="$(check_dump_file)"
659c12
+			ocf_log err "start: Unknown error waiting for redis to start. redis-check-dump output=${check_output//$'\n'/; }"
659c12
 			return $OCF_ERR_GENERIC
659c12
 		fi
659c12
 	done
659c12
@@ -338,7 +369,8 @@ function start() {
659c12
 		return $OCF_SUCCESS
659c12
 	fi
659c12
 
659c12
-	ocf_log err "start: Unknown error starting redis. output=${output//$'\n'/; }"
659c12
+	check_output="$(check_dump_file)"
659c12
+	ocf_log err "start: Unknown error starting redis. redis-server output=${output//$'\n'/; } redis-check-dump output=${check_output//$'\n'/; }"
659c12
 	return $status
659c12
 }
659c12
 
659c12
@@ -427,14 +459,23 @@ function demote() {
659c12
 
659c12
 	redis_client slaveof "$master_host" "$master_port"
659c12
 
659c12
-	# wait briefly for the slave to connect to the master	
659c12
-	for (( c=1; c <= 20; c++ ))
659c12
-	do
659c12
+	# Wait forever for the slave to connect to the master and finish the 
659c12
+	# sync. Timeout is controlled by Pacemaker "op start timeout=XX".
659c12
+	#
659c12
+	# hint: redis master_link_status will only come "up" when 
659c12
+	#       the SYNC with the master has completed.
659c12
+	#       This can take an arbitraty time (data) and should 
659c12
+	#       only be parametrized by the start operation timeout
659c12
+	#	by the administrator, not by this resource agent code
659c12
+	while true; do 
659c12
+		# Wait infinite if replication is syncing
659c12
+		# Then start/demote operation timeout determines timeout
659c12
 		monitor
659c12
 		status=$?
659c12
 		if (( status == OCF_SUCCESS )); then
659c12
 			return $OCF_SUCCESS
659c12
 		fi
659c12
+		
659c12
 		sleep 1
659c12
 	done
659c12
 
659c12
-- 
659c12
1.8.4.2
659c12