In my case the PIDFILE is created, but it is empty. bash -x output is below for a start.
I only see this behaviour on one arbiter. On other that I have, it works always.
If I put in a sleep for 1 second for example, before the pid is gathered and written to the pid file, it works also always on this problematic node.
garb version is Percona-XtraDB-Cluster-garbd-2-2.11-1.2675.rhel6.x86_64
In my case the PIDFILE is created, but it is empty. bash -x output is below for a start.
I only see this behaviour on one arbiter. On other that I have, it works always.
If I put in a sleep for 1 second for example, before the pid is gathered and written to the pid file, it works also always on this problematic node.
garb version is Percona- XtraDB- Cluster- garbd-2- 2.11-1. 2675.rhel6. x86_64
[root@arbiter40 ~]# bash -x /etc/init.d/garb start d/functions initscripts /usr/sbin: /bin:/usr/ bin d/lang. sh SUCCESS= 'echo -en \033[0;32m' FAILURE= 'echo -en \033[0;31m' WARNING= 'echo -en \033[0;33m' NORMAL= 'echo -en \033[0;39m' CONSOLES= '/dev/tty[ 1-6]' /sbin/sushell ignored_ files=' /\(~\|\ .bak\|\ .orig\| \.rpmnew\ |\.rpmorig\ |\.rpmsave\ )$/d' network arbiter40. exmaple. com 10.28.33. 250 /etc/sysconfig/ garb /var/run/ garbd NODES=' 10.6.166. 235:4010 10.6.166.221:4010 10.115.20.166:4010 10.115.20.167:4010' GROUP=OProdLRCl uster OPTIONS= 'evs.keepalive_ period= PT3S;evs. suspect_ timeout= PT30S;evs. inactive_ timeout= PT1M;evs. install_ timeout= PT1M;evs. send_window= 64;evs. user_send_ window= 32;evs. debug_log_ mask=EVS_ DEBUG' /var/log/ garbd.log /10.6.166. 235:4010' /10.6.166. 235:4010 -g OProdLRCluster' period= PT3S;evs. suspect_ timeout= PT30S;evs. inactive_ timeout= PT1M;evs. install_ timeout= PT1M;evs. send_window= 64;evs. user_send_ window= 32;evs. debug_log_ mask=EVS_ DEBUG' ']' /10.6.166. 235:4010 -g OProdLRCluster -o evs.keepalive_ period= PT3S;evs. suspect_ timeout= PT30S;evs. inactive_ timeout= PT1M;evs. install_ timeout= PT1M;evs. send_window= 64;evs. user_send_ window= 32;evs. debug_log_ mask=EVS_ DEBUG' /10.6.166. 235:4010 -g OProdLRCluster -o evs.keepalive_ period= PT3S;evs. suspect_ timeout= PT30S;evs. inactive_ timeout= PT1M;evs. install_ timeout= PT1M;evs. send_window= 64;evs. user_send_ window= 32;evs. debug_log_ mask=EVS_ DEBUG -l /var/log/garbd.log' /10.6.166. 235:4010 -g OProdLRCluster -o 'evs.keepalive_ period= PT3S;evs. suspect_ timeout= PT30S;evs. inactive_ timeout= PT1M;evs. install_ timeout= PT1M;evs. send_window= 64;evs. user_send_ window= 32;evs. debug_log_ mask=EVS_ DEBUG' -l /var/log/garbd.log /10.6.166. 235:4010 -g OProdLRCluster -o 'evs.keepalive_ period= PT3S;evs. suspect_ timeout= PT30S;evs. inactive_ timeout= PT1M;evs. install_ timeout= PT1M;evs. send_window= 64;evs. user_send_ window= 32;evs. debug_log_ mask=EVS_ DEBUG' -l /var/log/garbd.log
+ echo -n '['
+ '[' -f /etc/redhat-release ']'
+ . /etc/init.
++ TEXTDOMAIN=
++ umask 022
++ PATH=/sbin:
++ export PATH
++ '[' -z '' ']'
++ COLUMNS=80
++ '[' -z '' ']'
+++ /sbin/consoletype
++ CONSOLETYPE=pty
++ '[' -f /etc/sysconfig/i18n -a -z '' -a -z '' ']'
++ . /etc/profile.
++ unset LANGSH_SOURCED
++ '[' -z '' ']'
++ '[' -f /etc/sysconfig/init ']'
++ . /etc/sysconfig/init
+++ BOOTUP=color
+++ RES_COL=60
+++ MOVE_TO_COL='echo -en \033[60G'
+++ SETCOLOR_
+++ SETCOLOR_
+++ SETCOLOR_
+++ SETCOLOR_
+++ PROMPT=yes
+++ AUTOSWAP=no
+++ ACTIVE_
+++ SINGLE=
++ '[' pty = serial ']'
++ __sed_discard_
+ . /etc/sysconfig/
++ NETWORKING=yes
++ NETWORKING_IPV6=no
++ HOSTNAME=
++ GATEWAY=
+ config=
+ PIDFILE=
++ which garbd
+ prog=/usr/bin/garbd
+ case "$1" in
+ start
+ '[' 0 '!=' 0 ']'
+ '[' yes = no ']'
+ grep -q -E '^# REMOVE' /etc/sysconfig/garb
+ '[' -r /var/run/garbd ']'
+ '[' -x /usr/bin/garbd ']'
+ '[' -f /etc/sysconfig/garb ']'
+ . /etc/sysconfig/garb
++ GALERA_
++ GALERA_
++ GALERA_
++ LOG_FILE=
++ GALERA_PORT=4010
+ '[' -z '10.6.166.235:4010 10.6.166.221:4010 10.115.20.166:4010 10.115.20.167:4010' ']'
+ '[' -z OProdLRCluster ']'
+ GALERA_PORT=4010
+ for ADDRESS in '${GALERA_NODES}' 0
++ cut -d : -f 1
++ echo 10.6.166.235:4010
+ HOST=10.6.166.235
++ cut -d : -f 2
++ echo 10.6.166.235:4010
+ PORT=4010
+ PORT=4010
++ which nc
+ [[ -x /usr/bin/nc ]]
+ grep -q -- -z
+ nc -h
+ nc -z 10.6.166.235 4010
+ break
+ '[' 10.6.166.235:4010 == 0 ']'
+ OPTIONS='-d -a gcomm:/
+ '[' -n OProdLRCluster ']'
+ OPTIONS='-d -a gcomm:/
+ '[' -n 'evs.keepalive_
+ OPTIONS='-d -a gcomm:/
+ '[' -n /var/log/garbd.log ']'
+ OPTIONS='-d -a gcomm:/
+ program_start -d -a gcomm:/
+ local rcode
+ '[' -f /etc/redhat-release ']'
+ echo -n 'Starting /usr/bin/garbd: '
Starting /usr/bin/garbd: + sudo -u nobody /usr/bin/garbd -d -a gcomm:/
+ rcode=0
+ '[' 0 -eq 0 ']'
+ pidof /usr/bin/garbd
+ echo_failure
+ '[' color = color ']'
+ echo -en '\033[60G'
[+ '[' color = color ']'
+ echo -en '\033[0;31m'
+ echo -n FAILED
FAILED+ '[' color = color ']'
+ echo -en '\033[0;39m'
+ echo -n ']'
]+ echo -ne '\r'
+ return 1
+ echo
+ return 0
+ exit 0
[root@arbiter40 ~]# cat /var/run/garbd
[root@arbiter40 ~]#