Controller=10.80.0.4
Node=10.80.0.5
HABind=10.10.10.1
HAPeer=10.10.10.2
Fence=/usr/sbin/fence_idrac -a 192.168.100.2 -l root -p vsphereroot -o reboot Node Type: Controller
Controller: 10.80.0.4
HA Peer: 10.10.10.2
HA Bind: 10.10.10.1
Node Status: Controller Inited
Node Role: Master
Sync Status: Sync Done
Nodes: 10.80.0.5Controller=10.80.0.4
Node=10.80.0.5
Type=Master
HABind=10.10.10.2
HAPeer=10.10.10.1
Fence=/usr/sbin/fence_idrac -a 192.168.100.1 -l root -p vsphereroot -o reboot
Node Type: Client
Controller: 10.80.0.4
Node: 10.80.0.5
HA Peer: 10.10.10.1
HA Bind: 10.10.10.2
Node Status: Master Inited
Node Role: Standby
Sync Status: Sync Done[root@fileserver1 ~]# /quadstor/bin/vdconfig -l
Name Pool Serial Number Size(GB) LUN Status
infra-backups Default 6e340bdadcca0d25d25e0e01ed15d0af 10000 2 D C E
cln0 Default 6e38124216698641e6271b4942579d8e 5000 1 D C
cln1 Default 6edc37e2b5294e1e0092067f5a418e74 5000 3 D C
cln2 Default 6e31c9affed295dbfe8c522394571c46 5000 4 D C
shared Default 6eb1656d67181df7f8def6627d206962 10000 5 D C/dev/sdj on /mnt/shared type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)
/dev/sdk on /mnt/cln0 type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)
/dev/sdl on /mnt/cln1 type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)
/dev/sdm on /mnt/cln2 type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)/dev/sdm on /mnt/shared type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)
/dev/sdj on /mnt/cln0 type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)
/dev/sdk on /mnt/cln1 type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)
/dev/sdl on /mnt/cln2 type ocfs2 (rw,_netdev,noatime,data=writeback,commit=30,heartbeat=local)node:
ip_port=7777
ip_address=10.10.10.1
number=0
name=fileserver1
cluster=ocfs2
node:
ip_port=7777
ip_address=10.10.10.2
number=1
name=fileserver2
cluster=ocfs2
cluster:
node_count=2
name=ocfs2[root@fileserver1 ~]# /usr/sbin/fence_idrac -a 192.168.100.2 -l root -p vsphereroot -o reboot
Rebooting machine @ IPMI:192.168.100.2...Done
[root@fileserver1 ~]#
Aug 30 15:15:30 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 2956155 msg timestamp 2932155 cmd 10 msg_id 7521 xchg id 0 timo 24000
Aug 30 15:15:30 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 2956160 msg timestamp 2932160 cmd 10 msg_id 7522 xchg id 0 timo 24000
Aug 30 15:15:30 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 2956164 msg timestamp 2932164 cmd 10 msg_id 7523 xchg id 0 timo 24000
Aug 30 15:15:30 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 2956168 msg timestamp 2932168 cmd 10 msg_id 7524 xchg id 0 timo 24000
Aug 30 15:15:35 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 has been idle for 30.60 secs, shutting it down.
Aug 30 15:15:35 fileserver2 kernel: o2net: No longer connected to node fileserver1 (num 0) at 10.10.10.1:7777
Aug 30 15:15:35 fileserver2 kernel: (kworker/u:3,243,0):dlm_do_master_request:1332 ERROR: link to 0 went down!
Aug 30 15:15:35 fileserver2 kernel: (kworker/u:3,243,0):dlm_get_lock_resource:917 ERROR: status = -112
Aug 30 15:15:36 fileserver2 kernel: bnx2 0000:03:00.0: eth2: NIC Copper Link is Down
Aug 30 15:15:38 fileserver2 kernel: bnx2 0000:03:00.0: eth2: NIC Copper Link is Up, 1000 Mbps full duplex, receive & transmit flow control ON
Aug 30 15:15:40 fileserver2 smbd[10901]: [2014/08/30 15:15:40.797359, 0] lib/ctdbd_conn.c:624(ctdb_handle_message)
Aug 30 15:15:40 fileserver2 smbd[10901]: Got cluster reconfigure message
Aug 30 15:15:41 fileserver2 ntpd[4292]: Listen normally on 13 eth0 10.80.0.7 UDP 123
Aug 30 15:15:41 fileserver2 ntpd[4292]: peers refreshed
Aug 30 15:15:45 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:15:48 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:15:51 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:15:54 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:15:57 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:00 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:03 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:05 fileserver2 kernel: o2net: No connection established with node 0 after 30.0 seconds, giving up.
Aug 30 15:16:06 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:10 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:13 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:16 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:19 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:22 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:25 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:28 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:31 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:34 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:35 fileserver2 kernel: o2net: No connection established with node 0 after 30.0 seconds, giving up.
Aug 30 15:16:37 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:41 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:44 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:47 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:50 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:53 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:54 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 3040155 msg timestamp 3016155 cmd 10 msg_id 7525 xchg id 0 timo 24000
Aug 30 15:16:54 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 3040160 msg timestamp 3016160 cmd 10 msg_id 7526 xchg id 0 timo 24000
Aug 30 15:16:54 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 3040164 msg timestamp 3016164 cmd 10 msg_id 7527 xchg id 0 timo 24000
Aug 30 15:16:54 fileserver2 kernel: WARN: node_msg_wait:48 msg timedout ticks 3040168 msg timestamp 3016168 cmd 10 msg_id 7528 xchg id 0 timo 24000
Aug 30 15:16:56 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
Aug 30 15:16:59 fileserver2 kernel: o2net: Connection to node fileserver1 (num 0) at 10.10.10.1:7777 shutdown, state 7
# machine reboots here, boot-up logs start 6 minutes later
[root@fileserver2 ~]# /quadstor/bin/ndconfig
Node Type: Client
Controller: 10.80.0.4
Node: 10.80.0.5
HA Peer: 10.10.10.1
HA Bind: 10.10.10.2
Node Status: Master Inited
Node Role: Standby
Sync Status: Sync Error