a similar case i found on google.
i have a galera cluster with 4 nodes and a single garbd, high packet loss only on the garbd network will bring all others nodes to initialised state. it's easy to reproduce.
wsrep_provider_options="pc.weight=1;evs.join_retrans_period=PT2S;evs.keepalive_period=PT3S;evs.inactive_check_period=PT10S;evs.suspect_timeout=PT30S;evs.inactive_timeout=PT1M;evs.install_timeout=PT1M"
131031 15:25:07 [Warning] WSREP: evs::proto(b138644e-3a4f-11e3-a890-cbf6831de099, GATHER, view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497)) install timer expired
evs::proto(evs::proto(b138644e-3a4f-11e3-a890-cbf6831de099, GATHER, view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497)), GATHER) {
current_view=view(view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497) memb {
2853b263-3a4c-11e3-8d08-bb69a1cadba2,
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,
63e5752e-3a4d-11e3-a457-76d5146fbfb5,
b138644e-3a4f-11e3-a890-cbf6831de099,
e4fb10ff-3a77-11e3-9767-863d8c1156cd,
} joined {
} left {
} partitioned {
}),
input_map=evs::input_map: {aru_seq=4216,safe_seq=4187,node_index=node: {idx=0,range=[4217,4216],safe_seq=4216} node: {idx=1,range=[4217,4216],safe_seq=4216
} node: {idx=2,range=[4217,4216],safe_seq=4216} node: {idx=3,range=[4217,4216],safe_seq=4216} node: {idx=4,range=[4217,4216],safe_seq=4187} },
fifo_seq=8055201,
last_sent=4216,
known={
2853b263-3a4c-11e3-8d08-bb69a1cadba2,evs::node{operational=1,suspected=0,installed=0,fifo_seq=8062200,join_message=
evs::msg{version=0,type=4,user_type=255,order=1,seq=4187,seq_range=-1,aru_seq=4216,flags=4,source=2853b263-3a4c-11e3-8d08-bb69a1cadba2,source_view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),range_uuid=00000000-0000-0000-0000-000000000000,range=[-1,-1],fifo_seq=8062200,node_list=( 2853b263-3a4c-11e3-8d08-bb69a1cadba2,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
63e5752e-3a4d-11e3-a457-76d5146fbfb5,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
b138644e-3a4f-11e3-a890-cbf6831de099,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
e4fb10ff-3a77-11e3-9767-863d8c1156cd,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4187,im_range=[4217,4216],}
)
},
}
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,evs::node{operational=1,suspected=0,installed=0,fifo_seq=8011820,join_message=
evs::msg{version=0,type=4,user_type=255,order=1,seq=4187,seq_range=-1,aru_seq=4216,flags=4,source=4e6e7b63-3a59-11e3-83c8-4b32aeffee17,source_view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),range_uuid=00000000-0000-0000-0000-000000000000,range=[-1,-1],fifo_seq=8011820,node_list=( 2853b263-3a4c-11e3-8d08-bb69a1cadba2,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
63e5752e-3a4d-11e3-a457-76d5146fbfb5,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
b138644e-3a4f-11e3-a890-cbf6831de099,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
e4fb10ff-3a77-11e3-9767-863d8c1156cd,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4187,im_range=[4217,4216],}
)
},
}
63e5752e-3a4d-11e3-a457-76d5146fbfb5,evs::node{operational=1,suspected=0,installed=0,fifo_seq=7999212,join_message=
evs::msg{version=0,type=4,user_type=255,order=1,seq=4187,seq_range=-1,aru_seq=4216,flags=4,source=63e5752e-3a4d-11e3-a457-76d5146fbfb5,source_view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),range_uuid=00000000-0000-0000-0000-000000000000,range=[-1,-1],fifo_seq=7999212,node_list=( 2853b263-3a4c-11e3-8d08-bb69a1cadba2,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
63e5752e-3a4d-11e3-a457-76d5146fbfb5,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
b138644e-3a4f-11e3-a890-cbf6831de099,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
e4fb10ff-3a77-11e3-9767-863d8c1156cd,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4187,im_range=[4217,4216],}
)
},
}
b138644e-3a4f-11e3-a890-cbf6831de099,evs::node{operational=1,suspected=0,installed=0,fifo_seq=-1,join_message=
evs::msg{version=0,type=4,user_type=255,order=1,seq=4187,seq_range=-1,aru_seq=4216,flags=0,source=b138644e-3a4f-11e3-a890-cbf6831de099,source_view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),range_uuid=00000000-0000-0000-0000-000000000000,range=[-1,-1],fifo_seq=8055201,node_list=( 2853b263-3a4c-11e3-8d08-bb69a1cadba2,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
63e5752e-3a4d-11e3-a457-76d5146fbfb5,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
b138644e-3a4f-11e3-a890-cbf6831de099,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4216,im_range=[4217,4216],}
e4fb10ff-3a77-11e3-9767-863d8c1156cd,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4187,im_range=[4217,4216],}
)
},
}
e4fb10ff-3a77-11e3-9767-863d8c1156cd,evs::node{operational=1,suspected=0,installed=0,fifo_seq=7929206,join_message=
evs::msg{version=0,type=4,user_type=255,order=1,seq=4187,seq_range=-1,aru_seq=4187,flags=4,source=e4fb10ff-3a77-11e3-9767-863d8c1156cd,source_view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),range_uuid=00000000-0000-0000-0000-000000000000,range=[-1,-1],fifo_seq=7929206,node_list=( 2853b263-3a4c-11e3-8d08-bb69a1cadba2,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4190,im_range=[4217,4216],}
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,node: {operational=1,suspected=1,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4190,im_range=[4191,4190],}
63e5752e-3a4d-11e3-a457-76d5146fbfb5,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4190,im_range=[4188,4216],}
b138644e-3a4f-11e3-a890-cbf6831de099,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4190,im_range=[4217,4216],}
e4fb10ff-3a77-11e3-9767-863d8c1156cd,node: {operational=1,suspected=0,leave_seq=-1,view_id=view_id(REG,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497),safe_seq=4187,im_range=[4217,4216],}
)
},
}
}
}
131031 15:25:07 [Note] WSREP: no install message received
131031 15:25:07 [Note] WSREP: view(view_id(NON_PRIM,2853b263-3a4c-11e3-8d08-bb69a1cadba2,497) memb {
b138644e-3a4f-11e3-a890-cbf6831de099,
} joined {
} left {
} partitioned {
2853b263-3a4c-11e3-8d08-bb69a1cadba2,
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,
63e5752e-3a4d-11e3-a457-76d5146fbfb5,
e4fb10ff-3a77-11e3-9767-863d8c1156cd,
})
131031 15:25:07 [Note] WSREP: New COMPONENT: primary = no, bootstrap = no, my_idx = 0, memb_num = 1
131031 15:25:07 [Note] WSREP: Flow-control interval: [16, 16]
131031 15:25:07 [Note] WSREP: Received NON-PRIMARY.
131031 15:25:07 [Note] WSREP: Shifting SYNCED -> OPEN (TO: 2021088)
131031 15:25:07 [Note] WSREP: New cluster view: global state: 1ddd4eed-ee2e-11e2-0800-45d2899001c9:2021088, view# -1: non-Primary, number of nodes: 1, my index: 0, protocol version 2
131031 15:25:07 [Note] WSREP: wsrep_notify_cmd is not defined, skipping notification.
131031 15:25:07 [Note] WSREP: view(view_id(NON_PRIM,b138644e-3a4f-11e3-a890-cbf6831de099,498) memb {
b138644e-3a4f-11e3-a890-cbf6831de099,
} joined {
} left {
} partitioned {
2853b263-3a4c-11e3-8d08-bb69a1cadba2,
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,
63e5752e-3a4d-11e3-a457-76d5146fbfb5,
e4fb10ff-3a77-11e3-9767-863d8c1156cd,
})
131031 15:25:07 [Note] WSREP: New COMPONENT: primary = no, bootstrap = no, my_idx = 0, memb_num = 1
131031 15:25:07 [Note] WSREP: Flow-control interval: [16, 16]
131031 15:25:07 [Note] WSREP: Received NON-PRIMARY.
131031 15:25:07 [Note] WSREP: New cluster view: global state: 1ddd4eed-ee2e-11e2-0800-45d2899001c9:2021088, view# -1: non-Primary, number of nodes: 1, my index: 0, protocol version 2
131031 15:25:07 [Note] WSREP: wsrep_notify_cmd is not defined, skipping notification.
131031 15:25:07 [Note] WSREP: declaring 2853b263-3a4c-11e3-8d08-bb69a1cadba2 stable
131031 15:25:07 [Note] WSREP: view(view_id(NON_PRIM,2853b263-3a4c-11e3-8d08-bb69a1cadba2,499) memb {
2853b263-3a4c-11e3-8d08-bb69a1cadba2,
b138644e-3a4f-11e3-a890-cbf6831de099,
} joined {
} left {
} partitioned {
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,
63e5752e-3a4d-11e3-a457-76d5146fbfb5,
e4fb10ff-3a77-11e3-9767-863d8c1156cd,
})
131031 15:25:07 [Note] WSREP: New COMPONENT: primary = no, bootstrap = no, my_idx = 1, memb_num = 2
131031 15:25:07 [Note] WSREP: Flow-control interval: [23, 23]
131031 15:25:07 [Note] WSREP: Received NON-PRIMARY.
131031 15:25:07 [Note] WSREP: New cluster view: global state: 1ddd4eed-ee2e-11e2-0800-45d2899001c9:2021088, view# -1: non-Primary, number of nodes: 2, my index: 1, protocol version 2
131031 15:25:07 [Note] WSREP: wsrep_notify_cmd is not defined, skipping notification.
131031 15:25:07 [Note] WSREP: declaring 2853b263-3a4c-11e3-8d08-bb69a1cadba2 stable
131031 15:25:07 [Note] WSREP: declaring 63e5752e-3a4d-11e3-a457-76d5146fbfb5 stable
131031 15:25:07 [Note] WSREP: view(view_id(NON_PRIM,2853b263-3a4c-11e3-8d08-bb69a1cadba2,500) memb {
2853b263-3a4c-11e3-8d08-bb69a1cadba2,
63e5752e-3a4d-11e3-a457-76d5146fbfb5,
b138644e-3a4f-11e3-a890-cbf6831de099,
} joined {
} left {
} partitioned {
4e6e7b63-3a59-11e3-83c8-4b32aeffee17,
e4fb10ff-3a77-11e3-9767-863d8c1156cd,
})
131031 15:25:07 [Note] WSREP: New COMPONENT: primary = no, bootstrap = no, my_idx = 2, memb_num = 3
131031 15:25:07 [Note] WSREP: Flow-control interval: [28, 28]
131031 15:25:07 [Note] WSREP: Received NON-PRIMARY.
131031 15:25:07 [Note] WSREP: New cluster view: global state: 1ddd4eed-ee2e-11e2-0800-45d2899001c9:2021088, view# -1: non-Primary, number of nodes: 3, my index: 2, protocol version 2
131031 15:25:07 [Note] WSREP: wsrep_notify_cmd is not defined, skipping notification.
thanks in advance.