[ClusterLabs] drbd9 3 node "neverending" sync?

Mevo Govo govomevo at gmail.com
Mon Oct 8 05:20:25 EDT 2018


Hi,

we are testing drbd9 with 3 node. After a test (network disable, then
enable on one host), the syncronization is not finishing.
As a recovery, I switched the pacemaker off, and I tried "primary --force"
on one node and "--discard-my-data" on the other nodes. It seem solve the
problem (everything is UpToDate), but after I down/up the resource, the
"neverending" synchronization is restarted (when the resource is Secondary
on all the 3 node).
Why sync is restarted after UpToDate state. Ho can I solve this problem?
Nodes are xetes1, xetest2, xetest3, here is a checking test ("drbdadm
status" on every node, then wait 10 secod. This repeated 10 times)

Thanks for answers: Laci.


for i in {1..10}
do
  echo "################## check $i ##################"
  sleep 10
  date
  echo '################## on node xetest1'
  ssh xetest1 sudo drbdadm status
  echo '################## on node xetest2'
  ssh xetest2 sudo drbdadm status
  echo '################## on node xetest3'
  ssh xetest3 sudo drbdadm status
done

################## check 1 ##################



Mon Oct  8 09:11:12 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:UpToDate

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:Inconsistent resync-suspended:peer

################## on node xetest3
r0 role:Secondary
  disk:Outdated blocked:upper
  xetest1 role:Secondary
    replication:WFBitMapT peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 2 ##################
Mon Oct  8 09:11:23 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:Inconsistent resync-suspended:peer

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Outdated blocked:upper
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest2 role:Secondary
    replication:WFBitMapT peer-disk:UpToDate

################## check 3 ##################
Mon Oct  8 09:11:35 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 4 ##################
Mon Oct  8 09:11:46 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:WFBitMapS peer-disk:Outdated

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Inconsistent
  xetest1 role:Secondary
    replication:SyncTarget peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 5 ##################
Mon Oct  8 09:11:58 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:Outdated

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Outdated blocked:upper
  xetest1 role:Secondary
    replication:WFBitMapT peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 6 ##################
Mon Oct  8 09:12:09 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:UpToDate

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:Inconsistent resync-suspended:peer

################## on node xetest3
r0 role:Secondary
  disk:Inconsistent
  xetest1 role:Secondary
    replication:SyncTarget peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 7 ##################
Mon Oct  8 09:12:21 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:UpToDate

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Outdated blocked:upper
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest2 role:Secondary
    replication:WFBitMapT peer-disk:UpToDate

################## check 8 ##################
Mon Oct  8 09:12:32 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:Outdated

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Inconsistent
  xetest1 role:Secondary
    replication:SyncTarget peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 9 ##################
Mon Oct  8 09:12:44 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:Outdated

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Outdated blocked:upper
  xetest1 role:Secondary
    replication:WFBitMapT peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

################## check 10 ##################
Mon Oct  8 09:12:55 GMT 2018
################## on node xetest1
r0 role:Secondary
  disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    peer-disk:UpToDate

################## on node xetest2
r0 role:Secondary
  disk:UpToDate
  xetest1 role:Secondary
    peer-disk:UpToDate
  xetest3 role:Secondary
    replication:SyncSource peer-disk:Inconsistent

################## on node xetest3
r0 role:Secondary
  disk:Outdated blocked:upper
  xetest1 role:Secondary
    replication:WFBitMapT peer-disk:UpToDate
  xetest2 role:Secondary
    peer-disk:UpToDate

[oracle at xetest1 ~]$






####### our config file is:
[oracle at xetest1 ~]$ cat /etc/drbd.conf
include "drbd.d/global_common.conf";

resource r0 {
 protocol C;
 meta-disk internal;
 device /dev/drbd0;
 options {
   auto-promote no;
   quorum majority;
   on-no-quorum io-error;
#   quorum-minimum-redundancy 2;
 }
 syncer {
  verify-alg sha1;
 }
 net {
  ping-int 5;
  after-sb-0pri discard-zero-changes;
  after-sb-1pri disconnect;
  after-sb-2pri disconnect;
 }
 on xetest1 {
  disk   /dev/sdb1;
  address  10.0.1.2:7790;
  node-id  1;
 }
 on xetest2 {
  disk   /dev/sdb1;
  address  10.0.2.2:7790;
  node-id  2;
 }
 on xetest3 {
  disk   /dev/sdb1;
  address  10.0.0.2:7790;
  node-id  3;
 }
 connection-mesh {
        hosts     xetest1 xetest2 xetest3;
 }
}
[oracle at xetest1 ~]$
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <https://lists.clusterlabs.org/pipermail/users/attachments/20181008/b7d35ec9/attachment.html>


More information about the Users mailing list