DRBD: ensure peers are UpToDate for dual-primary

author Apollon Oikonomopoulos <apoikos@gmail.com>

Tue, 5 Nov 2013 14:30:45 +0000 (16:30 +0200)

committer Michele Tartara <mtartara@google.com>

Wed, 6 Nov 2013 10:25:21 +0000 (10:25 +0000)
author Apollon Oikonomopoulos <apoikos@gmail.com>
Tue, 5 Nov 2013 14:30:45 +0000 (16:30 +0200)
committer Michele Tartara <mtartara@google.com>
Wed, 6 Nov 2013 10:25:21 +0000 (10:25 +0000)
diff --git a/lib/backend.py b/lib/backend.py

index a75432b..9e12639 100644 (file)
--- a/lib/backend.py
+++ b/lib/backend.py
@@ -3622,8 +3622,20 @@ def DrbdAttachNet(nodes_ip, disks, instance_name, multimaster):
      for rd in bdevs:
        stats = rd.GetProcStatus()
  
-      all_connected = (all_connected and
-                       (stats.is_connected or stats.is_in_resync))
+      if multimaster:
+        # In the multimaster case we have to wait explicitly until
+        # the resource is Connected and UpToDate/UpToDate, because
+        # we promote *both nodes* to primary directly afterwards.
+        # Being in resync is not enough, since there is a race during which we
+        # may promote a node with an Outdated disk to primary, effectively
+        # tearing down the connection.
+        all_connected = (all_connected and
+                         stats.is_connected and
+                         stats.is_disk_uptodate and
+                         stats.peer_disk_uptodate)
+      else:
+        all_connected = (all_connected and
+                         (stats.is_connected or stats.is_in_resync))
  
        if stats.is_standalone:
          # peer had different config info and this node became
diff --git a/lib/bdev.py b/lib/bdev.py

index 7623869..7226f1f 100644 (file)
--- a/lib/bdev.py
+++ b/lib/bdev.py
@@ -1050,7 +1050,7 @@ class LogicalVolume(BlockDev):
      _ThrowError("Can't grow LV %s: %s", self.dev_path, result.output)
  
  
-class DRBD8Status(object):
+class DRBD8Status(object): # pylint: disable=R0902
    """A DRBD status representation class.
  
    Note that this doesn't support unconfigured devices (cs:Unconfigured).
@@ -1135,6 +1135,7 @@ class DRBD8Status(object):
  
      self.is_diskless = self.ldisk == self.DS_DISKLESS
      self.is_disk_uptodate = self.ldisk == self.DS_UPTODATE
+    self.peer_disk_uptodate = self.rdisk == self.DS_UPTODATE
  
      self.is_in_resync = self.cstatus in self.CSET_SYNC
      self.is_in_use = self.cstatus != self.CS_UNCONFIGURED
author	Apollon Oikonomopoulos <apoikos@gmail.com>
	Tue, 5 Nov 2013 14:30:45 +0000 (16:30 +0200)
committer	Michele Tartara <mtartara@google.com>
	Wed, 6 Nov 2013 10:25:21 +0000 (10:25 +0000)
lib/backend.py		patch \| blob \| history
lib/bdev.py		patch \| blob \| history