backend.DemoteFromMC: don't fail for missing files

[ganeti-local] / lib / backend.py
diff --git a/lib/backend.py b/lib/backend.py

index 9ebab3b..bca3512 100644 (file)
--- a/lib/backend.py
+++ b/lib/backend.py
@@ -437,9 +437,9 @@ def VerifyNode(what, cluster_name):
    if constants.NV_DRBDLIST in what:
      try:
        used_minors = bdev.DRBD8.GetUsedDevs().keys()
-    except errors.BlockDeviceError:
+    except errors.BlockDeviceError, err:
        logging.warning("Can't get used minors list", exc_info=True)
-      used_minors = []
+      used_minors = str(err)
      result[constants.NV_DRBDLIST] = used_minors
  
    return result
@@ -575,7 +575,6 @@ def GetInstanceList(hypervisor_list):
        results.extend(names)
      except errors.HypervisorError, err:
        logging.exception("Error enumerating instances for hypevisor %s", hname)
-      # FIXME: should we somehow not propagate this to the master?
        raise
  
    return results
@@ -661,9 +660,14 @@ def GetAllInstancesInfo(hypervisor_list):
            'state': state,
            'time': times,
            }
-        if name in output and output[name] != value:
-          raise errors.HypervisorError("Instance %s running duplicate"
-                                       " with different parameters" % name)
+        if name in output:
+          # we only check static parameters, like memory and vcpus,
+          # and not state and time which can change between the
+          # invocations of the different hypervisors
+          for key in 'memory', 'vcpus':
+            if value[key] != output[name][key]:
+              raise errors.HypervisorError("Instance %s is running twice"
+                                           " with different parameters" % name)
          output[name] = value
  
    return output
@@ -857,7 +861,7 @@ def _GatherAndLinkBlockDevs(instance):
    return block_devices
  
  
-def StartInstance(instance, extra_args):
+def StartInstance(instance):
    """Start an instance.
  
    @type instance: L{objects.Instance}
@@ -874,7 +878,7 @@ def StartInstance(instance, extra_args):
    try:
      block_devices = _GatherAndLinkBlockDevs(instance)
      hyper = hypervisor.GetHypervisor(instance.hypervisor)
-    hyper.StartInstance(instance, block_devices, extra_args)
+    hyper.StartInstance(instance, block_devices)
    except errors.BlockDeviceError, err:
      logging.exception("Failed to start instance")
      return (False, "Block device error: %s" % str(err))
@@ -886,7 +890,7 @@ def StartInstance(instance, extra_args):
    return (True, "Instance started successfully")
  
  
-def ShutdownInstance(instance):
+def InstanceShutdown(instance):
    """Shut an instance down.
  
    @note: this functions uses polling with a hardcoded timeout.
@@ -901,14 +905,15 @@ def ShutdownInstance(instance):
    running_instances = GetInstanceList([hv_name])
  
    if instance.name not in running_instances:
-    return True
+    return (True, "Instance already stopped")
  
    hyper = hypervisor.GetHypervisor(hv_name)
    try:
      hyper.StopInstance(instance)
    except errors.HypervisorError, err:
-    logging.error("Failed to stop instance: %s" % err)
-    return False
+    msg = "Failed to stop instance %s: %s" % (instance.name, err)
+    logging.error(msg)
+    return (False, msg)
  
    # test every 10secs for 2min
  
@@ -925,21 +930,23 @@ def ShutdownInstance(instance):
      try:
        hyper.StopInstance(instance, force=True)
      except errors.HypervisorError, err:
-      logging.exception("Failed to stop instance: %s" % err)
-      return False
+      msg = "Failed to force stop instance %s: %s" % (instance.name, err)
+      logging.error(msg)
+      return (False, msg)
  
      time.sleep(1)
      if instance.name in GetInstanceList([hv_name]):
-      logging.error("Could not shutdown instance '%s' even by destroy",
-                    instance.name)
-      return False
+      msg = ("Could not shutdown instance %s even by destroy" %
+             instance.name)
+      logging.error(msg)
+      return (False, msg)
  
    _RemoveBlockDevLinks(instance.name, instance.disks)
  
-  return True
+  return (True, "Instance has been shutdown successfully")
  
  
-def RebootInstance(instance, reboot_type, extra_args):
+def InstanceReboot(instance, reboot_type):
    """Reboot an instance.
  
    @type instance: L{objects.Instance}
@@ -951,9 +958,10 @@ def RebootInstance(instance, reboot_type, extra_args):
          instance OS, do not recreate the VM
        - L{constants.INSTANCE_REBOOT_HARD}: tear down and
          restart the VM (at the hypervisor level)
-      - the other reboot type (L{constants.INSTANCE_REBOOT_HARD})
-        is not accepted here, since that mode is handled
-        differently
+      - the other reboot type (L{constants.INSTANCE_REBOOT_FULL}) is
+        not accepted here, since that mode is handled differently, in
+        cmdlib, and translates into full stop and start of the
+        instance (instead of a call_instance_reboot RPC)
    @rtype: boolean
    @return: the success of the operation
  
@@ -961,27 +969,32 @@ def RebootInstance(instance, reboot_type, extra_args):
    running_instances = GetInstanceList([instance.hypervisor])
  
    if instance.name not in running_instances:
-    logging.error("Cannot reboot instance that is not running")
-    return False
+    msg = "Cannot reboot instance %s that is not running" % instance.name
+    logging.error(msg)
+    return (False, msg)
  
    hyper = hypervisor.GetHypervisor(instance.hypervisor)
    if reboot_type == constants.INSTANCE_REBOOT_SOFT:
      try:
        hyper.RebootInstance(instance)
      except errors.HypervisorError, err:
-      logging.exception("Failed to soft reboot instance")
-      return False
+      msg = "Failed to soft reboot instance %s: %s" % (instance.name, err)
+      logging.error(msg)
+      return (False, msg)
    elif reboot_type == constants.INSTANCE_REBOOT_HARD:
      try:
-      ShutdownInstance(instance)
-      StartInstance(instance, extra_args)
+      stop_result = InstanceShutdown(instance)
+      if not stop_result[0]:
+        return stop_result
+      return StartInstance(instance)
      except errors.HypervisorError, err:
-      logging.exception("Failed to hard reboot instance")
-      return False
+      msg = "Failed to hard reboot instance %s: %s" % (instance.name, err)
+      logging.error(msg)
+      return (False, msg)
    else:
-    raise errors.ParameterError("reboot_type invalid")
+    return (False, "Invalid reboot_type received: %s" % (reboot_type,))
  
-  return True
+  return (True, "Reboot successful")
  
  
  def MigrationInfo(instance):
@@ -1112,7 +1125,7 @@ def BlockdevCreate(disk, size, owner, on_primary, info):
        clist.append(crdev)
  
    try:
-    device = bdev.Create(disk.dev_type, disk.physical_id, clist, size)
+    device = bdev.Create(disk.dev_type, disk.physical_id, clist, disk.size)
    except errors.BlockDeviceError, err:
      return False, "Can't create block device: %s" % str(err)
  
@@ -1222,7 +1235,7 @@ def _RecursiveAssembleBD(disk, owner, as_primary):
        children.append(cdev)
  
    if as_primary or disk.AssembleOnSecondary():
-    r_dev = bdev.Assemble(disk.dev_type, disk.physical_id, children)
+    r_dev = bdev.Assemble(disk.dev_type, disk.physical_id, children, disk.size)
      r_dev.SetSyncSpeed(constants.SYNC_SPEED)
      result = r_dev
      if as_primary or disk.OpenOnSecondary():
@@ -1392,7 +1405,7 @@ def _RecursiveFindBD(disk):
      for chdisk in disk.children:
        children.append(_RecursiveFindBD(chdisk))
  
-  return bdev.FindDevice(disk.dev_type, disk.physical_id, children)
+  return bdev.FindDevice(disk.dev_type, disk.physical_id, children, disk.size)
  
  
  def BlockdevFind(disk):
@@ -1660,7 +1673,6 @@ def OSEnvironment(instance, debug=0):
                                      str(disk))
      real_disk.Open()
      result['DISK_%d_PATH' % idx] = real_disk.dev_path
-    # FIXME: When disks will have read-only mode, populate this
      result['DISK_%d_ACCESS' % idx] = disk.mode
      if constants.HV_DISK_TYPE in instance.hvparams:
        result['DISK_%d_FRONTEND_TYPE' % idx] = \
@@ -1679,6 +1691,10 @@ def OSEnvironment(instance, debug=0):
        result['NIC_%d_FRONTEND_TYPE' % idx] = \
          instance.hvparams[constants.HV_NIC_TYPE]
  
+  for source, kind in [(instance.beparams, "BE"), (instance.hvparams, "HV")]:
+    for key, value in source.items():
+      result["INSTANCE_%s_%s" % (kind, key)] = str(value)
+
    return result
  
  def BlockdevGrow(disk, amount):
@@ -2292,7 +2308,8 @@ def DemoteFromMC():
    if utils.IsProcessAlive(utils.ReadPidFile(pid_file)):
      return (False, "The master daemon is running, will not demote")
    try:
-    utils.CreateBackup(constants.CLUSTER_CONF_FILE)
+    if os.path.isfile(constants.CLUSTER_CONF_FILE):
+      utils.CreateBackup(constants.CLUSTER_CONF_FILE)
    except EnvironmentError, err:
      if err.errno != errno.ENOENT:
        return (False, "Error while backing up cluster file: %s" % str(err))
@@ -2377,7 +2394,7 @@ def DrbdAttachNet(nodes_ip, disks, instance_name, multimaster):
          # standalone, even though this should not happen with the
          # new staged way of changing disk configs
          try:
-          rd.ReAttachNet(multimaster)
+          rd.AttachNet(multimaster)
          except errors.BlockDeviceError, err:
            return (False, "Can't change network configuration: %s" % str(err))
      if all_connected: