Treat empty oob_program param as default

[ganeti-local] / lib / cmdlib.py
diff --git a/lib/cmdlib.py b/lib/cmdlib.py

index fa8becd..1cc765a 100644 (file)
--- a/lib/cmdlib.py
+++ b/lib/cmdlib.py
@@ -1554,7 +1554,7 @@ class LUClusterVerify(LogicalUnit):
                 node_current)
  
      for node, n_img in node_image.items():
-      if (not node == node_current):
+      if node != node_current:
          test = instance in n_img.instances
          _ErrorIf(test, self.EINSTANCEWRONGNODE, instance,
                   "instance should not run on node %s", node)
@@ -1564,7 +1564,11 @@ class LUClusterVerify(LogicalUnit):
                  for idx, (success, status) in enumerate(disks)]
  
      for nname, success, bdev_status, idx in diskdata:
-      _ErrorIf(instanceconfig.admin_up and not success,
+      # the 'ghost node' construction in Exec() ensures that we have a
+      # node here
+      snode = node_image[nname]
+      bad_snode = snode.ghost or snode.offline
+      _ErrorIf(instanceconfig.admin_up and not success and not bad_snode,
                 self.EINSTANCEFAULTYDISK, instance,
                 "couldn't retrieve status for disk/%s on %s: %s",
                 idx, nname, bdev_status)
@@ -1622,6 +1626,12 @@ class LUClusterVerify(LogicalUnit):
        # WARNING: we currently take into account down instances as well
        # as up ones, considering that even if they're down someone
        # might want to start them even in the event of a node failure.
+      if n_img.offline:
+        # we're skipping offline nodes from the N+1 warning, since
+        # most likely we don't have good memory infromation from them;
+        # we already list instances living on such nodes, and that's
+        # enough warning
+        continue
        for prinode, instances in n_img.sbp.items():
          needed_mem = 0
          for instance in instances:
@@ -2290,8 +2300,8 @@ class LUClusterVerify(LogicalUnit):
                 self.ENODERPC, pnode, "instance %s, connection to"
                 " primary node failed", instance)
  
-      if pnode_img.offline:
-        inst_nodes_offline.append(pnode)
+      _ErrorIf(pnode_img.offline, self.EINSTANCEBADNODE, instance,
+               "instance lives on offline node %s", inst_config.primary_node)
  
        # If the instance is non-redundant we cannot survive losing its primary
        # node, so we are not N+1 compliant. On the other hand we have no disk
@@ -2340,7 +2350,7 @@ class LUClusterVerify(LogicalUnit):
  
        # warn that the instance lives on offline nodes
        _ErrorIf(inst_nodes_offline, self.EINSTANCEBADNODE, instance,
-               "instance lives on offline node(s) %s",
+               "instance has offline secondary node(s) %s",
                 utils.CommaJoin(inst_nodes_offline))
        # ... or ghost/non-vm_capable nodes
        for node in inst_config.all_nodes:
@@ -2791,6 +2801,12 @@ class LUClusterSetParams(LogicalUnit):
        utils.ForceDictType(self.op.ndparams, constants.NDS_PARAMETER_TYPES)
        self.new_ndparams = cluster.SimpleFillND(self.op.ndparams)
  
+      # TODO: we need a more general way to handle resetting
+      # cluster-level parameters to default values
+      if self.new_ndparams["oob_program"] == "":
+        self.new_ndparams["oob_program"] = \
+            constants.NDC_DEFAULTS[constants.ND_OOB_PROGRAM]
+
      if self.op.nicparams:
        utils.ForceDictType(self.op.nicparams, constants.NICS_PARAMETER_TYPES)
        self.new_nicparams = cluster.SimpleFillNIC(self.op.nicparams)
@@ -3622,7 +3638,10 @@ class _NodeQuery(_QueryBase):
  
      # Gather data as requested
      if query.NQ_LIVE in self.requested_data:
-      node_data = lu.rpc.call_node_info(nodenames, lu.cfg.GetVGName(),
+      # filter out non-vm_capable nodes
+      toquery_nodes = [name for name in nodenames if all_info[name].vm_capable]
+
+      node_data = lu.rpc.call_node_info(toquery_nodes, lu.cfg.GetVGName(),
                                          lu.cfg.GetHypervisorType())
        live_data = dict((name, nresult.payload)
                         for (name, nresult) in node_data.items()
@@ -3897,10 +3916,16 @@ class _InstanceQuery(_QueryBase):
            bad_nodes.append(name)
          elif result.payload:
            for inst in result.payload:
-            if all_info[inst].primary_node == name:
-              live_data.update(result.payload)
+            if inst in all_info:
+              if all_info[inst].primary_node == name:
+                live_data.update(result.payload)
+              else:
+                wrongnode_inst.add(inst)
              else:
-              wrongnode_inst.add(inst)
+              # orphan instance; we don't list it here as we don't
+              # handle this case yet in the output of instance listing
+              logging.warning("Orphan instance '%s' found on node %s",
+                              inst, name)
          # else no instance is alive
      else:
        live_data = {}
@@ -6616,6 +6641,10 @@ def _WipeDisks(lu, instance):
  
    """
    node = instance.primary_node
+
+  for device in instance.disks:
+    lu.cfg.SetDiskID(device, node)
+
    logging.info("Pause sync of instance %s disks", instance.name)
    result = lu.rpc.call_blockdev_pause_resume_sync(node, instance.disks, True)
  
@@ -6627,7 +6656,8 @@ def _WipeDisks(lu, instance):
    try:
      for idx, device in enumerate(instance.disks):
        lu.LogInfo("* Wiping disk %d", idx)
-      logging.info("Wiping disk %d for instance %s", idx, instance.name)
+      logging.info("Wiping disk %d for instance %s, node %s",
+                   idx, instance.name, node)
  
        # The wipe size is MIN_WIPE_CHUNK_PERCENT % of the instance disk but
        # MAX_WIPE_CHUNK at max
@@ -6808,6 +6838,21 @@ def _ComputeDiskSize(disk_template, disks):
    return req_size_dict[disk_template]
  
  
+def _FilterVmNodes(lu, nodenames):
+  """Filters out non-vm_capable nodes from a list.
+
+  @type lu: L{LogicalUnit}
+  @param lu: the logical unit for which we check
+  @type nodenames: list
+  @param nodenames: the list of nodes on which we should check
+  @rtype: list
+  @return: the list of vm-capable nodes
+
+  """
+  vm_nodes = frozenset(lu.cfg.GetNonVmCapableNodeList())
+  return [name for name in nodenames if name not in vm_nodes]
+
+
  def _CheckHVParams(lu, nodenames, hvname, hvparams):
    """Hypervisor parameter validation.
  
@@ -6825,6 +6870,7 @@ def _CheckHVParams(lu, nodenames, hvname, hvparams):
    @raise errors.OpPrereqError: if the parameters are not valid
  
    """
+  nodenames = _FilterVmNodes(lu, nodenames)
    hvinfo = lu.rpc.call_hypervisor_validate_params(nodenames,
                                                    hvname,
                                                    hvparams)
@@ -6852,6 +6898,7 @@ def _CheckOSParams(lu, required, nodenames, osname, osparams):
    @raise errors.OpPrereqError: if the parameters are not valid
  
    """
+  nodenames = _FilterVmNodes(lu, nodenames)
    result = lu.rpc.call_os_validate(required, nodenames, osname,
                                     [constants.OS_VALIDATE_PARAMETERS],
                                     osparams)