Convert os_diagnose rpc to new style result

[ganeti-local] / lib / cmdlib.py
diff --git a/lib/cmdlib.py b/lib/cmdlib.py

index e4e7b71..ea36327 100644 (file)
--- a/lib/cmdlib.py
+++ b/lib/cmdlib.py
@@ -610,11 +610,10 @@ def _CheckNicsBridgesExist(lu, target_nics, target_node,
              if params[constants.NIC_MODE] == constants.NIC_MODE_BRIDGED]
    if brlist:
      result = lu.rpc.call_bridges_exist(target_node, brlist)
-    result.Raise()
-    if not result.data:
-      raise errors.OpPrereqError("One or more target bridges %s does not"
-                                 " exist on destination node '%s'" %
-                                 (brlist, target_node))
+    msg = result.RemoteFailMsg()
+    if msg:
+      raise errors.OpPrereqError("Error checking bridges on destination node"
+                                 " '%s': %s" % (target_node, msg))
  
  
  def _CheckInstanceBridgesExist(lu, instance, node=None):
@@ -657,9 +656,9 @@ class LUDestroyCluster(NoHooksLU):
      """
      master = self.cfg.GetMasterNode()
      result = self.rpc.call_node_stop_master(master, False)
-    result.Raise()
-    if not result.data:
-      raise errors.OpExecError("Could not disable the master role")
+    msg = result.RemoteFailMsg()
+    if msg:
+      raise errors.OpExecError("Could not disable the master role: %s" % msg)
      priv_key, pub_key, _ = ssh.GetUserFiles(constants.GANETI_RUNAS)
      utils.CreateBackup(priv_key)
      utils.CreateBackup(pub_key)
@@ -1023,7 +1022,6 @@ class LUVerifyCluster(LogicalUnit):
  
      for node_i in nodeinfo:
        node = node_i.name
-      nresult = all_nvinfo[node].data
  
        if node_i.offline:
          feedback_fn("* Skipping offline node %s" % (node,))
@@ -1041,11 +1039,13 @@ class LUVerifyCluster(LogicalUnit):
          ntype = "regular"
        feedback_fn("* Verifying node %s (%s)" % (node, ntype))
  
-      if all_nvinfo[node].failed or not isinstance(nresult, dict):
-        feedback_fn("  - ERROR: connection to %s failed" % (node,))
+      msg = all_nvinfo[node].RemoteFailMsg()
+      if msg:
+        feedback_fn("  - ERROR: while contacting node %s: %s" % (node, msg))
          bad = True
          continue
  
+      nresult = all_nvinfo[node].payload
        node_drbd = {}
        for minor, instance in all_drbd_map[node].items():
          if instance not in instanceinfo:
@@ -1289,8 +1289,13 @@ class LUVerifyDisks(NoHooksLU):
    def Exec(self, feedback_fn):
      """Verify integrity of cluster disks.
  
+    @rtype: tuple of three items
+    @return: a tuple of (dict of node-to-node_error, list of instances
+        which need activate-disks, dict of instance: (node, volume) for
+        missing volumes
+
      """
-    result = res_nodes, res_nlvm, res_instances, res_missing = [], {}, [], {}
+    result = res_nodes, res_instances, res_missing = {}, [], {}
  
      vg_name = self.cfg.GetVGName()
      nodes = utils.NiceSort(self.cfg.GetNodeList())
@@ -1317,24 +1322,17 @@ class LUVerifyDisks(NoHooksLU):
      to_act = set()
      for node in nodes:
        # node_volume
-      lvs = node_lvs[node]
-      if lvs.failed:
-        if not lvs.offline:
-          self.LogWarning("Connection to node %s failed: %s" %
-                          (node, lvs.data))
-        continue
-      lvs = lvs.data
-      if isinstance(lvs, basestring):
-        logging.warning("Error enumerating LVs on node %s: %s", node, lvs)
-        res_nlvm[node] = lvs
+      node_res = node_lvs[node]
+      if node_res.offline:
          continue
-      elif not isinstance(lvs, dict):
-        logging.warning("Connection to node %s failed or invalid data"
-                        " returned", node)
-        res_nodes.append(node)
+      msg = node_res.RemoteFailMsg()
+      if msg:
+        logging.warning("Error enumerating LVs on node %s: %s", node, msg)
+        res_nodes[node] = msg
          continue
  
-      for lv_name, (_, lv_inactive, lv_online) in lvs.iteritems():
+      lvs = node_res.payload
+      for lv_name, (_, lv_inactive, lv_online) in lvs.items():
          inst = nv_dict.pop((node, lv_name), None)
          if (not lv_online and inst is not None
              and inst.name not in res_instances):
@@ -1400,8 +1398,9 @@ class LURenameCluster(LogicalUnit):
      # shutdown the master IP
      master = self.cfg.GetMasterNode()
      result = self.rpc.call_node_stop_master(master, False)
-    if result.failed or not result.data:
-      raise errors.OpExecError("Could not disable the master role")
+    msg = result.RemoteFailMsg()
+    if msg:
+      raise errors.OpExecError("Could not disable the master role: %s" % msg)
  
      try:
        cluster = self.cfg.GetClusterInfo()
@@ -1427,9 +1426,10 @@ class LURenameCluster(LogicalUnit):
  
      finally:
        result = self.rpc.call_node_start_master(master, False)
-      if result.failed or not result.data:
+      msg = result.RemoteFailMsg()
+      if msg:
          self.LogWarning("Could not re-enable the master role on"
-                        " the master, please restart manually.")
+                        " the master, please restart manually: %s", msg)
  
  
  def _RecursiveCheckIfLVMBased(disk):
@@ -1512,11 +1512,13 @@ class LUSetClusterParams(LogicalUnit):
      if self.op.vg_name:
        vglist = self.rpc.call_vg_list(node_list)
        for node in node_list:
-        if vglist[node].failed:
+        msg = vglist[node].RemoteFailMsg()
+        if msg:
            # ignoring down node
-          self.LogWarning("Node %s unreachable/error, ignoring" % node)
+          self.LogWarning("Error while gathering data on node %s"
+                          " (ignoring node): %s", node, msg)
            continue
-        vgstatus = utils.CheckVolumeGroupSize(vglist[node].data,
+        vgstatus = utils.CheckVolumeGroupSize(vglist[node].payload,
                                                self.op.vg_name,
                                                constants.MIN_VG_SIZE)
          if vgstatus:
@@ -1809,11 +1811,12 @@ class LUDiagnoseOS(NoHooksLU):
      # level), so that nodes with a non-responding node daemon don't
      # make all OSes invalid
      good_nodes = [node_name for node_name in rlist
-                  if not rlist[node_name].failed]
-    for node_name, nr in rlist.iteritems():
-      if nr.failed or not nr.data:
+                  if not rlist[node_name].RemoteFailMsg()]
+    for node_name, nr in rlist.items():
+      if nr.RemoteFailMsg() or not nr.payload:
          continue
-      for os_obj in nr.data:
+      for os_serialized in nr.payload:
+        os_obj = objects.OS.FromDict(os_serialized)
          if os_obj.name not in all_os:
            # build a list of nodes for this os containing empty lists
            # for each node in node_list
@@ -1829,11 +1832,9 @@ class LUDiagnoseOS(NoHooksLU):
      """
      valid_nodes = [node for node in self.cfg.GetOnlineNodeList()]
      node_data = self.rpc.call_os_diagnose(valid_nodes)
-    if node_data == False:
-      raise errors.OpExecError("Can't gather the list of OSes")
      pol = self._DiagnoseByOS(valid_nodes, node_data)
      output = []
-    for os_name, os_data in pol.iteritems():
+    for os_name, os_data in pol.items():
        row = []
        for field in self.op.output_fields:
          if field == "name":
@@ -1915,7 +1916,11 @@ class LURemoveNode(LogicalUnit):
  
      self.context.RemoveNode(node.name)
  
-    self.rpc.call_node_leave_cluster(node.name)
+    result = self.rpc.call_node_leave_cluster(node.name)
+    msg = result.RemoteFailMsg()
+    if msg:
+      self.LogWarning("Errors encountered on the remote node while leaving"
+                      " the cluster: %s", msg)
  
      # Promote nodes to master candidate as needed
      _AdjustCandidatePool(self)
@@ -2000,8 +2005,8 @@ class LUQueryNodes(NoHooksLU):
                                            self.cfg.GetHypervisorType())
        for name in nodenames:
          nodeinfo = node_data[name]
-        if not nodeinfo.failed and nodeinfo.data:
-          nodeinfo = nodeinfo.data
+        if not nodeinfo.RemoteFailMsg() and nodeinfo.payload:
+          nodeinfo = nodeinfo.payload
            fn = utils.TryConvert
            live_data[name] = {
              "mtotal": fn(int, nodeinfo.get('memory_total', None)),
@@ -2123,10 +2128,15 @@ class LUQueryNodeVolumes(NoHooksLU):
  
      output = []
      for node in nodenames:
-      if node not in volumes or volumes[node].failed or not volumes[node].data:
+      nresult = volumes[node]
+      if nresult.offline:
+        continue
+      msg = nresult.RemoteFailMsg()
+      if msg:
+        self.LogWarning("Can't compute volume data on node %s: %s", node, msg)
          continue
  
-      node_vols = volumes[node].data[:]
+      node_vols = nresult.payload[:]
        node_vols.sort(key=lambda vol: vol['dev'])
  
        for vol in node_vols:
@@ -2276,17 +2286,17 @@ class LUAddNode(LogicalUnit):
  
      # check connectivity
      result = self.rpc.call_version([node])[node]
-    result.Raise()
-    if result.data:
-      if constants.PROTOCOL_VERSION == result.data:
-        logging.info("Communication to node %s fine, sw version %s match",
-                     node, result.data)
-      else:
-        raise errors.OpExecError("Version mismatch master version %s,"
-                                 " node version %s" %
-                                 (constants.PROTOCOL_VERSION, result.data))
+    msg = result.RemoteFailMsg()
+    if msg:
+      raise errors.OpExecError("Can't get version information from"
+                               " node %s: %s" % (node, msg))
+    if constants.PROTOCOL_VERSION == result.payload:
+      logging.info("Communication to node %s fine, sw version %s match",
+                   node, result.payload)
      else:
-      raise errors.OpExecError("Cannot get version from the new node")
+      raise errors.OpExecError("Version mismatch master version %s,"
+                               " node version %s" %
+                               (constants.PROTOCOL_VERSION, result.payload))
  
      # setup ssh on node
      logging.info("Copy ssh key to node %s", node)
@@ -2319,7 +2329,11 @@ class LUAddNode(LogicalUnit):
      if new_node.secondary_ip != new_node.primary_ip:
        result = self.rpc.call_node_has_ip_address(new_node.name,
                                                   new_node.secondary_ip)
-      if result.failed or not result.data:
+      msg = result.RemoteFailMsg()
+      if msg:
+        raise errors.OpPrereqError("Failure checking secondary ip"
+                                   " on node %s: %s" % (new_node.name, msg))
+      if not result.payload:
          raise errors.OpExecError("Node claims it doesn't have the secondary ip"
                                   " you gave (%s). Please fix and re-run this"
                                   " command." % new_node.secondary_ip)
@@ -2333,13 +2347,15 @@ class LUAddNode(LogicalUnit):
      result = self.rpc.call_node_verify(node_verify_list, node_verify_param,
                                         self.cfg.GetClusterName())
      for verifier in node_verify_list:
-      if result[verifier].failed or not result[verifier].data:
-        raise errors.OpExecError("Cannot communicate with %s's node daemon"
-                                 " for remote verification" % verifier)
-      if result[verifier].data['nodelist']:
-        for failed in result[verifier].data['nodelist']:
+      msg = result[verifier].RemoteFailMsg()
+      if msg:
+        raise errors.OpExecError("Cannot communicate with node %s: %s" %
+                                 (verifier, msg))
+      nl_payload = result[verifier].payload['nodelist']
+      if nl_payload:
+        for failed in nl_payload:
            feedback_fn("ssh/hostname verification failed %s -> %s" %
-                      (verifier, result[verifier].data['nodelist'][failed]))
+                      (verifier, nl_payload[failed]))
          raise errors.OpExecError("ssh/hostname verification failed.")
  
      if self.op.readd:
@@ -2770,14 +2786,14 @@ def _SafeShutdownInstanceDisks(lu, instance):
    _ShutdownInstanceDisks.
  
    """
-  ins_l = lu.rpc.call_instance_list([instance.primary_node],
-                                      [instance.hypervisor])
-  ins_l = ins_l[instance.primary_node]
-  if ins_l.failed or not isinstance(ins_l.data, list):
-    raise errors.OpExecError("Can't contact node '%s'" %
-                             instance.primary_node)
-
-  if instance.name in ins_l.data:
+  pnode = instance.primary_node
+  ins_l = lu.rpc.call_instance_list([pnode], [instance.hypervisor])
+  ins_l = ins_l[pnode]
+  msg = ins_l.RemoteFailMsg()
+  if msg:
+    raise errors.OpExecError("Can't contact node %s: %s" % (pnode, msg))
+
+  if instance.name in ins_l.payload:
      raise errors.OpExecError("Instance is running, can't shutdown"
                               " block devices.")
  
@@ -2830,15 +2846,17 @@ def _CheckNodeFreeMemory(lu, node, reason, requested, hypervisor_name):
  
    """
    nodeinfo = lu.rpc.call_node_info([node], lu.cfg.GetVGName(), hypervisor_name)
-  nodeinfo[node].Raise()
-  free_mem = nodeinfo[node].data.get('memory_free')
+  msg = nodeinfo[node].RemoteFailMsg()
+  if msg:
+    raise errors.OpPrereqError("Can't get data from node %s: %s" % (node, msg))
+  free_mem = nodeinfo[node].payload.get('memory_free', None)
    if not isinstance(free_mem, int):
      raise errors.OpPrereqError("Can't compute free memory on node %s, result"
-                             " was '%s'" % (node, free_mem))
+                               " was '%s'" % (node, free_mem))
    if requested > free_mem:
      raise errors.OpPrereqError("Not enough memory on node %s for %s:"
-                             " needed %s MiB, available %s MiB" %
-                             (node, reason, requested, free_mem))
+                               " needed %s MiB, available %s MiB" %
+                               (node, reason, requested, free_mem))
  
  
  class LUStartupInstance(LogicalUnit):
@@ -2913,8 +2931,11 @@ class LUStartupInstance(LogicalUnit):
      remote_info = self.rpc.call_instance_info(instance.primary_node,
                                                instance.name,
                                                instance.hypervisor)
-    remote_info.Raise()
-    if not remote_info.data:
+    msg = remote_info.RemoteFailMsg()
+    if msg:
+      raise errors.OpPrereqError("Error checking node %s: %s" %
+                                 (instance.primary_node, msg))
+    if not remote_info.payload: # not running already
        _CheckNodeFreeMemory(self, instance.primary_node,
                             "starting instance %s" % instance.name,
                             bep[constants.BE_MEMORY], instance.hypervisor)
@@ -3115,8 +3136,11 @@ class LUReinstallInstance(LogicalUnit):
      remote_info = self.rpc.call_instance_info(instance.primary_node,
                                                instance.name,
                                                instance.hypervisor)
-    remote_info.Raise()
-    if remote_info.data:
+    msg = remote_info.RemoteFailMsg()
+    if msg:
+      raise errors.OpPrereqError("Error checking node %s: %s" %
+                                 (instance.primary_node, msg))
+    if remote_info.payload:
        raise errors.OpPrereqError("Instance '%s' is running on the node %s" %
                                   (self.op.instance_name,
                                    instance.primary_node))
@@ -3199,8 +3223,11 @@ class LURenameInstance(LogicalUnit):
      remote_info = self.rpc.call_instance_info(instance.primary_node,
                                                instance.name,
                                                instance.hypervisor)
-    remote_info.Raise()
-    if remote_info.data:
+    msg = remote_info.RemoteFailMsg()
+    if msg:
+      raise errors.OpPrereqError("Error checking node %s: %s" %
+                                 (instance.primary_node, msg))
+    if remote_info.payload:
        raise errors.OpPrereqError("Instance '%s' is running on the node %s" %
                                   (self.op.instance_name,
                                    instance.primary_node))
@@ -3438,12 +3465,12 @@ class LUQueryInstances(NoHooksLU):
          if result.offline:
            # offline nodes will be in both lists
            off_nodes.append(name)
-        if result.failed:
+        if result.failed or result.RemoteFailMsg():
            bad_nodes.append(name)
          else:
-          if result.data:
-            live_data.update(result.data)
-            # else no instance is alive
+          if result.payload:
+            live_data.update(result.payload)
+          # else no instance is alive
      else:
        live_data = dict([(name, {}) for name in instance_names])
  
@@ -3882,12 +3909,12 @@ class LUMigrateInstance(LogicalUnit):
                       " a bad state)")
      ins_l = self.rpc.call_instance_list(self.all_nodes, [instance.hypervisor])
      for node, result in ins_l.items():
-      result.Raise()
-      if not isinstance(result.data, list):
-        raise errors.OpExecError("Can't contact node '%s'" % node)
+      msg = result.RemoteFailMsg()
+      if msg:
+        raise errors.OpExecError("Can't contact node %s: %s" % (node, msg))
  
-    runningon_source = instance.name in ins_l[source_node].data
-    runningon_target = instance.name in ins_l[target_node].data
+    runningon_source = instance.name in ins_l[source_node].payload
+    runningon_target = instance.name in ins_l[target_node].payload
  
      if runningon_source and runningon_target:
        raise errors.OpExecError("Instance seems to be running on two nodes,"
@@ -4672,11 +4699,13 @@ class LUCreateInstance(LogicalUnit):
        src_path = self.op.src_path
  
        if src_node is None:
-        exp_list = self.rpc.call_export_list(
-          self.acquired_locks[locking.LEVEL_NODE])
+        locked_nodes = self.acquired_locks[locking.LEVEL_NODE]
+        exp_list = self.rpc.call_export_list(locked_nodes)
          found = False
          for node in exp_list:
-          if not exp_list[node].failed and src_path in exp_list[node].data:
+          if exp_list[node].RemoteFailMsg():
+            continue
+          if src_path in exp_list[node].payload:
              found = True
              self.op.src_node = src_node = node
              self.op.src_path = src_path = os.path.join(constants.EXPORT_DIR,
@@ -4688,11 +4717,12 @@ class LUCreateInstance(LogicalUnit):
  
        _CheckNodeOnline(self, src_node)
        result = self.rpc.call_export_info(src_node, src_path)
-      result.Raise()
-      if not result.data:
-        raise errors.OpPrereqError("No export found in dir %s" % src_path)
+      msg = result.RemoteFailMsg()
+      if msg:
+        raise errors.OpPrereqError("No export or invalid export found in"
+                                   " dir %s: %s" % (src_path, msg))
  
-      export_info = result.data
+      export_info = objects.SerializableConfigParser.Loads(str(result.payload))
        if not export_info.has_section(constants.INISECT_EXP):
          raise errors.ProgrammerError("Corrupted export config")
  
@@ -4798,19 +4828,19 @@ class LUCreateInstance(LogicalUnit):
                                           self.op.hypervisor)
        for node in nodenames:
          info = nodeinfo[node]
-        info.Raise()
-        info = info.data
-        if not info:
+        msg = info.RemoteFailMsg()
+        if msg:
            raise errors.OpPrereqError("Cannot get current information"
-                                     " from node '%s'" % node)
+                                     " from node %s: %s" % (node, msg))
+        info = info.payload
          vg_free = info.get('vg_free', None)
          if not isinstance(vg_free, int):
            raise errors.OpPrereqError("Can't compute free disk space on"
                                       " node %s" % node)
-        if req_size > info['vg_free']:
+        if req_size > vg_free:
            raise errors.OpPrereqError("Not enough disk space on target node %s."
                                       " %d MB available, %d MB required" %
-                                     (node, info['vg_free'], req_size))
+                                     (node, vg_free, req_size))
  
      _CheckHVParams(self, nodenames, self.op.hypervisor, self.op.hvparams)
  
@@ -4945,12 +4975,10 @@ class LUCreateInstance(LogicalUnit):
          import_result = self.rpc.call_instance_os_import(pnode_name, iobj,
                                                           src_node, src_images,
                                                           cluster_name)
-        import_result.Raise()
-        for idx, result in enumerate(import_result.data):
-          if not result:
-            self.LogWarning("Could not import the image %s for instance"
-                            " %s, disk %d, on node %s" %
-                            (src_images[idx], instance, idx, pnode_name))
+        msg = import_result.RemoteFailMsg()
+        if msg:
+          self.LogWarning("Error while importing the disk images for instance"
+                          " %s on node %s: %s" % (instance, pnode_name, msg))
        else:
          # also checked in the prereq part
          raise errors.ProgrammerError("Unknown OS initialization mode '%s'"
@@ -5001,9 +5029,12 @@ class LUConnectConsole(NoHooksLU):
  
      node_insts = self.rpc.call_instance_list([node],
                                               [instance.hypervisor])[node]
-    node_insts.Raise()
+    msg = node_insts.RemoteFailMsg()
+    if msg:
+      raise errors.OpExecError("Can't get node information from %s: %s" %
+                               (node, msg))
  
-    if instance.name not in node_insts.data:
+    if instance.name not in node_insts.payload:
        raise errors.OpExecError("Instance %s is not running." % instance.name)
  
      logging.debug("Connecting to console of %s on %s", instance.name, node)
@@ -5225,7 +5256,10 @@ class LUReplaceDisks(LogicalUnit):
        raise errors.OpExecError("Can't list volume groups on the nodes")
      for node in oth_node, tgt_node:
        res = results[node]
-      if res.failed or not res.data or my_vg not in res.data:
+      msg = res.RemoteFailMsg()
+      if msg:
+        raise errors.OpExecError("Error checking node %s: %s" % (node, msg))
+      if my_vg not in res.payload:
          raise errors.OpExecError("Volume group '%s' not found on %s" %
                                   (my_vg, node))
      for idx, dev in enumerate(instance.disks):
@@ -5421,7 +5455,10 @@ class LUReplaceDisks(LogicalUnit):
      results = self.rpc.call_vg_list([pri_node, new_node])
      for node in pri_node, new_node:
        res = results[node]
-      if res.failed or not res.data or my_vg not in res.data:
+      msg = res.RemoteFailMsg()
+      if msg:
+        raise errors.OpExecError("Error checking node %s: %s" % (node, msg))
+      if my_vg not in res.payload:
          raise errors.OpExecError("Volume group '%s' not found on %s" %
                                   (my_vg, node))
      for idx, dev in enumerate(instance.disks):
@@ -5651,10 +5688,11 @@ class LUGrowDisk(LogicalUnit):
                                         instance.hypervisor)
      for node in nodenames:
        info = nodeinfo[node]
-      if info.failed or not info.data:
+      msg = info.RemoteFailMsg()
+      if msg:
          raise errors.OpPrereqError("Cannot get current information"
-                                   " from node '%s'" % node)
-      vg_free = info.data.get('vg_free', None)
+                                   " from node %s:" % (node, msg))
+      vg_free = info.payload.get('vg_free', None)
        if not isinstance(vg_free, int):
          raise errors.OpPrereqError("Can't compute free disk space on"
                                     " node %s" % node)
@@ -5801,8 +5839,11 @@ class LUQueryInstanceData(NoHooksLU):
          remote_info = self.rpc.call_instance_info(instance.primary_node,
                                                    instance.name,
                                                    instance.hypervisor)
-        remote_info.Raise()
-        remote_info = remote_info.data
+        msg = remote_info.RemoteFailMsg()
+        if msg:
+          raise errors.OpExecError("Error checking node %s: %s" %
+                                   (instance.primary_node, msg))
+        remote_info = remote_info.payload
          if remote_info and "state" in remote_info:
            remote_state = "up"
          else:
@@ -6090,31 +6131,45 @@ class LUSetInstanceParams(LogicalUnit):
                                                    instance.hypervisor)
        nodeinfo = self.rpc.call_node_info(mem_check_list, self.cfg.GetVGName(),
                                           instance.hypervisor)
-      if nodeinfo[pnode].failed or not isinstance(nodeinfo[pnode].data, dict):
+      pninfo = nodeinfo[pnode]
+      msg = pninfo.RemoteFailMsg()
+      if msg:
          # Assume the primary node is unreachable and go ahead
-        self.warn.append("Can't get info from primary node %s" % pnode)
+        self.warn.append("Can't get info from primary node %s: %s" %
+                         (pnode,  msg))
+      elif not isinstance(pninfo.payload.get('memory_free', None), int):
+        self.warn.append("Node data from primary node %s doesn't contain"
+                         " free memory information" % pnode)
+      elif instance_info.RemoteFailMsg():
+        self.warn.append("Can't get instance runtime information: %s" %
+                        instance_info.RemoteFailMsg())
        else:
-        if not instance_info.failed and instance_info.data:
-          current_mem = int(instance_info.data['memory'])
+        if instance_info.payload:
+          current_mem = int(instance_info.payload['memory'])
          else:
            # Assume instance not running
            # (there is a slight race condition here, but it's not very probable,
            # and we have no other way to check)
            current_mem = 0
          miss_mem = (be_new[constants.BE_MEMORY] - current_mem -
-                    nodeinfo[pnode].data['memory_free'])
+                    pninfo.payload['memory_free'])
          if miss_mem > 0:
            raise errors.OpPrereqError("This change will prevent the instance"
                                       " from starting, due to %d MB of memory"
                                       " missing on its primary node" % miss_mem)
  
        if be_new[constants.BE_AUTO_BALANCE]:
-        for node, nres in nodeinfo.iteritems():
+        for node, nres in nodeinfo.items():
            if node not in instance.secondary_nodes:
              continue
-          if nres.failed or not isinstance(nres.data, dict):
-            self.warn.append("Can't get info from secondary node %s" % node)
-          elif be_new[constants.BE_MEMORY] > nres.data['memory_free']:
+          msg = nres.RemoteFailMsg()
+          if msg:
+            self.warn.append("Can't get info from secondary node %s: %s" %
+                             (node, msg))
+          elif not isinstance(nres.payload.get('memory_free', None), int):
+            self.warn.append("Secondary node %s didn't return free"
+                             " memory information" % node)
+          elif be_new[constants.BE_MEMORY] > nres.payload['memory_free']:
              self.warn.append("Not enough memory to failover instance to"
                               " secondary node %s" % node)
  
@@ -6157,10 +6212,9 @@ class LUSetInstanceParams(LogicalUnit):
        if new_nic_mode == constants.NIC_MODE_BRIDGED:
          nic_bridge = new_filled_nic_params[constants.NIC_LINK]
          result = self.rpc.call_bridges_exist(pnode, [nic_bridge])
-        result.Raise()
-        if not result.data:
-          msg = ("Bridge '%s' doesn't exist on one of"
-                 " the instance nodes" % nic_bridge)
+        msg = result.RemoteFailMsg()
+        if msg:
+          msg = "Error checking bridges on node %s: %s" % (pnode, msg)
            if self.force:
              self.warn.append(msg)
            else:
@@ -6197,9 +6251,11 @@ class LUSetInstanceParams(LogicalUnit):
                                       " an instance")
          ins_l = self.rpc.call_instance_list([pnode], [instance.hypervisor])
          ins_l = ins_l[pnode]
-        if ins_l.failed or not isinstance(ins_l.data, list):
-          raise errors.OpPrereqError("Can't contact node '%s'" % pnode)
-        if instance.name in ins_l.data:
+        msg = ins_l.RemoteFailMsg()
+        if msg:
+          raise errors.OpPrereqError("Can't contact node %s: %s" %
+                                     (pnode, msg))
+        if instance.name in ins_l.payload:
            raise errors.OpPrereqError("Instance is running, can't remove"
                                       " disks.")
  
@@ -6360,10 +6416,10 @@ class LUQueryExports(NoHooksLU):
      rpcresult = self.rpc.call_export_list(self.nodes)
      result = {}
      for node in rpcresult:
-      if rpcresult[node].failed:
+      if rpcresult[node].RemoteFailMsg():
          result[node] = False
        else:
-        result[node] = rpcresult[node].data
+        result[node] = rpcresult[node].payload
  
      return result
  
@@ -6491,19 +6547,21 @@ class LUExportInstance(LogicalUnit):
        if dev:
          result = self.rpc.call_snapshot_export(src_node, dev, dst_node.name,
                                                 instance, cluster_name, idx)
-        if result.failed or not result.data:
+        msg = result.RemoteFailMsg()
+        if msg:
            self.LogWarning("Could not export block device %s from node %s to"
-                          " node %s", dev.logical_id[1], src_node,
-                          dst_node.name)
+                          " node %s: %s", dev.logical_id[1], src_node,
+                          dst_node.name, msg)
          msg = self.rpc.call_blockdev_remove(src_node, dev).RemoteFailMsg()
          if msg:
            self.LogWarning("Could not remove snapshot block device %s from node"
                            " %s: %s", dev.logical_id[1], src_node, msg)
  
      result = self.rpc.call_finalize_export(dst_node.name, instance, snap_disks)
-    if result.failed or not result.data:
-      self.LogWarning("Could not finalize export for instance %s on node %s",
-                      instance.name, dst_node.name)
+    msg = result.RemoteFailMsg()
+    if msg:
+      self.LogWarning("Could not finalize export for instance %s"
+                      " on node %s: %s", instance.name, dst_node.name, msg)
  
      nodelist = self.cfg.GetNodeList()
      nodelist.remove(dst_node.name)
@@ -6511,15 +6569,17 @@ class LUExportInstance(LogicalUnit):
      # on one-node clusters nodelist will be empty after the removal
      # if we proceed the backup would be removed because OpQueryExports
      # substitutes an empty list with the full cluster node list.
+    iname = instance.name
      if nodelist:
        exportlist = self.rpc.call_export_list(nodelist)
        for node in exportlist:
-        if exportlist[node].failed:
+        if exportlist[node].RemoteFailMsg():
            continue
-        if instance.name in exportlist[node].data:
-          if not self.rpc.call_export_remove(node, instance.name):
+        if iname in exportlist[node].payload:
+          msg = self.rpc.call_export_remove(node, iname).RemoteFailMsg()
+          if msg:
              self.LogWarning("Could not remove older export for instance %s"
-                            " on node %s", instance.name, node)
+                            " on node %s: %s", iname, node, msg)
  
  
  class LURemoveExport(NoHooksLU):
@@ -6553,19 +6613,21 @@ class LURemoveExport(NoHooksLU):
        fqdn_warn = True
        instance_name = self.op.instance_name
  
-    exportlist = self.rpc.call_export_list(self.acquired_locks[
-      locking.LEVEL_NODE])
+    locked_nodes = self.acquired_locks[locking.LEVEL_NODE]
+    exportlist = self.rpc.call_export_list(locked_nodes)
      found = False
      for node in exportlist:
-      if exportlist[node].failed:
-        self.LogWarning("Failed to query node %s, continuing" % node)
+      msg = exportlist[node].RemoteFailMsg()
+      if msg:
+        self.LogWarning("Failed to query node %s (continuing): %s", node, msg)
          continue
-      if instance_name in exportlist[node].data:
+      if instance_name in exportlist[node].payload:
          found = True
          result = self.rpc.call_export_remove(node, instance_name)
-        if result.failed or not result.data:
+        msg = result.RemoteFailMsg()
+        if msg:
            logging.error("Could not remove export for instance %s"
-                        " on node %s", instance_name, node)
+                        " on node %s: %s", instance_name, node, msg)
  
      if fqdn_warn and not found:
        feedback_fn("Export not found. If trying to remove an export belonging"
@@ -6885,29 +6947,33 @@ class IAllocator(object):
          }
  
        if not ninfo.offline:
-        nresult.Raise()
-        if not isinstance(nresult.data, dict):
-          raise errors.OpExecError("Can't get data for node %s" % nname)
-        remote_info = nresult.data
+        msg = nresult.RemoteFailMsg()
+        if msg:
+          raise errors.OpExecError("Can't get data for node %s: %s" %
+                                   (nname, msg))
+        msg = node_iinfo[nname].RemoteFailMsg()
+        if msg:
+          raise errors.OpExecError("Can't get node instance info"
+                                   " from node %s: %s" % (nname, msg))
+        remote_info = nresult.payload
          for attr in ['memory_total', 'memory_free', 'memory_dom0',
                       'vg_size', 'vg_free', 'cpu_total']:
            if attr not in remote_info:
              raise errors.OpExecError("Node '%s' didn't return attribute"
                                       " '%s'" % (nname, attr))
-          try:
-            remote_info[attr] = int(remote_info[attr])
-          except ValueError, err:
+          if not isinstance(remote_info[attr], int):
              raise errors.OpExecError("Node '%s' returned invalid value"
-                                     " for '%s': %s" % (nname, attr, err))
+                                     " for '%s': %s" %
+                                     (nname, attr, remote_info[attr]))
          # compute memory used by primary instances
          i_p_mem = i_p_up_mem = 0
          for iinfo, beinfo in i_list:
            if iinfo.primary_node == nname:
              i_p_mem += beinfo[constants.BE_MEMORY]
-            if iinfo.name not in node_iinfo[nname].data:
+            if iinfo.name not in node_iinfo[nname].payload:
                i_used_mem = 0
              else:
-              i_used_mem = int(node_iinfo[nname].data[iinfo.name]['memory'])
+              i_used_mem = int(node_iinfo[nname].payload[iinfo.name]['memory'])
              i_mem_diff = beinfo[constants.BE_MEMORY] - i_used_mem
              remote_info['memory_free'] -= max(0, i_mem_diff)