Convert bdev.py to the logging module

[ganeti-local] / lib / cmdlib.py
diff --git a/lib/cmdlib.py b/lib/cmdlib.py

index ae9a302..8c8f4f7 100644 (file)
--- a/lib/cmdlib.py
+++ b/lib/cmdlib.py
@@ -1,7 +1,7 @@
  #
  #
  
  #
  #
  
-# Copyright (C) 2006, 2007 Google Inc.
+# Copyright (C) 2006, 2007, 2008 Google Inc.
  #
  # This program is free software; you can redistribute it and/or modify
  # it under the terms of the GNU General Public License as published by
  #
  # This program is free software; you can redistribute it and/or modify
  # it under the terms of the GNU General Public License as published by
@@ -37,32 +37,40 @@ from ganeti import logger
  from ganeti import utils
  from ganeti import errors
  from ganeti import hypervisor
  from ganeti import utils
  from ganeti import errors
  from ganeti import hypervisor
+from ganeti import locking
  from ganeti import config
  from ganeti import constants
  from ganeti import objects
  from ganeti import opcodes
  from ganeti import ssconf
  from ganeti import config
  from ganeti import constants
  from ganeti import objects
  from ganeti import opcodes
  from ganeti import ssconf
+from ganeti import serializer
+
  
  class LogicalUnit(object):
    """Logical Unit base class.
  
    Subclasses must follow these rules:
  
  class LogicalUnit(object):
    """Logical Unit base class.
  
    Subclasses must follow these rules:
-    - implement CheckPrereq which also fills in the opcode instance
-      with all the fields (even if as None)
+    - implement ExpandNames
+    - implement CheckPrereq
      - implement Exec
      - implement BuildHooksEnv
      - redefine HPATH and HTYPE
      - implement Exec
      - implement BuildHooksEnv
      - redefine HPATH and HTYPE
-    - optionally redefine their run requirements (REQ_CLUSTER,
-      REQ_MASTER); note that all commands require root permissions
+    - optionally redefine their run requirements:
+        REQ_MASTER: the LU needs to run on the master node
+        REQ_WSSTORE: the LU needs a writable SimpleStore
+        REQ_BGL: the LU needs to hold the Big Ganeti Lock exclusively
+
+  Note that all commands require root permissions.
  
    """
    HPATH = None
    HTYPE = None
    _OP_REQP = []
  
    """
    HPATH = None
    HTYPE = None
    _OP_REQP = []
-  REQ_CLUSTER = True
    REQ_MASTER = True
    REQ_MASTER = True
+  REQ_WSSTORE = False
+  REQ_BGL = True
  
  
-  def __init__(self, processor, op, cfg, sstore):
+  def __init__(self, processor, op, context, sstore):
      """Constructor for LogicalUnit.
  
      This needs to be overriden in derived classes in order to check op
      """Constructor for LogicalUnit.
  
      This needs to be overriden in derived classes in order to check op
@@ -71,22 +79,76 @@ class LogicalUnit(object):
      """
      self.proc = processor
      self.op = op
      """
      self.proc = processor
      self.op = op
-    self.cfg = cfg
+    self.cfg = context.cfg
      self.sstore = sstore
      self.sstore = sstore
+    self.context = context
+    self.needed_locks = None
+    self.__ssh = None
+
      for attr_name in self._OP_REQP:
        attr_val = getattr(op, attr_name, None)
        if attr_val is None:
          raise errors.OpPrereqError("Required parameter '%s' missing" %
                                     attr_name)
      for attr_name in self._OP_REQP:
        attr_val = getattr(op, attr_name, None)
        if attr_val is None:
          raise errors.OpPrereqError("Required parameter '%s' missing" %
                                     attr_name)
-    if self.REQ_CLUSTER:
-      if not cfg.IsCluster():
-        raise errors.OpPrereqError("Cluster not initialized yet,"
-                                   " use 'gnt-cluster init' first.")
-      if self.REQ_MASTER:
-        master = sstore.GetMasterNode()
-        if master != utils.HostInfo().name:
-          raise errors.OpPrereqError("Commands must be run on the master"
-                                     " node %s" % master)
+
+    if not self.cfg.IsCluster():
+      raise errors.OpPrereqError("Cluster not initialized yet,"
+                                 " use 'gnt-cluster init' first.")
+    if self.REQ_MASTER:
+      master = sstore.GetMasterNode()
+      if master != utils.HostInfo().name:
+        raise errors.OpPrereqError("Commands must be run on the master"
+                                   " node %s" % master)
+
+  def __GetSSH(self):
+    """Returns the SshRunner object
+
+    """
+    if not self.__ssh:
+      self.__ssh = ssh.SshRunner(self.sstore)
+    return self.__ssh
+
+  ssh = property(fget=__GetSSH)
+
+  def ExpandNames(self):
+    """Expand names for this LU.
+
+    This method is called before starting to execute the opcode, and it should
+    update all the parameters of the opcode to their canonical form (e.g. a
+    short node name must be fully expanded after this method has successfully
+    completed). This way locking, hooks, logging, ecc. can work correctly.
+
+    LUs which implement this method must also populate the self.needed_locks
+    member, as a dict with lock levels as keys, and a list of needed lock names
+    as values. Rules:
+      - Use an empty dict if you don't need any lock
+      - If you don't need any lock at a particular level omit that level
+      - Don't put anything for the BGL level
+      - If you want all locks at a level use None as a value
+        (this reflects what LockSet does, and will be replaced before
+        CheckPrereq with the full list of nodes that have been locked)
+
+    Examples:
+    # Acquire all nodes and one instance
+    self.needed_locks = {
+      locking.LEVEL_NODE: None,
+      locking.LEVEL_INSTANCES: ['instance1.example.tld'],
+    }
+    # Acquire just two nodes
+    self.needed_locks = {
+      locking.LEVEL_NODE: ['node1.example.tld', 'node2.example.tld'],
+    }
+    # Acquire no locks
+    self.needed_locks = {} # No, you can't leave it to the default value None
+
+    """
+    # The implementation of this method is mandatory only if the new LU is
+    # concurrent, so that old LUs don't need to be changed all at the same
+    # time.
+    if self.REQ_BGL:
+      self.needed_locks = {} # Exclusive LUs don't need locks.
+    else:
+      raise NotImplementedError
  
    def CheckPrereq(self):
      """Check prerequisites for this LU.
  
    def CheckPrereq(self):
      """Check prerequisites for this LU.
@@ -100,9 +162,7 @@ class LogicalUnit(object):
      not fulfilled. Its return value is ignored.
  
      This method should also update all the parameters of the opcode to
      not fulfilled. Its return value is ignored.
  
      This method should also update all the parameters of the opcode to
-    their canonical form; e.g. a short node name must be fully
-    expanded after this method has successfully completed (so that
-    hooks, logging, etc. work correctly).
+    their canonical form if it hasn't been done by ExpandNames before.
  
      """
      raise NotImplementedError
  
      """
      raise NotImplementedError
@@ -131,11 +191,7 @@ class LogicalUnit(object):
      added by the hooks runner. If the LU doesn't define any
      environment, an empty dict (and not None) should be returned.
  
      added by the hooks runner. If the LU doesn't define any
      environment, an empty dict (and not None) should be returned.
  
-    As for the node lists, the master should not be included in the
-    them, as it will be added by the hooks runner in case this LU
-    requires a cluster to run on (otherwise we don't have a node
-    list). No nodes should be returned as an empty list (and not
-    None).
+    No nodes should be returned as an empty list (and not None).
  
      Note that if the HPATH for a LU class is None, this function will
      not be called.
  
      Note that if the HPATH for a LU class is None, this function will
      not be called.
@@ -143,6 +199,24 @@ class LogicalUnit(object):
      """
      raise NotImplementedError
  
      """
      raise NotImplementedError
  
+  def HooksCallBack(self, phase, hook_results, feedback_fn, lu_result):
+    """Notify the LU about the results of its hooks.
+
+    This method is called every time a hooks phase is executed, and notifies
+    the Logical Unit about the hooks' result. The LU can then use it to alter
+    its result based on the hooks.  By default the method does nothing and the
+    previous result is passed back unchanged but any LU can define it if it
+    wants to use the local cluster hook-scripts somehow.
+
+    Args:
+      phase: the hooks phase that has just been run
+      hooks_results: the results of the multi-node hooks rpc call
+      feedback_fn: function to send feedback back to the caller
+      lu_result: the previous result this LU had, or None in the PRE phase.
+
+    """
+    return lu_result
+
  
  class NoHooksLU(LogicalUnit):
    """Simple LU which runs no hooks.
  
  class NoHooksLU(LogicalUnit):
    """Simple LU which runs no hooks.
@@ -154,31 +228,6 @@ class NoHooksLU(LogicalUnit):
    HPATH = None
    HTYPE = None
  
    HPATH = None
    HTYPE = None
  
-  def BuildHooksEnv(self):
-    """Build hooks env.
-
-    This is a no-op, since we don't run hooks.
-
-    """
-    return {}, [], []
-
-
-def _AddHostToEtcHosts(hostname):
-  """Wrapper around utils.SetEtcHostsEntry.
-
-  """
-  hi = utils.HostInfo(name=hostname)
-  utils.SetEtcHostsEntry(constants.ETC_HOSTS, hi.ip, hi.name, [hi.ShortName()])
-
-
-def _RemoveHostFromEtcHosts(hostname):
-  """Wrapper around utils.RemoveEtcHostsEntry.
-
-  """
-  hi = utils.HostInfo(name=hostname)
-  utils.RemoveEtcHostsEntry(constants.ETC_HOSTS, hi.name)
-  utils.RemoveEtcHostsEntry(constants.ETC_HOSTS, hi.ShortName())
-
  
  def _GetWantedNodes(lu, nodes):
    """Returns list of checked and expanded node names.
  
  def _GetWantedNodes(lu, nodes):
    """Returns list of checked and expanded node names.
@@ -267,11 +316,12 @@ def _BuildInstanceHookEnv(name, primary_node, secondary_nodes, os_type, status,
  
    if nics:
      nic_count = len(nics)
  
    if nics:
      nic_count = len(nics)
-    for idx, (ip, bridge) in enumerate(nics):
+    for idx, (ip, bridge, mac) in enumerate(nics):
        if ip is None:
          ip = ""
        env["INSTANCE_NIC%d_IP" % idx] = ip
        env["INSTANCE_NIC%d_BRIDGE" % idx] = bridge
        if ip is None:
          ip = ""
        env["INSTANCE_NIC%d_IP" % idx] = ip
        env["INSTANCE_NIC%d_BRIDGE" % idx] = bridge
+      env["INSTANCE_NIC%d_HWADDR" % idx] = mac
    else:
      nic_count = 0
  
    else:
      nic_count = 0
  
@@ -295,171 +345,13 @@ def _BuildInstanceHookEnvByObject(instance, override=None):
      'status': instance.os,
      'memory': instance.memory,
      'vcpus': instance.vcpus,
      'status': instance.os,
      'memory': instance.memory,
      'vcpus': instance.vcpus,
-    'nics': [(nic.ip, nic.bridge) for nic in instance.nics],
+    'nics': [(nic.ip, nic.bridge, nic.mac) for nic in instance.nics],
    }
    if override:
      args.update(override)
    return _BuildInstanceHookEnv(**args)
  
  
    }
    if override:
      args.update(override)
    return _BuildInstanceHookEnv(**args)
  
  
-def _UpdateKnownHosts(fullnode, ip, pubkey):
-  """Ensure a node has a correct known_hosts entry.
-
-  Args:
-    fullnode - Fully qualified domain name of host. (str)
-    ip       - IPv4 address of host (str)
-    pubkey   - the public key of the cluster
-
-  """
-  if os.path.exists(constants.SSH_KNOWN_HOSTS_FILE):
-    f = open(constants.SSH_KNOWN_HOSTS_FILE, 'r+')
-  else:
-    f = open(constants.SSH_KNOWN_HOSTS_FILE, 'w+')
-
-  inthere = False
-
-  save_lines = []
-  add_lines = []
-  removed = False
-
-  for rawline in f:
-    logger.Debug('read %s' % (repr(rawline),))
-
-    parts = rawline.rstrip('\r\n').split()
-
-    # Ignore unwanted lines
-    if len(parts) >= 3 and not rawline.lstrip()[0] == '#':
-      fields = parts[0].split(',')
-      key = parts[2]
-
-      haveall = True
-      havesome = False
-      for spec in [ ip, fullnode ]:
-        if spec not in fields:
-          haveall = False
-        if spec in fields:
-          havesome = True
-
-      logger.Debug("key, pubkey = %s." % (repr((key, pubkey)),))
-      if haveall and key == pubkey:
-        inthere = True
-        save_lines.append(rawline)
-        logger.Debug("Keeping known_hosts '%s'." % (repr(rawline),))
-        continue
-
-      if havesome and (not haveall or key != pubkey):
-        removed = True
-        logger.Debug("Discarding known_hosts '%s'." % (repr(rawline),))
-        continue
-
-    save_lines.append(rawline)
-
-  if not inthere:
-    add_lines.append('%s,%s ssh-rsa %s\n' % (fullnode, ip, pubkey))
-    logger.Debug("Adding known_hosts '%s'." % (repr(add_lines[-1]),))
-
-  if removed:
-    save_lines = save_lines + add_lines
-
-    # Write a new file and replace old.
-    fd, tmpname = tempfile.mkstemp('.tmp', 'known_hosts.',
-                                   constants.DATA_DIR)
-    newfile = os.fdopen(fd, 'w')
-    try:
-      newfile.write(''.join(save_lines))
-    finally:
-      newfile.close()
-    logger.Debug("Wrote new known_hosts.")
-    os.rename(tmpname, constants.SSH_KNOWN_HOSTS_FILE)
-
-  elif add_lines:
-    # Simply appending a new line will do the trick.
-    f.seek(0, 2)
-    for add in add_lines:
-      f.write(add)
-
-  f.close()
-
-
-def _HasValidVG(vglist, vgname):
-  """Checks if the volume group list is valid.
-
-  A non-None return value means there's an error, and the return value
-  is the error message.
-
-  """
-  vgsize = vglist.get(vgname, None)
-  if vgsize is None:
-    return "volume group '%s' missing" % vgname
-  elif vgsize < 20480:
-    return ("volume group '%s' too small (20480MiB required, %dMib found)" %
-            (vgname, vgsize))
-  return None
-
-
-def _InitSSHSetup(node):
-  """Setup the SSH configuration for the cluster.
-
-
-  This generates a dsa keypair for root, adds the pub key to the
-  permitted hosts and adds the hostkey to its own known hosts.
-
-  Args:
-    node: the name of this host as a fqdn
-
-  """
-  priv_key, pub_key, auth_keys = ssh.GetUserFiles(constants.GANETI_RUNAS)
-
-  for name in priv_key, pub_key:
-    if os.path.exists(name):
-      utils.CreateBackup(name)
-    utils.RemoveFile(name)
-
-  result = utils.RunCmd(["ssh-keygen", "-t", "dsa",
-                         "-f", priv_key,
-                         "-q", "-N", ""])
-  if result.failed:
-    raise errors.OpExecError("Could not generate ssh keypair, error %s" %
-                             result.output)
-
-  f = open(pub_key, 'r')
-  try:
-    utils.AddAuthorizedKey(auth_keys, f.read(8192))
-  finally:
-    f.close()
-
-
-def _InitGanetiServerSetup(ss):
-  """Setup the necessary configuration for the initial node daemon.
-
-  This creates the nodepass file containing the shared password for
-  the cluster and also generates the SSL certificate.
-
-  """
-  # Create pseudo random password
-  randpass = sha.new(os.urandom(64)).hexdigest()
-  # and write it into sstore
-  ss.SetKey(ss.SS_NODED_PASS, randpass)
-
-  result = utils.RunCmd(["openssl", "req", "-new", "-newkey", "rsa:1024",
-                         "-days", str(365*5), "-nodes", "-x509",
-                         "-keyout", constants.SSL_CERT_FILE,
-                         "-out", constants.SSL_CERT_FILE, "-batch"])
-  if result.failed:
-    raise errors.OpExecError("could not generate server ssl cert, command"
-                             " %s had exitcode %s and error message %s" %
-                             (result.cmd, result.exit_code, result.output))
-
-  os.chmod(constants.SSL_CERT_FILE, 0400)
-
-  result = utils.RunCmd([constants.NODE_INITD_SCRIPT, "restart"])
-
-  if result.failed:
-    raise errors.OpExecError("Could not start the node daemon, command %s"
-                             " had exitcode %s and error %s" %
-                             (result.cmd, result.exit_code, result.output))
-
-
  def _CheckInstanceBridgesExist(instance):
    """Check that the brigdes needed by an instance exist.
  
  def _CheckInstanceBridgesExist(instance):
    """Check that the brigdes needed by an instance exist.
  
@@ -472,129 +364,6 @@ def _CheckInstanceBridgesExist(instance):
                                 (brlist, instance.primary_node))
  
  
                                 (brlist, instance.primary_node))
  
  
-class LUInitCluster(LogicalUnit):
-  """Initialise the cluster.
-
-  """
-  HPATH = "cluster-init"
-  HTYPE = constants.HTYPE_CLUSTER
-  _OP_REQP = ["cluster_name", "hypervisor_type", "vg_name", "mac_prefix",
-              "def_bridge", "master_netdev"]
-  REQ_CLUSTER = False
-
-  def BuildHooksEnv(self):
-    """Build hooks env.
-
-    Notes: Since we don't require a cluster, we must manually add
-    ourselves in the post-run node list.
-
-    """
-    env = {"OP_TARGET": self.op.cluster_name}
-    return env, [], [self.hostname.name]
-
-  def CheckPrereq(self):
-    """Verify that the passed name is a valid one.
-
-    """
-    if config.ConfigWriter.IsCluster():
-      raise errors.OpPrereqError("Cluster is already initialised")
-
-    self.hostname = hostname = utils.HostInfo()
-
-    if hostname.ip.startswith("127."):
-      raise errors.OpPrereqError("This host's IP resolves to the private"
-                                 " range (%s). Please fix DNS or /etc/hosts." %
-                                 (hostname.ip,))
-
-    self.clustername = clustername = utils.HostInfo(self.op.cluster_name)
-
-    if not utils.TcpPing(constants.LOCALHOST_IP_ADDRESS, hostname.ip,
-                         constants.DEFAULT_NODED_PORT):
-      raise errors.OpPrereqError("Inconsistency: this host's name resolves"
-                                 " to %s,\nbut this ip address does not"
-                                 " belong to this host."
-                                 " Aborting." % hostname.ip)
-
-    secondary_ip = getattr(self.op, "secondary_ip", None)
-    if secondary_ip and not utils.IsValidIP(secondary_ip):
-      raise errors.OpPrereqError("Invalid secondary ip given")
-    if (secondary_ip and
-        secondary_ip != hostname.ip and
-        (not utils.TcpPing(constants.LOCALHOST_IP_ADDRESS, secondary_ip,
-                           constants.DEFAULT_NODED_PORT))):
-      raise errors.OpPrereqError("You gave %s as secondary IP,\n"
-                                 "but it does not belong to this host." %
-                                 secondary_ip)
-    self.secondary_ip = secondary_ip
-
-    # checks presence of the volume group given
-    vgstatus = _HasValidVG(utils.ListVolumeGroups(), self.op.vg_name)
-
-    if vgstatus:
-      raise errors.OpPrereqError("Error: %s" % vgstatus)
-
-    if not re.match("^[0-9a-z]{2}:[0-9a-z]{2}:[0-9a-z]{2}$",
-                    self.op.mac_prefix):
-      raise errors.OpPrereqError("Invalid mac prefix given '%s'" %
-                                 self.op.mac_prefix)
-
-    if self.op.hypervisor_type not in hypervisor.VALID_HTYPES:
-      raise errors.OpPrereqError("Invalid hypervisor type given '%s'" %
-                                 self.op.hypervisor_type)
-
-    result = utils.RunCmd(["ip", "link", "show", "dev", self.op.master_netdev])
-    if result.failed:
-      raise errors.OpPrereqError("Invalid master netdev given (%s): '%s'" %
-                                 (self.op.master_netdev,
-                                  result.output.strip()))
-
-    if not (os.path.isfile(constants.NODE_INITD_SCRIPT) and
-            os.access(constants.NODE_INITD_SCRIPT, os.X_OK)):
-      raise errors.OpPrereqError("Init.d script '%s' missing or not "
-                                 "executable." % constants.NODE_INITD_SCRIPT)
-
-  def Exec(self, feedback_fn):
-    """Initialize the cluster.
-
-    """
-    clustername = self.clustername
-    hostname = self.hostname
-
-    # set up the simple store
-    self.sstore = ss = ssconf.SimpleStore()
-    ss.SetKey(ss.SS_HYPERVISOR, self.op.hypervisor_type)
-    ss.SetKey(ss.SS_MASTER_NODE, hostname.name)
-    ss.SetKey(ss.SS_MASTER_IP, clustername.ip)
-    ss.SetKey(ss.SS_MASTER_NETDEV, self.op.master_netdev)
-    ss.SetKey(ss.SS_CLUSTER_NAME, clustername.name)
-
-    # set up the inter-node password and certificate
-    _InitGanetiServerSetup(ss)
-
-    # start the master ip
-    rpc.call_node_start_master(hostname.name)
-
-    # set up ssh config and /etc/hosts
-    f = open(constants.SSH_HOST_RSA_PUB, 'r')
-    try:
-      sshline = f.read()
-    finally:
-      f.close()
-    sshkey = sshline.split(" ")[1]
-
-    _AddHostToEtcHosts(hostname.name)
-
-    _UpdateKnownHosts(hostname.name, hostname.ip, sshkey)
-
-    _InitSSHSetup(hostname.name)
-
-    # init of cluster config file
-    self.cfg = cfgw = config.ConfigWriter()
-    cfgw.InitConfig(hostname.name, hostname.ip, self.secondary_ip,
-                    sshkey, self.op.mac_prefix,
-                    self.op.vg_name, self.op.def_bridge)
-
-
  class LUDestroyCluster(NoHooksLU):
    """Logical unit for destroying the cluster.
  
  class LUDestroyCluster(NoHooksLU):
    """Logical unit for destroying the cluster.
  
@@ -625,18 +394,21 @@ class LUDestroyCluster(NoHooksLU):
  
      """
      master = self.sstore.GetMasterNode()
  
      """
      master = self.sstore.GetMasterNode()
+    if not rpc.call_node_stop_master(master):
+      raise errors.OpExecError("Could not disable the master role")
      priv_key, pub_key, _ = ssh.GetUserFiles(constants.GANETI_RUNAS)
      utils.CreateBackup(priv_key)
      utils.CreateBackup(pub_key)
      rpc.call_node_leave_cluster(master)
      priv_key, pub_key, _ = ssh.GetUserFiles(constants.GANETI_RUNAS)
      utils.CreateBackup(priv_key)
      utils.CreateBackup(pub_key)
      rpc.call_node_leave_cluster(master)
-    _RemoveHostFromEtcHosts(master)
  
  
  
  
-class LUVerifyCluster(NoHooksLU):
+class LUVerifyCluster(LogicalUnit):
    """Verifies the cluster status.
  
    """
    """Verifies the cluster status.
  
    """
-  _OP_REQP = []
+  HPATH = "cluster-verify"
+  HTYPE = constants.HTYPE_CLUSTER
+  _OP_REQP = ["skip_checks"]
  
    def _VerifyNode(self, node, file_list, local_cksum, vglist, node_result,
                    remote_version, feedback_fn):
  
    def _VerifyNode(self, node, file_list, local_cksum, vglist, node_result,
                    remote_version, feedback_fn):
@@ -657,7 +429,7 @@ class LUVerifyCluster(NoHooksLU):
      # compares ganeti version
      local_version = constants.PROTOCOL_VERSION
      if not remote_version:
      # compares ganeti version
      local_version = constants.PROTOCOL_VERSION
      if not remote_version:
-      feedback_fn(" - ERROR: connection to %s failed" % (node))
+      feedback_fn("  - ERROR: connection to %s failed" % (node))
        return True
  
      if local_version != remote_version:
        return True
  
      if local_version != remote_version:
@@ -673,7 +445,8 @@ class LUVerifyCluster(NoHooksLU):
                        (node,))
        bad = True
      else:
                        (node,))
        bad = True
      else:
-      vgstatus = _HasValidVG(vglist, self.cfg.GetVGName())
+      vgstatus = utils.CheckVolumeGroupSize(vglist, self.cfg.GetVGName(),
+                                            constants.MIN_VG_SIZE)
        if vgstatus:
          feedback_fn("  - ERROR: %s on node %s" % (vgstatus, node))
          bad = True
        if vgstatus:
          feedback_fn("  - ERROR: %s on node %s" % (vgstatus, node))
          bad = True
@@ -696,19 +469,31 @@ class LUVerifyCluster(NoHooksLU):
  
      if 'nodelist' not in node_result:
        bad = True
  
      if 'nodelist' not in node_result:
        bad = True
-      feedback_fn("  - ERROR: node hasn't returned node connectivity data")
+      feedback_fn("  - ERROR: node hasn't returned node ssh connectivity data")
      else:
        if node_result['nodelist']:
          bad = True
          for node in node_result['nodelist']:
      else:
        if node_result['nodelist']:
          bad = True
          for node in node_result['nodelist']:
-          feedback_fn("  - ERROR: communication with node '%s': %s" %
+          feedback_fn("  - ERROR: ssh communication with node '%s': %s" %
                            (node, node_result['nodelist'][node]))
                            (node, node_result['nodelist'][node]))
+    if 'node-net-test' not in node_result:
+      bad = True
+      feedback_fn("  - ERROR: node hasn't returned node tcp connectivity data")
+    else:
+      if node_result['node-net-test']:
+        bad = True
+        nlist = utils.NiceSort(node_result['node-net-test'].keys())
+        for node in nlist:
+          feedback_fn("  - ERROR: tcp communication with node '%s': %s" %
+                          (node, node_result['node-net-test'][node]))
+
      hyp_result = node_result.get('hypervisor', None)
      if hyp_result is not None:
        feedback_fn("  - ERROR: hypervisor verify failure: '%s'" % hyp_result)
      return bad
  
      hyp_result = node_result.get('hypervisor', None)
      if hyp_result is not None:
        feedback_fn("  - ERROR: hypervisor verify failure: '%s'" % hyp_result)
      return bad
  
-  def _VerifyInstance(self, instance, node_vol_is, node_instance, feedback_fn):
+  def _VerifyInstance(self, instance, instanceconfig, node_vol_is,
+                      node_instance, feedback_fn):
      """Verify an instance.
  
      This function checks to see if the required block devices are
      """Verify an instance.
  
      This function checks to see if the required block devices are
@@ -717,13 +502,6 @@ class LUVerifyCluster(NoHooksLU):
      """
      bad = False
  
      """
      bad = False
  
-    instancelist = self.cfg.GetInstanceList()
-    if not instance in instancelist:
-      feedback_fn("  - ERROR: instance %s not in instance list %s" %
-                      (instance, instancelist))
-      bad = True
-
-    instanceconfig = self.cfg.GetInstanceInfo(instance)
      node_current = instanceconfig.primary_node
  
      node_vol_should = {}
      node_current = instanceconfig.primary_node
  
      node_vol_should = {}
@@ -737,7 +515,8 @@ class LUVerifyCluster(NoHooksLU):
            bad = True
  
      if not instanceconfig.status == 'down':
            bad = True
  
      if not instanceconfig.status == 'down':
-      if not instance in node_instance[node_current]:
+      if (node_current not in node_instance or
+          not instance in node_instance[node_current]):
          feedback_fn("  - ERROR: instance %s not running on node %s" %
                          (instance, node_current))
          bad = True
          feedback_fn("  - ERROR: instance %s not running on node %s" %
                          (instance, node_current))
          bad = True
@@ -783,13 +562,56 @@ class LUVerifyCluster(NoHooksLU):
            bad = True
      return bad
  
            bad = True
      return bad
  
+  def _VerifyNPlusOneMemory(self, node_info, instance_cfg, feedback_fn):
+    """Verify N+1 Memory Resilience.
+
+    Check that if one single node dies we can still start all the instances it
+    was primary for.
+
+    """
+    bad = False
+
+    for node, nodeinfo in node_info.iteritems():
+      # This code checks that every node which is now listed as secondary has
+      # enough memory to host all instances it is supposed to should a single
+      # other node in the cluster fail.
+      # FIXME: not ready for failover to an arbitrary node
+      # FIXME: does not support file-backed instances
+      # WARNING: we currently take into account down instances as well as up
+      # ones, considering that even if they're down someone might want to start
+      # them even in the event of a node failure.
+      for prinode, instances in nodeinfo['sinst-by-pnode'].iteritems():
+        needed_mem = 0
+        for instance in instances:
+          needed_mem += instance_cfg[instance].memory
+        if nodeinfo['mfree'] < needed_mem:
+          feedback_fn("  - ERROR: not enough memory on node %s to accomodate"
+                      " failovers should node %s fail" % (node, prinode))
+          bad = True
+    return bad
+
    def CheckPrereq(self):
      """Check prerequisites.
  
    def CheckPrereq(self):
      """Check prerequisites.
  
-    This has no prerequisites.
+    Transform the list of checks we're going to skip into a set and check that
+    all its members are valid.
  
      """
  
      """
-    pass
+    self.skip_set = frozenset(self.op.skip_checks)
+    if not constants.VERIFY_OPTIONAL_CHECKS.issuperset(self.skip_set):
+      raise errors.OpPrereqError("Invalid checks to be skipped specified")
+
+  def BuildHooksEnv(self):
+    """Build hooks env.
+
+    Cluster-Verify hooks just rone in the post phase and their failure makes
+    the output be logged in the verify output and the verification to fail.
+
+    """
+    all_nodes = self.cfg.GetNodeList()
+    # TODO: populate the environment with useful information for verify hooks
+    env = {}
+    return env, [], all_nodes
  
    def Exec(self, feedback_fn):
      """Verify integrity of cluster, performing various test on nodes.
  
    def Exec(self, feedback_fn):
      """Verify integrity of cluster, performing various test on nodes.
@@ -797,13 +619,18 @@ class LUVerifyCluster(NoHooksLU):
      """
      bad = False
      feedback_fn("* Verifying global settings")
      """
      bad = False
      feedback_fn("* Verifying global settings")
-    self.cfg.VerifyConfig()
+    for msg in self.cfg.VerifyConfig():
+      feedback_fn("  - ERROR: %s" % msg)
  
      vg_name = self.cfg.GetVGName()
      nodelist = utils.NiceSort(self.cfg.GetNodeList())
  
      vg_name = self.cfg.GetVGName()
      nodelist = utils.NiceSort(self.cfg.GetNodeList())
+    nodeinfo = [self.cfg.GetNodeInfo(nname) for nname in nodelist]
      instancelist = utils.NiceSort(self.cfg.GetInstanceList())
      instancelist = utils.NiceSort(self.cfg.GetInstanceList())
+    i_non_redundant = [] # Non redundant instances
      node_volume = {}
      node_instance = {}
      node_volume = {}
      node_instance = {}
+    node_info = {}
+    instance_cfg = {}
  
      # FIXME: verify OS list
      # do local checksums
  
      # FIXME: verify OS list
      # do local checksums
@@ -820,9 +647,12 @@ class LUVerifyCluster(NoHooksLU):
        'filelist': file_names,
        'nodelist': nodelist,
        'hypervisor': None,
        'filelist': file_names,
        'nodelist': nodelist,
        'hypervisor': None,
+      'node-net-test': [(node.name, node.primary_ip, node.secondary_ip)
+                        for node in nodeinfo]
        }
      all_nvinfo = rpc.call_node_verify(nodelist, node_verify_param)
      all_rversion = rpc.call_version(nodelist)
        }
      all_nvinfo = rpc.call_node_verify(nodelist, node_verify_param)
      all_rversion = rpc.call_version(nodelist)
+    all_ninfo = rpc.call_node_info(nodelist, self.cfg.GetVGName())
  
      for node in nodelist:
        feedback_fn("* Verifying node %s" % node)
  
      for node in nodelist:
        feedback_fn("* Verifying node %s" % node)
@@ -834,12 +664,17 @@ class LUVerifyCluster(NoHooksLU):
        # node_volume
        volumeinfo = all_volumeinfo[node]
  
        # node_volume
        volumeinfo = all_volumeinfo[node]
  
-      if type(volumeinfo) != dict:
+      if isinstance(volumeinfo, basestring):
+        feedback_fn("  - ERROR: LVM problem on node %s: %s" %
+                    (node, volumeinfo[-400:].encode('string_escape')))
+        bad = True
+        node_volume[node] = {}
+      elif not isinstance(volumeinfo, dict):
          feedback_fn("  - ERROR: connection to %s failed" % (node,))
          bad = True
          continue
          feedback_fn("  - ERROR: connection to %s failed" % (node,))
          bad = True
          continue
-
-      node_volume[node] = volumeinfo
+      else:
+        node_volume[node] = volumeinfo
  
        # node_instance
        nodeinstance = all_instanceinfo[node]
  
        # node_instance
        nodeinstance = all_instanceinfo[node]
@@ -850,18 +685,74 @@ class LUVerifyCluster(NoHooksLU):
  
        node_instance[node] = nodeinstance
  
  
        node_instance[node] = nodeinstance
  
+      # node_info
+      nodeinfo = all_ninfo[node]
+      if not isinstance(nodeinfo, dict):
+        feedback_fn("  - ERROR: connection to %s failed" % (node,))
+        bad = True
+        continue
+
+      try:
+        node_info[node] = {
+          "mfree": int(nodeinfo['memory_free']),
+          "dfree": int(nodeinfo['vg_free']),
+          "pinst": [],
+          "sinst": [],
+          # dictionary holding all instances this node is secondary for,
+          # grouped by their primary node. Each key is a cluster node, and each
+          # value is a list of instances which have the key as primary and the
+          # current node as secondary.  this is handy to calculate N+1 memory
+          # availability if you can only failover from a primary to its
+          # secondary.
+          "sinst-by-pnode": {},
+        }
+      except ValueError:
+        feedback_fn("  - ERROR: invalid value returned from node %s" % (node,))
+        bad = True
+        continue
+
      node_vol_should = {}
  
      for instance in instancelist:
        feedback_fn("* Verifying instance %s" % instance)
      node_vol_should = {}
  
      for instance in instancelist:
        feedback_fn("* Verifying instance %s" % instance)
-      result =  self._VerifyInstance(instance, node_volume, node_instance,
-                                     feedback_fn)
-      bad = bad or result
-
        inst_config = self.cfg.GetInstanceInfo(instance)
        inst_config = self.cfg.GetInstanceInfo(instance)
+      result =  self._VerifyInstance(instance, inst_config, node_volume,
+                                     node_instance, feedback_fn)
+      bad = bad or result
  
        inst_config.MapLVsByNode(node_vol_should)
  
  
        inst_config.MapLVsByNode(node_vol_should)
  
+      instance_cfg[instance] = inst_config
+
+      pnode = inst_config.primary_node
+      if pnode in node_info:
+        node_info[pnode]['pinst'].append(instance)
+      else:
+        feedback_fn("  - ERROR: instance %s, connection to primary node"
+                    " %s failed" % (instance, pnode))
+        bad = True
+
+      # If the instance is non-redundant we cannot survive losing its primary
+      # node, so we are not N+1 compliant. On the other hand we have no disk
+      # templates with more than one secondary so that situation is not well
+      # supported either.
+      # FIXME: does not support file-backed instances
+      if len(inst_config.secondary_nodes) == 0:
+        i_non_redundant.append(instance)
+      elif len(inst_config.secondary_nodes) > 1:
+        feedback_fn("  - WARNING: multiple secondaries for instance %s"
+                    % instance)
+
+      for snode in inst_config.secondary_nodes:
+        if snode in node_info:
+          node_info[snode]['sinst'].append(instance)
+          if pnode not in node_info[snode]['sinst-by-pnode']:
+            node_info[snode]['sinst-by-pnode'][pnode] = []
+          node_info[snode]['sinst-by-pnode'][pnode].append(instance)
+        else:
+          feedback_fn("  - ERROR: instance %s, connection to secondary node"
+                      " %s failed" % (instance, snode))
+
      feedback_fn("* Verifying orphan volumes")
      result = self._VerifyOrphanVolumes(node_vol_should, node_volume,
                                         feedback_fn)
      feedback_fn("* Verifying orphan volumes")
      result = self._VerifyOrphanVolumes(node_vol_should, node_volume,
                                         feedback_fn)
@@ -872,8 +763,131 @@ class LUVerifyCluster(NoHooksLU):
                                           feedback_fn)
      bad = bad or result
  
                                           feedback_fn)
      bad = bad or result
  
+    if constants.VERIFY_NPLUSONE_MEM not in self.skip_set:
+      feedback_fn("* Verifying N+1 Memory redundancy")
+      result = self._VerifyNPlusOneMemory(node_info, instance_cfg, feedback_fn)
+      bad = bad or result
+
+    feedback_fn("* Other Notes")
+    if i_non_redundant:
+      feedback_fn("  - NOTICE: %d non-redundant instance(s) found."
+                  % len(i_non_redundant))
+
      return int(bad)
  
      return int(bad)
  
+  def HooksCallBack(self, phase, hooks_results, feedback_fn, lu_result):
+    """Analize the post-hooks' result, handle it, and send some
+    nicely-formatted feedback back to the user.
+
+    Args:
+      phase: the hooks phase that has just been run
+      hooks_results: the results of the multi-node hooks rpc call
+      feedback_fn: function to send feedback back to the caller
+      lu_result: previous Exec result
+
+    """
+    # We only really run POST phase hooks, and are only interested in their results
+    if phase == constants.HOOKS_PHASE_POST:
+      # Used to change hooks' output to proper indentation
+      indent_re = re.compile('^', re.M)
+      feedback_fn("* Hooks Results")
+      if not hooks_results:
+        feedback_fn("  - ERROR: general communication failure")
+        lu_result = 1
+      else:
+        for node_name in hooks_results:
+          show_node_header = True
+          res = hooks_results[node_name]
+          if res is False or not isinstance(res, list):
+            feedback_fn("    Communication failure")
+            lu_result = 1
+            continue
+          for script, hkr, output in res:
+            if hkr == constants.HKR_FAIL:
+              # The node header is only shown once, if there are
+              # failing hooks on that node
+              if show_node_header:
+                feedback_fn("  Node %s:" % node_name)
+                show_node_header = False
+              feedback_fn("    ERROR: Script %s failed, output:" % script)
+              output = indent_re.sub('      ', output)
+              feedback_fn("%s" % output)
+              lu_result = 1
+
+      return lu_result
+
+
+class LUVerifyDisks(NoHooksLU):
+  """Verifies the cluster disks status.
+
+  """
+  _OP_REQP = []
+
+  def CheckPrereq(self):
+    """Check prerequisites.
+
+    This has no prerequisites.
+
+    """
+    pass
+
+  def Exec(self, feedback_fn):
+    """Verify integrity of cluster disks.
+
+    """
+    result = res_nodes, res_nlvm, res_instances, res_missing = [], {}, [], {}
+
+    vg_name = self.cfg.GetVGName()
+    nodes = utils.NiceSort(self.cfg.GetNodeList())
+    instances = [self.cfg.GetInstanceInfo(name)
+                 for name in self.cfg.GetInstanceList()]
+
+    nv_dict = {}
+    for inst in instances:
+      inst_lvs = {}
+      if (inst.status != "up" or
+          inst.disk_template not in constants.DTS_NET_MIRROR):
+        continue
+      inst.MapLVsByNode(inst_lvs)
+      # transform { iname: {node: [vol,],},} to {(node, vol): iname}
+      for node, vol_list in inst_lvs.iteritems():
+        for vol in vol_list:
+          nv_dict[(node, vol)] = inst
+
+    if not nv_dict:
+      return result
+
+    node_lvs = rpc.call_volume_list(nodes, vg_name)
+
+    to_act = set()
+    for node in nodes:
+      # node_volume
+      lvs = node_lvs[node]
+
+      if isinstance(lvs, basestring):
+        logger.Info("error enumerating LVs on node %s: %s" % (node, lvs))
+        res_nlvm[node] = lvs
+      elif not isinstance(lvs, dict):
+        logger.Info("connection to node %s failed or invalid data returned" %
+                    (node,))
+        res_nodes.append(node)
+        continue
+
+      for lv_name, (_, lv_inactive, lv_online) in lvs.iteritems():
+        inst = nv_dict.pop((node, lv_name), None)
+        if (not lv_online and inst is not None
+            and inst.name not in res_instances):
+          res_instances.append(inst.name)
+
+    # any leftover items in nv_dict are missing LVs, let's arrange the
+    # data better
+    for key, inst in nv_dict.iteritems():
+      if inst.name not in res_missing:
+        res_missing[inst.name] = []
+      res_missing[inst.name].append(key)
+
+    return result
+
  
  class LURenameCluster(LogicalUnit):
    """Rename the cluster.
  
  class LURenameCluster(LogicalUnit):
    """Rename the cluster.
@@ -882,13 +896,14 @@ class LURenameCluster(LogicalUnit):
    HPATH = "cluster-rename"
    HTYPE = constants.HTYPE_CLUSTER
    _OP_REQP = ["name"]
    HPATH = "cluster-rename"
    HTYPE = constants.HTYPE_CLUSTER
    _OP_REQP = ["name"]
+  REQ_WSSTORE = True
  
    def BuildHooksEnv(self):
      """Build hooks env.
  
      """
      env = {
  
    def BuildHooksEnv(self):
      """Build hooks env.
  
      """
      env = {
-      "OP_TARGET": self.op.sstore.GetClusterName(),
+      "OP_TARGET": self.sstore.GetClusterName(),
        "NEW_NAME": self.op.name,
        }
      mn = self.sstore.GetMasterNode()
        "NEW_NAME": self.op.name,
        }
      mn = self.sstore.GetMasterNode()
@@ -908,8 +923,7 @@ class LURenameCluster(LogicalUnit):
        raise errors.OpPrereqError("Neither the name nor the IP address of the"
                                   " cluster has changed")
      if new_ip != old_ip:
        raise errors.OpPrereqError("Neither the name nor the IP address of the"
                                   " cluster has changed")
      if new_ip != old_ip:
-      result = utils.RunCmd(["fping", "-q", new_ip])
-      if not result.failed:
+      if utils.TcpPing(new_ip, constants.DEFAULT_NODED_PORT):
          raise errors.OpPrereqError("The given cluster IP address (%s) is"
                                     " reachable on the network. Aborting." %
                                     new_ip)
          raise errors.OpPrereqError("The given cluster IP address (%s) is"
                                     " reachable on the network. Aborting." %
                                     new_ip)
@@ -950,8 +964,82 @@ class LURenameCluster(LogicalUnit):
                           (fname, to_node))
      finally:
        if not rpc.call_node_start_master(master):
                           (fname, to_node))
      finally:
        if not rpc.call_node_start_master(master):
-        logger.Error("Could not re-enable the master role on the master,\n"
-                     "please restart manually.")
+        logger.Error("Could not re-enable the master role on the master,"
+                     " please restart manually.")
+
+
+def _RecursiveCheckIfLVMBased(disk):
+  """Check if the given disk or its children are lvm-based.
+
+  Args:
+    disk: ganeti.objects.Disk object
+
+  Returns:
+    boolean indicating whether a LD_LV dev_type was found or not
+
+  """
+  if disk.children:
+    for chdisk in disk.children:
+      if _RecursiveCheckIfLVMBased(chdisk):
+        return True
+  return disk.dev_type == constants.LD_LV
+
+
+class LUSetClusterParams(LogicalUnit):
+  """Change the parameters of the cluster.
+
+  """
+  HPATH = "cluster-modify"
+  HTYPE = constants.HTYPE_CLUSTER
+  _OP_REQP = []
+
+  def BuildHooksEnv(self):
+    """Build hooks env.
+
+    """
+    env = {
+      "OP_TARGET": self.sstore.GetClusterName(),
+      "NEW_VG_NAME": self.op.vg_name,
+      }
+    mn = self.sstore.GetMasterNode()
+    return env, [mn], [mn]
+
+  def CheckPrereq(self):
+    """Check prerequisites.
+
+    This checks whether the given params don't conflict and
+    if the given volume group is valid.
+
+    """
+    if not self.op.vg_name:
+      instances = [self.cfg.GetInstanceInfo(name)
+                   for name in self.cfg.GetInstanceList()]
+      for inst in instances:
+        for disk in inst.disks:
+          if _RecursiveCheckIfLVMBased(disk):
+            raise errors.OpPrereqError("Cannot disable lvm storage while"
+                                       " lvm-based instances exist")
+
+    # if vg_name not None, checks given volume group on all nodes
+    if self.op.vg_name:
+      node_list = self.cfg.GetNodeList()
+      vglist = rpc.call_vg_list(node_list)
+      for node in node_list:
+        vgstatus = utils.CheckVolumeGroupSize(vglist[node], self.op.vg_name,
+                                              constants.MIN_VG_SIZE)
+        if vgstatus:
+          raise errors.OpPrereqError("Error on node '%s': %s" %
+                                     (node, vgstatus))
+
+  def Exec(self, feedback_fn):
+    """Change the parameters of the cluster.
+
+    """
+    if self.op.vg_name != self.cfg.GetVGName():
+      self.cfg.SetVGName(self.op.vg_name)
+    else:
+      feedback_fn("Cluster LVM configuration already in desired"
+                  " state, not changing")
  
  
  def _WaitForSync(cfgw, instance, proc, oneshot=False, unlock=False):
  
  
  def _WaitForSync(cfgw, instance, proc, oneshot=False, unlock=False):
@@ -1005,13 +1093,7 @@ def _WaitForSync(cfgw, instance, proc, oneshot=False, unlock=False):
      if done or oneshot:
        break
  
      if done or oneshot:
        break
  
-    if unlock:
-      utils.Unlock('cmd')
-    try:
-      time.sleep(min(60, max_time))
-    finally:
-      if unlock:
-        utils.Lock('cmd')
+    time.sleep(min(60, max_time))
  
    if done:
      proc.LogInfo("Instance %s's disks are in sync." % instance.name)
  
    if done:
      proc.LogInfo("Instance %s's disks are in sync." % instance.name)
@@ -1036,7 +1118,7 @@ def _CheckDiskConsistency(cfgw, dev, node, on_primary, ldisk=False):
    if on_primary or dev.AssembleOnSecondary():
      rstats = rpc.call_blockdev_find(node, dev)
      if not rstats:
    if on_primary or dev.AssembleOnSecondary():
      rstats = rpc.call_blockdev_find(node, dev)
      if not rstats:
-      logger.ToStderr("Can't get any data from node %s" % node)
+      logger.ToStderr("Node %s: Disk degraded, not found or node down" % node)
        result = False
      else:
        result = result and (not rstats[idx])
        result = False
      else:
        result = result and (not rstats[idx])
@@ -1051,7 +1133,7 @@ class LUDiagnoseOS(NoHooksLU):
    """Logical unit for OS diagnose/query.
  
    """
    """Logical unit for OS diagnose/query.
  
    """
-  _OP_REQP = []
+  _OP_REQP = ["output_fields", "names"]
  
    def CheckPrereq(self):
      """Check prerequisites.
  
    def CheckPrereq(self):
      """Check prerequisites.
@@ -1059,7 +1141,44 @@ class LUDiagnoseOS(NoHooksLU):
      This always succeeds, since this is a pure query LU.
  
      """
      This always succeeds, since this is a pure query LU.
  
      """
-    return
+    if self.op.names:
+      raise errors.OpPrereqError("Selective OS query not supported")
+
+    self.dynamic_fields = frozenset(["name", "valid", "node_status"])
+    _CheckOutputFields(static=[],
+                       dynamic=self.dynamic_fields,
+                       selected=self.op.output_fields)
+
+  @staticmethod
+  def _DiagnoseByOS(node_list, rlist):
+    """Remaps a per-node return list into an a per-os per-node dictionary
+
+      Args:
+        node_list: a list with the names of all nodes
+        rlist: a map with node names as keys and OS objects as values
+
+      Returns:
+        map: a map with osnames as keys and as value another map, with
+             nodes as
+             keys and list of OS objects as values
+             e.g. {"debian-etch": {"node1": [<object>,...],
+                                   "node2": [<object>,]}
+                  }
+
+    """
+    all_os = {}
+    for node_name, nr in rlist.iteritems():
+      if not nr:
+        continue
+      for os_obj in nr:
+        if os_obj.name not in all_os:
+          # build a list of nodes for this os containing empty lists
+          # for each node in node_list
+          all_os[os_obj.name] = {}
+          for nname in node_list:
+            all_os[os_obj.name][nname] = []
+        all_os[os_obj.name][node_name].append(os_obj)
+    return all_os
  
    def Exec(self, feedback_fn):
      """Compute the list of OSes.
  
    def Exec(self, feedback_fn):
      """Compute the list of OSes.
@@ -1069,11 +1188,29 @@ class LUDiagnoseOS(NoHooksLU):
      node_data = rpc.call_os_diagnose(node_list)
      if node_data == False:
        raise errors.OpExecError("Can't gather the list of OSes")
      node_data = rpc.call_os_diagnose(node_list)
      if node_data == False:
        raise errors.OpExecError("Can't gather the list of OSes")
-    return node_data
-
-
-class LURemoveNode(LogicalUnit):
-  """Logical unit for removing a node.
+    pol = self._DiagnoseByOS(node_list, node_data)
+    output = []
+    for os_name, os_data in pol.iteritems():
+      row = []
+      for field in self.op.output_fields:
+        if field == "name":
+          val = os_name
+        elif field == "valid":
+          val = utils.all([osl and osl[0] for osl in os_data.values()])
+        elif field == "node_status":
+          val = {}
+          for node_name, nos_list in os_data.iteritems():
+            val[node_name] = [(v.status, v.path) for v in nos_list]
+        else:
+          raise errors.ParameterError(field)
+        row.append(val)
+      output.append(row)
+
+    return output
+
+
+class LURemoveNode(LogicalUnit):
+  """Logical unit for removing a node.
  
    """
    HPATH = "node-remove"
  
    """
    HPATH = "node-remove"
@@ -1084,7 +1221,7 @@ class LURemoveNode(LogicalUnit):
      """Build hooks env.
  
      This doesn't run on the target node in the pre phase as a failed
      """Build hooks env.
  
      This doesn't run on the target node in the pre phase as a failed
-    node would not allows itself to run.
+    node would then be impossible to remove.
  
      """
      env = {
  
      """
      env = {
@@ -1138,13 +1275,13 @@ class LURemoveNode(LogicalUnit):
  
      rpc.call_node_leave_cluster(node.name)
  
  
      rpc.call_node_leave_cluster(node.name)
  
-    ssh.SSHCall(node.name, 'root', "%s stop" % constants.NODE_INITD_SCRIPT)
-
      logger.Info("Removing node %s from config" % node.name)
  
      self.cfg.RemoveNode(node.name)
      logger.Info("Removing node %s from config" % node.name)
  
      self.cfg.RemoveNode(node.name)
+    # Remove the node from the Ganeti Lock Manager
+    self.context.glm.remove(locking.LEVEL_NODE, node.name)
  
  
-    _RemoveHostFromEtcHosts(node.name)
+    utils.RemoveHostFromEtcHosts(node.name)
  
  
  class LUQueryNodes(NoHooksLU):
  
  
  class LUQueryNodes(NoHooksLU):
@@ -1159,13 +1296,16 @@ class LUQueryNodes(NoHooksLU):
      This checks that the fields required are valid output fields.
  
      """
      This checks that the fields required are valid output fields.
  
      """
-    self.dynamic_fields = frozenset(["dtotal", "dfree",
-                                     "mtotal", "mnode", "mfree",
-                                     "bootid"])
+    self.dynamic_fields = frozenset([
+      "dtotal", "dfree",
+      "mtotal", "mnode", "mfree",
+      "bootid",
+      "ctotal",
+      ])
  
      _CheckOutputFields(static=["name", "pinst_cnt", "sinst_cnt",
                                 "pinst_list", "sinst_list",
  
      _CheckOutputFields(static=["name", "pinst_cnt", "sinst_cnt",
                                 "pinst_list", "sinst_list",
-                               "pip", "sip"],
+                               "pip", "sip", "tags"],
                         dynamic=self.dynamic_fields,
                         selected=self.op.output_fields)
  
                         dynamic=self.dynamic_fields,
                         selected=self.op.output_fields)
  
@@ -1192,6 +1332,7 @@ class LUQueryNodes(NoHooksLU):
              "mfree": utils.TryConvert(int, nodeinfo['memory_free']),
              "dtotal": utils.TryConvert(int, nodeinfo['vg_size']),
              "dfree": utils.TryConvert(int, nodeinfo['vg_free']),
              "mfree": utils.TryConvert(int, nodeinfo['memory_free']),
              "dtotal": utils.TryConvert(int, nodeinfo['vg_size']),
              "dfree": utils.TryConvert(int, nodeinfo['vg_free']),
+            "ctotal": utils.TryConvert(int, nodeinfo['cpu_total']),
              "bootid": nodeinfo['bootid'],
              }
          else:
              "bootid": nodeinfo['bootid'],
              }
          else:
@@ -1235,6 +1376,8 @@ class LUQueryNodes(NoHooksLU):
            val = node.primary_ip
          elif field == "sip":
            val = node.secondary_ip
            val = node.primary_ip
          elif field == "sip":
            val = node.secondary_ip
+        elif field == "tags":
+          val = list(node.GetTags())
          elif field in self.dynamic_fields:
            val = live_data[node.name].get(field, None)
          else:
          elif field in self.dynamic_fields:
            val = live_data[node.name].get(field, None)
          else:
@@ -1363,13 +1506,24 @@ class LUAddNode(LogicalUnit):
      if not utils.IsValidIP(secondary_ip):
        raise errors.OpPrereqError("Invalid secondary IP given")
      self.op.secondary_ip = secondary_ip
      if not utils.IsValidIP(secondary_ip):
        raise errors.OpPrereqError("Invalid secondary IP given")
      self.op.secondary_ip = secondary_ip
+
      node_list = cfg.GetNodeList()
      node_list = cfg.GetNodeList()
-    if node in node_list:
-      raise errors.OpPrereqError("Node %s is already in the configuration"
-                                 % node)
+    if not self.op.readd and node in node_list:
+      raise errors.OpPrereqError("Node %s is already in the configuration" %
+                                 node)
+    elif self.op.readd and node not in node_list:
+      raise errors.OpPrereqError("Node %s is not in the configuration" % node)
  
      for existing_node_name in node_list:
        existing_node = cfg.GetNodeInfo(existing_node_name)
  
      for existing_node_name in node_list:
        existing_node = cfg.GetNodeInfo(existing_node_name)
+
+      if self.op.readd and node == existing_node_name:
+        if (existing_node.primary_ip != primary_ip or
+            existing_node.secondary_ip != secondary_ip):
+          raise errors.OpPrereqError("Readded node doesn't have the same IP"
+                                     " address configuration as before")
+        continue
+
        if (existing_node.primary_ip == primary_ip or
            existing_node.secondary_ip == primary_ip or
            existing_node.primary_ip == secondary_ip or
        if (existing_node.primary_ip == primary_ip or
            existing_node.secondary_ip == primary_ip or
            existing_node.primary_ip == secondary_ip or
@@ -1391,18 +1545,15 @@ class LUAddNode(LogicalUnit):
                                     " new node doesn't have one")
  
      # checks reachablity
                                     " new node doesn't have one")
  
      # checks reachablity
-    if not utils.TcpPing(utils.HostInfo().name,
-                         primary_ip,
-                         constants.DEFAULT_NODED_PORT):
+    if not utils.TcpPing(primary_ip, constants.DEFAULT_NODED_PORT):
        raise errors.OpPrereqError("Node not reachable by ping")
  
      if not newbie_singlehomed:
        # check reachability from my secondary ip to newbie's secondary ip
        raise errors.OpPrereqError("Node not reachable by ping")
  
      if not newbie_singlehomed:
        # check reachability from my secondary ip to newbie's secondary ip
-      if not utils.TcpPing(myself.secondary_ip,
-                           secondary_ip,
-                           constants.DEFAULT_NODED_PORT):
-        raise errors.OpPrereqError(
-          "Node secondary ip not reachable by TCP based ping to noded port")
+      if not utils.TcpPing(secondary_ip, constants.DEFAULT_NODED_PORT,
+                           source=myself.secondary_ip):
+        raise errors.OpPrereqError("Node secondary ip not reachable by TCP"
+                                   " based ping to noded port")
  
      self.new_node = objects.Node(name=node,
                                   primary_ip=primary_ip,
  
      self.new_node = objects.Node(name=node,
                                   primary_ip=primary_ip,
@@ -1415,46 +1566,7 @@ class LUAddNode(LogicalUnit):
      new_node = self.new_node
      node = new_node.name
  
      new_node = self.new_node
      node = new_node.name
  
-    # set up inter-node password and certificate and restarts the node daemon
-    gntpass = self.sstore.GetNodeDaemonPassword()
-    if not re.match('^[a-zA-Z0-9.]{1,64}$', gntpass):
-      raise errors.OpExecError("ganeti password corruption detected")
-    f = open(constants.SSL_CERT_FILE)
-    try:
-      gntpem = f.read(8192)
-    finally:
-      f.close()
-    # in the base64 pem encoding, neither '!' nor '.' are valid chars,
-    # so we use this to detect an invalid certificate; as long as the
-    # cert doesn't contain this, the here-document will be correctly
-    # parsed by the shell sequence below
-    if re.search('^!EOF\.', gntpem, re.MULTILINE):
-      raise errors.OpExecError("invalid PEM encoding in the SSL certificate")
-    if not gntpem.endswith("\n"):
-      raise errors.OpExecError("PEM must end with newline")
-    logger.Info("copy cluster pass to %s and starting the node daemon" % node)
-
-    # and then connect with ssh to set password and start ganeti-noded
-    # note that all the below variables are sanitized at this point,
-    # either by being constants or by the checks above
-    ss = self.sstore
-    mycommand = ("umask 077 && "
-                 "echo '%s' > '%s' && "
-                 "cat > '%s' << '!EOF.' && \n"
-                 "%s!EOF.\n%s restart" %
-                 (gntpass, ss.KeyToFilename(ss.SS_NODED_PASS),
-                  constants.SSL_CERT_FILE, gntpem,
-                  constants.NODE_INITD_SCRIPT))
-
-    result = ssh.SSHCall(node, 'root', mycommand, batch=False, ask_key=True)
-    if result.failed:
-      raise errors.OpExecError("Remote command on node %s, error: %s,"
-                               " output: %s" %
-                               (node, result.fail_reason, result.output))
-
      # check connectivity
      # check connectivity
-    time.sleep(4)
-
      result = rpc.call_version([node])[node]
      if result:
        if constants.PROTOCOL_VERSION == result:
      result = rpc.call_version([node])[node]
      if result:
        if constants.PROTOCOL_VERSION == result:
@@ -1489,10 +1601,7 @@ class LUAddNode(LogicalUnit):
        raise errors.OpExecError("Cannot transfer ssh keys to the new node")
  
      # Add node to our /etc/hosts, and add key to known_hosts
        raise errors.OpExecError("Cannot transfer ssh keys to the new node")
  
      # Add node to our /etc/hosts, and add key to known_hosts
-    _AddHostToEtcHosts(new_node.name)
-
-    _UpdateKnownHosts(new_node.name, new_node.primary_ip,
-                      self.cfg.GetHostKey())
+    utils.AddHostToEtcHosts(new_node.name)
  
      if new_node.secondary_ip != new_node.primary_ip:
        if not rpc.call_node_tcp_ping(new_node.name,
  
      if new_node.secondary_ip != new_node.primary_ip:
        if not rpc.call_node_tcp_ping(new_node.name,
@@ -1500,40 +1609,57 @@ class LUAddNode(LogicalUnit):
                                      new_node.secondary_ip,
                                      constants.DEFAULT_NODED_PORT,
                                      10, False):
                                      new_node.secondary_ip,
                                      constants.DEFAULT_NODED_PORT,
                                      10, False):
-        raise errors.OpExecError("Node claims it doesn't have the"
-                                 " secondary ip you gave (%s).\n"
-                                 "Please fix and re-run this command." %
-                                 new_node.secondary_ip)
-
-    success, msg = ssh.VerifyNodeHostname(node)
-    if not success:
-      raise errors.OpExecError("Node '%s' claims it has a different hostname"
-                               " than the one the resolver gives: %s.\n"
-                               "Please fix and re-run this command." %
-                               (node, msg))
+        raise errors.OpExecError("Node claims it doesn't have the secondary ip"
+                                 " you gave (%s). Please fix and re-run this"
+                                 " command." % new_node.secondary_ip)
+
+    node_verify_list = [self.sstore.GetMasterNode()]
+    node_verify_param = {
+      'nodelist': [node],
+      # TODO: do a node-net-test as well?
+    }
+
+    result = rpc.call_node_verify(node_verify_list, node_verify_param)
+    for verifier in node_verify_list:
+      if not result[verifier]:
+        raise errors.OpExecError("Cannot communicate with %s's node daemon"
+                                 " for remote verification" % verifier)
+      if result[verifier]['nodelist']:
+        for failed in result[verifier]['nodelist']:
+          feedback_fn("ssh/hostname verification failed %s -> %s" %
+                      (verifier, result[verifier]['nodelist'][failed]))
+        raise errors.OpExecError("ssh/hostname verification failed.")
  
      # Distribute updated /etc/hosts and known_hosts to all nodes,
      # including the node just added
      myself = self.cfg.GetNodeInfo(self.sstore.GetMasterNode())
  
      # Distribute updated /etc/hosts and known_hosts to all nodes,
      # including the node just added
      myself = self.cfg.GetNodeInfo(self.sstore.GetMasterNode())
-    dist_nodes = self.cfg.GetNodeList() + [node]
+    dist_nodes = self.cfg.GetNodeList()
+    if not self.op.readd:
+      dist_nodes.append(node)
      if myself.name in dist_nodes:
        dist_nodes.remove(myself.name)
  
      logger.Debug("Copying hosts and known_hosts to all nodes")
      if myself.name in dist_nodes:
        dist_nodes.remove(myself.name)
  
      logger.Debug("Copying hosts and known_hosts to all nodes")
-    for fname in ("/etc/hosts", constants.SSH_KNOWN_HOSTS_FILE):
+    for fname in (constants.ETC_HOSTS, constants.SSH_KNOWN_HOSTS_FILE):
        result = rpc.call_upload_file(dist_nodes, fname)
        for to_node in dist_nodes:
          if not result[to_node]:
            logger.Error("copy of file %s to node %s failed" %
                         (fname, to_node))
  
        result = rpc.call_upload_file(dist_nodes, fname)
        for to_node in dist_nodes:
          if not result[to_node]:
            logger.Error("copy of file %s to node %s failed" %
                         (fname, to_node))
  
-    to_copy = ss.GetFileList()
+    to_copy = self.sstore.GetFileList()
+    if self.sstore.GetHypervisorType() == constants.HT_XEN_HVM31:
+      to_copy.append(constants.VNC_PASSWORD_FILE)
      for fname in to_copy:
      for fname in to_copy:
-      if not ssh.CopyFileToNode(node, fname):
+      result = rpc.call_upload_file([node], fname)
+      if not result[node]:
          logger.Error("could not copy file %s to node %s" % (fname, node))
  
          logger.Error("could not copy file %s to node %s" % (fname, node))
  
-    logger.Info("adding node %s to cluster.conf" % node)
-    self.cfg.AddNode(new_node)
+    if not self.op.readd:
+      logger.Info("adding node %s to cluster.conf" % node)
+      self.cfg.AddNode(new_node)
+      # Add the new node to the Ganeti Lock Manager
+      self.context.glm.add(locking.LEVEL_NODE, node)
  
  
  class LUMasterFailover(LogicalUnit):
  
  
  class LUMasterFailover(LogicalUnit):
@@ -1545,6 +1671,7 @@ class LUMasterFailover(LogicalUnit):
    HPATH = "master-failover"
    HTYPE = constants.HTYPE_CLUSTER
    REQ_MASTER = False
    HPATH = "master-failover"
    HTYPE = constants.HTYPE_CLUSTER
    REQ_MASTER = False
+  REQ_WSSTORE = True
    _OP_REQP = []
  
    def BuildHooksEnv(self):
    _OP_REQP = []
  
    def BuildHooksEnv(self):
@@ -1572,8 +1699,8 @@ class LUMasterFailover(LogicalUnit):
  
      if self.old_master == self.new_master:
        raise errors.OpPrereqError("This commands must be run on the node"
  
      if self.old_master == self.new_master:
        raise errors.OpPrereqError("This commands must be run on the node"
-                                 " where you want the new master to be.\n"
-                                 "%s is already the master" %
+                                 " where you want the new master to be."
+                                 " %s is already the master" %
                                   self.old_master)
  
    def Exec(self, feedback_fn):
                                   self.old_master)
  
    def Exec(self, feedback_fn):
@@ -1602,8 +1729,8 @@ class LUMasterFailover(LogicalUnit):
      if not rpc.call_node_start_master(self.new_master):
        logger.Error("could not start the master role on the new master"
                     " %s, please check" % self.new_master)
      if not rpc.call_node_start_master(self.new_master):
        logger.Error("could not start the master role on the new master"
                     " %s, please check" % self.new_master)
-      feedback_fn("Error in activating the master IP on the new master,\n"
-                  "please fix manually.")
+      feedback_fn("Error in activating the master IP on the new master,"
+                  " please fix manually.")
  
  
  
  
  
  
@@ -1633,50 +1760,12 @@ class LUQueryClusterInfo(NoHooksLU):
        "export_version": constants.EXPORT_VERSION,
        "master": self.sstore.GetMasterNode(),
        "architecture": (platform.architecture()[0], platform.machine()),
        "export_version": constants.EXPORT_VERSION,
        "master": self.sstore.GetMasterNode(),
        "architecture": (platform.architecture()[0], platform.machine()),
+      "hypervisor_type": self.sstore.GetHypervisorType(),
        }
  
      return result
  
  
        }
  
      return result
  
  
-class LUClusterCopyFile(NoHooksLU):
-  """Copy file to cluster.
-
-  """
-  _OP_REQP = ["nodes", "filename"]
-
-  def CheckPrereq(self):
-    """Check prerequisites.
-
-    It should check that the named file exists and that the given list
-    of nodes is valid.
-
-    """
-    if not os.path.exists(self.op.filename):
-      raise errors.OpPrereqError("No such filename '%s'" % self.op.filename)
-
-    self.nodes = _GetWantedNodes(self, self.op.nodes)
-
-  def Exec(self, feedback_fn):
-    """Copy a file from master to some nodes.
-
-    Args:
-      opts - class with options as members
-      args - list containing a single element, the file name
-    Opts used:
-      nodes - list containing the name of target nodes; if empty, all nodes
-
-    """
-    filename = self.op.filename
-
-    myname = utils.HostInfo().name
-
-    for node in self.nodes:
-      if node == myname:
-        continue
-      if not ssh.CopyFileToNode(node, filename):
-        logger.Error("Copy of file %s to node %s failed" % (filename, node))
-
-
  class LUDumpClusterConfig(NoHooksLU):
    """Return a text-representation of the cluster-config.
  
  class LUDumpClusterConfig(NoHooksLU):
    """Return a text-representation of the cluster-config.
  
@@ -1696,32 +1785,6 @@ class LUDumpClusterConfig(NoHooksLU):
      return self.cfg.DumpConfig()
  
  
      return self.cfg.DumpConfig()
  
  
-class LURunClusterCommand(NoHooksLU):
-  """Run a command on some nodes.
-
-  """
-  _OP_REQP = ["command", "nodes"]
-
-  def CheckPrereq(self):
-    """Check prerequisites.
-
-    It checks that the given list of nodes is valid.
-
-    """
-    self.nodes = _GetWantedNodes(self, self.op.nodes)
-
-  def Exec(self, feedback_fn):
-    """Run a command on some nodes.
-
-    """
-    data = []
-    for node in self.nodes:
-      result = ssh.SSHCall(node, "root", self.op.command)
-      data.append((node, result.output, result.exit_code))
-
-    return data
-
-
  class LUActivateInstanceDisks(NoHooksLU):
    """Bring up an instance's disks.
  
  class LUActivateInstanceDisks(NoHooksLU):
    """Bring up an instance's disks.
  
@@ -1770,22 +1833,41 @@ def _AssembleInstanceDisks(instance, cfg, ignore_secondaries=False):
    """
    device_info = []
    disks_ok = True
    """
    device_info = []
    disks_ok = True
+  iname = instance.name
+  # With the two passes mechanism we try to reduce the window of
+  # opportunity for the race condition of switching DRBD to primary
+  # before handshaking occured, but we do not eliminate it
+
+  # The proper fix would be to wait (with some limits) until the
+  # connection has been made and drbd transitions from WFConnection
+  # into any other network-connected state (Connected, SyncTarget,
+  # SyncSource, etc.)
+
+  # 1st pass, assemble on all nodes in secondary mode
    for inst_disk in instance.disks:
    for inst_disk in instance.disks:
-    master_result = None
      for node, node_disk in inst_disk.ComputeNodeTree(instance.primary_node):
        cfg.SetDiskID(node_disk, node)
      for node, node_disk in inst_disk.ComputeNodeTree(instance.primary_node):
        cfg.SetDiskID(node_disk, node)
-      is_primary = node == instance.primary_node
-      result = rpc.call_blockdev_assemble(node, node_disk,
-                                          instance.name, is_primary)
+      result = rpc.call_blockdev_assemble(node, node_disk, iname, False)
        if not result:
        if not result:
-        logger.Error("could not prepare block device %s on node %s (is_pri"
-                     "mary=%s)" % (inst_disk.iv_name, node, is_primary))
-        if is_primary or not ignore_secondaries:
+        logger.Error("could not prepare block device %s on node %s"
+                     " (is_primary=False, pass=1)" % (inst_disk.iv_name, node))
+        if not ignore_secondaries:
            disks_ok = False
            disks_ok = False
-      if is_primary:
-        master_result = result
-    device_info.append((instance.primary_node, inst_disk.iv_name,
-                        master_result))
+
+  # FIXME: race condition on drbd migration to primary
+
+  # 2nd pass, do only the primary node
+  for inst_disk in instance.disks:
+    for node, node_disk in inst_disk.ComputeNodeTree(instance.primary_node):
+      if node != instance.primary_node:
+        continue
+      cfg.SetDiskID(node_disk, node)
+      result = rpc.call_blockdev_assemble(node, node_disk, iname, True)
+      if not result:
+        logger.Error("could not prepare block device %s on node %s"
+                     " (is_primary=True, pass=2)" % (inst_disk.iv_name, node))
+        disks_ok = False
+    device_info.append((instance.primary_node, inst_disk.iv_name, result))
  
    # leave the disks configured for the primary node
    # this is a workaround that would be fixed better by
  
    # leave the disks configured for the primary node
    # this is a workaround that would be fixed better by
@@ -1868,6 +1950,36 @@ def _ShutdownInstanceDisks(instance, cfg, ignore_primary=False):
    return result
  
  
    return result
  
  
+def _CheckNodeFreeMemory(cfg, node, reason, requested):
+  """Checks if a node has enough free memory.
+
+  This function check if a given node has the needed amount of free
+  memory. In case the node has less memory or we cannot get the
+  information from the node, this function raise an OpPrereqError
+  exception.
+
+  Args:
+    - cfg: a ConfigWriter instance
+    - node: the node name
+    - reason: string to use in the error message
+    - requested: the amount of memory in MiB
+
+  """
+  nodeinfo = rpc.call_node_info([node], cfg.GetVGName())
+  if not nodeinfo or not isinstance(nodeinfo, dict):
+    raise errors.OpPrereqError("Could not contact node %s for resource"
+                             " information" % (node,))
+
+  free_mem = nodeinfo[node].get('memory_free')
+  if not isinstance(free_mem, int):
+    raise errors.OpPrereqError("Can't compute free memory on node %s, result"
+                             " was '%s'" % (node, free_mem))
+  if requested > free_mem:
+    raise errors.OpPrereqError("Not enough memory on node %s for %s:"
+                             " needed %s MiB, available %s MiB" %
+                             (node, reason, requested, free_mem))
+
+
  class LUStartupInstance(LogicalUnit):
    """Starts an instance.
  
  class LUStartupInstance(LogicalUnit):
    """Starts an instance.
  
@@ -1905,6 +2017,10 @@ class LUStartupInstance(LogicalUnit):
      # check bridges existance
      _CheckInstanceBridgesExist(instance)
  
      # check bridges existance
      _CheckInstanceBridgesExist(instance)
  
+    _CheckNodeFreeMemory(self.cfg, instance.primary_node,
+                         "starting instance %s" % instance.name,
+                         instance.memory)
+
      self.instance = instance
      self.op.instance_name = instance.name
  
      self.instance = instance
      self.op.instance_name = instance.name
  
@@ -1916,21 +2032,9 @@ class LUStartupInstance(LogicalUnit):
      force = self.op.force
      extra_args = getattr(self.op, "extra_args", "")
  
      force = self.op.force
      extra_args = getattr(self.op, "extra_args", "")
  
-    node_current = instance.primary_node
-
-    nodeinfo = rpc.call_node_info([node_current], self.cfg.GetVGName())
-    if not nodeinfo:
-      raise errors.OpExecError("Could not contact node %s for infos" %
-                               (node_current))
+    self.cfg.MarkInstanceUp(instance.name)
  
  
-    freememory = nodeinfo[node_current]['memory_free']
-    memory = instance.memory
-    if memory > freememory:
-      raise errors.OpExecError("Not enough memory to start instance"
-                               " %s on node %s"
-                               " needed %s MiB, available %s MiB" %
-                               (instance.name, node_current, memory,
-                                freememory))
+    node_current = instance.primary_node
  
      _StartInstanceDisks(self.cfg, instance, force)
  
  
      _StartInstanceDisks(self.cfg, instance, force)
  
@@ -1938,8 +2042,6 @@ class LUStartupInstance(LogicalUnit):
        _ShutdownInstanceDisks(instance, self.cfg)
        raise errors.OpExecError("Could not start instance")
  
        _ShutdownInstanceDisks(instance, self.cfg)
        raise errors.OpExecError("Could not start instance")
  
-    self.cfg.MarkInstanceUp(instance.name)
-
  
  class LURebootInstance(LogicalUnit):
    """Reboot an instance.
  
  class LURebootInstance(LogicalUnit):
    """Reboot an instance.
@@ -2055,10 +2157,10 @@ class LUShutdownInstance(LogicalUnit):
      """
      instance = self.instance
      node_current = instance.primary_node
      """
      instance = self.instance
      node_current = instance.primary_node
+    self.cfg.MarkInstanceDown(instance.name)
      if not rpc.call_instance_shutdown(node_current, instance):
        logger.Error("could not shutdown instance")
  
      if not rpc.call_instance_shutdown(node_current, instance):
        logger.Error("could not shutdown instance")
  
-    self.cfg.MarkInstanceDown(instance.name)
      _ShutdownInstanceDisks(instance, self.cfg)
  
  
      _ShutdownInstanceDisks(instance, self.cfg)
  
  
@@ -2134,8 +2236,8 @@ class LUReinstallInstance(LogicalUnit):
      try:
        feedback_fn("Running the instance OS create scripts...")
        if not rpc.call_instance_os_add(inst.primary_node, inst, "sda", "sdb"):
      try:
        feedback_fn("Running the instance OS create scripts...")
        if not rpc.call_instance_os_add(inst.primary_node, inst, "sda", "sdb"):
-        raise errors.OpExecError("Could not install OS for instance %s "
-                                 "on node %s" %
+        raise errors.OpExecError("Could not install OS for instance %s"
+                                 " on node %s" %
                                   (inst.name, inst.primary_node))
      finally:
        _ShutdownInstanceDisks(inst, self.cfg)
                                   (inst.name, inst.primary_node))
      finally:
        _ShutdownInstanceDisks(inst, self.cfg)
@@ -2186,10 +2288,13 @@ class LURenameInstance(LogicalUnit):
      name_info = utils.HostInfo(self.op.new_name)
  
      self.op.new_name = new_name = name_info.name
      name_info = utils.HostInfo(self.op.new_name)
  
      self.op.new_name = new_name = name_info.name
+    instance_list = self.cfg.GetInstanceList()
+    if new_name in instance_list:
+      raise errors.OpPrereqError("Instance '%s' is already in the cluster" %
+                                 new_name)
+
      if not getattr(self.op, "ignore_ip", False):
      if not getattr(self.op, "ignore_ip", False):
-      command = ["fping", "-q", name_info.ip]
-      result = utils.RunCmd(command)
-      if not result.failed:
+      if utils.TcpPing(name_info.ip, constants.DEFAULT_NODED_PORT):
          raise errors.OpPrereqError("IP %s of instance %s already in use" %
                                     (name_info.ip, new_name))
  
          raise errors.OpPrereqError("IP %s of instance %s already in use" %
                                     (name_info.ip, new_name))
  
@@ -2201,18 +2306,39 @@ class LURenameInstance(LogicalUnit):
      inst = self.instance
      old_name = inst.name
  
      inst = self.instance
      old_name = inst.name
  
+    if inst.disk_template == constants.DT_FILE:
+      old_file_storage_dir = os.path.dirname(inst.disks[0].logical_id[1])
+
      self.cfg.RenameInstance(inst.name, self.op.new_name)
  
      # re-read the instance from the configuration after rename
      inst = self.cfg.GetInstanceInfo(self.op.new_name)
  
      self.cfg.RenameInstance(inst.name, self.op.new_name)
  
      # re-read the instance from the configuration after rename
      inst = self.cfg.GetInstanceInfo(self.op.new_name)
  
+    if inst.disk_template == constants.DT_FILE:
+      new_file_storage_dir = os.path.dirname(inst.disks[0].logical_id[1])
+      result = rpc.call_file_storage_dir_rename(inst.primary_node,
+                                                old_file_storage_dir,
+                                                new_file_storage_dir)
+
+      if not result:
+        raise errors.OpExecError("Could not connect to node '%s' to rename"
+                                 " directory '%s' to '%s' (but the instance"
+                                 " has been renamed in Ganeti)" % (
+                                 inst.primary_node, old_file_storage_dir,
+                                 new_file_storage_dir))
+
+      if not result[0]:
+        raise errors.OpExecError("Could not rename directory '%s' to '%s'"
+                                 " (but the instance has been renamed in"
+                                 " Ganeti)" % (old_file_storage_dir,
+                                               new_file_storage_dir))
+
      _StartInstanceDisks(self.cfg, inst, None)
      try:
        if not rpc.call_instance_run_rename(inst.primary_node, inst, old_name,
                                            "sda", "sdb"):
      _StartInstanceDisks(self.cfg, inst, None)
      try:
        if not rpc.call_instance_run_rename(inst.primary_node, inst, old_name,
                                            "sda", "sdb"):
-        msg = ("Could run OS rename script for instance %s\n"
-               "on node %s\n"
-               "(but the instance has been renamed in Ganeti)" %
+        msg = ("Could run OS rename script for instance %s on node %s (but the"
+               " instance has been renamed in Ganeti)" %
                 (inst.name, inst.primary_node))
          logger.Error(msg)
      finally:
                 (inst.name, inst.primary_node))
          logger.Error(msg)
      finally:
@@ -2225,7 +2351,7 @@ class LURemoveInstance(LogicalUnit):
    """
    HPATH = "instance-remove"
    HTYPE = constants.HTYPE_INSTANCE
    """
    HPATH = "instance-remove"
    HTYPE = constants.HTYPE_INSTANCE
-  _OP_REQP = ["instance_name"]
+  _OP_REQP = ["instance_name", "ignore_failures"]
  
    def BuildHooksEnv(self):
      """Build hooks env.
  
    def BuildHooksEnv(self):
      """Build hooks env.
@@ -2276,6 +2402,8 @@ class LURemoveInstance(LogicalUnit):
      logger.Info("removing instance %s out of cluster config" % instance.name)
  
      self.cfg.RemoveInstance(instance.name)
      logger.Info("removing instance %s out of cluster config" % instance.name)
  
      self.cfg.RemoveInstance(instance.name)
+    # Remove the new instance from the Ganeti Lock Manager
+    self.context.glm.remove(locking.LEVEL_INSTANCE, instance.name)
  
  
  class LUQueryInstances(NoHooksLU):
  
  
  class LUQueryInstances(NoHooksLU):
@@ -2290,11 +2418,11 @@ class LUQueryInstances(NoHooksLU):
      This checks that the fields required are valid output fields.
  
      """
      This checks that the fields required are valid output fields.
  
      """
-    self.dynamic_fields = frozenset(["oper_state", "oper_ram"])
+    self.dynamic_fields = frozenset(["oper_state", "oper_ram", "status"])
      _CheckOutputFields(static=["name", "os", "pnode", "snodes",
                                 "admin_state", "admin_ram",
                                 "disk_template", "ip", "mac", "bridge",
      _CheckOutputFields(static=["name", "os", "pnode", "snodes",
                                 "admin_state", "admin_ram",
                                 "disk_template", "ip", "mac", "bridge",
-                               "sda_size", "sdb_size"],
+                               "sda_size", "sdb_size", "vcpus", "tags"],
                         dynamic=self.dynamic_fields,
                         selected=self.op.output_fields)
  
                         dynamic=self.dynamic_fields,
                         selected=self.op.output_fields)
  
@@ -2347,6 +2475,21 @@ class LUQueryInstances(NoHooksLU):
              val = None
            else:
              val = bool(live_data.get(instance.name))
              val = None
            else:
              val = bool(live_data.get(instance.name))
+        elif field == "status":
+          if instance.primary_node in bad_nodes:
+            val = "ERROR_nodedown"
+          else:
+            running = bool(live_data.get(instance.name))
+            if running:
+              if instance.status != "down":
+                val = "running"
+              else:
+                val = "ERROR_up"
+            else:
+              if instance.status != "down":
+                val = "ERROR_down"
+              else:
+                val = "ADMIN_down"
          elif field == "admin_ram":
            val = instance.memory
          elif field == "oper_ram":
          elif field == "admin_ram":
            val = instance.memory
          elif field == "oper_ram":
@@ -2370,6 +2513,10 @@ class LUQueryInstances(NoHooksLU):
              val = None
            else:
              val = disk.size
              val = None
            else:
              val = disk.size
+        elif field == "vcpus":
+          val = instance.vcpus
+        elif field == "tags":
+          val = list(instance.GetTags())
          else:
            raise errors.ParameterError(field)
          iout.append(val)
          else:
            raise errors.ParameterError(field)
          iout.append(val)
@@ -2418,20 +2565,12 @@ class LUFailoverInstance(LogicalUnit):
      secondary_nodes = instance.secondary_nodes
      if not secondary_nodes:
        raise errors.ProgrammerError("no secondary node but using "
      secondary_nodes = instance.secondary_nodes
      if not secondary_nodes:
        raise errors.ProgrammerError("no secondary node but using "
-                                   "DT_REMOTE_RAID1 template")
+                                   "a mirrored disk template")
  
  
-    # check memory requirements on the secondary node
      target_node = secondary_nodes[0]
      target_node = secondary_nodes[0]
-    nodeinfo = rpc.call_node_info([target_node], self.cfg.GetVGName())
-    info = nodeinfo.get(target_node, None)
-    if not info:
-      raise errors.OpPrereqError("Cannot get current information"
-                                 " from node '%s'" % nodeinfo)
-    if instance.memory > info['memory_free']:
-      raise errors.OpPrereqError("Not enough memory on target node %s."
-                                 " %d MB available, %d MB required" %
-                                 (target_node, info['memory_free'],
-                                  instance.memory))
+    # check memory requirements on the secondary node
+    _CheckNodeFreeMemory(self.cfg, target_node, "failing over instance %s" %
+                         instance.name, instance.memory)
  
      # check bridge existance
      brlist = [nic.bridge for nic in instance.nics]
  
      # check bridge existance
      brlist = [nic.bridge for nic in instance.nics]
@@ -2456,27 +2595,12 @@ class LUFailoverInstance(LogicalUnit):
  
      feedback_fn("* checking disk consistency between source and target")
      for dev in instance.disks:
  
      feedback_fn("* checking disk consistency between source and target")
      for dev in instance.disks:
-      # for remote_raid1, these are md over drbd
+      # for drbd, these are drbd over lvm
        if not _CheckDiskConsistency(self.cfg, dev, target_node, False):
        if not _CheckDiskConsistency(self.cfg, dev, target_node, False):
-        if not self.op.ignore_consistency:
+        if instance.status == "up" and not self.op.ignore_consistency:
            raise errors.OpExecError("Disk %s is degraded on target node,"
                                     " aborting failover." % dev.iv_name)
  
            raise errors.OpExecError("Disk %s is degraded on target node,"
                                     " aborting failover." % dev.iv_name)
  
-    feedback_fn("* checking target node resource availability")
-    nodeinfo = rpc.call_node_info([target_node], self.cfg.GetVGName())
-
-    if not nodeinfo:
-      raise errors.OpExecError("Could not contact target node %s." %
-                               target_node)
-
-    free_memory = int(nodeinfo[target_node]['memory_free'])
-    memory = instance.memory
-    if memory > free_memory:
-      raise errors.OpExecError("Not enough memory to create instance %s on"
-                               " node %s. needed %s MiB, available %s MiB" %
-                               (instance.name, target_node, memory,
-                                free_memory))
-
      feedback_fn("* shutting down instance on source node")
      logger.Info("Shutting down instance %s on node %s" %
                  (instance.name, source_node))
      feedback_fn("* shutting down instance on source node")
      logger.Info("Shutting down instance %s on node %s" %
                  (instance.name, source_node))
@@ -2496,23 +2620,25 @@ class LUFailoverInstance(LogicalUnit):
  
      instance.primary_node = target_node
      # distribute new instance config to the other nodes
  
      instance.primary_node = target_node
      # distribute new instance config to the other nodes
-    self.cfg.AddInstance(instance)
+    self.cfg.Update(instance)
  
  
-    feedback_fn("* activating the instance's disks on target node")
-    logger.Info("Starting instance %s on node %s" %
-                (instance.name, target_node))
+    # Only start the instance if it's marked as up
+    if instance.status == "up":
+      feedback_fn("* activating the instance's disks on target node")
+      logger.Info("Starting instance %s on node %s" %
+                  (instance.name, target_node))
  
  
-    disks_ok, dummy = _AssembleInstanceDisks(instance, self.cfg,
-                                             ignore_secondaries=True)
-    if not disks_ok:
-      _ShutdownInstanceDisks(instance, self.cfg)
-      raise errors.OpExecError("Can't activate the instance's disks")
+      disks_ok, dummy = _AssembleInstanceDisks(instance, self.cfg,
+                                               ignore_secondaries=True)
+      if not disks_ok:
+        _ShutdownInstanceDisks(instance, self.cfg)
+        raise errors.OpExecError("Can't activate the instance's disks")
  
  
-    feedback_fn("* starting the instance on the target node")
-    if not rpc.call_instance_start(target_node, instance, None):
-      _ShutdownInstanceDisks(instance, self.cfg)
-      raise errors.OpExecError("Could not start instance %s on node %s." %
-                               (instance.name, target_node))
+      feedback_fn("* starting the instance on the target node")
+      if not rpc.call_instance_start(target_node, instance, None):
+        _ShutdownInstanceDisks(instance, self.cfg)
+        raise errors.OpExecError("Could not start instance %s on node %s." %
+                                 (instance.name, target_node))
  
  
  def _CreateBlockDevOnPrimary(cfg, node, instance, device, info):
  
  
  def _CreateBlockDevOnPrimary(cfg, node, instance, device, info):
@@ -2578,22 +2704,6 @@ def _GenerateUniqueNames(cfg, exts):
    return results
  
  
    return results
  
  
-def _GenerateMDDRBDBranch(cfg, primary, secondary, size, names):
-  """Generate a drbd device complete with its children.
-
-  """
-  port = cfg.AllocatePort()
-  vgname = cfg.GetVGName()
-  dev_data = objects.Disk(dev_type=constants.LD_LV, size=size,
-                          logical_id=(vgname, names[0]))
-  dev_meta = objects.Disk(dev_type=constants.LD_LV, size=128,
-                          logical_id=(vgname, names[1]))
-  drbd_dev = objects.Disk(dev_type=constants.LD_DRBD7, size=size,
-                          logical_id = (primary, secondary, port),
-                          children = [dev_data, dev_meta])
-  return drbd_dev
-
-
  def _GenerateDRBD8Branch(cfg, primary, secondary, size, names, iv_name):
    """Generate a drbd8 device complete with its children.
  
  def _GenerateDRBD8Branch(cfg, primary, secondary, size, names, iv_name):
    """Generate a drbd8 device complete with its children.
  
@@ -2610,18 +2720,20 @@ def _GenerateDRBD8Branch(cfg, primary, secondary, size, names, iv_name):
                            iv_name=iv_name)
    return drbd_dev
  
                            iv_name=iv_name)
    return drbd_dev
  
+
  def _GenerateDiskTemplate(cfg, template_name,
                            instance_name, primary_node,
  def _GenerateDiskTemplate(cfg, template_name,
                            instance_name, primary_node,
-                          secondary_nodes, disk_sz, swap_sz):
+                          secondary_nodes, disk_sz, swap_sz,
+                          file_storage_dir, file_driver):
    """Generate the entire disk layout for a given template type.
  
    """
    #TODO: compute space requirements
  
    vgname = cfg.GetVGName()
    """Generate the entire disk layout for a given template type.
  
    """
    #TODO: compute space requirements
  
    vgname = cfg.GetVGName()
-  if template_name == "diskless":
+  if template_name == constants.DT_DISKLESS:
      disks = []
      disks = []
-  elif template_name == "plain":
+  elif template_name == constants.DT_PLAIN:
      if len(secondary_nodes) != 0:
        raise errors.ProgrammerError("Wrong template configuration")
  
      if len(secondary_nodes) != 0:
        raise errors.ProgrammerError("Wrong template configuration")
  
@@ -2633,43 +2745,6 @@ def _GenerateDiskTemplate(cfg, template_name,
                             logical_id=(vgname, names[1]),
                             iv_name = "sdb")
      disks = [sda_dev, sdb_dev]
                             logical_id=(vgname, names[1]),
                             iv_name = "sdb")
      disks = [sda_dev, sdb_dev]
-  elif template_name == "local_raid1":
-    if len(secondary_nodes) != 0:
-      raise errors.ProgrammerError("Wrong template configuration")
-
-
-    names = _GenerateUniqueNames(cfg, [".sda_m1", ".sda_m2",
-                                       ".sdb_m1", ".sdb_m2"])
-    sda_dev_m1 = objects.Disk(dev_type=constants.LD_LV, size=disk_sz,
-                              logical_id=(vgname, names[0]))
-    sda_dev_m2 = objects.Disk(dev_type=constants.LD_LV, size=disk_sz,
-                              logical_id=(vgname, names[1]))
-    md_sda_dev = objects.Disk(dev_type=constants.LD_MD_R1, iv_name = "sda",
-                              size=disk_sz,
-                              children = [sda_dev_m1, sda_dev_m2])
-    sdb_dev_m1 = objects.Disk(dev_type=constants.LD_LV, size=swap_sz,
-                              logical_id=(vgname, names[2]))
-    sdb_dev_m2 = objects.Disk(dev_type=constants.LD_LV, size=swap_sz,
-                              logical_id=(vgname, names[3]))
-    md_sdb_dev = objects.Disk(dev_type=constants.LD_MD_R1, iv_name = "sdb",
-                              size=swap_sz,
-                              children = [sdb_dev_m1, sdb_dev_m2])
-    disks = [md_sda_dev, md_sdb_dev]
-  elif template_name == constants.DT_REMOTE_RAID1:
-    if len(secondary_nodes) != 1:
-      raise errors.ProgrammerError("Wrong template configuration")
-    remote_node = secondary_nodes[0]
-    names = _GenerateUniqueNames(cfg, [".sda_data", ".sda_meta",
-                                       ".sdb_data", ".sdb_meta"])
-    drbd_sda_dev = _GenerateMDDRBDBranch(cfg, primary_node, remote_node,
-                                         disk_sz, names[0:2])
-    md_sda_dev = objects.Disk(dev_type=constants.LD_MD_R1, iv_name="sda",
-                              children = [drbd_sda_dev], size=disk_sz)
-    drbd_sdb_dev = _GenerateMDDRBDBranch(cfg, primary_node, remote_node,
-                                         swap_sz, names[2:4])
-    md_sdb_dev = objects.Disk(dev_type=constants.LD_MD_R1, iv_name="sdb",
-                              children = [drbd_sdb_dev], size=swap_sz)
-    disks = [md_sda_dev, md_sdb_dev]
    elif template_name == constants.DT_DRBD8:
      if len(secondary_nodes) != 1:
        raise errors.ProgrammerError("Wrong template configuration")
    elif template_name == constants.DT_DRBD8:
      if len(secondary_nodes) != 1:
        raise errors.ProgrammerError("Wrong template configuration")
@@ -2681,6 +2756,17 @@ def _GenerateDiskTemplate(cfg, template_name,
      drbd_sdb_dev = _GenerateDRBD8Branch(cfg, primary_node, remote_node,
                                           swap_sz, names[2:4], "sdb")
      disks = [drbd_sda_dev, drbd_sdb_dev]
      drbd_sdb_dev = _GenerateDRBD8Branch(cfg, primary_node, remote_node,
                                           swap_sz, names[2:4], "sdb")
      disks = [drbd_sda_dev, drbd_sdb_dev]
+  elif template_name == constants.DT_FILE:
+    if len(secondary_nodes) != 0:
+      raise errors.ProgrammerError("Wrong template configuration")
+
+    file_sda_dev = objects.Disk(dev_type=constants.LD_FILE, size=disk_sz,
+                                iv_name="sda", logical_id=(file_driver,
+                                "%s/sda" % file_storage_dir))
+    file_sdb_dev = objects.Disk(dev_type=constants.LD_FILE, size=swap_sz,
+                                iv_name="sdb", logical_id=(file_driver,
+                                "%s/sdb" % file_storage_dir))
+    disks = [file_sda_dev, file_sdb_dev]
    else:
      raise errors.ProgrammerError("Invalid disk template '%s'" % template_name)
    return disks
    else:
      raise errors.ProgrammerError("Invalid disk template '%s'" % template_name)
    return disks
@@ -2707,9 +2793,22 @@ def _CreateDisks(cfg, instance):
    """
    info = _GetInstanceInfoText(instance)
  
    """
    info = _GetInstanceInfoText(instance)
  
+  if instance.disk_template == constants.DT_FILE:
+    file_storage_dir = os.path.dirname(instance.disks[0].logical_id[1])
+    result = rpc.call_file_storage_dir_create(instance.primary_node,
+                                              file_storage_dir)
+
+    if not result:
+      logger.Error("Could not connect to node '%s'" % instance.primary_node)
+      return False
+
+    if not result[0]:
+      logger.Error("failed to create directory '%s'" % file_storage_dir)
+      return False
+
    for device in instance.disks:
      logger.Info("creating volume %s for instance %s" %
    for device in instance.disks:
      logger.Info("creating volume %s for instance %s" %
-              (device.iv_name, instance.name))
+                (device.iv_name, instance.name))
      #HARDCODE
      for secondary_node in instance.secondary_nodes:
        if not _CreateBlockDevOnSecondary(cfg, secondary_node, instance,
      #HARDCODE
      for secondary_node in instance.secondary_nodes:
        if not _CreateBlockDevOnSecondary(cfg, secondary_node, instance,
@@ -2723,6 +2822,7 @@ def _CreateDisks(cfg, instance):
        logger.Error("failed to create volume %s on primary!" %
                     device.iv_name)
        return False
        logger.Error("failed to create volume %s on primary!" %
                     device.iv_name)
        return False
+
    return True
  
  
    return True
  
  
@@ -2752,18 +2852,86 @@ def _RemoveDisks(instance, cfg):
                       " continuing anyway" %
                       (device.iv_name, node))
          result = False
                       " continuing anyway" %
                       (device.iv_name, node))
          result = False
+
+  if instance.disk_template == constants.DT_FILE:
+    file_storage_dir = os.path.dirname(instance.disks[0].logical_id[1])
+    if not rpc.call_file_storage_dir_remove(instance.primary_node,
+                                            file_storage_dir):
+      logger.Error("could not remove directory '%s'" % file_storage_dir)
+      result = False
+
    return result
  
  
    return result
  
  
+def _ComputeDiskSize(disk_template, disk_size, swap_size):
+  """Compute disk size requirements in the volume group
+
+  This is currently hard-coded for the two-drive layout.
+
+  """
+  # Required free disk space as a function of disk and swap space
+  req_size_dict = {
+    constants.DT_DISKLESS: None,
+    constants.DT_PLAIN: disk_size + swap_size,
+    # 256 MB are added for drbd metadata, 128MB for each drbd device
+    constants.DT_DRBD8: disk_size + swap_size + 256,
+    constants.DT_FILE: None,
+  }
+
+  if disk_template not in req_size_dict:
+    raise errors.ProgrammerError("Disk template '%s' size requirement"
+                                 " is unknown" %  disk_template)
+
+  return req_size_dict[disk_template]
+
+
  class LUCreateInstance(LogicalUnit):
    """Create an instance.
  
    """
    HPATH = "instance-add"
    HTYPE = constants.HTYPE_INSTANCE
  class LUCreateInstance(LogicalUnit):
    """Create an instance.
  
    """
    HPATH = "instance-add"
    HTYPE = constants.HTYPE_INSTANCE
-  _OP_REQP = ["instance_name", "mem_size", "disk_size", "pnode",
+  _OP_REQP = ["instance_name", "mem_size", "disk_size",
                "disk_template", "swap_size", "mode", "start", "vcpus",
                "disk_template", "swap_size", "mode", "start", "vcpus",
-              "wait_for_sync", "ip_check"]
+              "wait_for_sync", "ip_check", "mac"]
+
+  def _RunAllocator(self):
+    """Run the allocator based on input opcode.
+
+    """
+    disks = [{"size": self.op.disk_size, "mode": "w"},
+             {"size": self.op.swap_size, "mode": "w"}]
+    nics = [{"mac": self.op.mac, "ip": getattr(self.op, "ip", None),
+             "bridge": self.op.bridge}]
+    ial = IAllocator(self.cfg, self.sstore,
+                     mode=constants.IALLOCATOR_MODE_ALLOC,
+                     name=self.op.instance_name,
+                     disk_template=self.op.disk_template,
+                     tags=[],
+                     os=self.op.os_type,
+                     vcpus=self.op.vcpus,
+                     mem_size=self.op.mem_size,
+                     disks=disks,
+                     nics=nics,
+                     )
+
+    ial.Run(self.op.iallocator)
+
+    if not ial.success:
+      raise errors.OpPrereqError("Can't compute nodes using"
+                                 " iallocator '%s': %s" % (self.op.iallocator,
+                                                           ial.info))
+    if len(ial.nodes) != ial.required_nodes:
+      raise errors.OpPrereqError("iallocator '%s' returned invalid number"
+                                 " of nodes (%s), required %s" %
+                                 (len(ial.nodes), ial.required_nodes))
+    self.op.pnode = ial.nodes[0]
+    logger.ToStdout("Selected nodes for the instance: %s" %
+                    (", ".join(ial.nodes),))
+    logger.Info("Selected nodes for instance %s via iallocator %s: %s" %
+                (self.op.instance_name, self.op.iallocator, ial.nodes))
+    if ial.required_nodes == 2:
+      self.op.snode = ial.nodes[1]
  
    def BuildHooksEnv(self):
      """Build hooks env.
  
    def BuildHooksEnv(self):
      """Build hooks env.
@@ -2789,7 +2957,7 @@ class LUCreateInstance(LogicalUnit):
        os_type=self.op.os_type,
        memory=self.op.mem_size,
        vcpus=self.op.vcpus,
        os_type=self.op.os_type,
        memory=self.op.mem_size,
        vcpus=self.op.vcpus,
-      nics=[(self.inst_ip, self.op.bridge)],
+      nics=[(self.inst_ip, self.op.bridge, self.op.mac)],
      ))
  
      nl = ([self.sstore.GetMasterNode(), self.op.pnode] +
      ))
  
      nl = ([self.sstore.GetMasterNode(), self.op.pnode] +
@@ -2801,11 +2969,23 @@ class LUCreateInstance(LogicalUnit):
      """Check prerequisites.
  
      """
      """Check prerequisites.
  
      """
+    # set optional parameters to none if they don't exist
+    for attr in ["kernel_path", "initrd_path", "hvm_boot_order", "pnode",
+                 "iallocator", "hvm_acpi", "hvm_pae", "hvm_cdrom_image_path",
+                 "vnc_bind_address"]:
+      if not hasattr(self.op, attr):
+        setattr(self.op, attr, None)
+
      if self.op.mode not in (constants.INSTANCE_CREATE,
                              constants.INSTANCE_IMPORT):
        raise errors.OpPrereqError("Invalid instance creation mode '%s'" %
                                   self.op.mode)
  
      if self.op.mode not in (constants.INSTANCE_CREATE,
                              constants.INSTANCE_IMPORT):
        raise errors.OpPrereqError("Invalid instance creation mode '%s'" %
                                   self.op.mode)
  
+    if (not self.cfg.GetVGName() and
+        self.op.disk_template not in constants.DTS_NOT_LVM):
+      raise errors.OpPrereqError("Cluster does not support lvm-based"
+                                 " instances")
+
      if self.op.mode == constants.INSTANCE_IMPORT:
        src_node = getattr(self.op, "src_node", None)
        src_path = getattr(self.op, "src_path", None)
      if self.op.mode == constants.INSTANCE_IMPORT:
        src_node = getattr(self.op, "src_node", None)
        src_path = getattr(self.op, "src_path", None)
@@ -2846,69 +3026,13 @@ class LUCreateInstance(LogicalUnit):
        if getattr(self.op, "os_type", None) is None:
          raise errors.OpPrereqError("No guest OS specified")
  
        if getattr(self.op, "os_type", None) is None:
          raise errors.OpPrereqError("No guest OS specified")
  
-    # check primary node
-    pnode = self.cfg.GetNodeInfo(self.cfg.ExpandNodeName(self.op.pnode))
-    if pnode is None:
-      raise errors.OpPrereqError("Primary node '%s' is unknown" %
-                                 self.op.pnode)
-    self.op.pnode = pnode.name
-    self.pnode = pnode
-    self.secondaries = []
+    #### instance parameters check
+
      # disk template and mirror node verification
      if self.op.disk_template not in constants.DISK_TEMPLATES:
        raise errors.OpPrereqError("Invalid disk template name")
  
      # disk template and mirror node verification
      if self.op.disk_template not in constants.DISK_TEMPLATES:
        raise errors.OpPrereqError("Invalid disk template name")
  
-    if self.op.disk_template in constants.DTS_NET_MIRROR:
-      if getattr(self.op, "snode", None) is None:
-        raise errors.OpPrereqError("The networked disk templates need"
-                                   " a mirror node")
-
-      snode_name = self.cfg.ExpandNodeName(self.op.snode)
-      if snode_name is None:
-        raise errors.OpPrereqError("Unknown secondary node '%s'" %
-                                   self.op.snode)
-      elif snode_name == pnode.name:
-        raise errors.OpPrereqError("The secondary node cannot be"
-                                   " the primary node.")
-      self.secondaries.append(snode_name)
-
-    # Check lv size requirements
-    nodenames = [pnode.name] + self.secondaries
-    nodeinfo = rpc.call_node_info(nodenames, self.cfg.GetVGName())
-
-    # Required free disk space as a function of disk and swap space
-    req_size_dict = {
-      constants.DT_DISKLESS: 0,
-      constants.DT_PLAIN: self.op.disk_size + self.op.swap_size,
-      constants.DT_LOCAL_RAID1: (self.op.disk_size + self.op.swap_size) * 2,
-      # 256 MB are added for drbd metadata, 128MB for each drbd device
-      constants.DT_REMOTE_RAID1: self.op.disk_size + self.op.swap_size + 256,
-      constants.DT_DRBD8: self.op.disk_size + self.op.swap_size + 256,
-    }
-
-    if self.op.disk_template not in req_size_dict:
-      raise errors.ProgrammerError("Disk template '%s' size requirement"
-                                   " is unknown" %  self.op.disk_template)
-
-    req_size = req_size_dict[self.op.disk_template]
-
-    for node in nodenames:
-      info = nodeinfo.get(node, None)
-      if not info:
-        raise errors.OpPrereqError("Cannot get current information"
-                                   " from node '%s'" % nodeinfo)
-      if req_size > info['vg_free']:
-        raise errors.OpPrereqError("Not enough disk space on target node %s."
-                                   " %d MB available, %d MB required" %
-                                   (node, info['vg_free'], req_size))
-
-    # os verification
-    os_obj = rpc.call_os_get(pnode.name, self.op.os_type)
-    if not os_obj:
-      raise errors.OpPrereqError("OS '%s' not in supported os list for"
-                                 " primary node"  % self.op.os_type)
-
-    # instance verification
+    # instance name verification
      hostname1 = utils.HostInfo(self.op.instance_name)
  
      self.op.instance_name = instance_name = hostname1.name
      hostname1 = utils.HostInfo(self.op.instance_name)
  
      self.op.instance_name = instance_name = hostname1.name
@@ -2917,6 +3041,7 @@ class LUCreateInstance(LogicalUnit):
        raise errors.OpPrereqError("Instance '%s' is already in the cluster" %
                                   instance_name)
  
        raise errors.OpPrereqError("Instance '%s' is already in the cluster" %
                                   instance_name)
  
+    # ip validity checks
      ip = getattr(self.op, "ip", None)
      if ip is None or ip.lower() == "none":
        inst_ip = None
      ip = getattr(self.op, "ip", None)
      if ip is None or ip.lower() == "none":
        inst_ip = None
@@ -2927,18 +3052,23 @@ class LUCreateInstance(LogicalUnit):
          raise errors.OpPrereqError("given IP address '%s' doesn't look"
                                     " like a valid IP" % ip)
        inst_ip = ip
          raise errors.OpPrereqError("given IP address '%s' doesn't look"
                                     " like a valid IP" % ip)
        inst_ip = ip
-    self.inst_ip = inst_ip
+    self.inst_ip = self.op.ip = inst_ip
  
      if self.op.start and not self.op.ip_check:
        raise errors.OpPrereqError("Cannot ignore IP address conflicts when"
                                   " adding an instance in start mode")
  
      if self.op.ip_check:
  
      if self.op.start and not self.op.ip_check:
        raise errors.OpPrereqError("Cannot ignore IP address conflicts when"
                                   " adding an instance in start mode")
  
      if self.op.ip_check:
-      if utils.TcpPing(utils.HostInfo().name, hostname1.ip,
-                       constants.DEFAULT_NODED_PORT):
+      if utils.TcpPing(hostname1.ip, constants.DEFAULT_NODED_PORT):
          raise errors.OpPrereqError("IP %s of instance %s already in use" %
                                     (hostname1.ip, instance_name))
  
          raise errors.OpPrereqError("IP %s of instance %s already in use" %
                                     (hostname1.ip, instance_name))
  
+    # MAC address verification
+    if self.op.mac != "auto":
+      if not utils.IsValidMac(self.op.mac.lower()):
+        raise errors.OpPrereqError("invalid MAC address specified: %s" %
+                                   self.op.mac)
+
      # bridge verification
      bridge = getattr(self.op, "bridge", None)
      if bridge is None:
      # bridge verification
      bridge = getattr(self.op, "bridge", None)
      if bridge is None:
@@ -2946,11 +3076,117 @@ class LUCreateInstance(LogicalUnit):
      else:
        self.op.bridge = bridge
  
      else:
        self.op.bridge = bridge
  
+    # boot order verification
+    if self.op.hvm_boot_order is not None:
+      if len(self.op.hvm_boot_order.strip("acdn")) != 0:
+        raise errors.OpPrereqError("invalid boot order specified,"
+                                   " must be one or more of [acdn]")
+    # file storage checks
+    if (self.op.file_driver and
+        not self.op.file_driver in constants.FILE_DRIVER):
+      raise errors.OpPrereqError("Invalid file driver name '%s'" %
+                                 self.op.file_driver)
+
+    if self.op.file_storage_dir and os.path.isabs(self.op.file_storage_dir):
+      raise errors.OpPrereqError("File storage directory not a relative"
+                                 " path")
+    #### allocator run
+
+    if [self.op.iallocator, self.op.pnode].count(None) != 1:
+      raise errors.OpPrereqError("One and only one of iallocator and primary"
+                                 " node must be given")
+
+    if self.op.iallocator is not None:
+      self._RunAllocator()
+
+    #### node related checks
+
+    # check primary node
+    pnode = self.cfg.GetNodeInfo(self.cfg.ExpandNodeName(self.op.pnode))
+    if pnode is None:
+      raise errors.OpPrereqError("Primary node '%s' is unknown" %
+                                 self.op.pnode)
+    self.op.pnode = pnode.name
+    self.pnode = pnode
+    self.secondaries = []
+
+    # mirror node verification
+    if self.op.disk_template in constants.DTS_NET_MIRROR:
+      if getattr(self.op, "snode", None) is None:
+        raise errors.OpPrereqError("The networked disk templates need"
+                                   " a mirror node")
+
+      snode_name = self.cfg.ExpandNodeName(self.op.snode)
+      if snode_name is None:
+        raise errors.OpPrereqError("Unknown secondary node '%s'" %
+                                   self.op.snode)
+      elif snode_name == pnode.name:
+        raise errors.OpPrereqError("The secondary node cannot be"
+                                   " the primary node.")
+      self.secondaries.append(snode_name)
+
+    req_size = _ComputeDiskSize(self.op.disk_template,
+                                self.op.disk_size, self.op.swap_size)
+
+    # Check lv size requirements
+    if req_size is not None:
+      nodenames = [pnode.name] + self.secondaries
+      nodeinfo = rpc.call_node_info(nodenames, self.cfg.GetVGName())
+      for node in nodenames:
+        info = nodeinfo.get(node, None)
+        if not info:
+          raise errors.OpPrereqError("Cannot get current information"
+                                     " from node '%s'" % node)
+        vg_free = info.get('vg_free', None)
+        if not isinstance(vg_free, int):
+          raise errors.OpPrereqError("Can't compute free disk space on"
+                                     " node %s" % node)
+        if req_size > info['vg_free']:
+          raise errors.OpPrereqError("Not enough disk space on target node %s."
+                                     " %d MB available, %d MB required" %
+                                     (node, info['vg_free'], req_size))
+
+    # os verification
+    os_obj = rpc.call_os_get(pnode.name, self.op.os_type)
+    if not os_obj:
+      raise errors.OpPrereqError("OS '%s' not in supported os list for"
+                                 " primary node"  % self.op.os_type)
+
+    if self.op.kernel_path == constants.VALUE_NONE:
+      raise errors.OpPrereqError("Can't set instance kernel to none")
+
+
+    # bridge check on primary node
      if not rpc.call_bridges_exist(self.pnode.name, [self.op.bridge]):
        raise errors.OpPrereqError("target bridge '%s' does not exist on"
                                   " destination node '%s'" %
                                   (self.op.bridge, pnode.name))
  
      if not rpc.call_bridges_exist(self.pnode.name, [self.op.bridge]):
        raise errors.OpPrereqError("target bridge '%s' does not exist on"
                                   " destination node '%s'" %
                                   (self.op.bridge, pnode.name))
  
+    # memory check on primary node
+    if self.op.start:
+      _CheckNodeFreeMemory(self.cfg, self.pnode.name,
+                           "creating instance %s" % self.op.instance_name,
+                           self.op.mem_size)
+
+    # hvm_cdrom_image_path verification
+    if self.op.hvm_cdrom_image_path is not None:
+      if not os.path.isabs(self.op.hvm_cdrom_image_path):
+        raise errors.OpPrereqError("The path to the HVM CDROM image must"
+                                   " be an absolute path or None, not %s" %
+                                   self.op.hvm_cdrom_image_path)
+      if not os.path.isfile(self.op.hvm_cdrom_image_path):
+        raise errors.OpPrereqError("The HVM CDROM image must either be a"
+                                   " regular file or a symlink pointing to"
+                                   " an existing regular file, not %s" %
+                                   self.op.hvm_cdrom_image_path)
+
+    # vnc_bind_address verification
+    if self.op.vnc_bind_address is not None:
+      if not utils.IsValidIP(self.op.vnc_bind_address):
+        raise errors.OpPrereqError("given VNC bind address '%s' doesn't look"
+                                   " like a valid IP address" %
+                                   self.op.vnc_bind_address)
+
      if self.op.start:
        self.instance_status = 'up'
      else:
      if self.op.start:
        self.instance_status = 'up'
      else:
@@ -2963,15 +3199,43 @@ class LUCreateInstance(LogicalUnit):
      instance = self.op.instance_name
      pnode_name = self.pnode.name
  
      instance = self.op.instance_name
      pnode_name = self.pnode.name
  
-    nic = objects.NIC(bridge=self.op.bridge, mac=self.cfg.GenerateMAC())
+    if self.op.mac == "auto":
+      mac_address = self.cfg.GenerateMAC()
+    else:
+      mac_address = self.op.mac
+
+    nic = objects.NIC(bridge=self.op.bridge, mac=mac_address)
      if self.inst_ip is not None:
        nic.ip = self.inst_ip
  
      if self.inst_ip is not None:
        nic.ip = self.inst_ip
  
+    ht_kind = self.sstore.GetHypervisorType()
+    if ht_kind in constants.HTS_REQ_PORT:
+      network_port = self.cfg.AllocatePort()
+    else:
+      network_port = None
+
+    if self.op.vnc_bind_address is None:
+      self.op.vnc_bind_address = constants.VNC_DEFAULT_BIND_ADDRESS
+
+    # this is needed because os.path.join does not accept None arguments
+    if self.op.file_storage_dir is None:
+      string_file_storage_dir = ""
+    else:
+      string_file_storage_dir = self.op.file_storage_dir
+
+    # build the full file storage dir path
+    file_storage_dir = os.path.normpath(os.path.join(
+                                        self.sstore.GetFileStorageDir(),
+                                        string_file_storage_dir, instance))
+
+
      disks = _GenerateDiskTemplate(self.cfg,
                                    self.op.disk_template,
                                    instance, pnode_name,
                                    self.secondaries, self.op.disk_size,
      disks = _GenerateDiskTemplate(self.cfg,
                                    self.op.disk_template,
                                    instance, pnode_name,
                                    self.secondaries, self.op.disk_size,
-                                  self.op.swap_size)
+                                  self.op.swap_size,
+                                  file_storage_dir,
+                                  self.op.file_driver)
  
      iobj = objects.Instance(name=instance, os=self.op.os_type,
                              primary_node=pnode_name,
  
      iobj = objects.Instance(name=instance, os=self.op.os_type,
                              primary_node=pnode_name,
@@ -2980,6 +3244,14 @@ class LUCreateInstance(LogicalUnit):
                              nics=[nic], disks=disks,
                              disk_template=self.op.disk_template,
                              status=self.instance_status,
                              nics=[nic], disks=disks,
                              disk_template=self.op.disk_template,
                              status=self.instance_status,
+                            network_port=network_port,
+                            kernel_path=self.op.kernel_path,
+                            initrd_path=self.op.initrd_path,
+                            hvm_boot_order=self.op.hvm_boot_order,
+                            hvm_acpi=self.op.hvm_acpi,
+                            hvm_pae=self.op.hvm_pae,
+                            hvm_cdrom_image_path=self.op.hvm_cdrom_image_path,
+                            vnc_bind_address=self.op.vnc_bind_address,
                              )
  
      feedback_fn("* creating instance disks...")
                              )
  
      feedback_fn("* creating instance disks...")
@@ -2990,6 +3262,8 @@ class LUCreateInstance(LogicalUnit):
      feedback_fn("adding instance %s to cluster config" % instance)
  
      self.cfg.AddInstance(iobj)
      feedback_fn("adding instance %s to cluster config" % instance)
  
      self.cfg.AddInstance(iobj)
+    # Add the new instance to the Ganeti Lock Manager
+    self.context.glm.add(locking.LEVEL_INSTANCE, instance)
  
      if self.op.wait_for_sync:
        disk_abort = not _WaitForSync(self.cfg, iobj, self.proc)
  
      if self.op.wait_for_sync:
        disk_abort = not _WaitForSync(self.cfg, iobj, self.proc)
@@ -3004,6 +3278,8 @@ class LUCreateInstance(LogicalUnit):
      if disk_abort:
        _RemoveDisks(iobj, self.cfg)
        self.cfg.RemoveInstance(iobj.name)
      if disk_abort:
        _RemoveDisks(iobj, self.cfg)
        self.cfg.RemoveInstance(iobj.name)
+      # Remove the new instance from the Ganeti Lock Manager
+      self.context.glm.remove(locking.LEVEL_INSTANCE, iobj.name)
        raise errors.OpExecError("There are some degraded disks for"
                                 " this instance")
  
        raise errors.OpExecError("There are some degraded disks for"
                                 " this instance")
  
@@ -3042,191 +3318,12 @@ class LUCreateInstance(LogicalUnit):
  class LUConnectConsole(NoHooksLU):
    """Connect to an instance's console.
  
  class LUConnectConsole(NoHooksLU):
    """Connect to an instance's console.
  
-  This is somewhat special in that it returns the command line that
-  you need to run on the master node in order to connect to the
-  console.
-
-  """
-  _OP_REQP = ["instance_name"]
-
-  def CheckPrereq(self):
-    """Check prerequisites.
-
-    This checks that the instance is in the cluster.
-
-    """
-    instance = self.cfg.GetInstanceInfo(
-      self.cfg.ExpandInstanceName(self.op.instance_name))
-    if instance is None:
-      raise errors.OpPrereqError("Instance '%s' not known" %
-                                 self.op.instance_name)
-    self.instance = instance
-
-  def Exec(self, feedback_fn):
-    """Connect to the console of an instance
-
-    """
-    instance = self.instance
-    node = instance.primary_node
-
-    node_insts = rpc.call_instance_list([node])[node]
-    if node_insts is False:
-      raise errors.OpExecError("Can't connect to node %s." % node)
-
-    if instance.name not in node_insts:
-      raise errors.OpExecError("Instance %s is not running." % instance.name)
-
-    logger.Debug("connecting to console of %s on %s" % (instance.name, node))
-
-    hyper = hypervisor.GetHypervisor()
-    console_cmd = hyper.GetShellCommandForConsole(instance.name)
-    # build ssh cmdline
-    argv = ["ssh", "-q", "-t"]
-    argv.extend(ssh.KNOWN_HOSTS_OPTS)
-    argv.extend(ssh.BATCH_MODE_OPTS)
-    argv.append(node)
-    argv.append(console_cmd)
-    return "ssh", argv
-
-
-class LUAddMDDRBDComponent(LogicalUnit):
-  """Adda new mirror member to an instance's disk.
-
-  """
-  HPATH = "mirror-add"
-  HTYPE = constants.HTYPE_INSTANCE
-  _OP_REQP = ["instance_name", "remote_node", "disk_name"]
-
-  def BuildHooksEnv(self):
-    """Build hooks env.
-
-    This runs on the master, the primary and all the secondaries.
-
-    """
-    env = {
-      "NEW_SECONDARY": self.op.remote_node,
-      "DISK_NAME": self.op.disk_name,
-      }
-    env.update(_BuildInstanceHookEnvByObject(self.instance))
-    nl = [self.sstore.GetMasterNode(), self.instance.primary_node,
-          self.op.remote_node,] + list(self.instance.secondary_nodes)
-    return env, nl, nl
-
-  def CheckPrereq(self):
-    """Check prerequisites.
-
-    This checks that the instance is in the cluster.
-
-    """
-    instance = self.cfg.GetInstanceInfo(
-      self.cfg.ExpandInstanceName(self.op.instance_name))
-    if instance is None:
-      raise errors.OpPrereqError("Instance '%s' not known" %
-                                 self.op.instance_name)
-    self.instance = instance
-
-    remote_node = self.cfg.ExpandNodeName(self.op.remote_node)
-    if remote_node is None:
-      raise errors.OpPrereqError("Node '%s' not known" % self.op.remote_node)
-    self.remote_node = remote_node
-
-    if remote_node == instance.primary_node:
-      raise errors.OpPrereqError("The specified node is the primary node of"
-                                 " the instance.")
-
-    if instance.disk_template != constants.DT_REMOTE_RAID1:
-      raise errors.OpPrereqError("Instance's disk layout is not"
-                                 " remote_raid1.")
-    for disk in instance.disks:
-      if disk.iv_name == self.op.disk_name:
-        break
-    else:
-      raise errors.OpPrereqError("Can't find this device ('%s') in the"
-                                 " instance." % self.op.disk_name)
-    if len(disk.children) > 1:
-      raise errors.OpPrereqError("The device already has two slave"
-                                 " devices.\n"
-                                 "This would create a 3-disk raid1"
-                                 " which we don't allow.")
-    self.disk = disk
-
-  def Exec(self, feedback_fn):
-    """Add the mirror component
-
-    """
-    disk = self.disk
-    instance = self.instance
-
-    remote_node = self.remote_node
-    lv_names = [".%s_%s" % (disk.iv_name, suf) for suf in ["data", "meta"]]
-    names = _GenerateUniqueNames(self.cfg, lv_names)
-    new_drbd = _GenerateMDDRBDBranch(self.cfg, instance.primary_node,
-                                     remote_node, disk.size, names)
-
-    logger.Info("adding new mirror component on secondary")
-    #HARDCODE
-    if not _CreateBlockDevOnSecondary(self.cfg, remote_node, instance,
-                                      new_drbd, False,
-                                      _GetInstanceInfoText(instance)):
-      raise errors.OpExecError("Failed to create new component on secondary"
-                               " node %s" % remote_node)
-
-    logger.Info("adding new mirror component on primary")
-    #HARDCODE
-    if not _CreateBlockDevOnPrimary(self.cfg, instance.primary_node,
-                                    instance, new_drbd,
-                                    _GetInstanceInfoText(instance)):
-      # remove secondary dev
-      self.cfg.SetDiskID(new_drbd, remote_node)
-      rpc.call_blockdev_remove(remote_node, new_drbd)
-      raise errors.OpExecError("Failed to create volume on primary")
-
-    # the device exists now
-    # call the primary node to add the mirror to md
-    logger.Info("adding new mirror component to md")
-    if not rpc.call_blockdev_addchildren(instance.primary_node,
-                                         disk, [new_drbd]):
-      logger.Error("Can't add mirror compoment to md!")
-      self.cfg.SetDiskID(new_drbd, remote_node)
-      if not rpc.call_blockdev_remove(remote_node, new_drbd):
-        logger.Error("Can't rollback on secondary")
-      self.cfg.SetDiskID(new_drbd, instance.primary_node)
-      if not rpc.call_blockdev_remove(instance.primary_node, new_drbd):
-        logger.Error("Can't rollback on primary")
-      raise errors.OpExecError("Can't add mirror component to md array")
-
-    disk.children.append(new_drbd)
-
-    self.cfg.AddInstance(instance)
-
-    _WaitForSync(self.cfg, instance, self.proc)
-
-    return 0
-
-
-class LURemoveMDDRBDComponent(LogicalUnit):
-  """Remove a component from a remote_raid1 disk.
-
-  """
-  HPATH = "mirror-remove"
-  HTYPE = constants.HTYPE_INSTANCE
-  _OP_REQP = ["instance_name", "disk_name", "disk_id"]
-
-  def BuildHooksEnv(self):
-    """Build hooks env.
-
-    This runs on the master, the primary and all the secondaries.
-
-    """
-    env = {
-      "DISK_NAME": self.op.disk_name,
-      "DISK_ID": self.op.disk_id,
-      "OLD_SECONDARY": self.old_secondary,
-      }
-    env.update(_BuildInstanceHookEnvByObject(self.instance))
-    nl = [self.sstore.GetMasterNode(),
-          self.instance.primary_node] + list(self.instance.secondary_nodes)
-    return env, nl, nl
+  This is somewhat special in that it returns the command line that
+  you need to run on the master node in order to connect to the
+  console.
+
+  """
+  _OP_REQP = ["instance_name"]
  
    def CheckPrereq(self):
      """Check prerequisites.
  
    def CheckPrereq(self):
      """Check prerequisites.
@@ -3241,54 +3338,27 @@ class LURemoveMDDRBDComponent(LogicalUnit):
                                   self.op.instance_name)
      self.instance = instance
  
                                   self.op.instance_name)
      self.instance = instance
  
-    if instance.disk_template != constants.DT_REMOTE_RAID1:
-      raise errors.OpPrereqError("Instance's disk layout is not"
-                                 " remote_raid1.")
-    for disk in instance.disks:
-      if disk.iv_name == self.op.disk_name:
-        break
-    else:
-      raise errors.OpPrereqError("Can't find this device ('%s') in the"
-                                 " instance." % self.op.disk_name)
-    for child in disk.children:
-      if (child.dev_type == constants.LD_DRBD7 and
-          child.logical_id[2] == self.op.disk_id):
-        break
-    else:
-      raise errors.OpPrereqError("Can't find the device with this port.")
-
-    if len(disk.children) < 2:
-      raise errors.OpPrereqError("Cannot remove the last component from"
-                                 " a mirror.")
-    self.disk = disk
-    self.child = child
-    if self.child.logical_id[0] == instance.primary_node:
-      oid = 1
-    else:
-      oid = 0
-    self.old_secondary = self.child.logical_id[oid]
-
    def Exec(self, feedback_fn):
    def Exec(self, feedback_fn):
-    """Remove the mirror component
+    """Connect to the console of an instance
  
      """
      instance = self.instance
  
      """
      instance = self.instance
-    disk = self.disk
-    child = self.child
-    logger.Info("remove mirror component")
-    self.cfg.SetDiskID(disk, instance.primary_node)
-    if not rpc.call_blockdev_removechildren(instance.primary_node,
-                                            disk, [child]):
-      raise errors.OpExecError("Can't remove child from mirror.")
-
-    for node in child.logical_id[:2]:
-      self.cfg.SetDiskID(child, node)
-      if not rpc.call_blockdev_remove(node, child):
-        logger.Error("Warning: failed to remove device from node %s,"
-                     " continuing operation." % node)
-
-    disk.children.remove(child)
-    self.cfg.AddInstance(instance)
+    node = instance.primary_node
+
+    node_insts = rpc.call_instance_list([node])[node]
+    if node_insts is False:
+      raise errors.OpExecError("Can't connect to node %s." % node)
+
+    if instance.name not in node_insts:
+      raise errors.OpExecError("Instance %s is not running." % instance.name)
+
+    logger.Debug("connecting to console of %s on %s" % (instance.name, node))
+
+    hyper = hypervisor.GetHypervisor()
+    console_cmd = hyper.GetShellCommandForConsole(instance)
+
+    # build ssh cmdline
+    return self.ssh.BuildCmd(node, "root", console_cmd, batch=True, tty=True)
  
  
  class LUReplaceDisks(LogicalUnit):
  
  
  class LUReplaceDisks(LogicalUnit):
@@ -3299,6 +3369,29 @@ class LUReplaceDisks(LogicalUnit):
    HTYPE = constants.HTYPE_INSTANCE
    _OP_REQP = ["instance_name", "mode", "disks"]
  
    HTYPE = constants.HTYPE_INSTANCE
    _OP_REQP = ["instance_name", "mode", "disks"]
  
+  def _RunAllocator(self):
+    """Compute a new secondary node using an IAllocator.
+
+    """
+    ial = IAllocator(self.cfg, self.sstore,
+                     mode=constants.IALLOCATOR_MODE_RELOC,
+                     name=self.op.instance_name,
+                     relocate_from=[self.sec_node])
+
+    ial.Run(self.op.iallocator)
+
+    if not ial.success:
+      raise errors.OpPrereqError("Can't compute nodes using"
+                                 " iallocator '%s': %s" % (self.op.iallocator,
+                                                           ial.info))
+    if len(ial.nodes) != ial.required_nodes:
+      raise errors.OpPrereqError("iallocator '%s' returned invalid number"
+                                 " of nodes (%s), required %s" %
+                                 (len(ial.nodes), ial.required_nodes))
+    self.op.remote_node = ial.nodes[0]
+    logger.ToStdout("Selected new secondary for the instance: %s" %
+                    self.op.remote_node)
+
    def BuildHooksEnv(self):
      """Build hooks env.
  
    def BuildHooksEnv(self):
      """Build hooks env.
  
@@ -3325,6 +3418,9 @@ class LUReplaceDisks(LogicalUnit):
      This checks that the instance is in the cluster.
  
      """
      This checks that the instance is in the cluster.
  
      """
+    if not hasattr(self.op, "remote_node"):
+      self.op.remote_node = None
+
      instance = self.cfg.GetInstanceInfo(
        self.cfg.ExpandInstanceName(self.op.instance_name))
      if instance is None:
      instance = self.cfg.GetInstanceInfo(
        self.cfg.ExpandInstanceName(self.op.instance_name))
      if instance is None:
@@ -3344,7 +3440,14 @@ class LUReplaceDisks(LogicalUnit):
  
      self.sec_node = instance.secondary_nodes[0]
  
  
      self.sec_node = instance.secondary_nodes[0]
  
-    remote_node = getattr(self.op, "remote_node", None)
+    ia_name = getattr(self.op, "iallocator", None)
+    if ia_name is not None:
+      if self.op.remote_node is not None:
+        raise errors.OpPrereqError("Give either the iallocator or the new"
+                                   " secondary, not both")
+      self.op.remote_node = self._RunAllocator()
+
+    remote_node = self.op.remote_node
      if remote_node is not None:
        remote_node = self.cfg.ExpandNodeName(remote_node)
        if remote_node is None:
      if remote_node is not None:
        remote_node = self.cfg.ExpandNodeName(remote_node)
        if remote_node is None:
@@ -3362,13 +3465,6 @@ class LUReplaceDisks(LogicalUnit):
          # replacement as for drbd7 (no different port allocated)
          raise errors.OpPrereqError("Same secondary given, cannot execute"
                                     " replacement")
          # replacement as for drbd7 (no different port allocated)
          raise errors.OpPrereqError("Same secondary given, cannot execute"
                                     " replacement")
-      # the user gave the current secondary, switch to
-      # 'no-replace-secondary' mode for drbd7
-      remote_node = None
-    if (instance.disk_template == constants.DT_REMOTE_RAID1 and
-        self.op.mode != constants.REPLACE_DISK_ALL):
-      raise errors.OpPrereqError("Template 'remote_raid1' only allows all"
-                                 " disks replacement, not individual ones")
      if instance.disk_template == constants.DT_DRBD8:
        if (self.op.mode == constants.REPLACE_DISK_ALL and
            remote_node is not None):
      if instance.disk_template == constants.DT_DRBD8:
        if (self.op.mode == constants.REPLACE_DISK_ALL and
            remote_node is not None):
@@ -3376,12 +3472,12 @@ class LUReplaceDisks(LogicalUnit):
          self.op.mode = constants.REPLACE_DISK_SEC
  
        if self.op.mode == constants.REPLACE_DISK_ALL:
          self.op.mode = constants.REPLACE_DISK_SEC
  
        if self.op.mode == constants.REPLACE_DISK_ALL:
-        raise errors.OpPrereqError("Template 'drbd8' only allows primary or"
+        raise errors.OpPrereqError("Template 'drbd' only allows primary or"
                                     " secondary disk replacement, not"
                                     " both at once")
        elif self.op.mode == constants.REPLACE_DISK_PRI:
          if remote_node is not None:
                                     " secondary disk replacement, not"
                                     " both at once")
        elif self.op.mode == constants.REPLACE_DISK_PRI:
          if remote_node is not None:
-          raise errors.OpPrereqError("Template 'drbd8' does not allow changing"
+          raise errors.OpPrereqError("Template 'drbd' does not allow changing"
                                       " the secondary while doing a primary"
                                       " node disk replacement")
          self.tgt_node = instance.primary_node
                                       " the secondary while doing a primary"
                                       " node disk replacement")
          self.tgt_node = instance.primary_node
@@ -3400,102 +3496,6 @@ class LUReplaceDisks(LogicalUnit):
                                     (name, instance.name))
      self.op.remote_node = remote_node
  
                                     (name, instance.name))
      self.op.remote_node = remote_node
  
-  def _ExecRR1(self, feedback_fn):
-    """Replace the disks of an instance.
-
-    """
-    instance = self.instance
-    iv_names = {}
-    # start of work
-    if self.op.remote_node is None:
-      remote_node = self.sec_node
-    else:
-      remote_node = self.op.remote_node
-    cfg = self.cfg
-    for dev in instance.disks:
-      size = dev.size
-      lv_names = [".%s_%s" % (dev.iv_name, suf) for suf in ["data", "meta"]]
-      names = _GenerateUniqueNames(cfg, lv_names)
-      new_drbd = _GenerateMDDRBDBranch(cfg, instance.primary_node,
-                                       remote_node, size, names)
-      iv_names[dev.iv_name] = (dev, dev.children[0], new_drbd)
-      logger.Info("adding new mirror component on secondary for %s" %
-                  dev.iv_name)
-      #HARDCODE
-      if not _CreateBlockDevOnSecondary(cfg, remote_node, instance,
-                                        new_drbd, False,
-                                        _GetInstanceInfoText(instance)):
-        raise errors.OpExecError("Failed to create new component on"
-                                 " secondary node %s\n"
-                                 "Full abort, cleanup manually!" %
-                                 remote_node)
-
-      logger.Info("adding new mirror component on primary")
-      #HARDCODE
-      if not _CreateBlockDevOnPrimary(cfg, instance.primary_node,
-                                      instance, new_drbd,
-                                      _GetInstanceInfoText(instance)):
-        # remove secondary dev
-        cfg.SetDiskID(new_drbd, remote_node)
-        rpc.call_blockdev_remove(remote_node, new_drbd)
-        raise errors.OpExecError("Failed to create volume on primary!\n"
-                                 "Full abort, cleanup manually!!")
-
-      # the device exists now
-      # call the primary node to add the mirror to md
-      logger.Info("adding new mirror component to md")
-      if not rpc.call_blockdev_addchildren(instance.primary_node, dev,
-                                           [new_drbd]):
-        logger.Error("Can't add mirror compoment to md!")
-        cfg.SetDiskID(new_drbd, remote_node)
-        if not rpc.call_blockdev_remove(remote_node, new_drbd):
-          logger.Error("Can't rollback on secondary")
-        cfg.SetDiskID(new_drbd, instance.primary_node)
-        if not rpc.call_blockdev_remove(instance.primary_node, new_drbd):
-          logger.Error("Can't rollback on primary")
-        raise errors.OpExecError("Full abort, cleanup manually!!")
-
-      dev.children.append(new_drbd)
-      cfg.AddInstance(instance)
-
-    # this can fail as the old devices are degraded and _WaitForSync
-    # does a combined result over all disks, so we don't check its
-    # return value
-    _WaitForSync(cfg, instance, self.proc, unlock=True)
-
-    # so check manually all the devices
-    for name in iv_names:
-      dev, child, new_drbd = iv_names[name]
-      cfg.SetDiskID(dev, instance.primary_node)
-      is_degr = rpc.call_blockdev_find(instance.primary_node, dev)[5]
-      if is_degr:
-        raise errors.OpExecError("MD device %s is degraded!" % name)
-      cfg.SetDiskID(new_drbd, instance.primary_node)
-      is_degr = rpc.call_blockdev_find(instance.primary_node, new_drbd)[5]
-      if is_degr:
-        raise errors.OpExecError("New drbd device %s is degraded!" % name)
-
-    for name in iv_names:
-      dev, child, new_drbd = iv_names[name]
-      logger.Info("remove mirror %s component" % name)
-      cfg.SetDiskID(dev, instance.primary_node)
-      if not rpc.call_blockdev_removechildren(instance.primary_node,
-                                              dev, [child]):
-        logger.Error("Can't remove child from mirror, aborting"
-                     " *this device cleanup*.\nYou need to cleanup manually!!")
-        continue
-
-      for node in child.logical_id[:2]:
-        logger.Info("remove child device on %s" % node)
-        cfg.SetDiskID(child, node)
-        if not rpc.call_blockdev_remove(node, child):
-          logger.Error("Warning: failed to remove device from node %s,"
-                       " continuing operation." % node)
-
-      dev.children.remove(child)
-
-      cfg.AddInstance(instance)
-
    def _ExecD8DiskOnly(self, feedback_fn):
      """Replace a disk on the primary or secondary for dbrd8.
  
    def _ExecD8DiskOnly(self, feedback_fn):
      """Replace a disk on the primary or secondary for dbrd8.
  
@@ -3598,7 +3598,7 @@ class LUReplaceDisks(LogicalUnit):
        # ok, we created the new LVs, so now we know we have the needed
        # storage; as such, we proceed on the target node to rename
        # old_lv to _old, and new_lv to old_lv; note that we rename LVs
        # ok, we created the new LVs, so now we know we have the needed
        # storage; as such, we proceed on the target node to rename
        # old_lv to _old, and new_lv to old_lv; note that we rename LVs
-      # using the assumption than logical_id == physical_id (which in
+      # using the assumption that logical_id == physical_id (which in
        # turn is the unique_id on that node)
  
        # FIXME(iustin): use a better name for the replaced LVs
        # turn is the unique_id on that node)
  
        # FIXME(iustin): use a better name for the replaced LVs
@@ -3634,7 +3634,7 @@ class LUReplaceDisks(LogicalUnit):
        if not rpc.call_blockdev_addchildren(tgt_node, dev, new_lvs):
          for new_lv in new_lvs:
            if not rpc.call_blockdev_remove(tgt_node, new_lv):
        if not rpc.call_blockdev_addchildren(tgt_node, dev, new_lvs):
          for new_lv in new_lvs:
            if not rpc.call_blockdev_remove(tgt_node, new_lv):
-            warning("Can't rollback device %s", "manually cleanup unused"
+            warning("Can't rollback device %s", hint="manually cleanup unused"
                      " logical volumes")
          raise errors.OpExecError("Can't add local storage to drbd")
  
                      " logical volumes")
          raise errors.OpExecError("Can't add local storage to drbd")
  
@@ -3663,7 +3663,7 @@ class LUReplaceDisks(LogicalUnit):
        for lv in old_lvs:
          cfg.SetDiskID(lv, tgt_node)
          if not rpc.call_blockdev_remove(tgt_node, lv):
        for lv in old_lvs:
          cfg.SetDiskID(lv, tgt_node)
          if not rpc.call_blockdev_remove(tgt_node, lv):
-          warning("Can't remove old LV", "manually remove unused LVs")
+          warning("Can't remove old LV", hint="manually remove unused LVs")
            continue
  
    def _ExecD8Secondary(self, feedback_fn):
            continue
  
    def _ExecD8Secondary(self, feedback_fn):
@@ -3766,23 +3766,47 @@ class LUReplaceDisks(LogicalUnit):
        cfg.SetDiskID(dev, old_node)
        if not rpc.call_blockdev_shutdown(old_node, dev):
          warning("Failed to shutdown drbd for %s on old node" % dev.iv_name,
        cfg.SetDiskID(dev, old_node)
        if not rpc.call_blockdev_shutdown(old_node, dev):
          warning("Failed to shutdown drbd for %s on old node" % dev.iv_name,
-                "Please cleanup this device manuall as soon as possible")
+                hint="Please cleanup this device manually as soon as possible")
  
  
-      # we have new storage, we 'rename' the network on the primary
-      info("switching primary drbd for %s to new secondary node" % dev.iv_name)
+    info("detaching primary drbds from the network (=> standalone)")
+    done = 0
+    for dev in instance.disks:
        cfg.SetDiskID(dev, pri_node)
        cfg.SetDiskID(dev, pri_node)
-      # rename to the ip of the new node
-      new_uid = list(dev.physical_id)
-      new_uid[2] = self.remote_node_info.secondary_ip
-      rlist = [(dev, tuple(new_uid))]
-      if not rpc.call_blockdev_rename(pri_node, rlist):
-        raise errors.OpExecError("Can't detach & re-attach drbd %s on node"
-                                 " %s from %s to %s" %
-                                 (dev.iv_name, pri_node, old_node, new_node))
-      dev.logical_id = (pri_node, new_node, dev.logical_id[2])
+      # set the physical (unique in bdev terms) id to None, meaning
+      # detach from network
+      dev.physical_id = (None,) * len(dev.physical_id)
+      # and 'find' the device, which will 'fix' it to match the
+      # standalone state
+      if rpc.call_blockdev_find(pri_node, dev):
+        done += 1
+      else:
+        warning("Failed to detach drbd %s from network, unusual case" %
+                dev.iv_name)
+
+    if not done:
+      # no detaches succeeded (very unlikely)
+      raise errors.OpExecError("Can't detach at least one DRBD from old node")
+
+    # if we managed to detach at least one, we update all the disks of
+    # the instance to point to the new secondary
+    info("updating instance configuration")
+    for dev in instance.disks:
+      dev.logical_id = (pri_node, new_node) + dev.logical_id[2:]
        cfg.SetDiskID(dev, pri_node)
        cfg.SetDiskID(dev, pri_node)
-      cfg.Update(instance)
+    cfg.Update(instance)
  
  
+    # and now perform the drbd attach
+    info("attaching primary drbds to new secondary (standalone => connected)")
+    failures = []
+    for dev in instance.disks:
+      info("attaching primary drbd for %s to new secondary node" % dev.iv_name)
+      # since the attach is smart, it's enough to 'find' the device,
+      # it will automatically activate the network, if the physical_id
+      # is correct
+      cfg.SetDiskID(dev, pri_node)
+      if not rpc.call_blockdev_find(pri_node, dev):
+        warning("can't attach drbd %s to new secondary!" % dev.iv_name,
+                "please do a gnt-instance info to see the status of disks")
  
      # this can fail as the old devices are degraded and _WaitForSync
      # does a combined result over all disks, so we don't check its
  
      # this can fail as the old devices are degraded and _WaitForSync
      # does a combined result over all disks, so we don't check its
@@ -3804,7 +3828,7 @@ class LUReplaceDisks(LogicalUnit):
          cfg.SetDiskID(lv, old_node)
          if not rpc.call_blockdev_remove(old_node, lv):
            warning("Can't remove LV on old secondary",
          cfg.SetDiskID(lv, old_node)
          if not rpc.call_blockdev_remove(old_node, lv):
            warning("Can't remove LV on old secondary",
-                  "Cleanup stale volumes by hand")
+                  hint="Cleanup stale volumes by hand")
  
    def Exec(self, feedback_fn):
      """Execute disk replacement.
  
    def Exec(self, feedback_fn):
      """Execute disk replacement.
@@ -3813,16 +3837,110 @@ class LUReplaceDisks(LogicalUnit):
  
      """
      instance = self.instance
  
      """
      instance = self.instance
-    if instance.disk_template == constants.DT_REMOTE_RAID1:
-      fn = self._ExecRR1
-    elif instance.disk_template == constants.DT_DRBD8:
+
+    # Activate the instance disks if we're replacing them on a down instance
+    if instance.status == "down":
+      op = opcodes.OpActivateInstanceDisks(instance_name=instance.name)
+      self.proc.ChainOpCode(op)
+
+    if instance.disk_template == constants.DT_DRBD8:
        if self.op.remote_node is None:
          fn = self._ExecD8DiskOnly
        else:
          fn = self._ExecD8Secondary
      else:
        raise errors.ProgrammerError("Unhandled disk replacement case")
        if self.op.remote_node is None:
          fn = self._ExecD8DiskOnly
        else:
          fn = self._ExecD8Secondary
      else:
        raise errors.ProgrammerError("Unhandled disk replacement case")
-    return fn(feedback_fn)
+
+    ret = fn(feedback_fn)
+
+    # Deactivate the instance disks if we're replacing them on a down instance
+    if instance.status == "down":
+      op = opcodes.OpDeactivateInstanceDisks(instance_name=instance.name)
+      self.proc.ChainOpCode(op)
+
+    return ret
+
+
+class LUGrowDisk(LogicalUnit):
+  """Grow a disk of an instance.
+
+  """
+  HPATH = "disk-grow"
+  HTYPE = constants.HTYPE_INSTANCE
+  _OP_REQP = ["instance_name", "disk", "amount"]
+
+  def BuildHooksEnv(self):
+    """Build hooks env.
+
+    This runs on the master, the primary and all the secondaries.
+
+    """
+    env = {
+      "DISK": self.op.disk,
+      "AMOUNT": self.op.amount,
+      }
+    env.update(_BuildInstanceHookEnvByObject(self.instance))
+    nl = [
+      self.sstore.GetMasterNode(),
+      self.instance.primary_node,
+      ]
+    return env, nl, nl
+
+  def CheckPrereq(self):
+    """Check prerequisites.
+
+    This checks that the instance is in the cluster.
+
+    """
+    instance = self.cfg.GetInstanceInfo(
+      self.cfg.ExpandInstanceName(self.op.instance_name))
+    if instance is None:
+      raise errors.OpPrereqError("Instance '%s' not known" %
+                                 self.op.instance_name)
+    self.instance = instance
+    self.op.instance_name = instance.name
+
+    if instance.disk_template not in (constants.DT_PLAIN, constants.DT_DRBD8):
+      raise errors.OpPrereqError("Instance's disk layout does not support"
+                                 " growing.")
+
+    if instance.FindDisk(self.op.disk) is None:
+      raise errors.OpPrereqError("Disk '%s' not found for instance '%s'" %
+                                 (self.op.disk, instance.name))
+
+    nodenames = [instance.primary_node] + list(instance.secondary_nodes)
+    nodeinfo = rpc.call_node_info(nodenames, self.cfg.GetVGName())
+    for node in nodenames:
+      info = nodeinfo.get(node, None)
+      if not info:
+        raise errors.OpPrereqError("Cannot get current information"
+                                   " from node '%s'" % node)
+      vg_free = info.get('vg_free', None)
+      if not isinstance(vg_free, int):
+        raise errors.OpPrereqError("Can't compute free disk space on"
+                                   " node %s" % node)
+      if self.op.amount > info['vg_free']:
+        raise errors.OpPrereqError("Not enough disk space on target node %s:"
+                                   " %d MiB available, %d MiB required" %
+                                   (node, info['vg_free'], self.op.amount))
+
+  def Exec(self, feedback_fn):
+    """Execute disk grow.
+
+    """
+    instance = self.instance
+    disk = instance.FindDisk(self.op.disk)
+    for node in (instance.secondary_nodes + (instance.primary_node,)):
+      self.cfg.SetDiskID(disk, node)
+      result = rpc.call_blockdev_grow(node, disk, self.op.amount)
+      if not result or not isinstance(result, tuple) or len(result) != 2:
+        raise errors.OpExecError("grow request failed to node %s" % node)
+      elif not result[0]:
+        raise errors.OpExecError("grow request failed to node %s: %s" %
+                                 (node, result[1]))
+    disk.RecordGrow(self.op.amount)
+    self.cfg.Update(instance)
+    return
  
  
  class LUQueryInstanceData(NoHooksLU):
  
  
  class LUQueryInstanceData(NoHooksLU):
@@ -3846,7 +3964,7 @@ class LUQueryInstanceData(NoHooksLU):
          instance = self.cfg.GetInstanceInfo(self.cfg.ExpandInstanceName(name))
          if instance is None:
            raise errors.OpPrereqError("No such instance name '%s'" % name)
          instance = self.cfg.GetInstanceInfo(self.cfg.ExpandInstanceName(name))
          if instance is None:
            raise errors.OpPrereqError("No such instance name '%s'" % name)
-      self.wanted_instances.append(instance)
+        self.wanted_instances.append(instance)
      else:
        self.wanted_instances = [self.cfg.GetInstanceInfo(name) for name
                                 in self.cfg.GetInstanceList()]
      else:
        self.wanted_instances = [self.cfg.GetInstanceInfo(name) for name
                                 in self.cfg.GetInstanceList()]
@@ -3921,12 +4039,27 @@ class LUQueryInstanceData(NoHooksLU):
          "vcpus": instance.vcpus,
          }
  
          "vcpus": instance.vcpus,
          }
  
+      htkind = self.sstore.GetHypervisorType()
+      if htkind == constants.HT_XEN_PVM30:
+        idict["kernel_path"] = instance.kernel_path
+        idict["initrd_path"] = instance.initrd_path
+
+      if htkind == constants.HT_XEN_HVM31:
+        idict["hvm_boot_order"] = instance.hvm_boot_order
+        idict["hvm_acpi"] = instance.hvm_acpi
+        idict["hvm_pae"] = instance.hvm_pae
+        idict["hvm_cdrom_image_path"] = instance.hvm_cdrom_image_path
+
+      if htkind in constants.HTS_REQ_PORT:
+        idict["vnc_bind_address"] = instance.vnc_bind_address
+        idict["network_port"] = instance.network_port
+
        result[instance.name] = idict
  
      return result
  
  
        result[instance.name] = idict
  
      return result
  
  
-class LUSetInstanceParms(LogicalUnit):
+class LUSetInstanceParams(LogicalUnit):
    """Modifies an instances's parameters.
  
    """
    """Modifies an instances's parameters.
  
    """
@@ -3945,7 +4078,7 @@ class LUSetInstanceParms(LogicalUnit):
        args['memory'] = self.mem
      if self.vcpus:
        args['vcpus'] = self.vcpus
        args['memory'] = self.mem
      if self.vcpus:
        args['vcpus'] = self.vcpus
-    if self.do_ip or self.do_bridge:
+    if self.do_ip or self.do_bridge or self.mac:
        if self.do_ip:
          ip = self.ip
        else:
        if self.do_ip:
          ip = self.ip
        else:
@@ -3954,7 +4087,11 @@ class LUSetInstanceParms(LogicalUnit):
          bridge = self.bridge
        else:
          bridge = self.instance.nics[0].bridge
          bridge = self.bridge
        else:
          bridge = self.instance.nics[0].bridge
-      args['nics'] = [(ip, bridge)]
+      if self.mac:
+        mac = self.mac
+      else:
+        mac = self.instance.nics[0].mac
+      args['nics'] = [(ip, bridge, mac)]
      env = _BuildInstanceHookEnvByObject(self.instance, override=args)
      nl = [self.sstore.GetMasterNode(),
            self.instance.primary_node] + list(self.instance.secondary_nodes)
      env = _BuildInstanceHookEnvByObject(self.instance, override=args)
      nl = [self.sstore.GetMasterNode(),
            self.instance.primary_node] + list(self.instance.secondary_nodes)
@@ -3969,8 +4106,20 @@ class LUSetInstanceParms(LogicalUnit):
      self.mem = getattr(self.op, "mem", None)
      self.vcpus = getattr(self.op, "vcpus", None)
      self.ip = getattr(self.op, "ip", None)
      self.mem = getattr(self.op, "mem", None)
      self.vcpus = getattr(self.op, "vcpus", None)
      self.ip = getattr(self.op, "ip", None)
+    self.mac = getattr(self.op, "mac", None)
      self.bridge = getattr(self.op, "bridge", None)
      self.bridge = getattr(self.op, "bridge", None)
-    if [self.mem, self.vcpus, self.ip, self.bridge].count(None) == 4:
+    self.kernel_path = getattr(self.op, "kernel_path", None)
+    self.initrd_path = getattr(self.op, "initrd_path", None)
+    self.hvm_boot_order = getattr(self.op, "hvm_boot_order", None)
+    self.hvm_acpi = getattr(self.op, "hvm_acpi", None)
+    self.hvm_pae = getattr(self.op, "hvm_pae", None)
+    self.hvm_cdrom_image_path = getattr(self.op, "hvm_cdrom_image_path", None)
+    self.vnc_bind_address = getattr(self.op, "vnc_bind_address", None)
+    all_parms = [self.mem, self.vcpus, self.ip, self.bridge, self.mac,
+                 self.kernel_path, self.initrd_path, self.hvm_boot_order,
+                 self.hvm_acpi, self.hvm_pae, self.hvm_cdrom_image_path,
+                 self.vnc_bind_address]
+    if all_parms.count(None) == len(all_parms):
        raise errors.OpPrereqError("No changes submitted")
      if self.mem is not None:
        try:
        raise errors.OpPrereqError("No changes submitted")
      if self.mem is not None:
        try:
@@ -3992,6 +4141,61 @@ class LUSetInstanceParms(LogicalUnit):
      else:
        self.do_ip = False
      self.do_bridge = (self.bridge is not None)
      else:
        self.do_ip = False
      self.do_bridge = (self.bridge is not None)
+    if self.mac is not None:
+      if self.cfg.IsMacInUse(self.mac):
+        raise errors.OpPrereqError('MAC address %s already in use in cluster' %
+                                   self.mac)
+      if not utils.IsValidMac(self.mac):
+        raise errors.OpPrereqError('Invalid MAC address %s' % self.mac)
+
+    if self.kernel_path is not None:
+      self.do_kernel_path = True
+      if self.kernel_path == constants.VALUE_NONE:
+        raise errors.OpPrereqError("Can't set instance to no kernel")
+
+      if self.kernel_path != constants.VALUE_DEFAULT:
+        if not os.path.isabs(self.kernel_path):
+          raise errors.OpPrereqError("The kernel path must be an absolute"
+                                    " filename")
+    else:
+      self.do_kernel_path = False
+
+    if self.initrd_path is not None:
+      self.do_initrd_path = True
+      if self.initrd_path not in (constants.VALUE_NONE,
+                                  constants.VALUE_DEFAULT):
+        if not os.path.isabs(self.initrd_path):
+          raise errors.OpPrereqError("The initrd path must be an absolute"
+                                    " filename")
+    else:
+      self.do_initrd_path = False
+
+    # boot order verification
+    if self.hvm_boot_order is not None:
+      if self.hvm_boot_order != constants.VALUE_DEFAULT:
+        if len(self.hvm_boot_order.strip("acdn")) != 0:
+          raise errors.OpPrereqError("invalid boot order specified,"
+                                     " must be one or more of [acdn]"
+                                     " or 'default'")
+
+    # hvm_cdrom_image_path verification
+    if self.op.hvm_cdrom_image_path is not None:
+      if not os.path.isabs(self.op.hvm_cdrom_image_path):
+        raise errors.OpPrereqError("The path to the HVM CDROM image must"
+                                   " be an absolute path or None, not %s" %
+                                   self.op.hvm_cdrom_image_path)
+      if not os.path.isfile(self.op.hvm_cdrom_image_path):
+        raise errors.OpPrereqError("The HVM CDROM image must either be a"
+                                   " regular file or a symlink pointing to"
+                                   " an existing regular file, not %s" %
+                                   self.op.hvm_cdrom_image_path)
+
+    # vnc_bind_address verification
+    if self.op.vnc_bind_address is not None:
+      if not utils.IsValidIP(self.op.vnc_bind_address):
+        raise errors.OpPrereqError("given VNC bind address '%s' doesn't look"
+                                   " like a valid IP address" %
+                                   self.op.vnc_bind_address)
  
      instance = self.cfg.GetInstanceInfo(
        self.cfg.ExpandInstanceName(self.op.instance_name))
  
      instance = self.cfg.GetInstanceInfo(
        self.cfg.ExpandInstanceName(self.op.instance_name))
@@ -4021,6 +4225,33 @@ class LUSetInstanceParms(LogicalUnit):
      if self.bridge:
        instance.nics[0].bridge = self.bridge
        result.append(("bridge", self.bridge))
      if self.bridge:
        instance.nics[0].bridge = self.bridge
        result.append(("bridge", self.bridge))
+    if self.mac:
+      instance.nics[0].mac = self.mac
+      result.append(("mac", self.mac))
+    if self.do_kernel_path:
+      instance.kernel_path = self.kernel_path
+      result.append(("kernel_path", self.kernel_path))
+    if self.do_initrd_path:
+      instance.initrd_path = self.initrd_path
+      result.append(("initrd_path", self.initrd_path))
+    if self.hvm_boot_order:
+      if self.hvm_boot_order == constants.VALUE_DEFAULT:
+        instance.hvm_boot_order = None
+      else:
+        instance.hvm_boot_order = self.hvm_boot_order
+      result.append(("hvm_boot_order", self.hvm_boot_order))
+    if self.hvm_acpi:
+      instance.hvm_acpi = self.hvm_acpi
+      result.append(("hvm_acpi", self.hvm_acpi))
+    if self.hvm_pae:
+      instance.hvm_pae = self.hvm_pae
+      result.append(("hvm_pae", self.hvm_pae))
+    if self.hvm_cdrom_image_path:
+      instance.hvm_cdrom_image_path = self.hvm_cdrom_image_path
+      result.append(("hvm_cdrom_image_path", self.hvm_cdrom_image_path))
+    if self.vnc_bind_address:
+      instance.vnc_bind_address = self.vnc_bind_address
+      result.append(("vnc_bind_address", self.vnc_bind_address))
  
      self.cfg.AddInstance(instance)
  
  
      self.cfg.AddInstance(instance)
  
@@ -4077,7 +4308,7 @@ class LUExportInstance(LogicalUnit):
    def CheckPrereq(self):
      """Check prerequisites.
  
    def CheckPrereq(self):
      """Check prerequisites.
  
-    This checks that the instance name is a valid one.
+    This checks that the instance and node names are valid.
  
      """
      instance_name = self.cfg.ExpandInstanceName(self.op.instance_name)
  
      """
      instance_name = self.cfg.ExpandInstanceName(self.op.instance_name)
@@ -4095,6 +4326,12 @@ class LUExportInstance(LogicalUnit):
                                   self.op.target_node)
      self.op.target_node = self.dst_node.name
  
                                   self.op.target_node)
      self.op.target_node = self.dst_node.name
  
+    # instance disk type verification
+    for disk in self.instance.disks:
+      if disk.dev_type == constants.LD_FILE:
+        raise errors.OpPrereqError("Export not supported for instances with"
+                                   " file-based disks")
+
    def Exec(self, feedback_fn):
      """Export an instance to an image in the cluster.
  
    def Exec(self, feedback_fn):
      """Export an instance to an image in the cluster.
  
@@ -4102,10 +4339,11 @@ class LUExportInstance(LogicalUnit):
      instance = self.instance
      dst_node = self.dst_node
      src_node = instance.primary_node
      instance = self.instance
      dst_node = self.dst_node
      src_node = instance.primary_node
-    # shutdown the instance, unless requested not to do so
      if self.op.shutdown:
      if self.op.shutdown:
-      op = opcodes.OpShutdownInstance(instance_name=instance.name)
-      self.proc.ChainOpCode(op)
+      # shutdown the instance, but not the disks
+      if not rpc.call_instance_shutdown(src_node, instance):
+         raise errors.OpExecError("Could not shutdown instance %s on node %s" %
+                                  (instance.name, src_node))
  
      vgname = self.cfg.GetVGName()
  
  
      vgname = self.cfg.GetVGName()
  
@@ -4128,22 +4366,20 @@ class LUExportInstance(LogicalUnit):
              snap_disks.append(new_dev)
  
      finally:
              snap_disks.append(new_dev)
  
      finally:
-      if self.op.shutdown:
-        op = opcodes.OpStartupInstance(instance_name=instance.name,
-                                       force=False)
-        self.proc.ChainOpCode(op)
+      if self.op.shutdown and instance.status == "up":
+        if not rpc.call_instance_start(src_node, instance, None):
+          _ShutdownInstanceDisks(instance, self.cfg)
+          raise errors.OpExecError("Could not start instance")
  
      # TODO: check for size
  
      for dev in snap_disks:
  
      # TODO: check for size
  
      for dev in snap_disks:
-      if not rpc.call_snapshot_export(src_node, dev, dst_node.name,
-                                           instance):
-        logger.Error("could not export block device %s from node"
-                     " %s to node %s" %
-                     (dev.logical_id[1], src_node, dst_node.name))
+      if not rpc.call_snapshot_export(src_node, dev, dst_node.name, instance):
+        logger.Error("could not export block device %s from node %s to node %s"
+                     % (dev.logical_id[1], src_node, dst_node.name))
        if not rpc.call_blockdev_remove(src_node, dev):
        if not rpc.call_blockdev_remove(src_node, dev):
-        logger.Error("could not remove snapshot block device %s from"
-                     " node %s" % (dev.logical_id[1], src_node))
+        logger.Error("could not remove snapshot block device %s from node %s" %
+                     (dev.logical_id[1], src_node))
  
      if not rpc.call_finalize_export(dst_node.name, instance, snap_disks):
        logger.Error("could not finalize export for instance %s on node %s" %
  
      if not rpc.call_finalize_export(dst_node.name, instance, snap_disks):
        logger.Error("could not finalize export for instance %s on node %s" %
@@ -4165,6 +4401,45 @@ class LUExportInstance(LogicalUnit):
                           " on node %s" % (instance.name, node))
  
  
                           " on node %s" % (instance.name, node))
  
  
+class LURemoveExport(NoHooksLU):
+  """Remove exports related to the named instance.
+
+  """
+  _OP_REQP = ["instance_name"]
+
+  def CheckPrereq(self):
+    """Check prerequisites.
+    """
+    pass
+
+  def Exec(self, feedback_fn):
+    """Remove any export.
+
+    """
+    instance_name = self.cfg.ExpandInstanceName(self.op.instance_name)
+    # If the instance was not found we'll try with the name that was passed in.
+    # This will only work if it was an FQDN, though.
+    fqdn_warn = False
+    if not instance_name:
+      fqdn_warn = True
+      instance_name = self.op.instance_name
+
+    op = opcodes.OpQueryExports(nodes=[])
+    exportlist = self.proc.ChainOpCode(op)
+    found = False
+    for node in exportlist:
+      if instance_name in exportlist[node]:
+        found = True
+        if not rpc.call_export_remove(node, instance_name):
+          logger.Error("could not remove export for instance %s"
+                       " on node %s" % (instance_name, node))
+
+    if fqdn_warn and not found:
+      feedback_fn("Export not found. If trying to remove an export belonging"
+                  " to a deleted instance please use its Fully Qualified"
+                  " Domain Name.")
+
+
  class TagsLU(NoHooksLU):
    """Generic tags LU.
  
  class TagsLU(NoHooksLU):
    """Generic tags LU.
  
@@ -4314,3 +4589,417 @@ class LUDelTags(TagsLU):
        raise errors.OpRetryError("There has been a modification to the"
                                  " config file and the operation has been"
                                  " aborted. Please retry.")
        raise errors.OpRetryError("There has been a modification to the"
                                  " config file and the operation has been"
                                  " aborted. Please retry.")
+
+class LUTestDelay(NoHooksLU):
+  """Sleep for a specified amount of time.
+
+  This LU sleeps on the master and/or nodes for a specified amount of
+  time.
+
+  """
+  _OP_REQP = ["duration", "on_master", "on_nodes"]
+  REQ_BGL = False
+
+  def ExpandNames(self):
+    """Expand names and set required locks.
+
+    This expands the node list, if any.
+
+    """
+    self.needed_locks = {}
+    if self.op.on_nodes:
+      # _GetWantedNodes can be used here, but is not always appropriate to use
+      # this way in ExpandNames. Check LogicalUnit.ExpandNames docstring for
+      # more information.
+      self.op.on_nodes = _GetWantedNodes(self, self.op.on_nodes)
+      self.needed_locks[locking.LEVEL_NODE] = self.op.on_nodes
+
+  def CheckPrereq(self):
+    """Check prerequisites.
+
+    """
+
+  def Exec(self, feedback_fn):
+    """Do the actual sleep.
+
+    """
+    if self.op.on_master:
+      if not utils.TestDelay(self.op.duration):
+        raise errors.OpExecError("Error during master delay test")
+    if self.op.on_nodes:
+      result = rpc.call_test_delay(self.op.on_nodes, self.op.duration)
+      if not result:
+        raise errors.OpExecError("Complete failure from rpc call")
+      for node, node_result in result.items():
+        if not node_result:
+          raise errors.OpExecError("Failure during rpc call to node %s,"
+                                   " result: %s" % (node, node_result))
+
+
+class IAllocator(object):
+  """IAllocator framework.
+
+  An IAllocator instance has three sets of attributes:
+    - cfg/sstore that are needed to query the cluster
+    - input data (all members of the _KEYS class attribute are required)
+    - four buffer attributes (in|out_data|text), that represent the
+      input (to the external script) in text and data structure format,
+      and the output from it, again in two formats
+    - the result variables from the script (success, info, nodes) for
+      easy usage
+
+  """
+  _ALLO_KEYS = [
+    "mem_size", "disks", "disk_template",
+    "os", "tags", "nics", "vcpus",
+    ]
+  _RELO_KEYS = [
+    "relocate_from",
+    ]
+
+  def __init__(self, cfg, sstore, mode, name, **kwargs):
+    self.cfg = cfg
+    self.sstore = sstore
+    # init buffer variables
+    self.in_text = self.out_text = self.in_data = self.out_data = None
+    # init all input fields so that pylint is happy
+    self.mode = mode
+    self.name = name
+    self.mem_size = self.disks = self.disk_template = None
+    self.os = self.tags = self.nics = self.vcpus = None
+    self.relocate_from = None
+    # computed fields
+    self.required_nodes = None
+    # init result fields
+    self.success = self.info = self.nodes = None
+    if self.mode == constants.IALLOCATOR_MODE_ALLOC:
+      keyset = self._ALLO_KEYS
+    elif self.mode == constants.IALLOCATOR_MODE_RELOC:
+      keyset = self._RELO_KEYS
+    else:
+      raise errors.ProgrammerError("Unknown mode '%s' passed to the"
+                                   " IAllocator" % self.mode)
+    for key in kwargs:
+      if key not in keyset:
+        raise errors.ProgrammerError("Invalid input parameter '%s' to"
+                                     " IAllocator" % key)
+      setattr(self, key, kwargs[key])
+    for key in keyset:
+      if key not in kwargs:
+        raise errors.ProgrammerError("Missing input parameter '%s' to"
+                                     " IAllocator" % key)
+    self._BuildInputData()
+
+  def _ComputeClusterData(self):
+    """Compute the generic allocator input data.
+
+    This is the data that is independent of the actual operation.
+
+    """
+    cfg = self.cfg
+    # cluster data
+    data = {
+      "version": 1,
+      "cluster_name": self.sstore.GetClusterName(),
+      "cluster_tags": list(cfg.GetClusterInfo().GetTags()),
+      "hypervisor_type": self.sstore.GetHypervisorType(),
+      # we don't have job IDs
+      }
+
+    i_list = [cfg.GetInstanceInfo(iname) for iname in cfg.GetInstanceList()]
+
+    # node data
+    node_results = {}
+    node_list = cfg.GetNodeList()
+    node_data = rpc.call_node_info(node_list, cfg.GetVGName())
+    for nname in node_list:
+      ninfo = cfg.GetNodeInfo(nname)
+      if nname not in node_data or not isinstance(node_data[nname], dict):
+        raise errors.OpExecError("Can't get data for node %s" % nname)
+      remote_info = node_data[nname]
+      for attr in ['memory_total', 'memory_free', 'memory_dom0',
+                   'vg_size', 'vg_free', 'cpu_total']:
+        if attr not in remote_info:
+          raise errors.OpExecError("Node '%s' didn't return attribute '%s'" %
+                                   (nname, attr))
+        try:
+          remote_info[attr] = int(remote_info[attr])
+        except ValueError, err:
+          raise errors.OpExecError("Node '%s' returned invalid value for '%s':"
+                                   " %s" % (nname, attr, str(err)))
+      # compute memory used by primary instances
+      i_p_mem = i_p_up_mem = 0
+      for iinfo in i_list:
+        if iinfo.primary_node == nname:
+          i_p_mem += iinfo.memory
+          if iinfo.status == "up":
+            i_p_up_mem += iinfo.memory
+
+      # compute memory used by instances
+      pnr = {
+        "tags": list(ninfo.GetTags()),
+        "total_memory": remote_info['memory_total'],
+        "reserved_memory": remote_info['memory_dom0'],
+        "free_memory": remote_info['memory_free'],
+        "i_pri_memory": i_p_mem,
+        "i_pri_up_memory": i_p_up_mem,
+        "total_disk": remote_info['vg_size'],
+        "free_disk": remote_info['vg_free'],
+        "primary_ip": ninfo.primary_ip,
+        "secondary_ip": ninfo.secondary_ip,
+        "total_cpus": remote_info['cpu_total'],
+        }
+      node_results[nname] = pnr
+    data["nodes"] = node_results
+
+    # instance data
+    instance_data = {}
+    for iinfo in i_list:
+      nic_data = [{"mac": n.mac, "ip": n.ip, "bridge": n.bridge}
+                  for n in iinfo.nics]
+      pir = {
+        "tags": list(iinfo.GetTags()),
+        "should_run": iinfo.status == "up",
+        "vcpus": iinfo.vcpus,
+        "memory": iinfo.memory,
+        "os": iinfo.os,
+        "nodes": [iinfo.primary_node] + list(iinfo.secondary_nodes),
+        "nics": nic_data,
+        "disks": [{"size": dsk.size, "mode": "w"} for dsk in iinfo.disks],
+        "disk_template": iinfo.disk_template,
+        }
+      instance_data[iinfo.name] = pir
+
+    data["instances"] = instance_data
+
+    self.in_data = data
+
+  def _AddNewInstance(self):
+    """Add new instance data to allocator structure.
+
+    This in combination with _AllocatorGetClusterData will create the
+    correct structure needed as input for the allocator.
+
+    The checks for the completeness of the opcode must have already been
+    done.
+
+    """
+    data = self.in_data
+    if len(self.disks) != 2:
+      raise errors.OpExecError("Only two-disk configurations supported")
+
+    disk_space = _ComputeDiskSize(self.disk_template,
+                                  self.disks[0]["size"], self.disks[1]["size"])
+
+    if self.disk_template in constants.DTS_NET_MIRROR:
+      self.required_nodes = 2
+    else:
+      self.required_nodes = 1
+    request = {
+      "type": "allocate",
+      "name": self.name,
+      "disk_template": self.disk_template,
+      "tags": self.tags,
+      "os": self.os,
+      "vcpus": self.vcpus,
+      "memory": self.mem_size,
+      "disks": self.disks,
+      "disk_space_total": disk_space,
+      "nics": self.nics,
+      "required_nodes": self.required_nodes,
+      }
+    data["request"] = request
+
+  def _AddRelocateInstance(self):
+    """Add relocate instance data to allocator structure.
+
+    This in combination with _IAllocatorGetClusterData will create the
+    correct structure needed as input for the allocator.
+
+    The checks for the completeness of the opcode must have already been
+    done.
+
+    """
+    instance = self.cfg.GetInstanceInfo(self.name)
+    if instance is None:
+      raise errors.ProgrammerError("Unknown instance '%s' passed to"
+                                   " IAllocator" % self.name)
+
+    if instance.disk_template not in constants.DTS_NET_MIRROR:
+      raise errors.OpPrereqError("Can't relocate non-mirrored instances")
+
+    if len(instance.secondary_nodes) != 1:
+      raise errors.OpPrereqError("Instance has not exactly one secondary node")
+
+    self.required_nodes = 1
+
+    disk_space = _ComputeDiskSize(instance.disk_template,
+                                  instance.disks[0].size,
+                                  instance.disks[1].size)
+
+    request = {
+      "type": "relocate",
+      "name": self.name,
+      "disk_space_total": disk_space,
+      "required_nodes": self.required_nodes,
+      "relocate_from": self.relocate_from,
+      }
+    self.in_data["request"] = request
+
+  def _BuildInputData(self):
+    """Build input data structures.
+
+    """
+    self._ComputeClusterData()
+
+    if self.mode == constants.IALLOCATOR_MODE_ALLOC:
+      self._AddNewInstance()
+    else:
+      self._AddRelocateInstance()
+
+    self.in_text = serializer.Dump(self.in_data)
+
+  def Run(self, name, validate=True, call_fn=rpc.call_iallocator_runner):
+    """Run an instance allocator and return the results.
+
+    """
+    data = self.in_text
+
+    result = call_fn(self.sstore.GetMasterNode(), name, self.in_text)
+
+    if not isinstance(result, tuple) or len(result) != 4:
+      raise errors.OpExecError("Invalid result from master iallocator runner")
+
+    rcode, stdout, stderr, fail = result
+
+    if rcode == constants.IARUN_NOTFOUND:
+      raise errors.OpExecError("Can't find allocator '%s'" % name)
+    elif rcode == constants.IARUN_FAILURE:
+        raise errors.OpExecError("Instance allocator call failed: %s,"
+                                 " output: %s" %
+                                 (fail, stdout+stderr))
+    self.out_text = stdout
+    if validate:
+      self._ValidateResult()
+
+  def _ValidateResult(self):
+    """Process the allocator results.
+
+    This will process and if successful save the result in
+    self.out_data and the other parameters.
+
+    """
+    try:
+      rdict = serializer.Load(self.out_text)
+    except Exception, err:
+      raise errors.OpExecError("Can't parse iallocator results: %s" % str(err))
+
+    if not isinstance(rdict, dict):
+      raise errors.OpExecError("Can't parse iallocator results: not a dict")
+
+    for key in "success", "info", "nodes":
+      if key not in rdict:
+        raise errors.OpExecError("Can't parse iallocator results:"
+                                 " missing key '%s'" % key)
+      setattr(self, key, rdict[key])
+
+    if not isinstance(rdict["nodes"], list):
+      raise errors.OpExecError("Can't parse iallocator results: 'nodes' key"
+                               " is not a list")
+    self.out_data = rdict
+
+
+class LUTestAllocator(NoHooksLU):
+  """Run allocator tests.
+
+  This LU runs the allocator tests
+
+  """
+  _OP_REQP = ["direction", "mode", "name"]
+
+  def CheckPrereq(self):
+    """Check prerequisites.
+
+    This checks the opcode parameters depending on the director and mode test.
+
+    """
+    if self.op.mode == constants.IALLOCATOR_MODE_ALLOC:
+      for attr in ["name", "mem_size", "disks", "disk_template",
+                   "os", "tags", "nics", "vcpus"]:
+        if not hasattr(self.op, attr):
+          raise errors.OpPrereqError("Missing attribute '%s' on opcode input" %
+                                     attr)
+      iname = self.cfg.ExpandInstanceName(self.op.name)
+      if iname is not None:
+        raise errors.OpPrereqError("Instance '%s' already in the cluster" %
+                                   iname)
+      if not isinstance(self.op.nics, list):
+        raise errors.OpPrereqError("Invalid parameter 'nics'")
+      for row in self.op.nics:
+        if (not isinstance(row, dict) or
+            "mac" not in row or
+            "ip" not in row or
+            "bridge" not in row):
+          raise errors.OpPrereqError("Invalid contents of the"
+                                     " 'nics' parameter")
+      if not isinstance(self.op.disks, list):
+        raise errors.OpPrereqError("Invalid parameter 'disks'")
+      if len(self.op.disks) != 2:
+        raise errors.OpPrereqError("Only two-disk configurations supported")
+      for row in self.op.disks:
+        if (not isinstance(row, dict) or
+            "size" not in row or
+            not isinstance(row["size"], int) or
+            "mode" not in row or
+            row["mode"] not in ['r', 'w']):
+          raise errors.OpPrereqError("Invalid contents of the"
+                                     " 'disks' parameter")
+    elif self.op.mode == constants.IALLOCATOR_MODE_RELOC:
+      if not hasattr(self.op, "name"):
+        raise errors.OpPrereqError("Missing attribute 'name' on opcode input")
+      fname = self.cfg.ExpandInstanceName(self.op.name)
+      if fname is None:
+        raise errors.OpPrereqError("Instance '%s' not found for relocation" %
+                                   self.op.name)
+      self.op.name = fname
+      self.relocate_from = self.cfg.GetInstanceInfo(fname).secondary_nodes
+    else:
+      raise errors.OpPrereqError("Invalid test allocator mode '%s'" %
+                                 self.op.mode)
+
+    if self.op.direction == constants.IALLOCATOR_DIR_OUT:
+      if not hasattr(self.op, "allocator") or self.op.allocator is None:
+        raise errors.OpPrereqError("Missing allocator name")
+    elif self.op.direction != constants.IALLOCATOR_DIR_IN:
+      raise errors.OpPrereqError("Wrong allocator test '%s'" %
+                                 self.op.direction)
+
+  def Exec(self, feedback_fn):
+    """Run the allocator test.
+
+    """
+    if self.op.mode == constants.IALLOCATOR_MODE_ALLOC:
+      ial = IAllocator(self.cfg, self.sstore,
+                       mode=self.op.mode,
+                       name=self.op.name,
+                       mem_size=self.op.mem_size,
+                       disks=self.op.disks,
+                       disk_template=self.op.disk_template,
+                       os=self.op.os,
+                       tags=self.op.tags,
+                       nics=self.op.nics,
+                       vcpus=self.op.vcpus,
+                       )
+    else:
+      ial = IAllocator(self.cfg, self.sstore,
+                       mode=self.op.mode,
+                       name=self.op.name,
+                       relocate_from=list(self.relocate_from),
+                       )
+
+    if self.op.direction == constants.IALLOCATOR_DIR_IN:
+      result = ial.in_text
+    else:
+      ial.Run(self.op.allocator, validate=False)
+      result = ial.out_text
+    return result