utils.KillProcess: Use waitpid() to wait for child processes
[ganeti-local] / qa / qa_instance.py
index b6bd59b..fe5dfb5 100644 (file)
@@ -1,3 +1,6 @@
+#
+#
+
 # Copyright (C) 2007 Google Inc.
 #
 # This program is free software; you can redistribute it and/or modify
 
 """
 
+import re
+import time
+
 from ganeti import utils
 from ganeti import constants
 
 import qa_config
 import qa_utils
+import qa_error
 
-from qa_utils import AssertEqual, StartSSH
+from qa_utils import AssertEqual, AssertNotEqual, StartSSH
+
+
+def _GetDiskStatePath(disk):
+  return "/sys/block/%s/device/state" % disk
 
 
 def _GetGenericAddParameters():
-  return ['--os-size=%s' % qa_config.get('os-size'),
-          '--swap-size=%s' % qa_config.get('swap-size'),
-          '--memory=%s' % qa_config.get('mem')]
+  params = ['-B', '%s=%s' % (constants.BE_MEMORY, qa_config.get('mem'))]
+  for idx, size in enumerate(qa_config.get('disk')):
+    params.extend(["--disk", "%s:size=%s" % (idx, size)])
+  return params
 
 
-def _DiskTest(node, args):
+def _DiskTest(node, disk_template):
   master = qa_config.GetMasterNode()
 
   instance = qa_config.AcquireInstance()
   try:
     cmd = (['gnt-instance', 'add',
             '--os-type=%s' % qa_config.get('os'),
-            '--node=%s' % node['primary']] +
+            '--disk-template=%s' % disk_template,
+            '--node=%s' % node] +
            _GetGenericAddParameters())
-    if args:
-      cmd += args
     cmd.append(instance['name'])
 
     AssertEqual(StartSSH(master['primary'],
@@ -58,19 +69,13 @@ def _DiskTest(node, args):
 
 def TestInstanceAddWithPlainDisk(node):
   """gnt-instance add -t plain"""
-  return _DiskTest(node, ['--disk-template=plain'])
-
-
-def TestInstanceAddWithLocalMirrorDisk(node):
-  """gnt-instance add -t local_raid1"""
-  return _DiskTest(node, ['--disk-template=local_raid1'])
+  return _DiskTest(node['primary'], 'plain')
 
 
-def TestInstanceAddWithRemoteRaidDisk(node, node2):
-  """gnt-instance add -t remote_raid1"""
-  return _DiskTest(node,
-                   ['--disk-template=remote_raid1',
-                    '--secondary-node=%s' % node2['primary']])
+def TestInstanceAddWithDrbdDisk(node, node2):
+  """gnt-instance add -t drbd"""
+  return _DiskTest("%s:%s" % (node['primary'], node2['primary']),
+                   'drbd')
 
 
 def TestInstanceRemove(instance):
@@ -102,6 +107,17 @@ def TestInstanceShutdown(instance):
                        utils.ShellQuoteArgs(cmd)).wait(), 0)
 
 
+def TestInstanceReboot(instance):
+  """gnt-instance reboot"""
+  master = qa_config.GetMasterNode()
+
+  for reboottype in ["soft", "hard", "full"]:
+    cmd = ['gnt-instance', 'reboot', '--type=%s' % reboottype,
+           instance['name']]
+    AssertEqual(StartSSH(master['primary'],
+                         utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+
 def TestInstanceReinstall(instance):
   """gnt-instance reinstall"""
   master = qa_config.GetMasterNode()
@@ -119,6 +135,11 @@ def TestInstanceFailover(instance):
   AssertEqual(StartSSH(master['primary'],
                        utils.ShellQuoteArgs(cmd)).wait(), 0)
 
+  # ... and back
+  cmd = ['gnt-instance', 'failover', '--force', instance['name']]
+  AssertEqual(StartSSH(master['primary'],
+                       utils.ShellQuoteArgs(cmd)).wait(), 0)
+
 
 def TestInstanceInfo(instance):
   """gnt-instance info"""
@@ -129,6 +150,48 @@ def TestInstanceInfo(instance):
                        utils.ShellQuoteArgs(cmd)).wait(), 0)
 
 
+def TestInstanceModify(instance):
+  """gnt-instance modify"""
+  master = qa_config.GetMasterNode()
+
+  # Assume /sbin/init exists on all systems
+  test_kernel = "/sbin/init"
+  test_initrd = test_kernel
+
+  orig_memory = qa_config.get('mem')
+  orig_bridge = qa_config.get('bridge', 'xen-br0')
+  args = [
+    ["-B", "%s=128" % constants.BE_MEMORY],
+    ["-B", "%s=%s" % (constants.BE_MEMORY, orig_memory)],
+    ["-B", "%s=2" % constants.BE_VCPUS],
+    ["-B", "%s=1" % constants.BE_VCPUS],
+    ["-B", "%s=%s" % (constants.BE_VCPUS, constants.VALUE_DEFAULT)],
+
+    ["-H", "%s=%s" % (constants.HV_KERNEL_PATH, test_kernel)],
+    ["-H", "%s=%s" % (constants.HV_KERNEL_PATH, constants.VALUE_DEFAULT)],
+    ["-H", "%s=%s" % (constants.HV_INITRD_PATH, test_initrd)],
+    ["-H", "%s=%s" % (constants.HV_INITRD_PATH, constants.VALUE_NONE)],
+    ["-H", "%s=%s" % (constants.HV_INITRD_PATH, constants.VALUE_DEFAULT)],
+
+    # TODO: bridge tests
+    #["--bridge", "xen-br1"],
+    #["--bridge", orig_bridge],
+
+    # TODO: Do these tests only with xen-hvm
+    #["-H", "%s=acn" % constants.HV_BOOT_ORDER],
+    #["-H", "%s=%s" % (constants.HV_BOOT_ORDER, constants.VALUE_DEFAULT)],
+    ]
+  for alist in args:
+    cmd = ['gnt-instance', 'modify'] + alist + [instance['name']]
+    AssertEqual(StartSSH(master['primary'],
+                         utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+  # check no-modify
+  cmd = ['gnt-instance', 'modify', instance['name']]
+  AssertNotEqual(StartSSH(master['primary'],
+                          utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+
 def TestInstanceList():
   """gnt-instance list"""
   master = qa_config.GetMasterNode()
@@ -138,6 +201,43 @@ def TestInstanceList():
                        utils.ShellQuoteArgs(cmd)).wait(), 0)
 
 
+def TestInstanceConsole(instance):
+  """gnt-instance console"""
+  master = qa_config.GetMasterNode()
+
+  cmd = ['gnt-instance', 'console', '--show-cmd', instance['name']]
+  AssertEqual(StartSSH(master['primary'],
+                       utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+
+def TestReplaceDisks(instance, pnode, snode, othernode):
+  """gnt-instance replace-disks"""
+  master = qa_config.GetMasterNode()
+
+  def buildcmd(args):
+    cmd = ['gnt-instance', 'replace-disks']
+    cmd.extend(args)
+    cmd.append(instance["name"])
+    return cmd
+
+  cmd = buildcmd(["-p"])
+  AssertEqual(StartSSH(master['primary'],
+                       utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+  cmd = buildcmd(["-s"])
+  AssertEqual(StartSSH(master['primary'],
+                       utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+  cmd = buildcmd(["--new-secondary=%s" % othernode["primary"]])
+  AssertEqual(StartSSH(master['primary'],
+                       utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+  # Restore
+  cmd = buildcmd(["--new-secondary=%s" % snode["primary"]])
+  AssertEqual(StartSSH(master['primary'],
+                       utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+
 def TestInstanceExport(instance, node):
   """gnt-backup export"""
   master = qa_config.GetMasterNode()
@@ -169,6 +269,145 @@ def TestBackupList(expnode):
   """gnt-backup list"""
   master = qa_config.GetMasterNode()
 
-  cmd = ['gnt-backup', 'list', '--nodes=%s' % expnode['primary']]
+  cmd = ['gnt-backup', 'list', '--node=%s' % expnode['primary']]
   AssertEqual(StartSSH(master['primary'],
                        utils.ShellQuoteArgs(cmd)).wait(), 0)
+
+
+def _TestInstanceDiskFailure(instance, node, node2, onmaster):
+  """Testing disk failure."""
+  master = qa_config.GetMasterNode()
+  sq = utils.ShellQuoteArgs
+
+  instance_full = qa_utils.ResolveInstanceName(instance)
+  node_full = qa_utils.ResolveNodeName(node)
+  node2_full = qa_utils.ResolveNodeName(node2)
+
+  print qa_utils.FormatInfo("Getting physical disk names")
+  cmd = ['gnt-node', 'volumes', '--separator=|', '--no-headers',
+         '--output=node,phys,instance',
+         node['primary'], node2['primary']]
+  output = qa_utils.GetCommandOutput(master['primary'], sq(cmd))
+
+  # Get physical disk names
+  re_disk = re.compile(r'^/dev/([a-z]+)\d+$')
+  node2disk = {}
+  for line in output.splitlines():
+    (node_name, phys, inst) = line.split('|')
+    if inst == instance_full:
+      if node_name not in node2disk:
+        node2disk[node_name] = []
+
+      m = re_disk.match(phys)
+      if not m:
+        raise qa_error.Error("Unknown disk name format: %s" % disk)
+
+      name = m.group(1)
+      if name not in node2disk[node_name]:
+        node2disk[node_name].append(name)
+
+  if [node2_full, node_full][int(onmaster)] not in node2disk:
+    raise qa_error.Error("Couldn't find physical disks used on"
+                         " %s node" % ["secondary", "master"][int(onmaster)])
+
+  print qa_utils.FormatInfo("Checking whether nodes have ability to stop"
+                            " disks")
+  for node_name, disks in node2disk.iteritems():
+    cmds = []
+    for disk in disks:
+      cmds.append(sq(["test", "-f", _GetDiskStatePath(disk)]))
+    AssertEqual(StartSSH(node_name, ' && '.join(cmds)).wait(), 0)
+
+  print qa_utils.FormatInfo("Getting device paths")
+  cmd = ['gnt-instance', 'activate-disks', instance['name']]
+  output = qa_utils.GetCommandOutput(master['primary'], sq(cmd))
+  devpath = []
+  for line in output.splitlines():
+    (_, _, tmpdevpath) = line.split(':')
+    devpath.append(tmpdevpath)
+  print devpath
+
+  print qa_utils.FormatInfo("Getting drbd device paths")
+  cmd = ['gnt-instance', 'info', instance['name']]
+  output = qa_utils.GetCommandOutput(master['primary'], sq(cmd))
+  pattern = (r'\s+-\s+sd[a-z]+,\s+type:\s+drbd8?,\s+.*$'
+             r'\s+primary:\s+(/dev/drbd\d+)\s+')
+  drbddevs = re.findall(pattern, output, re.M)
+  print drbddevs
+
+  halted_disks = []
+  try:
+    print qa_utils.FormatInfo("Deactivating disks")
+    cmds = []
+    for name in node2disk[[node2_full, node_full][int(onmaster)]]:
+      halted_disks.append(name)
+      cmds.append(sq(["echo", "offline"]) + " >%s" % _GetDiskStatePath(name))
+    AssertEqual(StartSSH([node2, node][int(onmaster)]['primary'],
+                         ' && '.join(cmds)).wait(), 0)
+
+    print qa_utils.FormatInfo("Write to disks and give some time to notice"
+                              " to notice the problem")
+    cmds = []
+    for disk in devpath:
+      cmds.append(sq(["dd", "count=1", "bs=512", "conv=notrunc",
+                      "if=%s" % disk, "of=%s" % disk]))
+    for _ in (0, 1, 2):
+      AssertEqual(StartSSH(node['primary'], ' && '.join(cmds)).wait(), 0)
+      time.sleep(3)
+
+    print qa_utils.FormatInfo("Debugging info")
+    for name in drbddevs:
+      cmd = ['drbdsetup', name, 'show']
+      AssertEqual(StartSSH(node['primary'], sq(cmd)).wait(), 0)
+
+    cmd = ['gnt-instance', 'info', instance['name']]
+    AssertEqual(StartSSH(master['primary'], sq(cmd)).wait(), 0)
+
+  finally:
+    print qa_utils.FormatInfo("Activating disks again")
+    cmds = []
+    for name in halted_disks:
+      cmds.append(sq(["echo", "running"]) + " >%s" % _GetDiskStatePath(name))
+    AssertEqual(StartSSH([node2, node][int(onmaster)]['primary'],
+                         '; '.join(cmds)).wait(), 0)
+
+  if onmaster:
+    for name in drbddevs:
+      cmd = ['drbdsetup', name, 'detach']
+      AssertEqual(StartSSH(node['primary'], sq(cmd)).wait(), 0)
+  else:
+    for name in drbddevs:
+      cmd = ['drbdsetup', name, 'disconnect']
+      AssertEqual(StartSSH(node2['primary'], sq(cmd)).wait(), 0)
+
+  # TODO
+  #cmd = ['vgs']
+  #AssertEqual(StartSSH([node2, node][int(onmaster)]['primary'],
+  #                     sq(cmd)).wait(), 0)
+
+  print qa_utils.FormatInfo("Making sure disks are up again")
+  cmd = ['gnt-instance', 'replace-disks', instance['name']]
+  AssertEqual(StartSSH(master['primary'], sq(cmd)).wait(), 0)
+
+  print qa_utils.FormatInfo("Restarting instance")
+  cmd = ['gnt-instance', 'shutdown', instance['name']]
+  AssertEqual(StartSSH(master['primary'], sq(cmd)).wait(), 0)
+
+  cmd = ['gnt-instance', 'startup', instance['name']]
+  AssertEqual(StartSSH(master['primary'], sq(cmd)).wait(), 0)
+
+  cmd = ['gnt-cluster', 'verify']
+  AssertEqual(StartSSH(master['primary'], sq(cmd)).wait(), 0)
+
+
+def TestInstanceMasterDiskFailure(instance, node, node2):
+  """Testing disk failure on master node."""
+  print qa_utils.FormatError("Disk failure on primary node cannot be"
+                             " tested due to potential crashes.")
+  # The following can cause crashes, thus it's disabled until fixed
+  #return _TestInstanceDiskFailure(instance, node, node2, True)
+
+
+def TestInstanceSecondaryDiskFailure(instance, node, node2):
+  """Testing disk failure on secondary node."""
+  return _TestInstanceDiskFailure(instance, node, node2, False)