4 # Copyright (C) 2007, 2008, 2009, 2010, 2011, 2012, 2013 Google Inc.
6 # This program is free software; you can redistribute it and/or modify
7 # it under the terms of the GNU General Public License as published by
8 # the Free Software Foundation; either version 2 of the License, or
9 # (at your option) any later version.
11 # This program is distributed in the hope that it will be useful, but
12 # WITHOUT ANY WARRANTY; without even the implied warranty of
13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 # General Public License for more details.
16 # You should have received a copy of the GNU General Public License
17 # along with this program; if not, write to the Free Software
18 # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
22 """Script for doing QA on Ganeti.
26 # pylint: disable=C0103
47 from ganeti import utils
48 from ganeti import rapi # pylint: disable=W0611
49 from ganeti import constants
51 import ganeti.rapi.client # pylint: disable=W0611
52 from ganeti.rapi.client import UsesRapiClient
55 def _FormatHeader(line, end=72):
56 """Fill a line up to the end column.
59 line = "---- " + line + " "
60 line += "-" * (end - len(line))
65 def _DescriptionOf(fn):
66 """Computes the description of an item.
70 desc = fn.__doc__.splitlines()[0].strip()
74 return desc.rstrip(".")
77 def RunTest(fn, *args, **kwargs):
78 """Runs a test after printing a header.
82 tstart = datetime.datetime.now()
84 desc = _DescriptionOf(fn)
87 print _FormatHeader("%s start %s" % (tstart, desc))
90 retval = fn(*args, **kwargs)
93 tstop = datetime.datetime.now()
94 tdelta = tstop - tstart
95 print _FormatHeader("%s time=%s %s" % (tstop, tdelta, desc))
98 def RunTestIf(testnames, fn, *args, **kwargs):
99 """Runs a test conditionally.
101 @param testnames: either a single test name in the configuration
102 file, or a list of testnames (which will be AND-ed together)
105 if qa_config.TestEnabled(testnames):
106 RunTest(fn, *args, **kwargs)
108 tstart = datetime.datetime.now()
109 desc = _DescriptionOf(fn)
110 print _FormatHeader("%s skipping %s, test(s) %s disabled" %
111 (tstart, desc, testnames))
115 """Run several environment tests.
118 RunTestIf("env", qa_env.TestSshConnection)
119 RunTestIf("env", qa_env.TestIcmpPing)
120 RunTestIf("env", qa_env.TestGanetiCommands)
123 def SetupCluster(rapi_user, rapi_secret):
124 """Initializes the cluster.
126 @param rapi_user: Login user for RAPI
127 @param rapi_secret: Login secret for RAPI
130 RunTestIf("create-cluster", qa_cluster.TestClusterInit,
131 rapi_user, rapi_secret)
133 # Test on empty cluster
134 RunTestIf("node-list", qa_node.TestNodeList)
135 RunTestIf("instance-list", qa_instance.TestInstanceList)
136 RunTestIf("job-list", qa_job.TestJobList)
138 RunTestIf("create-cluster", qa_node.TestNodeAddAll)
139 if not qa_config.TestEnabled("create-cluster"):
140 # consider the nodes are already there
141 qa_node.MarkNodeAddedAll()
143 RunTestIf("test-jobqueue", qa_cluster.TestJobqueue)
145 # enable the watcher (unconditionally)
146 RunTest(qa_daemon.TestResumeWatcher)
148 RunTestIf("node-list", qa_node.TestNodeList)
150 # Test listing fields
151 RunTestIf("node-list", qa_node.TestNodeListFields)
152 RunTestIf("instance-list", qa_instance.TestInstanceListFields)
153 RunTestIf("job-list", qa_job.TestJobListFields)
154 RunTestIf("instance-export", qa_instance.TestBackupListFields)
156 RunTestIf("node-info", qa_node.TestNodeInfo)
159 def RunClusterTests():
160 """Runs tests related to gnt-cluster.
164 ("create-cluster", qa_cluster.TestClusterInitDisk),
165 ("cluster-renew-crypto", qa_cluster.TestClusterRenewCrypto),
166 ("cluster-verify", qa_cluster.TestClusterVerify),
167 ("cluster-reserved-lvs", qa_cluster.TestClusterReservedLvs),
168 # TODO: add more cluster modify tests
169 ("cluster-modify", qa_cluster.TestClusterModifyEmpty),
170 ("cluster-modify", qa_cluster.TestClusterModifyBe),
171 ("cluster-modify", qa_cluster.TestClusterModifyDisk),
172 ("cluster-rename", qa_cluster.TestClusterRename),
173 ("cluster-info", qa_cluster.TestClusterVersion),
174 ("cluster-info", qa_cluster.TestClusterInfo),
175 ("cluster-info", qa_cluster.TestClusterGetmaster),
176 ("cluster-redist-conf", qa_cluster.TestClusterRedistConf),
177 ("cluster-copyfile", qa_cluster.TestClusterCopyfile),
178 ("cluster-command", qa_cluster.TestClusterCommand),
179 ("cluster-burnin", qa_cluster.TestClusterBurnin),
180 ("cluster-master-failover", qa_cluster.TestClusterMasterFailover),
181 ("cluster-master-failover",
182 qa_cluster.TestClusterMasterFailoverWithDrainedQueue),
183 ("cluster-oob", qa_cluster.TestClusterOob),
184 ("rapi", qa_rapi.TestVersion),
185 ("rapi", qa_rapi.TestEmptyCluster),
186 ("rapi", qa_rapi.TestRapiQuery),
191 def RunRepairDiskSizes():
192 """Run the repair disk-sizes test.
195 RunTestIf("cluster-repair-disk-sizes", qa_cluster.TestClusterRepairDiskSizes)
199 """Runs all tests related to gnt-os.
202 if qa_config.TestEnabled("rapi"):
203 rapi_getos = qa_rapi.GetOperatingSystems
209 qa_os.TestOsDiagnose,
216 qa_os.TestOsPartiallyValid,
218 RunTestIf("os", fn, rapi_getos)
221 qa_os.TestOsModifyValid,
222 qa_os.TestOsModifyInvalid,
223 qa_os.TestOsStatesNonExisting,
228 def RunCommonInstanceTests(instance):
229 """Runs a few tests that are common to all disk types.
232 RunTestIf("instance-shutdown", qa_instance.TestInstanceShutdown, instance)
233 RunTestIf(["instance-shutdown", "instance-console", "rapi"],
234 qa_rapi.TestRapiStoppedInstanceConsole, instance)
235 RunTestIf(["instance-shutdown", "instance-modify"],
236 qa_instance.TestInstanceStoppedModify, instance)
237 RunTestIf("instance-shutdown", qa_instance.TestInstanceStartup, instance)
239 # Test shutdown/start via RAPI
240 RunTestIf(["instance-shutdown", "rapi"],
241 qa_rapi.TestRapiInstanceShutdown, instance)
242 RunTestIf(["instance-shutdown", "rapi"],
243 qa_rapi.TestRapiInstanceStartup, instance)
245 RunTestIf("instance-list", qa_instance.TestInstanceList)
247 RunTestIf("instance-info", qa_instance.TestInstanceInfo, instance)
249 RunTestIf("instance-modify", qa_instance.TestInstanceModify, instance)
250 RunTestIf(["instance-modify", "rapi"],
251 qa_rapi.TestRapiInstanceModify, instance)
253 RunTestIf("instance-console", qa_instance.TestInstanceConsole, instance)
254 RunTestIf(["instance-console", "rapi"],
255 qa_rapi.TestRapiInstanceConsole, instance)
257 DOWN_TESTS = qa_config.Either([
258 "instance-reinstall",
260 "instance-grow-disk",
263 # shutdown instance for any 'down' tests
264 RunTestIf(DOWN_TESTS, qa_instance.TestInstanceShutdown, instance)
266 # now run the 'down' state tests
267 RunTestIf("instance-reinstall", qa_instance.TestInstanceReinstall, instance)
268 RunTestIf(["instance-reinstall", "rapi"],
269 qa_rapi.TestRapiInstanceReinstall, instance)
271 if qa_config.TestEnabled("instance-rename"):
272 tgt_instance = qa_config.AcquireInstance()
274 rename_source = instance["name"]
275 rename_target = tgt_instance["name"]
276 # perform instance rename to the same name
277 RunTest(qa_instance.TestInstanceRenameAndBack,
278 rename_source, rename_source)
279 RunTestIf("rapi", qa_rapi.TestRapiInstanceRenameAndBack,
280 rename_source, rename_source)
281 if rename_target is not None:
282 # perform instance rename to a different name, if we have one configured
283 RunTest(qa_instance.TestInstanceRenameAndBack,
284 rename_source, rename_target)
285 RunTestIf("rapi", qa_rapi.TestRapiInstanceRenameAndBack,
286 rename_source, rename_target)
288 qa_config.ReleaseInstance(tgt_instance)
290 RunTestIf(["instance-grow-disk"], qa_instance.TestInstanceGrowDisk, instance)
292 # and now start the instance again
293 RunTestIf(DOWN_TESTS, qa_instance.TestInstanceStartup, instance)
295 RunTestIf("instance-reboot", qa_instance.TestInstanceReboot, instance)
297 RunTestIf("tags", qa_tags.TestInstanceTags, instance)
299 RunTestIf("cluster-verify", qa_cluster.TestClusterVerify)
301 RunTestIf("rapi", qa_rapi.TestInstance, instance)
303 # Lists instances, too
304 RunTestIf("node-list", qa_node.TestNodeList)
306 # Some jobs have been run, let's test listing them
307 RunTestIf("job-list", qa_job.TestJobList)
310 def RunCommonNodeTests():
311 """Run a few common node tests.
314 RunTestIf("node-volumes", qa_node.TestNodeVolumes)
315 RunTestIf("node-storage", qa_node.TestNodeStorage)
316 RunTestIf("node-oob", qa_node.TestOutOfBand)
319 def RunGroupListTests():
320 """Run tests for listing node groups.
323 RunTestIf("group-list", qa_group.TestGroupList)
324 RunTestIf("group-list", qa_group.TestGroupListFields)
327 def RunGroupRwTests():
328 """Run tests for adding/removing/renaming groups.
331 RunTestIf("group-rwops", qa_group.TestGroupAddRemoveRename)
332 RunTestIf("group-rwops", qa_group.TestGroupAddWithOptions)
333 RunTestIf("group-rwops", qa_group.TestGroupModify)
334 RunTestIf(["group-rwops", "rapi"], qa_rapi.TestRapiNodeGroups)
335 RunTestIf(["group-rwops", "tags"], qa_tags.TestGroupTags,
336 qa_group.GetDefaultGroup())
339 def RunExportImportTests(instance, pnode, snode):
340 """Tries to export and import the instance.
342 @param pnode: current primary node of the instance
343 @param snode: current secondary node of the instance, if any,
347 if qa_config.TestEnabled("instance-export"):
348 RunTest(qa_instance.TestInstanceExportNoTarget, instance)
350 expnode = qa_config.AcquireNode(exclude=pnode)
352 name = RunTest(qa_instance.TestInstanceExport, instance, expnode)
354 RunTest(qa_instance.TestBackupList, expnode)
356 if qa_config.TestEnabled("instance-import"):
357 newinst = qa_config.AcquireInstance()
359 RunTest(qa_instance.TestInstanceImport, newinst, pnode,
361 # Check if starting the instance works
362 RunTest(qa_instance.TestInstanceStartup, newinst)
363 RunTest(qa_instance.TestInstanceRemove, newinst)
365 qa_config.ReleaseInstance(newinst)
367 qa_config.ReleaseNode(expnode)
369 if qa_config.TestEnabled(["rapi", "inter-cluster-instance-move"]):
370 newinst = qa_config.AcquireInstance()
375 excl = [pnode, snode]
376 tnode = qa_config.AcquireNode(exclude=excl)
378 RunTest(qa_rapi.TestInterClusterInstanceMove, instance, newinst,
381 qa_config.ReleaseNode(tnode)
383 qa_config.ReleaseInstance(newinst)
386 def RunDaemonTests(instance):
387 """Test the ganeti-watcher script.
390 RunTest(qa_daemon.TestPauseWatcher)
392 RunTestIf("instance-automatic-restart",
393 qa_daemon.TestInstanceAutomaticRestart, instance)
394 RunTestIf("instance-consecutive-failures",
395 qa_daemon.TestInstanceConsecutiveFailures, instance)
397 RunTest(qa_daemon.TestResumeWatcher)
400 def RunSingleHomedHardwareFailureTests(instance, pnode):
401 """Test hardware failure recovery for single-homed instances.
404 if qa_config.TestEnabled("instance-recreate-disks"):
405 othernode = qa_config.AcquireNode(exclude=[pnode])
407 RunTest(qa_instance.TestRecreateDisks,
408 instance, pnode, None, [othernode])
410 qa_config.ReleaseNode(othernode)
413 def RunHardwareFailureTests(instance, pnode, snode):
414 """Test cluster internal hardware failure recovery.
417 RunTestIf("instance-failover", qa_instance.TestInstanceFailover, instance)
418 RunTestIf(["instance-failover", "rapi"],
419 qa_rapi.TestRapiInstanceFailover, instance)
421 RunTestIf("instance-migrate", qa_instance.TestInstanceMigrate, instance)
422 RunTestIf(["instance-migrate", "rapi"],
423 qa_rapi.TestRapiInstanceMigrate, instance)
425 if qa_config.TestEnabled("instance-replace-disks"):
426 othernode = qa_config.AcquireNode(exclude=[pnode, snode])
428 RunTestIf("rapi", qa_rapi.TestRapiInstanceReplaceDisks, instance)
429 RunTest(qa_instance.TestReplaceDisks,
430 instance, pnode, snode, othernode)
432 qa_config.ReleaseNode(othernode)
434 if qa_config.TestEnabled("instance-recreate-disks"):
435 othernode1 = qa_config.AcquireNode(exclude=[pnode, snode])
437 othernode2 = qa_config.AcquireNode(exclude=[pnode, snode, othernode1])
438 except qa_error.OutOfNodesError:
439 # Let's reuse one of the nodes if the cluster is not big enough
442 RunTest(qa_instance.TestRecreateDisks,
443 instance, pnode, snode, [othernode1, othernode2])
445 qa_config.ReleaseNode(othernode1)
446 if othernode2 != pnode:
447 qa_config.ReleaseNode(othernode2)
449 RunTestIf("node-evacuate", qa_node.TestNodeEvacuate, pnode, snode)
451 RunTestIf("node-failover", qa_node.TestNodeFailover, pnode, snode)
454 def RunExclusiveStorageTests():
455 """Test exclusive storage."""
456 if not qa_config.TestEnabled("cluster-exclusive-storage"):
459 node = qa_config.AcquireNode()
461 old_es = qa_cluster.TestSetExclStorCluster(False)
462 qa_cluster.TestExclStorSingleNode(node)
464 qa_cluster.TestSetExclStorCluster(True)
465 qa_cluster.TestExclStorSharedPv(node)
467 if qa_config.TestEnabled("instance-add-plain-disk"):
468 # Make sure that the cluster doesn't have any pre-existing problem
469 qa_cluster.AssertClusterVerify()
470 instance1 = qa_instance.TestInstanceAddWithPlainDisk(node)
471 instance2 = qa_instance.TestInstanceAddWithPlainDisk(node)
472 # cluster-verify checks that disks are allocated correctly
473 qa_cluster.AssertClusterVerify()
474 qa_instance.TestInstanceRemove(instance1)
475 qa_instance.TestInstanceRemove(instance2)
476 if qa_config.TestEnabled("instance-add-drbd-disk"):
477 snode = qa_config.AcquireNode()
479 qa_cluster.TestSetExclStorCluster(False)
480 instance = qa_instance.TestInstanceAddWithDrbdDisk(node, snode)
481 qa_cluster.TestSetExclStorCluster(True)
482 exp_err = [constants.CV_EINSTANCEUNSUITABLENODE]
483 qa_cluster.AssertClusterVerify(fail=True, errors=exp_err)
484 qa_instance.TestInstanceRemove(instance)
486 qa_config.ReleaseNode(snode)
487 qa_cluster.TestSetExclStorCluster(old_es)
489 qa_config.ReleaseNode(node)
496 rapi_user = "ganeti-qa"
497 rapi_secret = utils.GenerateSecret()
500 SetupCluster(rapi_user, rapi_secret)
502 # Load RAPI certificate
503 qa_rapi.Setup(rapi_user, rapi_secret)
508 RunTestIf("tags", qa_tags.TestClusterTags)
514 # The master shouldn't be readded or put offline; "delay" needs a non-master
516 pnode = qa_config.AcquireNode(exclude=qa_config.GetMasterNode())
518 RunTestIf("node-readd", qa_node.TestNodeReadd, pnode)
519 RunTestIf("node-modify", qa_node.TestNodeModify, pnode)
520 RunTestIf("delay", qa_cluster.TestDelay, pnode)
522 qa_config.ReleaseNode(pnode)
524 pnode = qa_config.AcquireNode()
526 RunTestIf("tags", qa_tags.TestNodeTags, pnode)
528 if qa_rapi.Enabled():
529 RunTest(qa_rapi.TestNode, pnode)
531 if qa_config.TestEnabled("instance-add-plain-disk"):
532 for use_client in [True, False]:
533 rapi_instance = RunTest(qa_rapi.TestRapiInstanceAdd, pnode,
535 if qa_config.TestEnabled("instance-plain-rapi-common-tests"):
536 RunCommonInstanceTests(rapi_instance)
537 RunTest(qa_rapi.TestRapiInstanceRemove, rapi_instance, use_client)
540 if qa_config.TestEnabled("instance-add-plain-disk"):
541 instance = RunTest(qa_instance.TestInstanceAddWithPlainDisk, pnode)
542 RunCommonInstanceTests(instance)
544 RunTestIf("cluster-epo", qa_cluster.TestClusterEpo)
545 RunExportImportTests(instance, pnode, None)
546 RunDaemonTests(instance)
548 RunSingleHomedHardwareFailureTests(instance, pnode)
549 RunTest(qa_instance.TestInstanceRemove, instance)
553 ("instance-add-drbd-disk",
554 qa_instance.TestInstanceAddWithDrbdDisk),
557 for name, func in multinode_tests:
558 if qa_config.TestEnabled(name):
559 snode = qa_config.AcquireNode(exclude=pnode)
561 instance = RunTest(func, pnode, snode)
562 RunTestIf("haskell-confd", qa_node.TestNodeListDrbd, pnode)
563 RunTestIf("haskell-confd", qa_node.TestNodeListDrbd, snode)
564 RunCommonInstanceTests(instance)
566 RunTestIf("group-rwops", qa_group.TestAssignNodesIncludingSplit,
567 constants.INITIAL_NODE_GROUP_NAME,
568 pnode["primary"], snode["primary"])
569 if qa_config.TestEnabled("instance-convert-disk"):
570 RunTest(qa_instance.TestInstanceShutdown, instance)
571 RunTest(qa_instance.TestInstanceConvertDisk, instance, snode)
572 RunTest(qa_instance.TestInstanceStartup, instance)
573 RunExportImportTests(instance, pnode, snode)
574 RunHardwareFailureTests(instance, pnode, snode)
576 RunTest(qa_instance.TestInstanceRemove, instance)
579 qa_config.ReleaseNode(snode)
582 qa_config.ReleaseNode(pnode)
584 # Test removing instance with offline drbd secondary
585 if qa_config.TestEnabled("instance-remove-drbd-offline"):
586 # Make sure the master is not put offline
587 snode = qa_config.AcquireNode(exclude=qa_config.GetMasterNode())
589 pnode = qa_config.AcquireNode(exclude=snode)
591 instance = qa_instance.TestInstanceAddWithDrbdDisk(pnode, snode)
592 qa_node.MakeNodeOffline(snode, "yes")
594 RunTest(qa_instance.TestInstanceRemove, instance)
596 qa_node.MakeNodeOffline(snode, "no")
598 qa_config.ReleaseNode(pnode)
600 qa_config.ReleaseNode(snode)
602 pnode = qa_config.AcquireNode()
604 if qa_config.TestEnabled(["instance-add-plain-disk", "instance-export"]):
605 for shutdown in [False, True]:
606 instance = RunTest(qa_instance.TestInstanceAddWithPlainDisk, pnode)
607 expnode = qa_config.AcquireNode(exclude=pnode)
610 # Stop instance before exporting and removing it
611 RunTest(qa_instance.TestInstanceShutdown, instance)
612 RunTest(qa_instance.TestInstanceExportWithRemove, instance, expnode)
613 RunTest(qa_instance.TestBackupList, expnode)
615 qa_config.ReleaseNode(expnode)
620 qa_config.ReleaseNode(pnode)
622 RunExclusiveStorageTests()
624 RunTestIf("create-cluster", qa_node.TestNodeRemoveAll)
626 RunTestIf("cluster-destroy", qa_cluster.TestClusterDestroy)
634 parser = optparse.OptionParser(usage="%prog [options] <config-file>")
635 parser.add_option("--yes-do-it", dest="yes_do_it",
637 help="Really execute the tests")
638 (qa_config.options, args) = parser.parse_args()
641 (config_file, ) = args
643 parser.error("Wrong number of arguments.")
645 if not qa_config.options.yes_do_it:
646 print ("Executing this script irreversibly destroys any Ganeti\n"
647 "configuration on all nodes involved. If you really want\n"
648 "to start testing, supply the --yes-do-it option.")
651 qa_config.Load(config_file)
653 primary = qa_config.GetMasterNode()["primary"]
654 qa_utils.StartMultiplexer(primary)
655 print ("SSH command for primary node: %s" %
656 utils.ShellQuoteArgs(qa_utils.GetSSHCommand(primary, "")))
657 print ("SSH command for other nodes: %s" %
658 utils.ShellQuoteArgs(qa_utils.GetSSHCommand("NODE", "")))
662 qa_utils.CloseMultiplexers()
664 if __name__ == "__main__":