X-Git-Url: https://code.grnet.gr/git/ganeti-local/blobdiff_plain/246e180a111750fc3316062bba262152dd6718b4..cbfc468166d63c9f02f21018140df2558770ff9f:/lib/opcodes.py diff --git a/lib/opcodes.py b/lib/opcodes.py index c53504a..958ee42 100644 --- a/lib/opcodes.py +++ b/lib/opcodes.py @@ -1,4 +1,4 @@ -#!/usr/bin/python +# # # Copyright (C) 2006, 2007 Google Inc. @@ -24,11 +24,8 @@ This module implements the data structures which define the cluster operations - the so-called opcodes. - -This module implements the logic for doing operations in the cluster. There -are two kinds of classes defined: - - opcodes, which are small classes only holding data for the task at hand - - logical units, which know how to deal with their specific opcode only +Every operation which modifies the cluster state is expressed via +opcodes. """ @@ -36,28 +33,151 @@ are two kinds of classes defined: # few public methods: # pylint: disable-msg=R0903 -class OpCode(object): - """Abstract OpCode""" - OP_ID = "OP_ABSTRACT" + +class BaseOpCode(object): + """A simple serializable object. + + This object serves as a parent class for OpCode without any custom + field handling. + + """ __slots__ = [] def __init__(self, **kwargs): + """Constructor for BaseOpCode. + + The constructor takes only keyword arguments and will set + attributes on this object based on the passed arguments. As such, + it means that you should not pass arguments which are not in the + __slots__ attribute for this class. + + """ for key in kwargs: if key not in self.__slots__: - raise TypeError("OpCode %s doesn't support the parameter '%s'" % + raise TypeError("Object %s doesn't support the parameter '%s'" % (self.__class__.__name__, key)) setattr(self, key, kwargs[key]) + def __getstate__(self): + """Generic serializer. + + This method just returns the contents of the instance as a + dictionary. + + @rtype: C{dict} + @return: the instance attributes and their values + + """ + state = {} + for name in self.__slots__: + if hasattr(self, name): + state[name] = getattr(self, name) + return state + + def __setstate__(self, state): + """Generic unserializer. + + This method just restores from the serialized state the attributes + of the current instance. + + @param state: the serialized opcode data + @type state: C{dict} + + """ + if not isinstance(state, dict): + raise ValueError("Invalid data to __setstate__: expected dict, got %s" % + type(state)) + + for name in self.__slots__: + if name not in state: + delattr(self, name) + + for name in state: + setattr(self, name, state[name]) + + +class OpCode(BaseOpCode): + """Abstract OpCode. -class OpInitCluster(OpCode): - """Initialise the cluster.""" - OP_ID = "OP_CLUSTER_INIT" - __slots__ = ["cluster_name", "secondary_ip", "hypervisor_type", - "vg_name", "mac_prefix", "def_bridge", "master_netdev"] + This is the root of the actual OpCode hierarchy. All clases derived + from this class should override OP_ID. + + @cvar OP_ID: The ID of this opcode. This should be unique amongst all + childre of this class. + + """ + OP_ID = "OP_ABSTRACT" + __slots__ = [] + + def __getstate__(self): + """Specialized getstate for opcodes. + + This method adds to the state dictionary the OP_ID of the class, + so that on unload we can identify the correct class for + instantiating the opcode. + + @rtype: C{dict} + @return: the state as a dictionary + + """ + data = BaseOpCode.__getstate__(self) + data["OP_ID"] = self.OP_ID + return data + + @classmethod + def LoadOpCode(cls, data): + """Generic load opcode method. + + The method identifies the correct opcode class from the dict-form + by looking for a OP_ID key, if this is not found, or its value is + not available in this module as a child of this class, we fail. + + @type data: C{dict} + @param data: the serialized opcode + + """ + if not isinstance(data, dict): + raise ValueError("Invalid data to LoadOpCode (%s)" % type(data)) + if "OP_ID" not in data: + raise ValueError("Invalid data to LoadOpcode, missing OP_ID") + op_id = data["OP_ID"] + op_class = None + for item in globals().values(): + if (isinstance(item, type) and + issubclass(item, cls) and + hasattr(item, "OP_ID") and + getattr(item, "OP_ID") == op_id): + op_class = item + break + if op_class is None: + raise ValueError("Invalid data to LoadOpCode: OP_ID %s unsupported" % + op_id) + op = op_class() + new_data = data.copy() + del new_data["OP_ID"] + op.__setstate__(new_data) + return op + + def Summary(self): + """Generates a summary description of this opcode. + + """ + # all OP_ID start with OP_, we remove that + txt = self.OP_ID[3:] + field_name = getattr(self, "OP_DSC_FIELD", None) + if field_name: + field_value = getattr(self, field_name, None) + txt = "%s(%s)" % (txt, field_value) + return txt class OpDestroyCluster(OpCode): - """Destroy the cluster.""" + """Destroy the cluster. + + This opcode has no other parameters. All the state is irreversibly + lost after the execution of this opcode. + + """ OP_ID = "OP_CLUSTER_DESTROY" __slots__ = [] @@ -68,46 +188,122 @@ class OpQueryClusterInfo(OpCode): __slots__ = [] -class OpClusterCopyFile(OpCode): - """Copy a file to multiple nodes.""" - OP_ID = "OP_CLUSTER_COPYFILE" - __slots__ = ["nodes", "filename"] +class OpVerifyCluster(OpCode): + """Verify the cluster state. + @type skip_checks: C{list} + @ivar skip_checks: steps to be skipped from the verify process; this + needs to be a subset of + L{constants.VERIFY_OPTIONAL_CHECKS}; currently + only L{constants.VERIFY_NPLUSONE_MEM} can be passed -class OpRunClusterCommand(OpCode): - """Run a command on multiple nodes.""" - OP_ID = "OP_CLUSTER_RUNCOMMAND" - __slots__ = ["nodes", "command"] + """ + OP_ID = "OP_CLUSTER_VERIFY" + __slots__ = ["skip_checks"] -class OpVerifyCluster(OpCode): - """Verify the cluster state.""" - OP_ID = "OP_CLUSTER_VERIFY" - __slots__ = [] +class OpVerifyDisks(OpCode): + """Verify the cluster disks. + Parameters: none -class OpMasterFailover(OpCode): - """Do a master failover.""" - OP_ID = "OP_CLUSTER_MASTERFAILOVER" - __slots__ = [] + Result: a tuple of four elements: + - list of node names with bad data returned (unreachable, etc.) + - dict of node names with broken volume groups (values: error msg) + - list of instances with degraded disks (that should be activated) + - dict of instances with missing logical volumes (values: (node, vol) + pairs with details about the missing volumes) + In normal operation, all lists should be empty. A non-empty instance + list (3rd element of the result) is still ok (errors were fixed) but + non-empty node list means some node is down, and probably there are + unfixable drbd errors. -class OpDumpClusterConfig(OpCode): - """Dump the cluster configuration.""" - OP_ID = "OP_CLUSTER_DUMPCONFIG" + Note that only instances that are drbd-based are taken into + consideration. This might need to be revisited in the future. + + """ + OP_ID = "OP_CLUSTER_VERIFY_DISKS" __slots__ = [] +class OpQueryConfigValues(OpCode): + """Query cluster configuration values.""" + OP_ID = "OP_CLUSTER_CONFIG_QUERY" + __slots__ = ["output_fields"] + + +class OpRenameCluster(OpCode): + """Rename the cluster. + + @type name: C{str} + @ivar name: The new name of the cluster. The name and/or the master IP + address will be changed to match the new name and its IP + address. + + """ + OP_ID = "OP_CLUSTER_RENAME" + OP_DSC_FIELD = "name" + __slots__ = ["name"] + + +class OpSetClusterParams(OpCode): + """Change the parameters of the cluster. + + @type vg_name: C{str} or C{None} + @ivar vg_name: The new volume group name or None to disable LVM usage. + + """ + OP_ID = "OP_CLUSTER_SET_PARAMS" + __slots__ = [ + "vg_name", + "enabled_hypervisors", + "hvparams", + "beparams", + "candidate_pool_size", + ] + + +# node opcodes + class OpRemoveNode(OpCode): - """Remove a node.""" + """Remove a node. + + @type node_name: C{str} + @ivar node_name: The name of the node to remove. If the node still has + instances on it, the operation will fail. + + """ OP_ID = "OP_NODE_REMOVE" + OP_DSC_FIELD = "node_name" __slots__ = ["node_name"] class OpAddNode(OpCode): - """Add a node.""" + """Add a node to the cluster. + + @type node_name: C{str} + @ivar node_name: The name of the node to add. This can be a short name, + but it will be expanded to the FQDN. + @type primary_ip: IP address + @ivar primary_ip: The primary IP of the node. This will be ignored when the + opcode is submitted, but will be filled during the node + add (so it will be visible in the job query). + @type secondary_ip: IP address + @ivar secondary_ip: The secondary IP of the node. This needs to be passed + if the cluster has been initialized in 'dual-network' + mode, otherwise it must not be given. + @type readd: C{bool} + @ivar readd: Whether to re-add an existing node to the cluster. If + this is not passed, then the operation will abort if the node + name is already in the cluster; use this parameter to 'repair' + a node that had its configuration broken, or was reinstalled + without removal from the cluster. + + """ OP_ID = "OP_NODE_ADD" - __slots__ = ["node_name", "primary_ip", "secondary_ip"] + OP_DSC_FIELD = "node_name" + __slots__ = ["node_name", "primary_ip", "secondary_ip", "readd"] class OpQueryNodes(OpCode): @@ -122,80 +318,108 @@ class OpQueryNodeVolumes(OpCode): __slots__ = ["nodes", "output_fields"] +class OpSetNodeParams(OpCode): + """Change the parameters of a node.""" + OP_ID = "OP_NODE_SET_PARAMS" + OP_DSC_FIELD = "node_name" + __slots__ = [ + "node_name", + "force", + "master_candidate", + ] + # instance opcodes class OpCreateInstance(OpCode): """Create an instance.""" OP_ID = "OP_INSTANCE_CREATE" - __slots__ = ["instance_name", "mem_size", "disk_size", "os_type", "pnode", - "disk_template", "snode", "swap_size", "mode", - "vcpus", "ip", "bridge", "src_node", "src_path", "start", - "wait_for_sync"] + OP_DSC_FIELD = "instance_name" + __slots__ = [ + "instance_name", "os_type", "pnode", + "disk_template", "snode", "mode", + "disks", "nics", + "src_node", "src_path", "start", + "wait_for_sync", "ip_check", + "file_storage_dir", "file_driver", + "iallocator", + "hypervisor", "hvparams", "beparams", + ] class OpReinstallInstance(OpCode): """Reinstall an instance's OS.""" OP_ID = "OP_INSTANCE_REINSTALL" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name", "os_type"] class OpRemoveInstance(OpCode): """Remove an instance.""" OP_ID = "OP_INSTANCE_REMOVE" - __slots__ = ["instance_name"] + OP_DSC_FIELD = "instance_name" + __slots__ = ["instance_name", "ignore_failures"] + + +class OpRenameInstance(OpCode): + """Rename an instance.""" + OP_ID = "OP_INSTANCE_RENAME" + __slots__ = ["instance_name", "ignore_ip", "new_name"] class OpStartupInstance(OpCode): """Startup an instance.""" OP_ID = "OP_INSTANCE_STARTUP" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name", "force", "extra_args"] class OpShutdownInstance(OpCode): """Shutdown an instance.""" OP_ID = "OP_INSTANCE_SHUTDOWN" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name"] -class OpAddMDDRBDComponent(OpCode): - """Add a MD-DRBD component.""" - OP_ID = "OP_INSTANCE_ADD_MDDRBD" - __slots__ = ["instance_name", "remote_node", "disk_name"] - - -class OpRemoveMDDRBDComponent(OpCode): - """Remove a MD-DRBD component.""" - OP_ID = "OP_INSTANCE_REMOVE_MDDRBD" - __slots__ = ["instance_name", "disk_name", "disk_id"] +class OpRebootInstance(OpCode): + """Reboot an instance.""" + OP_ID = "OP_INSTANCE_REBOOT" + OP_DSC_FIELD = "instance_name" + __slots__ = ["instance_name", "reboot_type", "extra_args", + "ignore_secondaries" ] class OpReplaceDisks(OpCode): """Replace the disks of an instance.""" OP_ID = "OP_INSTANCE_REPLACE_DISKS" - __slots__ = ["instance_name", "remote_node"] + OP_DSC_FIELD = "instance_name" + __slots__ = ["instance_name", "remote_node", "mode", "disks", "iallocator"] class OpFailoverInstance(OpCode): """Failover an instance.""" OP_ID = "OP_INSTANCE_FAILOVER" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name", "ignore_consistency"] class OpConnectConsole(OpCode): """Connect to an instance's console.""" OP_ID = "OP_INSTANCE_CONSOLE" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name"] class OpActivateInstanceDisks(OpCode): """Activate an instance's disks.""" OP_ID = "OP_INSTANCE_ACTIVATE_DISKS" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name"] class OpDeactivateInstanceDisks(OpCode): """Deactivate an instance's disks.""" OP_ID = "OP_INSTANCE_DEACTIVATE_DISKS" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name"] @@ -208,20 +432,33 @@ class OpQueryInstances(OpCode): class OpQueryInstanceData(OpCode): """Compute the run-time status of instances.""" OP_ID = "OP_INSTANCE_QUERY_DATA" - __slots__ = ["instances"] + __slots__ = ["instances", "static"] -class OpSetInstanceParms(OpCode): +class OpSetInstanceParams(OpCode): """Change the parameters of an instance.""" - OP_ID = "OP_INSTANCE_SET_PARMS" - __slots__ = ["instance_name", "mem", "vcpus", "ip", "bridge"] + OP_ID = "OP_INSTANCE_SET_PARAMS" + OP_DSC_FIELD = "instance_name" + __slots__ = [ + "instance_name", + "hvparams", "beparams", "force", + "nics", "disks", + ] + + +class OpGrowDisk(OpCode): + """Grow a disk of an instance.""" + OP_ID = "OP_INSTANCE_GROW_DISK" + OP_DSC_FIELD = "instance_name" + __slots__ = ["instance_name", "disk", "amount", "wait_for_sync"] # OS opcodes class OpDiagnoseOS(OpCode): """Compute the list of guest operating systems.""" OP_ID = "OP_OS_DIAGNOSE" - __slots__ = [] + __slots__ = ["output_fields", "names"] + # Exports opcodes class OpQueryExports(OpCode): @@ -229,26 +466,90 @@ class OpQueryExports(OpCode): OP_ID = "OP_BACKUP_QUERY" __slots__ = ["nodes"] + class OpExportInstance(OpCode): """Export an instance.""" OP_ID = "OP_BACKUP_EXPORT" + OP_DSC_FIELD = "instance_name" __slots__ = ["instance_name", "target_node", "shutdown"] +class OpRemoveExport(OpCode): + """Remove an instance's export.""" + OP_ID = "OP_BACKUP_REMOVE" + OP_DSC_FIELD = "instance_name" + __slots__ = ["instance_name"] + + # Tags opcodes class OpGetTags(OpCode): """Returns the tags of the given object.""" OP_ID = "OP_TAGS_GET" + OP_DSC_FIELD = "name" __slots__ = ["kind", "name"] -class OpSetTag(OpCode): - """Sets the value of a tag on a given object.""" +class OpSearchTags(OpCode): + """Searches the tags in the cluster for a given pattern.""" + OP_ID = "OP_TAGS_SEARCH" + OP_DSC_FIELD = "pattern" + __slots__ = ["pattern"] + + +class OpAddTags(OpCode): + """Add a list of tags on a given object.""" OP_ID = "OP_TAGS_SET" - __slots__ = ["kind", "name", "tag"] + __slots__ = ["kind", "name", "tags"] -class OpDelTag(OpCode): - """Remove a tag from a given object.""" +class OpDelTags(OpCode): + """Remove a list of tags from a given object.""" OP_ID = "OP_TAGS_DEL" - __slots__ = ["kind", "name", "tag"] + __slots__ = ["kind", "name", "tags"] + + +# Test opcodes +class OpTestDelay(OpCode): + """Sleeps for a configured amount of time. + + This is used just for debugging and testing. + + Parameters: + - duration: the time to sleep + - on_master: if true, sleep on the master + - on_nodes: list of nodes in which to sleep + + If the on_master parameter is true, it will execute a sleep on the + master (before any node sleep). + + If the on_nodes list is not empty, it will sleep on those nodes + (after the sleep on the master, if that is enabled). + + As an additional feature, the case of duration < 0 will be reported + as an execution error, so this opcode can be used as a failure + generator. The case of duration == 0 will not be treated specially. + + """ + OP_ID = "OP_TEST_DELAY" + OP_DSC_FIELD = "duration" + __slots__ = ["duration", "on_master", "on_nodes"] + + +class OpTestAllocator(OpCode): + """Allocator framework testing. + + This opcode has two modes: + - gather and return allocator input for a given mode (allocate new + or replace secondary) and a given instance definition (direction + 'in') + - run a selected allocator for a given operation (as above) and + return the allocator output (direction 'out') + + """ + OP_ID = "OP_TEST_ALLOCATOR" + OP_DSC_FIELD = "allocator" + __slots__ = [ + "direction", "mode", "allocator", "name", + "mem_size", "disks", "disk_template", + "os", "tags", "nics", "vcpus", "hypervisor", + ]