#
#
-# Copyright (C) 2006, 2007, 2008 Google Inc.
+# Copyright (C) 2006, 2007, 2008, 2010 Google Inc.
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
import sys
import re
+import os
+import errno
from ganeti import errors
from ganeti import constants
from ganeti import utils
from ganeti import serializer
+from ganeti import objects
+from ganeti import netutils
SSCONF_LOCK_TIMEOUT = 10
"""
self._file_name = file_name
- self.Reload()
+ self._last_inode = None
+ self._last_mtime = None
+ self._last_size = None
- def Reload(self):
- """Reloads the config file.
+ self._config_data = None
+ self._inst_ips_by_link = None
+ self._ip_to_inst_by_link = None
+ self._instances_ips = None
+ self._mc_primary_ips = None
+ self._nodes_primary_ips = None
+
+ # we need a forced reload at class init time, to initialize _last_*
+ self._Load(force=True)
+
+ def _Load(self, force=False):
+ """Loads (or reloads) the config file.
+
+ @type force: boolean
+ @param force: whether to force the reload without checking the mtime
+ @rtype: boolean
+ @return: boolean value that says whether we reloaded the configuration or
+ not (because we decided it was already up-to-date)
"""
try:
+ cfg_stat = os.stat(self._file_name)
+ except EnvironmentError, err:
+ raise errors.ConfigurationError("Cannot stat config file %s: %s" %
+ (self._file_name, err))
+ inode = cfg_stat.st_ino
+ mtime = cfg_stat.st_mtime
+ size = cfg_stat.st_size
+
+ if (force or inode != self._last_inode or
+ mtime > self._last_mtime or
+ size != self._last_size):
+ self._last_inode = inode
+ self._last_mtime = mtime
+ self._last_size = size
+ else:
+ # Don't reload
+ return False
+
+ try:
self._config_data = serializer.Load(utils.ReadFile(self._file_name))
- except IOError, err:
+ except EnvironmentError, err:
raise errors.ConfigurationError("Cannot read config file %s: %s" %
(self._file_name, err))
except ValueError, err:
raise errors.ConfigurationError("Cannot load config file %s: %s" %
(self._file_name, err))
+ self._ip_to_inst_by_link = {}
+ self._instances_ips = []
+ self._inst_ips_by_link = {}
+ c_nparams = self._config_data['cluster']['nicparams'][constants.PP_DEFAULT]
+ for iname in self._config_data['instances']:
+ instance = self._config_data['instances'][iname]
+ for nic in instance['nics']:
+ if 'ip' in nic and nic['ip']:
+ params = objects.FillDict(c_nparams, nic['nicparams'])
+ if not params['link'] in self._inst_ips_by_link:
+ self._inst_ips_by_link[params['link']] = []
+ self._ip_to_inst_by_link[params['link']] = {}
+ self._ip_to_inst_by_link[params['link']][nic['ip']] = iname
+ self._inst_ips_by_link[params['link']].append(nic['ip'])
+
+ self._nodes_primary_ips = []
+ self._mc_primary_ips = []
+ for node_name in self._config_data["nodes"]:
+ node = self._config_data["nodes"][node_name]
+ self._nodes_primary_ips.append(node["primary_ip"])
+ if node["master_candidate"]:
+ self._mc_primary_ips.append(node["primary_ip"])
+
+ return True
+
+ # Clients can request a reload of the config file, so we export our internal
+ # _Load function as Reload.
+ Reload = _Load
+
def GetClusterName(self):
return self._config_data["cluster"]["cluster_name"]
def GetFileStorageDir(self):
return self._config_data["cluster"]["file_storage_dir"]
- def GetHypervisorType(self):
- return self._config_data["cluster"]["hypervisor"]
+ def GetSharedFileStorageDir(self):
+ return self._config_data["cluster"]["shared_file_storage_dir"]
def GetNodeList(self):
return self._config_data["nodes"].keys()
+ def GetConfigSerialNo(self):
+ return self._config_data["serial_no"]
+
+ def GetClusterSerialNo(self):
+ return self._config_data["cluster"]["serial_no"]
+
+ def GetDefaultNicParams(self):
+ return self._config_data["cluster"]["nicparams"][constants.PP_DEFAULT]
+
+ def GetDefaultNicLink(self):
+ return self.GetDefaultNicParams()[constants.NIC_LINK]
+
+ def GetNodeStatusFlags(self, node):
+ """Get a node's status flags
+
+ @type node: string
+ @param node: node name
+ @rtype: (bool, bool, bool)
+ @return: (master_candidate, drained, offline) (or None if no such node)
+
+ """
+ if node not in self._config_data["nodes"]:
+ return None
+
+ master_candidate = self._config_data["nodes"][node]["master_candidate"]
+ drained = self._config_data["nodes"][node]["drained"]
+ offline = self._config_data["nodes"][node]["offline"]
+ return master_candidate, drained, offline
+
+ def GetInstanceByLinkIp(self, ip, link):
+ """Get instance name from its link and ip address.
+
+ @type ip: string
+ @param ip: ip address
+ @type link: string
+ @param link: nic link
+ @rtype: string
+ @return: instance name
+
+ """
+ if not link:
+ link = self.GetDefaultNicLink()
+ if not link in self._ip_to_inst_by_link:
+ return None
+ if not ip in self._ip_to_inst_by_link[link]:
+ return None
+ return self._ip_to_inst_by_link[link][ip]
+
+ def GetNodePrimaryIp(self, node):
+ """Get a node's primary ip
+
+ @type node: string
+ @param node: node name
+ @rtype: string, or None
+ @return: node's primary ip, or None if no such node
+
+ """
+ if node not in self._config_data["nodes"]:
+ return None
+ return self._config_data["nodes"][node]["primary_ip"]
+
+ def GetInstancePrimaryNode(self, instance):
+ """Get an instance's primary node
+
+ @type instance: string
+ @param instance: instance name
+ @rtype: string, or None
+ @return: primary node, or None if no such instance
+
+ """
+ if instance not in self._config_data["instances"]:
+ return None
+ return self._config_data["instances"][instance]["primary_node"]
+
+ def GetNodesPrimaryIps(self):
+ return self._nodes_primary_ips
+
+ def GetMasterCandidatesPrimaryIps(self):
+ return self._mc_primary_ips
+
+ def GetInstancesIps(self, link):
+ """Get list of nic ips connected to a certain link.
+
+ @type link: string
+ @param link: nic link
+ @rtype: list
+ @return: list of ips connected to that link
+
+ """
+ if not link:
+ link = self.GetDefaultNicLink()
+
+ if link in self._inst_ips_by_link:
+ return self._inst_ips_by_link[link]
+ else:
+ return []
+
class SimpleStore(object):
"""Interface to static cluster data.
constants.SS_CLUSTER_NAME,
constants.SS_CLUSTER_TAGS,
constants.SS_FILE_STORAGE_DIR,
+ constants.SS_SHARED_FILE_STORAGE_DIR,
constants.SS_MASTER_CANDIDATES,
constants.SS_MASTER_CANDIDATES_IPS,
constants.SS_MASTER_IP,
constants.SS_NODE_SECONDARY_IPS,
constants.SS_OFFLINE_NODES,
constants.SS_ONLINE_NODES,
+ constants.SS_PRIMARY_IP_FAMILY,
constants.SS_INSTANCE_LIST,
constants.SS_RELEASE_VERSION,
+ constants.SS_HYPERVISOR_LIST,
+ constants.SS_MAINTAIN_NODE_HEALTH,
+ constants.SS_UID_POOL,
+ constants.SS_NODEGROUPS,
)
_MAX_SIZE = 131072
filename = self._cfg_dir + '/' + self._SS_FILEPREFIX + key
return filename
- def _ReadFile(self, key):
+ def _ReadFile(self, key, default=None):
"""Generic routine to read keys.
This will read the file which holds the value requested. Errors
try:
data = utils.ReadFile(filename, size=self._MAX_SIZE)
except EnvironmentError, err:
+ if err.errno == errno.ENOENT and default is not None:
+ return default
raise errors.ConfigurationError("Can't read from the ssconf file:"
" '%s'" % str(err))
data = data.rstrip('\n')
@param values: Dictionary of (name, value)
"""
- ssconf_lock = utils.FileLock(constants.SSCONF_LOCK_FILE)
+ ssconf_lock = utils.FileLock.Open(constants.SSCONF_LOCK_FILE)
# Get lock while writing files
ssconf_lock.Exclusive(blocking=True, timeout=SSCONF_LOCK_TIMEOUT)
for name, value in values.iteritems():
if value and not value.endswith("\n"):
value += "\n"
+ if len(value) > self._MAX_SIZE:
+ raise errors.ConfigurationError("ssconf file %s above maximum size" %
+ name)
utils.WriteFile(self.KeyToFilename(name), data=value, mode=0444)
finally:
ssconf_lock.Unlock()
"""
return self._ReadFile(constants.SS_FILE_STORAGE_DIR)
+ def GetSharedFileStorageDir(self):
+ """Get the shared file storage dir.
+
+ """
+ return self._ReadFile(constants.SS_SHARED_FILE_STORAGE_DIR)
+
def GetMasterCandidates(self):
"""Return the list of master candidates.
nl = data.splitlines(False)
return nl
+ def GetNodegroupList(self):
+ """Return the list of nodegroups.
+
+ """
+ data = self._ReadFile(constants.SS_NODEGROUPS)
+ nl = data.splitlines(False)
+ return nl
+
def GetClusterTags(self):
"""Return the cluster tags.
nl = data.splitlines(False)
return nl
+ def GetHypervisorList(self):
+ """Return the list of enabled hypervisors.
+
+ """
+ data = self._ReadFile(constants.SS_HYPERVISOR_LIST)
+ nl = data.splitlines(False)
+ return nl
+
+ def GetMaintainNodeHealth(self):
+ """Return the value of the maintain_node_health option.
+
+ """
+ data = self._ReadFile(constants.SS_MAINTAIN_NODE_HEALTH)
+ # we rely on the bool serialization here
+ return data == "True"
+
+ def GetUidPool(self):
+ """Return the user-id pool definition string.
+
+ The separator character is a newline.
+
+ The return value can be parsed using uidpool.ParseUidPool()::
+
+ ss = ssconf.SimpleStore()
+ uid_pool = uidpool.ParseUidPool(ss.GetUidPool(), separator="\\n")
+
+ """
+ data = self._ReadFile(constants.SS_UID_POOL)
+ return data
+
+ def GetPrimaryIPFamily(self):
+ """Return the cluster-wide primary address family.
+
+ """
+ try:
+ return int(self._ReadFile(constants.SS_PRIMARY_IP_FAMILY,
+ default=netutils.IP4Address.family))
+ except (ValueError, TypeError), err:
+ raise errors.ConfigurationError("Error while trying to parse primary ip"
+ " family: %s" % err)
+
def GetMasterAndMyself(ss=None):
"""Get the master node and my own hostname.
"""
if ss is None:
ss = SimpleStore()
- return ss.GetMasterNode(), utils.HostInfo().name
+ return ss.GetMasterNode(), netutils.Hostname.GetSysName()
def CheckMaster(debug, ss=None):
if debug:
sys.stderr.write("Not master, exiting.\n")
sys.exit(constants.EXIT_NOTMASTER)
-
-
-def CheckMasterCandidate(debug, ss=None):
- """Checks the node setup.
-
- If this is a master candidate, the function will return. Otherwise it will
- exit with an exit code based on the node status.
-
- """
- try:
- if ss is None:
- ss = SimpleStore()
- myself = utils.HostInfo().name
- candidates = ss.GetMasterCandidates()
- except errors.ConfigurationError, err:
- print "Cluster configuration incomplete: '%s'" % str(err)
- sys.exit(constants.EXIT_NODESETUP_ERROR)
- except errors.ResolverError, err:
- sys.stderr.write("Cannot resolve my own name (%s)\n" % err.args[0])
- sys.exit(constants.EXIT_NODESETUP_ERROR)
-
- if myself not in candidates:
- if debug:
- sys.stderr.write("Not master candidate, exiting.\n")
- sys.exit(constants.EXIT_NOTCANDIDATE)
-