code.grnet.gr Git - ganeti-local/blob - lib/utils.py

   1 #
   2 #
   3
   4 # Copyright (C) 2006, 2007 Google Inc.
   5 #
   6 # This program is free software; you can redistribute it and/or modify
   7 # it under the terms of the GNU General Public License as published by
   8 # the Free Software Foundation; either version 2 of the License, or
   9 # (at your option) any later version.
  10 #
  11 # This program is distributed in the hope that it will be useful, but
  12 # WITHOUT ANY WARRANTY; without even the implied warranty of
  13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14 # General Public License for more details.
  15 #
  16 # You should have received a copy of the GNU General Public License
  17 # along with this program; if not, write to the Free Software
  18 # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
  19 # 02110-1301, USA.
  20
  21
  22 """Ganeti utility module.
  23
  24 This module holds functions that can be used in both daemons (all) and
  25 the command line scripts.
  26
  27 """
  28
  29
  30 import os
  31 import time
  32 import subprocess
  33 import re
  34 import socket
  35 import tempfile
  36 import shutil
  37 import errno
  38 import pwd
  39 import itertools
  40 import select
  41 import fcntl
  42 import resource
  43 import logging
  44 import signal
  45
  46 from cStringIO import StringIO
  47
  48 try:
  49   from hashlib import sha1
  50 except ImportError:
  51   import sha
  52   sha1 = sha.new
  53
  54 from ganeti import errors
  55 from ganeti import constants
  56
  57
  58 _locksheld = []
  59 _re_shell_unquoted = re.compile('^[-.,=:/_+@A-Za-z0-9]+$')
  60
  61 debug_locks = False
  62
  63 #: when set to True, L{RunCmd} is disabled
  64 no_fork = False
  65
  66
  67 class RunResult(object):
  68   """Holds the result of running external programs.
  69
  70   @type exit_code: int
  71   @ivar exit_code: the exit code of the program, or None (if the program
  72       didn't exit())
  73   @type signal: int or None
  74   @ivar signal: the signal that caused the program to finish, or None
  75       (if the program wasn't terminated by a signal)
  76   @type stdout: str
  77   @ivar stdout: the standard output of the program
  78   @type stderr: str
  79   @ivar stderr: the standard error of the program
  80   @type failed: boolean
  81   @ivar failed: True in case the program was
  82       terminated by a signal or exited with a non-zero exit code
  83   @ivar fail_reason: a string detailing the termination reason
  84
  85   """
  86   __slots__ = ["exit_code", "signal", "stdout", "stderr",
  87                "failed", "fail_reason", "cmd"]
  88
  89
  90   def __init__(self, exit_code, signal_, stdout, stderr, cmd):
  91     self.cmd = cmd
  92     self.exit_code = exit_code
  93     self.signal = signal_
  94     self.stdout = stdout
  95     self.stderr = stderr
  96     self.failed = (signal_ is not None or exit_code != 0)
  97
  98     if self.signal is not None:
  99       self.fail_reason = "terminated by signal %s" % self.signal
 100     elif self.exit_code is not None:
 101       self.fail_reason = "exited with exit code %s" % self.exit_code
 102     else:
 103       self.fail_reason = "unable to determine termination reason"
 104
 105     if self.failed:
 106       logging.debug("Command '%s' failed (%s); output: %s",
 107                     self.cmd, self.fail_reason, self.output)
 108
 109   def _GetOutput(self):
 110     """Returns the combined stdout and stderr for easier usage.
 111
 112     """
 113     return self.stdout + self.stderr
 114
 115   output = property(_GetOutput, None, None, "Return full output")
 116
 117
 118 def RunCmd(cmd, env=None, output=None, cwd='/'):
 119   """Execute a (shell) command.
 120
 121   The command should not read from its standard input, as it will be
 122   closed.
 123
 124   @type  cmd: string or list
 125   @param cmd: Command to run
 126   @type env: dict
 127   @param env: Additional environment
 128   @type output: str
 129   @param output: if desired, the output of the command can be
 130       saved in a file instead of the RunResult instance; this
 131       parameter denotes the file name (if not None)
 132   @type cwd: string
 133   @param cwd: if specified, will be used as the working
 134       directory for the command; the default will be /
 135   @rtype: L{RunResult}
 136   @return: RunResult instance
 137   @raise errors.ProgrammerError: if we call this when forks are disabled
 138
 139   """
 140   if no_fork:
 141     raise errors.ProgrammerError("utils.RunCmd() called with fork() disabled")
 142
 143   if isinstance(cmd, list):
 144     cmd = [str(val) for val in cmd]
 145     strcmd = " ".join(cmd)
 146     shell = False
 147   else:
 148     strcmd = cmd
 149     shell = True
 150   logging.debug("RunCmd '%s'", strcmd)
 151
 152   cmd_env = os.environ.copy()
 153   cmd_env["LC_ALL"] = "C"
 154   if env is not None:
 155     cmd_env.update(env)
 156
 157   try:
 158     if output is None:
 159       out, err, status = _RunCmdPipe(cmd, cmd_env, shell, cwd)
 160     else:
 161       status = _RunCmdFile(cmd, cmd_env, shell, output, cwd)
 162       out = err = ""
 163   except OSError, err:
 164     if err.errno == errno.ENOENT:
 165       raise errors.OpExecError("Can't execute '%s': not found (%s)" %
 166                                (strcmd, err))
 167     else:
 168       raise
 169
 170   if status >= 0:
 171     exitcode = status
 172     signal_ = None
 173   else:
 174     exitcode = None
 175     signal_ = -status
 176
 177   return RunResult(exitcode, signal_, out, err, strcmd)
 178
 179
 180 def _RunCmdPipe(cmd, env, via_shell, cwd):
 181   """Run a command and return its output.
 182
 183   @type  cmd: string or list
 184   @param cmd: Command to run
 185   @type env: dict
 186   @param env: The environment to use
 187   @type via_shell: bool
 188   @param via_shell: if we should run via the shell
 189   @type cwd: string
 190   @param cwd: the working directory for the program
 191   @rtype: tuple
 192   @return: (out, err, status)
 193
 194   """
 195   poller = select.poll()
 196   child = subprocess.Popen(cmd, shell=via_shell,
 197                            stderr=subprocess.PIPE,
 198                            stdout=subprocess.PIPE,
 199                            stdin=subprocess.PIPE,
 200                            close_fds=True, env=env,
 201                            cwd=cwd)
 202
 203   child.stdin.close()
 204   poller.register(child.stdout, select.POLLIN)
 205   poller.register(child.stderr, select.POLLIN)
 206   out = StringIO()
 207   err = StringIO()
 208   fdmap = {
 209     child.stdout.fileno(): (out, child.stdout),
 210     child.stderr.fileno(): (err, child.stderr),
 211     }
 212   for fd in fdmap:
 213     status = fcntl.fcntl(fd, fcntl.F_GETFL)
 214     fcntl.fcntl(fd, fcntl.F_SETFL, status | os.O_NONBLOCK)
 215
 216   while fdmap:
 217     try:
 218       pollresult = poller.poll()
 219     except EnvironmentError, eerr:
 220       if eerr.errno == errno.EINTR:
 221         continue
 222       raise
 223     except select.error, serr:
 224       if serr[0] == errno.EINTR:
 225         continue
 226       raise
 227
 228     for fd, event in pollresult:
 229       if event & select.POLLIN or event & select.POLLPRI:
 230         data = fdmap[fd][1].read()
 231         # no data from read signifies EOF (the same as POLLHUP)
 232         if not data:
 233           poller.unregister(fd)
 234           del fdmap[fd]
 235           continue
 236         fdmap[fd][0].write(data)
 237       if (event & select.POLLNVAL or event & select.POLLHUP or
 238           event & select.POLLERR):
 239         poller.unregister(fd)
 240         del fdmap[fd]
 241
 242   out = out.getvalue()
 243   err = err.getvalue()
 244
 245   status = child.wait()
 246   return out, err, status
 247
 248
 249 def _RunCmdFile(cmd, env, via_shell, output, cwd):
 250   """Run a command and save its output to a file.
 251
 252   @type  cmd: string or list
 253   @param cmd: Command to run
 254   @type env: dict
 255   @param env: The environment to use
 256   @type via_shell: bool
 257   @param via_shell: if we should run via the shell
 258   @type output: str
 259   @param output: the filename in which to save the output
 260   @type cwd: string
 261   @param cwd: the working directory for the program
 262   @rtype: int
 263   @return: the exit status
 264
 265   """
 266   fh = open(output, "a")
 267   try:
 268     child = subprocess.Popen(cmd, shell=via_shell,
 269                              stderr=subprocess.STDOUT,
 270                              stdout=fh,
 271                              stdin=subprocess.PIPE,
 272                              close_fds=True, env=env,
 273                              cwd=cwd)
 274
 275     child.stdin.close()
 276     status = child.wait()
 277   finally:
 278     fh.close()
 279   return status
 280
 281
 282 def RemoveFile(filename):
 283   """Remove a file ignoring some errors.
 284
 285   Remove a file, ignoring non-existing ones or directories. Other
 286   errors are passed.
 287
 288   @type filename: str
 289   @param filename: the file to be removed
 290
 291   """
 292   try:
 293     os.unlink(filename)
 294   except OSError, err:
 295     if err.errno not in (errno.ENOENT, errno.EISDIR):
 296       raise
 297
 298
 299 def RenameFile(old, new, mkdir=False, mkdir_mode=0750):
 300   """Renames a file.
 301
 302   @type old: string
 303   @param old: Original path
 304   @type new: string
 305   @param new: New path
 306   @type mkdir: bool
 307   @param mkdir: Whether to create target directory if it doesn't exist
 308   @type mkdir_mode: int
 309   @param mkdir_mode: Mode for newly created directories
 310
 311   """
 312   try:
 313     return os.rename(old, new)
 314   except OSError, err:
 315     # In at least one use case of this function, the job queue, directory
 316     # creation is very rare. Checking for the directory before renaming is not
 317     # as efficient.
 318     if mkdir and err.errno == errno.ENOENT:
 319       # Create directory and try again
 320       os.makedirs(os.path.dirname(new), mkdir_mode)
 321       return os.rename(old, new)
 322     raise
 323
 324
 325 def _FingerprintFile(filename):
 326   """Compute the fingerprint of a file.
 327
 328   If the file does not exist, a None will be returned
 329   instead.
 330
 331   @type filename: str
 332   @param filename: the filename to checksum
 333   @rtype: str
 334   @return: the hex digest of the sha checksum of the contents
 335       of the file
 336
 337   """
 338   if not (os.path.exists(filename) and os.path.isfile(filename)):
 339     return None
 340
 341   f = open(filename)
 342
 343   fp = sha1()
 344   while True:
 345     data = f.read(4096)
 346     if not data:
 347       break
 348
 349     fp.update(data)
 350
 351   return fp.hexdigest()
 352
 353
 354 def FingerprintFiles(files):
 355   """Compute fingerprints for a list of files.
 356
 357   @type files: list
 358   @param files: the list of filename to fingerprint
 359   @rtype: dict
 360   @return: a dictionary filename: fingerprint, holding only
 361       existing files
 362
 363   """
 364   ret = {}
 365
 366   for filename in files:
 367     cksum = _FingerprintFile(filename)
 368     if cksum:
 369       ret[filename] = cksum
 370
 371   return ret
 372
 373
 374 def ForceDictType(target, key_types, allowed_values=None):
 375   """Force the values of a dict to have certain types.
 376
 377   @type target: dict
 378   @param target: the dict to update
 379   @type key_types: dict
 380   @param key_types: dict mapping target dict keys to types
 381                     in constants.ENFORCEABLE_TYPES
 382   @type allowed_values: list
 383   @keyword allowed_values: list of specially allowed values
 384
 385   """
 386   if allowed_values is None:
 387     allowed_values = []
 388
 389   if not isinstance(target, dict):
 390     msg = "Expected dictionary, got '%s'" % target
 391     raise errors.TypeEnforcementError(msg)
 392
 393   for key in target:
 394     if key not in key_types:
 395       msg = "Unknown key '%s'" % key
 396       raise errors.TypeEnforcementError(msg)
 397
 398     if target[key] in allowed_values:
 399       continue
 400
 401     ktype = key_types[key]
 402     if ktype not in constants.ENFORCEABLE_TYPES:
 403       msg = "'%s' has non-enforceable type %s" % (key, ktype)
 404       raise errors.ProgrammerError(msg)
 405
 406     if ktype == constants.VTYPE_STRING:
 407       if not isinstance(target[key], basestring):
 408         if isinstance(target[key], bool) and not target[key]:
 409           target[key] = ''
 410         else:
 411           msg = "'%s' (value %s) is not a valid string" % (key, target[key])
 412           raise errors.TypeEnforcementError(msg)
 413     elif ktype == constants.VTYPE_BOOL:
 414       if isinstance(target[key], basestring) and target[key]:
 415         if target[key].lower() == constants.VALUE_FALSE:
 416           target[key] = False
 417         elif target[key].lower() == constants.VALUE_TRUE:
 418           target[key] = True
 419         else:
 420           msg = "'%s' (value %s) is not a valid boolean" % (key, target[key])
 421           raise errors.TypeEnforcementError(msg)
 422       elif target[key]:
 423         target[key] = True
 424       else:
 425         target[key] = False
 426     elif ktype == constants.VTYPE_SIZE:
 427       try:
 428         target[key] = ParseUnit(target[key])
 429       except errors.UnitParseError, err:
 430         msg = "'%s' (value %s) is not a valid size. error: %s" % \
 431               (key, target[key], err)
 432         raise errors.TypeEnforcementError(msg)
 433     elif ktype == constants.VTYPE_INT:
 434       try:
 435         target[key] = int(target[key])
 436       except (ValueError, TypeError):
 437         msg = "'%s' (value %s) is not a valid integer" % (key, target[key])
 438         raise errors.TypeEnforcementError(msg)
 439
 440
 441 def IsProcessAlive(pid):
 442   """Check if a given pid exists on the system.
 443
 444   @note: zombie status is not handled, so zombie processes
 445       will be returned as alive
 446   @type pid: int
 447   @param pid: the process ID to check
 448   @rtype: boolean
 449   @return: True if the process exists
 450
 451   """
 452   if pid <= 0:
 453     return False
 454
 455   try:
 456     os.stat("/proc/%d/status" % pid)
 457     return True
 458   except EnvironmentError, err:
 459     if err.errno in (errno.ENOENT, errno.ENOTDIR):
 460       return False
 461     raise
 462
 463
 464 def ReadPidFile(pidfile):
 465   """Read a pid from a file.
 466
 467   @type  pidfile: string
 468   @param pidfile: path to the file containing the pid
 469   @rtype: int
 470   @return: The process id, if the file exists and contains a valid PID,
 471            otherwise 0
 472
 473   """
 474   try:
 475     pf = open(pidfile, 'r')
 476   except EnvironmentError, err:
 477     if err.errno != errno.ENOENT:
 478       logging.exception("Can't read pid file?!")
 479     return 0
 480
 481   try:
 482     pid = int(pf.read())
 483   except ValueError, err:
 484     logging.info("Can't parse pid file contents", exc_info=True)
 485     return 0
 486
 487   return pid
 488
 489
 490 def MatchNameComponent(key, name_list):
 491   """Try to match a name against a list.
 492
 493   This function will try to match a name like test1 against a list
 494   like C{['test1.example.com', 'test2.example.com', ...]}. Against
 495   this list, I{'test1'} as well as I{'test1.example'} will match, but
 496   not I{'test1.ex'}. A multiple match will be considered as no match
 497   at all (e.g. I{'test1'} against C{['test1.example.com',
 498   'test1.example.org']}).
 499
 500   @type key: str
 501   @param key: the name to be searched
 502   @type name_list: list
 503   @param name_list: the list of strings against which to search the key
 504
 505   @rtype: None or str
 506   @return: None if there is no match I{or} if there are multiple matches,
 507       otherwise the element from the list which matches
 508
 509   """
 510   mo = re.compile("^%s(\..*)?$" % re.escape(key))
 511   names_filtered = [name for name in name_list if mo.match(name) is not None]
 512   if len(names_filtered) != 1:
 513     return None
 514   return names_filtered[0]
 515
 516
 517 class HostInfo:
 518   """Class implementing resolver and hostname functionality
 519
 520   """
 521   def __init__(self, name=None):
 522     """Initialize the host name object.
 523
 524     If the name argument is not passed, it will use this system's
 525     name.
 526
 527     """
 528     if name is None:
 529       name = self.SysName()
 530
 531     self.query = name
 532     self.name, self.aliases, self.ipaddrs = self.LookupHostname(name)
 533     self.ip = self.ipaddrs[0]
 534
 535   def ShortName(self):
 536     """Returns the hostname without domain.
 537
 538     """
 539     return self.name.split('.')[0]
 540
 541   @staticmethod
 542   def SysName():
 543     """Return the current system's name.
 544
 545     This is simply a wrapper over C{socket.gethostname()}.
 546
 547     """
 548     return socket.gethostname()
 549
 550   @staticmethod
 551   def LookupHostname(hostname):
 552     """Look up hostname
 553
 554     @type hostname: str
 555     @param hostname: hostname to look up
 556
 557     @rtype: tuple
 558     @return: a tuple (name, aliases, ipaddrs) as returned by
 559         C{socket.gethostbyname_ex}
 560     @raise errors.ResolverError: in case of errors in resolving
 561
 562     """
 563     try:
 564       result = socket.gethostbyname_ex(hostname)
 565     except socket.gaierror, err:
 566       # hostname not found in DNS
 567       raise errors.ResolverError(hostname, err.args[0], err.args[1])
 568
 569     return result
 570
 571
 572 def ListVolumeGroups():
 573   """List volume groups and their size
 574
 575   @rtype: dict
 576   @return:
 577        Dictionary with keys volume name and values
 578        the size of the volume
 579
 580   """
 581   command = "vgs --noheadings --units m --nosuffix -o name,size"
 582   result = RunCmd(command)
 583   retval = {}
 584   if result.failed:
 585     return retval
 586
 587   for line in result.stdout.splitlines():
 588     try:
 589       name, size = line.split()
 590       size = int(float(size))
 591     except (IndexError, ValueError), err:
 592       logging.error("Invalid output from vgs (%s): %s", err, line)
 593       continue
 594
 595     retval[name] = size
 596
 597   return retval
 598
 599
 600 def BridgeExists(bridge):
 601   """Check whether the given bridge exists in the system
 602
 603   @type bridge: str
 604   @param bridge: the bridge name to check
 605   @rtype: boolean
 606   @return: True if it does
 607
 608   """
 609   return os.path.isdir("/sys/class/net/%s/bridge" % bridge)
 610
 611
 612 def NiceSort(name_list):
 613   """Sort a list of strings based on digit and non-digit groupings.
 614
 615   Given a list of names C{['a1', 'a10', 'a11', 'a2']} this function
 616   will sort the list in the logical order C{['a1', 'a2', 'a10',
 617   'a11']}.
 618
 619   The sort algorithm breaks each name in groups of either only-digits
 620   or no-digits. Only the first eight such groups are considered, and
 621   after that we just use what's left of the string.
 622
 623   @type name_list: list
 624   @param name_list: the names to be sorted
 625   @rtype: list
 626   @return: a copy of the name list sorted with our algorithm
 627
 628   """
 629   _SORTER_BASE = "(\D+|\d+)"
 630   _SORTER_FULL = "^%s%s?%s?%s?%s?%s?%s?%s?.*$" % (_SORTER_BASE, _SORTER_BASE,
 631                                                   _SORTER_BASE, _SORTER_BASE,
 632                                                   _SORTER_BASE, _SORTER_BASE,
 633                                                   _SORTER_BASE, _SORTER_BASE)
 634   _SORTER_RE = re.compile(_SORTER_FULL)
 635   _SORTER_NODIGIT = re.compile("^\D*$")
 636   def _TryInt(val):
 637     """Attempts to convert a variable to integer."""
 638     if val is None or _SORTER_NODIGIT.match(val):
 639       return val
 640     rval = int(val)
 641     return rval
 642
 643   to_sort = [([_TryInt(grp) for grp in _SORTER_RE.match(name).groups()], name)
 644              for name in name_list]
 645   to_sort.sort()
 646   return [tup[1] for tup in to_sort]
 647
 648
 649 def TryConvert(fn, val):
 650   """Try to convert a value ignoring errors.
 651
 652   This function tries to apply function I{fn} to I{val}. If no
 653   C{ValueError} or C{TypeError} exceptions are raised, it will return
 654   the result, else it will return the original value. Any other
 655   exceptions are propagated to the caller.
 656
 657   @type fn: callable
 658   @param fn: function to apply to the value
 659   @param val: the value to be converted
 660   @return: The converted value if the conversion was successful,
 661       otherwise the original value.
 662
 663   """
 664   try:
 665     nv = fn(val)
 666   except (ValueError, TypeError):
 667     nv = val
 668   return nv
 669
 670
 671 def IsValidIP(ip):
 672   """Verifies the syntax of an IPv4 address.
 673
 674   This function checks if the IPv4 address passes is valid or not based
 675   on syntax (not IP range, class calculations, etc.).
 676
 677   @type ip: str
 678   @param ip: the address to be checked
 679   @rtype: a regular expression match object
 680   @return: a regular expression match object, or None if the
 681       address is not valid
 682
 683   """
 684   unit = "(0|[1-9]\d{0,2})"
 685   #TODO: convert and return only boolean
 686   return re.match("^%s\.%s\.%s\.%s$" % (unit, unit, unit, unit), ip)
 687
 688
 689 def IsValidShellParam(word):
 690   """Verifies is the given word is safe from the shell's p.o.v.
 691
 692   This means that we can pass this to a command via the shell and be
 693   sure that it doesn't alter the command line and is passed as such to
 694   the actual command.
 695
 696   Note that we are overly restrictive here, in order to be on the safe
 697   side.
 698
 699   @type word: str
 700   @param word: the word to check
 701   @rtype: boolean
 702   @return: True if the word is 'safe'
 703
 704   """
 705   return bool(re.match("^[-a-zA-Z0-9._+/:%@]+$", word))
 706
 707
 708 def BuildShellCmd(template, *args):
 709   """Build a safe shell command line from the given arguments.
 710
 711   This function will check all arguments in the args list so that they
 712   are valid shell parameters (i.e. they don't contain shell
 713   metacharacters). If everything is ok, it will return the result of
 714   template % args.
 715
 716   @type template: str
 717   @param template: the string holding the template for the
 718       string formatting
 719   @rtype: str
 720   @return: the expanded command line
 721
 722   """
 723   for word in args:
 724     if not IsValidShellParam(word):
 725       raise errors.ProgrammerError("Shell argument '%s' contains"
 726                                    " invalid characters" % word)
 727   return template % args
 728
 729
 730 def FormatUnit(value, units):
 731   """Formats an incoming number of MiB with the appropriate unit.
 732
 733   @type value: int
 734   @param value: integer representing the value in MiB (1048576)
 735   @type units: char
 736   @param units: the type of formatting we should do:
 737       - 'h' for automatic scaling
 738       - 'm' for MiBs
 739       - 'g' for GiBs
 740       - 't' for TiBs
 741   @rtype: str
 742   @return: the formatted value (with suffix)
 743
 744   """
 745   if units not in ('m', 'g', 't', 'h'):
 746     raise errors.ProgrammerError("Invalid unit specified '%s'" % str(units))
 747
 748   suffix = ''
 749
 750   if units == 'm' or (units == 'h' and value < 1024):
 751     if units == 'h':
 752       suffix = 'M'
 753     return "%d%s" % (round(value, 0), suffix)
 754
 755   elif units == 'g' or (units == 'h' and value < (1024 * 1024)):
 756     if units == 'h':
 757       suffix = 'G'
 758     return "%0.1f%s" % (round(float(value) / 1024, 1), suffix)
 759
 760   else:
 761     if units == 'h':
 762       suffix = 'T'
 763     return "%0.1f%s" % (round(float(value) / 1024 / 1024, 1), suffix)
 764
 765
 766 def ParseUnit(input_string):
 767   """Tries to extract number and scale from the given string.
 768
 769   Input must be in the format C{NUMBER+ [DOT NUMBER+] SPACE*
 770   [UNIT]}. If no unit is specified, it defaults to MiB. Return value
 771   is always an int in MiB.
 772
 773   """
 774   m = re.match('^([.\d]+)\s*([a-zA-Z]+)?$', str(input_string))
 775   if not m:
 776     raise errors.UnitParseError("Invalid format")
 777
 778   value = float(m.groups()[0])
 779
 780   unit = m.groups()[1]
 781   if unit:
 782     lcunit = unit.lower()
 783   else:
 784     lcunit = 'm'
 785
 786   if lcunit in ('m', 'mb', 'mib'):
 787     # Value already in MiB
 788     pass
 789
 790   elif lcunit in ('g', 'gb', 'gib'):
 791     value *= 1024
 792
 793   elif lcunit in ('t', 'tb', 'tib'):
 794     value *= 1024 * 1024
 795
 796   else:
 797     raise errors.UnitParseError("Unknown unit: %s" % unit)
 798
 799   # Make sure we round up
 800   if int(value) < value:
 801     value += 1
 802
 803   # Round up to the next multiple of 4
 804   value = int(value)
 805   if value % 4:
 806     value += 4 - value % 4
 807
 808   return value
 809
 810
 811 def AddAuthorizedKey(file_name, key):
 812   """Adds an SSH public key to an authorized_keys file.
 813
 814   @type file_name: str
 815   @param file_name: path to authorized_keys file
 816   @type key: str
 817   @param key: string containing key
 818
 819   """
 820   key_fields = key.split()
 821
 822   f = open(file_name, 'a+')
 823   try:
 824     nl = True
 825     for line in f:
 826       # Ignore whitespace changes
 827       if line.split() == key_fields:
 828         break
 829       nl = line.endswith('\n')
 830     else:
 831       if not nl:
 832         f.write("\n")
 833       f.write(key.rstrip('\r\n'))
 834       f.write("\n")
 835       f.flush()
 836   finally:
 837     f.close()
 838
 839
 840 def RemoveAuthorizedKey(file_name, key):
 841   """Removes an SSH public key from an authorized_keys file.
 842
 843   @type file_name: str
 844   @param file_name: path to authorized_keys file
 845   @type key: str
 846   @param key: string containing key
 847
 848   """
 849   key_fields = key.split()
 850
 851   fd, tmpname = tempfile.mkstemp(dir=os.path.dirname(file_name))
 852   try:
 853     out = os.fdopen(fd, 'w')
 854     try:
 855       f = open(file_name, 'r')
 856       try:
 857         for line in f:
 858           # Ignore whitespace changes while comparing lines
 859           if line.split() != key_fields:
 860             out.write(line)
 861
 862         out.flush()
 863         os.rename(tmpname, file_name)
 864       finally:
 865         f.close()
 866     finally:
 867       out.close()
 868   except:
 869     RemoveFile(tmpname)
 870     raise
 871
 872
 873 def SetEtcHostsEntry(file_name, ip, hostname, aliases):
 874   """Sets the name of an IP address and hostname in /etc/hosts.
 875
 876   @type file_name: str
 877   @param file_name: path to the file to modify (usually C{/etc/hosts})
 878   @type ip: str
 879   @param ip: the IP address
 880   @type hostname: str
 881   @param hostname: the hostname to be added
 882   @type aliases: list
 883   @param aliases: the list of aliases to add for the hostname
 884
 885   """
 886   # FIXME: use WriteFile + fn rather than duplicating its efforts
 887   # Ensure aliases are unique
 888   aliases = UniqueSequence([hostname] + aliases)[1:]
 889
 890   fd, tmpname = tempfile.mkstemp(dir=os.path.dirname(file_name))
 891   try:
 892     out = os.fdopen(fd, 'w')
 893     try:
 894       f = open(file_name, 'r')
 895       try:
 896         for line in f:
 897           fields = line.split()
 898           if fields and not fields[0].startswith('#') and ip == fields[0]:
 899             continue
 900           out.write(line)
 901
 902         out.write("%s\t%s" % (ip, hostname))
 903         if aliases:
 904           out.write(" %s" % ' '.join(aliases))
 905         out.write('\n')
 906
 907         out.flush()
 908         os.fsync(out)
 909         os.chmod(tmpname, 0644)
 910         os.rename(tmpname, file_name)
 911       finally:
 912         f.close()
 913     finally:
 914       out.close()
 915   except:
 916     RemoveFile(tmpname)
 917     raise
 918
 919
 920 def AddHostToEtcHosts(hostname):
 921   """Wrapper around SetEtcHostsEntry.
 922
 923   @type hostname: str
 924   @param hostname: a hostname that will be resolved and added to
 925       L{constants.ETC_HOSTS}
 926
 927   """
 928   hi = HostInfo(name=hostname)
 929   SetEtcHostsEntry(constants.ETC_HOSTS, hi.ip, hi.name, [hi.ShortName()])
 930
 931
 932 def RemoveEtcHostsEntry(file_name, hostname):
 933   """Removes a hostname from /etc/hosts.
 934
 935   IP addresses without names are removed from the file.
 936
 937   @type file_name: str
 938   @param file_name: path to the file to modify (usually C{/etc/hosts})
 939   @type hostname: str
 940   @param hostname: the hostname to be removed
 941
 942   """
 943   # FIXME: use WriteFile + fn rather than duplicating its efforts
 944   fd, tmpname = tempfile.mkstemp(dir=os.path.dirname(file_name))
 945   try:
 946     out = os.fdopen(fd, 'w')
 947     try:
 948       f = open(file_name, 'r')
 949       try:
 950         for line in f:
 951           fields = line.split()
 952           if len(fields) > 1 and not fields[0].startswith('#'):
 953             names = fields[1:]
 954             if hostname in names:
 955               while hostname in names:
 956                 names.remove(hostname)
 957               if names:
 958                 out.write("%s %s\n" % (fields[0], ' '.join(names)))
 959               continue
 960
 961           out.write(line)
 962
 963         out.flush()
 964         os.fsync(out)
 965         os.chmod(tmpname, 0644)
 966         os.rename(tmpname, file_name)
 967       finally:
 968         f.close()
 969     finally:
 970       out.close()
 971   except:
 972     RemoveFile(tmpname)
 973     raise
 974
 975
 976 def RemoveHostFromEtcHosts(hostname):
 977   """Wrapper around RemoveEtcHostsEntry.
 978
 979   @type hostname: str
 980   @param hostname: hostname that will be resolved and its
 981       full and shot name will be removed from
 982       L{constants.ETC_HOSTS}
 983
 984   """
 985   hi = HostInfo(name=hostname)
 986   RemoveEtcHostsEntry(constants.ETC_HOSTS, hi.name)
 987   RemoveEtcHostsEntry(constants.ETC_HOSTS, hi.ShortName())
 988
 989
 990 def CreateBackup(file_name):
 991   """Creates a backup of a file.
 992
 993   @type file_name: str
 994   @param file_name: file to be backed up
 995   @rtype: str
 996   @return: the path to the newly created backup
 997   @raise errors.ProgrammerError: for invalid file names
 998
 999   """
1000   if not os.path.isfile(file_name):
1001     raise errors.ProgrammerError("Can't make a backup of a non-file '%s'" %
1002                                 file_name)
1003
1004   prefix = '%s.backup-%d.' % (os.path.basename(file_name), int(time.time()))
1005   dir_name = os.path.dirname(file_name)
1006
1007   fsrc = open(file_name, 'rb')
1008   try:
1009     (fd, backup_name) = tempfile.mkstemp(prefix=prefix, dir=dir_name)
1010     fdst = os.fdopen(fd, 'wb')
1011     try:
1012       shutil.copyfileobj(fsrc, fdst)
1013     finally:
1014       fdst.close()
1015   finally:
1016     fsrc.close()
1017
1018   return backup_name
1019
1020
1021 def ShellQuote(value):
1022   """Quotes shell argument according to POSIX.
1023
1024   @type value: str
1025   @param value: the argument to be quoted
1026   @rtype: str
1027   @return: the quoted value
1028
1029   """
1030   if _re_shell_unquoted.match(value):
1031     return value
1032   else:
1033     return "'%s'" % value.replace("'", "'\\''")
1034
1035
1036 def ShellQuoteArgs(args):
1037   """Quotes a list of shell arguments.
1038
1039   @type args: list
1040   @param args: list of arguments to be quoted
1041   @rtype: str
1042   @return: the quoted arguments concatenated with spaces
1043
1044   """
1045   return ' '.join([ShellQuote(i) for i in args])
1046
1047
1048 def TcpPing(target, port, timeout=10, live_port_needed=False, source=None):
1049   """Simple ping implementation using TCP connect(2).
1050
1051   Check if the given IP is reachable by doing attempting a TCP connect
1052   to it.
1053
1054   @type target: str
1055   @param target: the IP or hostname to ping
1056   @type port: int
1057   @param port: the port to connect to
1058   @type timeout: int
1059   @param timeout: the timeout on the connection attempt
1060   @type live_port_needed: boolean
1061   @param live_port_needed: whether a closed port will cause the
1062       function to return failure, as if there was a timeout
1063   @type source: str or None
1064   @param source: if specified, will cause the connect to be made
1065       from this specific source address; failures to bind other
1066       than C{EADDRNOTAVAIL} will be ignored
1067
1068   """
1069   sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
1070
1071   success = False
1072
1073   if source is not None:
1074     try:
1075       sock.bind((source, 0))
1076     except socket.error, (errcode, _):
1077       if errcode == errno.EADDRNOTAVAIL:
1078         success = False
1079
1080   sock.settimeout(timeout)
1081
1082   try:
1083     sock.connect((target, port))
1084     sock.close()
1085     success = True
1086   except socket.timeout:
1087     success = False
1088   except socket.error, (errcode, errstring):
1089     success = (not live_port_needed) and (errcode == errno.ECONNREFUSED)
1090
1091   return success
1092
1093
1094 def OwnIpAddress(address):
1095   """Check if the current host has the the given IP address.
1096
1097   Currently this is done by TCP-pinging the address from the loopback
1098   address.
1099
1100   @type address: string
1101   @param address: the address to check
1102   @rtype: bool
1103   @return: True if we own the address
1104
1105   """
1106   return TcpPing(address, constants.DEFAULT_NODED_PORT,
1107                  source=constants.LOCALHOST_IP_ADDRESS)
1108
1109
1110 def ListVisibleFiles(path):
1111   """Returns a list of visible files in a directory.
1112
1113   @type path: str
1114   @param path: the directory to enumerate
1115   @rtype: list
1116   @return: the list of all files not starting with a dot
1117
1118   """
1119   files = [i for i in os.listdir(path) if not i.startswith(".")]
1120   files.sort()
1121   return files
1122
1123
1124 def GetHomeDir(user, default=None):
1125   """Try to get the homedir of the given user.
1126
1127   The user can be passed either as a string (denoting the name) or as
1128   an integer (denoting the user id). If the user is not found, the
1129   'default' argument is returned, which defaults to None.
1130
1131   """
1132   try:
1133     if isinstance(user, basestring):
1134       result = pwd.getpwnam(user)
1135     elif isinstance(user, (int, long)):
1136       result = pwd.getpwuid(user)
1137     else:
1138       raise errors.ProgrammerError("Invalid type passed to GetHomeDir (%s)" %
1139                                    type(user))
1140   except KeyError:
1141     return default
1142   return result.pw_dir
1143
1144
1145 def NewUUID():
1146   """Returns a random UUID.
1147
1148   @note: This is a Linux-specific method as it uses the /proc
1149       filesystem.
1150   @rtype: str
1151
1152   """
1153   f = open("/proc/sys/kernel/random/uuid", "r")
1154   try:
1155     return f.read(128).rstrip("\n")
1156   finally:
1157     f.close()
1158
1159
1160 def GenerateSecret():
1161   """Generates a random secret.
1162
1163   This will generate a pseudo-random secret, and return its sha digest
1164   (so that it can be used where an ASCII string is needed).
1165
1166   @rtype: str
1167   @return: a sha1 hexdigest of a block of 64 random bytes
1168
1169   """
1170   return sha1(os.urandom(64)).hexdigest()
1171
1172
1173 def EnsureDirs(dirs):
1174   """Make required directories, if they don't exist.
1175
1176   @param dirs: list of tuples (dir_name, dir_mode)
1177   @type dirs: list of (string, integer)
1178
1179   """
1180   for dir_name, dir_mode in dirs:
1181     try:
1182       os.mkdir(dir_name, dir_mode)
1183     except EnvironmentError, err:
1184       if err.errno != errno.EEXIST:
1185         raise errors.GenericError("Cannot create needed directory"
1186                                   " '%s': %s" % (dir_name, err))
1187     if not os.path.isdir(dir_name):
1188       raise errors.GenericError("%s is not a directory" % dir_name)
1189
1190
1191 def ReadFile(file_name, size=None):
1192   """Reads a file.
1193
1194   @type size: None or int
1195   @param size: Read at most size bytes
1196   @rtype: str
1197   @return: the (possibly partial) content of the file
1198
1199   """
1200   f = open(file_name, "r")
1201   try:
1202     if size is None:
1203       return f.read()
1204     else:
1205       return f.read(size)
1206   finally:
1207     f.close()
1208
1209
1210 def WriteFile(file_name, fn=None, data=None,
1211               mode=None, uid=-1, gid=-1,
1212               atime=None, mtime=None, close=True,
1213               dry_run=False, backup=False,
1214               prewrite=None, postwrite=None):
1215   """(Over)write a file atomically.
1216
1217   The file_name and either fn (a function taking one argument, the
1218   file descriptor, and which should write the data to it) or data (the
1219   contents of the file) must be passed. The other arguments are
1220   optional and allow setting the file mode, owner and group, and the
1221   mtime/atime of the file.
1222
1223   If the function doesn't raise an exception, it has succeeded and the
1224   target file has the new contents. If the function has raised an
1225   exception, an existing target file should be unmodified and the
1226   temporary file should be removed.
1227
1228   @type file_name: str
1229   @param file_name: the target filename
1230   @type fn: callable
1231   @param fn: content writing function, called with
1232       file descriptor as parameter
1233   @type data: str
1234   @param data: contents of the file
1235   @type mode: int
1236   @param mode: file mode
1237   @type uid: int
1238   @param uid: the owner of the file
1239   @type gid: int
1240   @param gid: the group of the file
1241   @type atime: int
1242   @param atime: a custom access time to be set on the file
1243   @type mtime: int
1244   @param mtime: a custom modification time to be set on the file
1245   @type close: boolean
1246   @param close: whether to close file after writing it
1247   @type prewrite: callable
1248   @param prewrite: function to be called before writing content
1249   @type postwrite: callable
1250   @param postwrite: function to be called after writing content
1251
1252   @rtype: None or int
1253   @return: None if the 'close' parameter evaluates to True,
1254       otherwise the file descriptor
1255
1256   @raise errors.ProgrammerError: if any of the arguments are not valid
1257
1258   """
1259   if not os.path.isabs(file_name):
1260     raise errors.ProgrammerError("Path passed to WriteFile is not"
1261                                  " absolute: '%s'" % file_name)
1262
1263   if [fn, data].count(None) != 1:
1264     raise errors.ProgrammerError("fn or data required")
1265
1266   if [atime, mtime].count(None) == 1:
1267     raise errors.ProgrammerError("Both atime and mtime must be either"
1268                                  " set or None")
1269
1270   if backup and not dry_run and os.path.isfile(file_name):
1271     CreateBackup(file_name)
1272
1273   dir_name, base_name = os.path.split(file_name)
1274   fd, new_name = tempfile.mkstemp('.new', base_name, dir_name)
1275   do_remove = True
1276   # here we need to make sure we remove the temp file, if any error
1277   # leaves it in place
1278   try:
1279     if uid != -1 or gid != -1:
1280       os.chown(new_name, uid, gid)
1281     if mode:
1282       os.chmod(new_name, mode)
1283     if callable(prewrite):
1284       prewrite(fd)
1285     if data is not None:
1286       os.write(fd, data)
1287     else:
1288       fn(fd)
1289     if callable(postwrite):
1290       postwrite(fd)
1291     os.fsync(fd)
1292     if atime is not None and mtime is not None:
1293       os.utime(new_name, (atime, mtime))
1294     if not dry_run:
1295       os.rename(new_name, file_name)
1296       do_remove = False
1297   finally:
1298     if close:
1299       os.close(fd)
1300       result = None
1301     else:
1302       result = fd
1303     if do_remove:
1304       RemoveFile(new_name)
1305
1306   return result
1307
1308
1309 def FirstFree(seq, base=0):
1310   """Returns the first non-existing integer from seq.
1311
1312   The seq argument should be a sorted list of positive integers. The
1313   first time the index of an element is smaller than the element
1314   value, the index will be returned.
1315
1316   The base argument is used to start at a different offset,
1317   i.e. C{[3, 4, 6]} with I{offset=3} will return 5.
1318
1319   Example: C{[0, 1, 3]} will return I{2}.
1320
1321   @type seq: sequence
1322   @param seq: the sequence to be analyzed.
1323   @type base: int
1324   @param base: use this value as the base index of the sequence
1325   @rtype: int
1326   @return: the first non-used index in the sequence
1327
1328   """
1329   for idx, elem in enumerate(seq):
1330     assert elem >= base, "Passed element is higher than base offset"
1331     if elem > idx + base:
1332       # idx is not used
1333       return idx + base
1334   return None
1335
1336
1337 def all(seq, pred=bool):
1338   "Returns True if pred(x) is True for every element in the iterable"
1339   for _ in itertools.ifilterfalse(pred, seq):
1340     return False
1341   return True
1342
1343
1344 def any(seq, pred=bool):
1345   "Returns True if pred(x) is True for at least one element in the iterable"
1346   for _ in itertools.ifilter(pred, seq):
1347     return True
1348   return False
1349
1350
1351 def UniqueSequence(seq):
1352   """Returns a list with unique elements.
1353
1354   Element order is preserved.
1355
1356   @type seq: sequence
1357   @param seq: the sequence with the source elements
1358   @rtype: list
1359   @return: list of unique elements from seq
1360
1361   """
1362   seen = set()
1363   return [i for i in seq if i not in seen and not seen.add(i)]
1364
1365
1366 def IsValidMac(mac):
1367   """Predicate to check if a MAC address is valid.
1368
1369   Checks whether the supplied MAC address is formally correct, only
1370   accepts colon separated format.
1371
1372   @type mac: str
1373   @param mac: the MAC to be validated
1374   @rtype: boolean
1375   @return: True is the MAC seems valid
1376
1377   """
1378   mac_check = re.compile("^([0-9a-f]{2}(:|$)){6}$")
1379   return mac_check.match(mac) is not None
1380
1381
1382 def TestDelay(duration):
1383   """Sleep for a fixed amount of time.
1384
1385   @type duration: float
1386   @param duration: the sleep duration
1387   @rtype: boolean
1388   @return: False for negative value, True otherwise
1389
1390   """
1391   if duration < 0:
1392     return False, "Invalid sleep duration"
1393   time.sleep(duration)
1394   return True, None
1395
1396
1397 def _CloseFDNoErr(fd, retries=5):
1398   """Close a file descriptor ignoring errors.
1399
1400   @type fd: int
1401   @param fd: the file descriptor
1402   @type retries: int
1403   @param retries: how many retries to make, in case we get any
1404       other error than EBADF
1405
1406   """
1407   try:
1408     os.close(fd)
1409   except OSError, err:
1410     if err.errno != errno.EBADF:
1411       if retries > 0:
1412         _CloseFDNoErr(fd, retries - 1)
1413     # else either it's closed already or we're out of retries, so we
1414     # ignore this and go on
1415
1416
1417 def CloseFDs(noclose_fds=None):
1418   """Close file descriptors.
1419
1420   This closes all file descriptors above 2 (i.e. except
1421   stdin/out/err).
1422
1423   @type noclose_fds: list or None
1424   @param noclose_fds: if given, it denotes a list of file descriptor
1425       that should not be closed
1426
1427   """
1428   # Default maximum for the number of available file descriptors.
1429   if 'SC_OPEN_MAX' in os.sysconf_names:
1430     try:
1431       MAXFD = os.sysconf('SC_OPEN_MAX')
1432       if MAXFD < 0:
1433         MAXFD = 1024
1434     except OSError:
1435       MAXFD = 1024
1436   else:
1437     MAXFD = 1024
1438   maxfd = resource.getrlimit(resource.RLIMIT_NOFILE)[1]
1439   if (maxfd == resource.RLIM_INFINITY):
1440     maxfd = MAXFD
1441
1442   # Iterate through and close all file descriptors (except the standard ones)
1443   for fd in range(3, maxfd):
1444     if noclose_fds and fd in noclose_fds:
1445       continue
1446     _CloseFDNoErr(fd)
1447
1448
1449 def Daemonize(logfile):
1450   """Daemonize the current process.
1451
1452   This detaches the current process from the controlling terminal and
1453   runs it in the background as a daemon.
1454
1455   @type logfile: str
1456   @param logfile: the logfile to which we should redirect stdout/stderr
1457   @rtype: int
1458   @return: the value zero
1459
1460   """
1461   UMASK = 077
1462   WORKDIR = "/"
1463
1464   # this might fail
1465   pid = os.fork()
1466   if (pid == 0):  # The first child.
1467     os.setsid()
1468     # this might fail
1469     pid = os.fork() # Fork a second child.
1470     if (pid == 0):  # The second child.
1471       os.chdir(WORKDIR)
1472       os.umask(UMASK)
1473     else:
1474       # exit() or _exit()?  See below.
1475       os._exit(0) # Exit parent (the first child) of the second child.
1476   else:
1477     os._exit(0) # Exit parent of the first child.
1478
1479   for fd in range(3):
1480     _CloseFDNoErr(fd)
1481   i = os.open("/dev/null", os.O_RDONLY) # stdin
1482   assert i == 0, "Can't close/reopen stdin"
1483   i = os.open(logfile, os.O_WRONLY|os.O_CREAT|os.O_APPEND, 0600) # stdout
1484   assert i == 1, "Can't close/reopen stdout"
1485   # Duplicate standard output to standard error.
1486   os.dup2(1, 2)
1487   return 0
1488
1489
1490 def DaemonPidFileName(name):
1491   """Compute a ganeti pid file absolute path
1492
1493   @type name: str
1494   @param name: the daemon name
1495   @rtype: str
1496   @return: the full path to the pidfile corresponding to the given
1497       daemon name
1498
1499   """
1500   return os.path.join(constants.RUN_GANETI_DIR, "%s.pid" % name)
1501
1502
1503 def WritePidFile(name):
1504   """Write the current process pidfile.
1505
1506   The file will be written to L{constants.RUN_GANETI_DIR}I{/name.pid}
1507
1508   @type name: str
1509   @param name: the daemon name to use
1510   @raise errors.GenericError: if the pid file already exists and
1511       points to a live process
1512
1513   """
1514   pid = os.getpid()
1515   pidfilename = DaemonPidFileName(name)
1516   if IsProcessAlive(ReadPidFile(pidfilename)):
1517     raise errors.GenericError("%s contains a live process" % pidfilename)
1518
1519   WriteFile(pidfilename, data="%d\n" % pid)
1520
1521
1522 def RemovePidFile(name):
1523   """Remove the current process pidfile.
1524
1525   Any errors are ignored.
1526
1527   @type name: str
1528   @param name: the daemon name used to derive the pidfile name
1529
1530   """
1531   pidfilename = DaemonPidFileName(name)
1532   # TODO: we could check here that the file contains our pid
1533   try:
1534     RemoveFile(pidfilename)
1535   except:
1536     pass
1537
1538
1539 def KillProcess(pid, signal_=signal.SIGTERM, timeout=30,
1540                 waitpid=False):
1541   """Kill a process given by its pid.
1542
1543   @type pid: int
1544   @param pid: The PID to terminate.
1545   @type signal_: int
1546   @param signal_: The signal to send, by default SIGTERM
1547   @type timeout: int
1548   @param timeout: The timeout after which, if the process is still alive,
1549                   a SIGKILL will be sent. If not positive, no such checking
1550                   will be done
1551   @type waitpid: boolean
1552   @param waitpid: If true, we should waitpid on this process after
1553       sending signals, since it's our own child and otherwise it
1554       would remain as zombie
1555
1556   """
1557   def _helper(pid, signal_, wait):
1558     """Simple helper to encapsulate the kill/waitpid sequence"""
1559     os.kill(pid, signal_)
1560     if wait:
1561       try:
1562         os.waitpid(pid, os.WNOHANG)
1563       except OSError:
1564         pass
1565
1566   if pid <= 0:
1567     # kill with pid=0 == suicide
1568     raise errors.ProgrammerError("Invalid pid given '%s'" % pid)
1569
1570   if not IsProcessAlive(pid):
1571     return
1572   _helper(pid, signal_, waitpid)
1573   if timeout <= 0:
1574     return
1575
1576   # Wait up to $timeout seconds
1577   end = time.time() + timeout
1578   wait = 0.01
1579   while time.time() < end and IsProcessAlive(pid):
1580     try:
1581       (result_pid, _) = os.waitpid(pid, os.WNOHANG)
1582       if result_pid > 0:
1583         break
1584     except OSError:
1585       pass
1586     time.sleep(wait)
1587     # Make wait time longer for next try
1588     if wait < 0.1:
1589       wait *= 1.5
1590
1591   if IsProcessAlive(pid):
1592     # Kill process if it's still alive
1593     _helper(pid, signal.SIGKILL, waitpid)
1594
1595
1596 def FindFile(name, search_path, test=os.path.exists):
1597   """Look for a filesystem object in a given path.
1598
1599   This is an abstract method to search for filesystem object (files,
1600   dirs) under a given search path.
1601
1602   @type name: str
1603   @param name: the name to look for
1604   @type search_path: str
1605   @param search_path: location to start at
1606   @type test: callable
1607   @param test: a function taking one argument that should return True
1608       if the a given object is valid; the default value is
1609       os.path.exists, causing only existing files to be returned
1610   @rtype: str or None
1611   @return: full path to the object if found, None otherwise
1612
1613   """
1614   for dir_name in search_path:
1615     item_name = os.path.sep.join([dir_name, name])
1616     if test(item_name):
1617       return item_name
1618   return None
1619
1620
1621 def CheckVolumeGroupSize(vglist, vgname, minsize):
1622   """Checks if the volume group list is valid.
1623
1624   The function will check if a given volume group is in the list of
1625   volume groups and has a minimum size.
1626
1627   @type vglist: dict
1628   @param vglist: dictionary of volume group names and their size
1629   @type vgname: str
1630   @param vgname: the volume group we should check
1631   @type minsize: int
1632   @param minsize: the minimum size we accept
1633   @rtype: None or str
1634   @return: None for success, otherwise the error message
1635
1636   """
1637   vgsize = vglist.get(vgname, None)
1638   if vgsize is None:
1639     return "volume group '%s' missing" % vgname
1640   elif vgsize < minsize:
1641     return ("volume group '%s' too small (%s MiB required, %d MiB found)" %
1642             (vgname, minsize, vgsize))
1643   return None
1644
1645
1646 def SplitTime(value):
1647   """Splits time as floating point number into a tuple.
1648
1649   @param value: Time in seconds
1650   @type value: int or float
1651   @return: Tuple containing (seconds, microseconds)
1652
1653   """
1654   (seconds, microseconds) = divmod(int(value * 1000000), 1000000)
1655
1656   assert 0 <= seconds, \
1657     "Seconds must be larger than or equal to 0, but are %s" % seconds
1658   assert 0 <= microseconds <= 999999, \
1659     "Microseconds must be 0-999999, but are %s" % microseconds
1660
1661   return (int(seconds), int(microseconds))
1662
1663
1664 def MergeTime(timetuple):
1665   """Merges a tuple into time as a floating point number.
1666
1667   @param timetuple: Time as tuple, (seconds, microseconds)
1668   @type timetuple: tuple
1669   @return: Time as a floating point number expressed in seconds
1670
1671   """
1672   (seconds, microseconds) = timetuple
1673
1674   assert 0 <= seconds, \
1675     "Seconds must be larger than or equal to 0, but are %s" % seconds
1676   assert 0 <= microseconds <= 999999, \
1677     "Microseconds must be 0-999999, but are %s" % microseconds
1678
1679   return float(seconds) + (float(microseconds) * 0.000001)
1680
1681
1682 def GetNodeDaemonPort():
1683   """Get the node daemon port for this cluster.
1684
1685   Note that this routine does not read a ganeti-specific file, but
1686   instead uses C{socket.getservbyname} to allow pre-customization of
1687   this parameter outside of Ganeti.
1688
1689   @rtype: int
1690
1691   """
1692   try:
1693     port = socket.getservbyname("ganeti-noded", "tcp")
1694   except socket.error:
1695     port = constants.DEFAULT_NODED_PORT
1696
1697   return port
1698
1699
1700 def SetupLogging(logfile, debug=False, stderr_logging=False, program="",
1701                  multithreaded=False):
1702   """Configures the logging module.
1703
1704   @type logfile: str
1705   @param logfile: the filename to which we should log
1706   @type debug: boolean
1707   @param debug: whether to enable debug messages too or
1708       only those at C{INFO} and above level
1709   @type stderr_logging: boolean
1710   @param stderr_logging: whether we should also log to the standard error
1711   @type program: str
1712   @param program: the name under which we should log messages
1713   @type multithreaded: boolean
1714   @param multithreaded: if True, will add the thread name to the log file
1715   @raise EnvironmentError: if we can't open the log file and
1716       stderr logging is disabled
1717
1718   """
1719   fmt = "%(asctime)s: " + program + " pid=%(process)d"
1720   if multithreaded:
1721     fmt += "/%(threadName)s"
1722   if debug:
1723     fmt += " %(module)s:%(lineno)s"
1724   fmt += " %(levelname)s %(message)s"
1725   formatter = logging.Formatter(fmt)
1726
1727   root_logger = logging.getLogger("")
1728   root_logger.setLevel(logging.NOTSET)
1729
1730   # Remove all previously setup handlers
1731   for handler in root_logger.handlers:
1732     handler.close()
1733     root_logger.removeHandler(handler)
1734
1735   if stderr_logging:
1736     stderr_handler = logging.StreamHandler()
1737     stderr_handler.setFormatter(formatter)
1738     if debug:
1739       stderr_handler.setLevel(logging.NOTSET)
1740     else:
1741       stderr_handler.setLevel(logging.CRITICAL)
1742     root_logger.addHandler(stderr_handler)
1743
1744   # this can fail, if the logging directories are not setup or we have
1745   # a permisssion problem; in this case, it's best to log but ignore
1746   # the error if stderr_logging is True, and if false we re-raise the
1747   # exception since otherwise we could run but without any logs at all
1748   try:
1749     logfile_handler = logging.FileHandler(logfile)
1750     logfile_handler.setFormatter(formatter)
1751     if debug:
1752       logfile_handler.setLevel(logging.DEBUG)
1753     else:
1754       logfile_handler.setLevel(logging.INFO)
1755     root_logger.addHandler(logfile_handler)
1756   except EnvironmentError:
1757     if stderr_logging:
1758       logging.exception("Failed to enable logging to file '%s'", logfile)
1759     else:
1760       # we need to re-raise the exception
1761       raise
1762
1763 def IsNormAbsPath(path):
1764   """Check whether a path is absolute and also normalized
1765
1766   This avoids things like /dir/../../other/path to be valid.
1767
1768   """
1769   return os.path.normpath(path) == path and os.path.isabs(path)
1770
1771 def TailFile(fname, lines=20):
1772   """Return the last lines from a file.
1773
1774   @note: this function will only read and parse the last 4KB of
1775       the file; if the lines are very long, it could be that less
1776       than the requested number of lines are returned
1777
1778   @param fname: the file name
1779   @type lines: int
1780   @param lines: the (maximum) number of lines to return
1781
1782   """
1783   fd = open(fname, "r")
1784   try:
1785     fd.seek(0, 2)
1786     pos = fd.tell()
1787     pos = max(0, pos-4096)
1788     fd.seek(pos, 0)
1789     raw_data = fd.read()
1790   finally:
1791     fd.close()
1792
1793   rows = raw_data.splitlines()
1794   return rows[-lines:]
1795
1796
1797 def SafeEncode(text):
1798   """Return a 'safe' version of a source string.
1799
1800   This function mangles the input string and returns a version that
1801   should be safe to display/encode as ASCII. To this end, we first
1802   convert it to ASCII using the 'backslashreplace' encoding which
1803   should get rid of any non-ASCII chars, and then we process it
1804   through a loop copied from the string repr sources in the python; we
1805   don't use string_escape anymore since that escape single quotes and
1806   backslashes too, and that is too much; and that escaping is not
1807   stable, i.e. string_escape(string_escape(x)) != string_escape(x).
1808
1809   @type text: str or unicode
1810   @param text: input data
1811   @rtype: str
1812   @return: a safe version of text
1813
1814   """
1815   if isinstance(text, unicode):
1816     # only if unicode; if str already, we handle it below
1817     text = text.encode('ascii', 'backslashreplace')
1818   resu = ""
1819   for char in text:
1820     c = ord(char)
1821     if char  == '\t':
1822       resu += r'\t'
1823     elif char == '\n':
1824       resu += r'\n'
1825     elif char == '\r':
1826       resu += r'\'r'
1827     elif c < 32 or c >= 127: # non-printable
1828       resu += "\\x%02x" % (c & 0xff)
1829     else:
1830       resu += char
1831   return resu
1832
1833
1834 def CommaJoin(names):
1835   """Nicely join a set of identifiers.
1836
1837   @param names: set, list or tuple
1838   @return: a string with the formatted results
1839
1840   """
1841   return ", ".join(["'%s'" % val for val in names])
1842
1843
1844 def LockedMethod(fn):
1845   """Synchronized object access decorator.
1846
1847   This decorator is intended to protect access to an object using the
1848   object's own lock which is hardcoded to '_lock'.
1849
1850   """
1851   def _LockDebug(*args, **kwargs):
1852     if debug_locks:
1853       logging.debug(*args, **kwargs)
1854
1855   def wrapper(self, *args, **kwargs):
1856     assert hasattr(self, '_lock')
1857     lock = self._lock
1858     _LockDebug("Waiting for %s", lock)
1859     lock.acquire()
1860     try:
1861       _LockDebug("Acquired %s", lock)
1862       result = fn(self, *args, **kwargs)
1863     finally:
1864       _LockDebug("Releasing %s", lock)
1865       lock.release()
1866       _LockDebug("Released %s", lock)
1867     return result
1868   return wrapper
1869
1870
1871 def LockFile(fd):
1872   """Locks a file using POSIX locks.
1873
1874   @type fd: int
1875   @param fd: the file descriptor we need to lock
1876
1877   """
1878   try:
1879     fcntl.flock(fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
1880   except IOError, err:
1881     if err.errno == errno.EAGAIN:
1882       raise errors.LockError("File already locked")
1883     raise
1884
1885
1886 class FileLock(object):
1887   """Utility class for file locks.
1888
1889   """
1890   def __init__(self, filename):
1891     """Constructor for FileLock.
1892
1893     This will open the file denoted by the I{filename} argument.
1894
1895     @type filename: str
1896     @param filename: path to the file to be locked
1897
1898     """
1899     self.filename = filename
1900     self.fd = open(self.filename, "w")
1901
1902   def __del__(self):
1903     self.Close()
1904
1905   def Close(self):
1906     """Close the file and release the lock.
1907
1908     """
1909     if self.fd:
1910       self.fd.close()
1911       self.fd = None
1912
1913   def _flock(self, flag, blocking, timeout, errmsg):
1914     """Wrapper for fcntl.flock.
1915
1916     @type flag: int
1917     @param flag: operation flag
1918     @type blocking: bool
1919     @param blocking: whether the operation should be done in blocking mode.
1920     @type timeout: None or float
1921     @param timeout: for how long the operation should be retried (implies
1922                     non-blocking mode).
1923     @type errmsg: string
1924     @param errmsg: error message in case operation fails.
1925
1926     """
1927     assert self.fd, "Lock was closed"
1928     assert timeout is None or timeout >= 0, \
1929       "If specified, timeout must be positive"
1930
1931     if timeout is not None:
1932       flag |= fcntl.LOCK_NB
1933       timeout_end = time.time() + timeout
1934
1935     # Blocking doesn't have effect with timeout
1936     elif not blocking:
1937       flag |= fcntl.LOCK_NB
1938       timeout_end = None
1939
1940     retry = True
1941     while retry:
1942       try:
1943         fcntl.flock(self.fd, flag)
1944         retry = False
1945       except IOError, err:
1946         if err.errno in (errno.EAGAIN, ):
1947           if timeout_end is not None and time.time() < timeout_end:
1948             # Wait before trying again
1949             time.sleep(max(0.1, min(1.0, timeout)))
1950           else:
1951             raise errors.LockError(errmsg)
1952         else:
1953           logging.exception("fcntl.flock failed")
1954           raise
1955
1956   def Exclusive(self, blocking=False, timeout=None):
1957     """Locks the file in exclusive mode.
1958
1959     @type blocking: boolean
1960     @param blocking: whether to block and wait until we
1961         can lock the file or return immediately
1962     @type timeout: int or None
1963     @param timeout: if not None, the duration to wait for the lock
1964         (in blocking mode)
1965
1966     """
1967     self._flock(fcntl.LOCK_EX, blocking, timeout,
1968                 "Failed to lock %s in exclusive mode" % self.filename)
1969
1970   def Shared(self, blocking=False, timeout=None):
1971     """Locks the file in shared mode.
1972
1973     @type blocking: boolean
1974     @param blocking: whether to block and wait until we
1975         can lock the file or return immediately
1976     @type timeout: int or None
1977     @param timeout: if not None, the duration to wait for the lock
1978         (in blocking mode)
1979
1980     """
1981     self._flock(fcntl.LOCK_SH, blocking, timeout,
1982                 "Failed to lock %s in shared mode" % self.filename)
1983
1984   def Unlock(self, blocking=True, timeout=None):
1985     """Unlocks the file.
1986
1987     According to C{flock(2)}, unlocking can also be a nonblocking
1988     operation::
1989
1990       To make a non-blocking request, include LOCK_NB with any of the above
1991       operations.
1992
1993     @type blocking: boolean
1994     @param blocking: whether to block and wait until we
1995         can lock the file or return immediately
1996     @type timeout: int or None
1997     @param timeout: if not None, the duration to wait for the lock
1998         (in blocking mode)
1999
2000     """
2001     self._flock(fcntl.LOCK_UN, blocking, timeout,
2002                 "Failed to unlock %s" % self.filename)
2003
2004
2005 class SignalHandler(object):
2006   """Generic signal handler class.
2007
2008   It automatically restores the original handler when deconstructed or
2009   when L{Reset} is called. You can either pass your own handler
2010   function in or query the L{called} attribute to detect whether the
2011   signal was sent.
2012
2013   @type signum: list
2014   @ivar signum: the signals we handle
2015   @type called: boolean
2016   @ivar called: tracks whether any of the signals have been raised
2017
2018   """
2019   def __init__(self, signum):
2020     """Constructs a new SignalHandler instance.
2021
2022     @type signum: int or list of ints
2023     @param signum: Single signal number or set of signal numbers
2024
2025     """
2026     if isinstance(signum, (int, long)):
2027       self.signum = set([signum])
2028     else:
2029       self.signum = set(signum)
2030
2031     self.called = False
2032
2033     self._previous = {}
2034     try:
2035       for signum in self.signum:
2036         # Setup handler
2037         prev_handler = signal.signal(signum, self._HandleSignal)
2038         try:
2039           self._previous[signum] = prev_handler
2040         except:
2041           # Restore previous handler
2042           signal.signal(signum, prev_handler)
2043           raise
2044     except:
2045       # Reset all handlers
2046       self.Reset()
2047       # Here we have a race condition: a handler may have already been called,
2048       # but there's not much we can do about it at this point.
2049       raise
2050
2051   def __del__(self):
2052     self.Reset()
2053
2054   def Reset(self):
2055     """Restore previous handler.
2056
2057     This will reset all the signals to their previous handlers.
2058
2059     """
2060     for signum, prev_handler in self._previous.items():
2061       signal.signal(signum, prev_handler)
2062       # If successful, remove from dict
2063       del self._previous[signum]
2064
2065   def Clear(self):
2066     """Unsets the L{called} flag.
2067
2068     This function can be used in case a signal may arrive several times.
2069
2070     """
2071     self.called = False
2072
2073   def _HandleSignal(self, signum, frame):
2074     """Actual signal handling function.
2075
2076     """
2077     # This is not nice and not absolutely atomic, but it appears to be the only
2078     # solution in Python -- there are no atomic types.
2079     self.called = True
2080
2081
2082 class FieldSet(object):
2083   """A simple field set.
2084
2085   Among the features are:
2086     - checking if a string is among a list of static string or regex objects
2087     - checking if a whole list of string matches
2088     - returning the matching groups from a regex match
2089
2090   Internally, all fields are held as regular expression objects.
2091
2092   """
2093   def __init__(self, *items):
2094     self.items = [re.compile("^%s$" % value) for value in items]
2095
2096   def Extend(self, other_set):
2097     """Extend the field set with the items from another one"""
2098     self.items.extend(other_set.items)
2099
2100   def Matches(self, field):
2101     """Checks if a field matches the current set
2102
2103     @type field: str
2104     @param field: the string to match
2105     @return: either False or a regular expression match object
2106
2107     """
2108     for m in itertools.ifilter(None, (val.match(field) for val in self.items)):
2109       return m
2110     return False
2111
2112   def NonMatching(self, items):
2113     """Returns the list of fields not matching the current set
2114
2115     @type items: list
2116     @param items: the list of fields to check
2117     @rtype: list
2118     @return: list of non-matching fields
2119
2120     """
2121     return [val for val in items if not self.Matches(val)]