Statistics
| Branch: | Tag: | Revision:

root / lib / hypervisor / hv_kvm.py @ 4d2cdb5a

History | View | Annotate | Download (59.7 kB)

1
#
2
#
3

    
4
# Copyright (C) 2008, 2009, 2010, 2011 Google Inc.
5
#
6
# This program is free software; you can redistribute it and/or modify
7
# it under the terms of the GNU General Public License as published by
8
# the Free Software Foundation; either version 2 of the License, or
9
# (at your option) any later version.
10
#
11
# This program is distributed in the hope that it will be useful, but
12
# WITHOUT ANY WARRANTY; without even the implied warranty of
13
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
# General Public License for more details.
15
#
16
# You should have received a copy of the GNU General Public License
17
# along with this program; if not, write to the Free Software
18
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19
# 02110-1301, USA.
20

    
21

    
22
"""KVM hypervisor
23

24
"""
25

    
26
import errno
27
import os
28
import os.path
29
import re
30
import tempfile
31
import time
32
import logging
33
import pwd
34
import struct
35
import fcntl
36
import shutil
37
import socket
38
import StringIO
39

    
40
from ganeti import utils
41
from ganeti import constants
42
from ganeti import errors
43
from ganeti import serializer
44
from ganeti import objects
45
from ganeti import uidpool
46
from ganeti import ssconf
47
from ganeti.hypervisor import hv_base
48
from ganeti import netutils
49
from ganeti.utils import wrapper as utils_wrapper
50

    
51

    
52
_KVM_NETWORK_SCRIPT = constants.SYSCONFDIR + "/ganeti/kvm-vif-bridge"
53

    
54
# TUN/TAP driver constants, taken from <linux/if_tun.h>
55
# They are architecture-independent and already hardcoded in qemu-kvm source,
56
# so we can safely include them here.
57
TUNSETIFF = 0x400454ca
58
TUNGETIFF = 0x800454d2
59
TUNGETFEATURES = 0x800454cf
60
IFF_TAP = 0x0002
61
IFF_NO_PI = 0x1000
62
IFF_VNET_HDR = 0x4000
63

    
64

    
65
def _ProbeTapVnetHdr(fd):
66
  """Check whether to enable the IFF_VNET_HDR flag.
67

68
  To do this, _all_ of the following conditions must be met:
69
   1. TUNGETFEATURES ioctl() *must* be implemented
70
   2. TUNGETFEATURES ioctl() result *must* contain the IFF_VNET_HDR flag
71
   3. TUNGETIFF ioctl() *must* be implemented; reading the kernel code in
72
      drivers/net/tun.c there is no way to test this until after the tap device
73
      has been created using TUNSETIFF, and there is no way to change the
74
      IFF_VNET_HDR flag after creating the interface, catch-22! However both
75
      TUNGETIFF and TUNGETFEATURES were introduced in kernel version 2.6.27,
76
      thus we can expect TUNGETIFF to be present if TUNGETFEATURES is.
77

78
   @type fd: int
79
   @param fd: the file descriptor of /dev/net/tun
80

81
  """
82
  req = struct.pack("I", 0)
83
  try:
84
    res = fcntl.ioctl(fd, TUNGETFEATURES, req)
85
  except EnvironmentError:
86
    logging.warning("TUNGETFEATURES ioctl() not implemented")
87
    return False
88

    
89
  tunflags = struct.unpack("I", res)[0]
90
  if tunflags & IFF_VNET_HDR:
91
    return True
92
  else:
93
    logging.warning("Host does not support IFF_VNET_HDR, not enabling")
94
    return False
95

    
96

    
97
def _OpenTap(vnet_hdr=True):
98
  """Open a new tap device and return its file descriptor.
99

100
  This is intended to be used by a qemu-type hypervisor together with the -net
101
  tap,fd=<fd> command line parameter.
102

103
  @type vnet_hdr: boolean
104
  @param vnet_hdr: Enable the VNET Header
105
  @return: (ifname, tapfd)
106
  @rtype: tuple
107

108
  """
109
  try:
110
    tapfd = os.open("/dev/net/tun", os.O_RDWR)
111
  except EnvironmentError:
112
    raise errors.HypervisorError("Failed to open /dev/net/tun")
113

    
114
  flags = IFF_TAP | IFF_NO_PI
115

    
116
  if vnet_hdr and _ProbeTapVnetHdr(tapfd):
117
    flags |= IFF_VNET_HDR
118

    
119
  # The struct ifreq ioctl request (see netdevice(7))
120
  ifr = struct.pack("16sh", "", flags)
121

    
122
  try:
123
    res = fcntl.ioctl(tapfd, TUNSETIFF, ifr)
124
  except EnvironmentError:
125
    raise errors.HypervisorError("Failed to allocate a new TAP device")
126

    
127
  # Get the interface name from the ioctl
128
  ifname = struct.unpack("16sh", res)[0].strip("\x00")
129
  return (ifname, tapfd)
130

    
131

    
132
class QmpMessage:
133
  """QEMU Messaging Protocol (QMP) message.
134

135
  """
136

    
137
  def __init__(self, data):
138
    """Creates a new QMP message based on the passed data.
139

140
    """
141
    if not isinstance(data, dict):
142
      raise TypeError("QmpMessage must be initialized with a dict")
143

    
144
    self.data = data
145

    
146
  def __getitem__(self, field_name):
147
    """Get the value of the required field if present, or None.
148

149
    Overrides the [] operator to provide access to the message data,
150
    returning None if the required item is not in the message
151
    @return: the value of the field_name field, or None if field_name
152
             is not contained in the message
153

154
    """
155

    
156
    if field_name in self.data:
157
      return self.data[field_name]
158

    
159
    return None
160

    
161
  def __setitem__(self, field_name, field_value):
162
    """Set the value of the required field_name to field_value.
163

164
    """
165
    self.data[field_name] = field_value
166

    
167
  @staticmethod
168
  def BuildFromJsonString(json_string):
169
    """Build a QmpMessage from a JSON encoded string.
170

171
    @type json_string: str
172
    @param json_string: JSON string representing the message
173
    @rtype: L{QmpMessage}
174
    @return: a L{QmpMessage} built from json_string
175

176
    """
177
    # Parse the string
178
    data = serializer.LoadJson(json_string)
179
    return QmpMessage(data)
180

    
181
  def __str__(self):
182
    # The protocol expects the JSON object to be sent as a single
183
    # line, hence the need for indent=False.
184
    return serializer.DumpJson(self.data, indent=False)
185

    
186
  def __eq__(self, other):
187
    # When comparing two QmpMessages, we are interested in comparing
188
    # their internal representation of the message data
189
    return self.data == other.data
190

    
191

    
192
class QmpConnection:
193
  """Connection to the QEMU Monitor using the QEMU Monitor Protocol (QMP).
194

195
  """
196
  _FIRST_MESSAGE_KEY = "QMP"
197
  _EVENT_KEY = "event"
198
  _ERROR_KEY = "error"
199
  _ERROR_CLASS_KEY = "class"
200
  _ERROR_DATA_KEY = "data"
201
  _ERROR_DESC_KEY = "desc"
202
  _EXECUTE_KEY = "execute"
203
  _ARGUMENTS_KEY = "arguments"
204
  _CAPABILITIES_COMMAND = "qmp_capabilities"
205
  _MESSAGE_END_TOKEN = "\r\n"
206
  _SOCKET_TIMEOUT = 5
207

    
208
  def __init__(self, monitor_filename):
209
    """Instantiates the QmpConnection object.
210

211
    @type monitor_filename: string
212
    @param monitor_filename: the filename of the UNIX raw socket on which the
213
                             QMP monitor is listening
214

215
    """
216
    self.monitor_filename = monitor_filename
217
    self.sock = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)
218
    # We want to fail if the server doesn't send a complete message
219
    # in a reasonable amount of time
220
    self.sock.settimeout(self._SOCKET_TIMEOUT)
221
    self._connected = False
222
    self._buf = ""
223

    
224
  def _check_connection(self):
225
    """Make sure that the connection is established.
226

227
    """
228
    if not self._connected:
229
      raise errors.ProgrammerError("To use a QmpConnection you need to first"
230
                                   " invoke connect() on it")
231

    
232
  def connect(self):
233
    """Connects to the QMP monitor.
234

235
    Connects to the UNIX socket and makes sure that we can actually send and
236
    receive data to the kvm instance via QMP.
237

238
    @raise errors.HypervisorError: when there are communication errors
239
    @raise errors.ProgrammerError: when there are data serialization errors
240

241
    """
242
    self.sock.connect(self.monitor_filename)
243
    self._connected = True
244

    
245
    # Check if we receive a correct greeting message from the server
246
    # (As per the QEMU Protocol Specification 0.1 - section 2.2)
247
    greeting = self._Recv()
248
    if not greeting[self._FIRST_MESSAGE_KEY]:
249
      self._connected = False
250
      raise errors.HypervisorError("kvm: qmp communication error (wrong"
251
                                   " server greeting")
252

    
253
    # Let's put the monitor in command mode using the qmp_capabilities
254
    # command, or else no command will be executable.
255
    # (As per the QEMU Protocol Specification 0.1 - section 4)
256
    self.Execute(self._CAPABILITIES_COMMAND)
257

    
258
  def _ParseMessage(self, buf):
259
    """Extract and parse a QMP message from the given buffer.
260

261
    Seeks for a QMP message in the given buf. If found, it parses it and
262
    returns it together with the rest of the characters in the buf.
263
    If no message is found, returns None and the whole buffer.
264

265
    @raise errors.ProgrammerError: when there are data serialization errors
266

267
    """
268
    message = None
269
    # Check if we got the message end token (CRLF, as per the QEMU Protocol
270
    # Specification 0.1 - Section 2.1.1)
271
    pos = buf.find(self._MESSAGE_END_TOKEN)
272
    if pos >= 0:
273
      try:
274
        message = QmpMessage.BuildFromJsonString(buf[:pos + 1])
275
      except Exception, err:
276
        raise errors.ProgrammerError("QMP data serialization error: %s" % err)
277
      buf = buf[pos + 1:]
278

    
279
    return (message, buf)
280

    
281
  def _Recv(self):
282
    """Receives a message from QMP and decodes the received JSON object.
283

284
    @rtype: QmpMessage
285
    @return: the received message
286
    @raise errors.HypervisorError: when there are communication errors
287
    @raise errors.ProgrammerError: when there are data serialization errors
288

289
    """
290
    self._check_connection()
291

    
292
    # Check if there is already a message in the buffer
293
    (message, self._buf) = self._ParseMessage(self._buf)
294
    if message:
295
      return message
296

    
297
    recv_buffer = StringIO.StringIO(self._buf)
298
    recv_buffer.seek(len(self._buf))
299
    try:
300
      while True:
301
        data = self.sock.recv(4096)
302
        if not data:
303
          break
304
        recv_buffer.write(data)
305

    
306
        (message, self._buf) = self._ParseMessage(recv_buffer.getvalue())
307
        if message:
308
          return message
309

    
310
    except socket.timeout, err:
311
      raise errors.HypervisorError("Timeout while receiving a QMP message: "
312
                                   "%s" % (err))
313
    except socket.error, err:
314
      raise errors.HypervisorError("Unable to receive data from KVM using the"
315
                                   " QMP protocol: %s" % err)
316

    
317
  def _Send(self, message):
318
    """Encodes and sends a message to KVM using QMP.
319

320
    @type message: QmpMessage
321
    @param message: message to send to KVM
322
    @raise errors.HypervisorError: when there are communication errors
323
    @raise errors.ProgrammerError: when there are data serialization errors
324

325
    """
326
    self._check_connection()
327
    try:
328
      message_str = str(message)
329
    except Exception, err:
330
      raise errors.ProgrammerError("QMP data deserialization error: %s" % err)
331

    
332
    try:
333
      self.sock.sendall(message_str)
334
    except socket.timeout, err:
335
      raise errors.HypervisorError("Timeout while sending a QMP message: "
336
                                   "%s (%s)" % (err.string, err.errno))
337
    except socket.error, err:
338
      raise errors.HypervisorError("Unable to send data from KVM using the"
339
                                   " QMP protocol: %s" % err)
340

    
341
  def Execute(self, command, arguments=None):
342
    """Executes a QMP command and returns the response of the server.
343

344
    @type command: str
345
    @param command: the command to execute
346
    @type arguments: dict
347
    @param arguments: dictionary of arguments to be passed to the command
348
    @rtype: dict
349
    @return: dictionary representing the received JSON object
350
    @raise errors.HypervisorError: when there are communication errors
351
    @raise errors.ProgrammerError: when there are data serialization errors
352

353
    """
354
    self._check_connection()
355
    message = QmpMessage({self._EXECUTE_KEY: command})
356
    if arguments:
357
      message[self._ARGUMENTS_KEY] = arguments
358
    self._Send(message)
359

    
360
    # Events can occur between the sending of the command and the reception
361
    # of the response, so we need to filter out messages with the event key.
362
    while True:
363
      response = self._Recv()
364
      err = response[self._ERROR_KEY]
365
      if err:
366
        raise errors.HypervisorError("kvm: error executing the %s"
367
                                     " command: %s (%s, %s):" %
368
                                     (command,
369
                                      err[self._ERROR_DESC_KEY],
370
                                      err[self._ERROR_CLASS_KEY],
371
                                      err[self._ERROR_DATA_KEY]))
372

    
373
      elif not response[self._EVENT_KEY]:
374
        return response
375

    
376

    
377
class KVMHypervisor(hv_base.BaseHypervisor):
378
  """KVM hypervisor interface"""
379
  CAN_MIGRATE = True
380

    
381
  _ROOT_DIR = constants.RUN_GANETI_DIR + "/kvm-hypervisor"
382
  _PIDS_DIR = _ROOT_DIR + "/pid" # contains live instances pids
383
  _UIDS_DIR = _ROOT_DIR + "/uid" # contains instances reserved uids
384
  _CTRL_DIR = _ROOT_DIR + "/ctrl" # contains instances control sockets
385
  _CONF_DIR = _ROOT_DIR + "/conf" # contains instances startup data
386
  _NICS_DIR = _ROOT_DIR + "/nic" # contains instances nic <-> tap associations
387
  _KEYMAP_DIR = _ROOT_DIR + "/keymap" # contains instances keymaps
388
  # KVM instances with chroot enabled are started in empty chroot directories.
389
  _CHROOT_DIR = _ROOT_DIR + "/chroot" # for empty chroot directories
390
  # After an instance is stopped, its chroot directory is removed.
391
  # If the chroot directory is not empty, it can't be removed.
392
  # A non-empty chroot directory indicates a possible security incident.
393
  # To support forensics, the non-empty chroot directory is quarantined in
394
  # a separate directory, called 'chroot-quarantine'.
395
  _CHROOT_QUARANTINE_DIR = _ROOT_DIR + "/chroot-quarantine"
396
  _DIRS = [_ROOT_DIR, _PIDS_DIR, _UIDS_DIR, _CTRL_DIR, _CONF_DIR, _NICS_DIR,
397
           _CHROOT_DIR, _CHROOT_QUARANTINE_DIR]
398

    
399
  PARAMETERS = {
400
    constants.HV_KERNEL_PATH: hv_base.OPT_FILE_CHECK,
401
    constants.HV_INITRD_PATH: hv_base.OPT_FILE_CHECK,
402
    constants.HV_ROOT_PATH: hv_base.NO_CHECK,
403
    constants.HV_KERNEL_ARGS: hv_base.NO_CHECK,
404
    constants.HV_ACPI: hv_base.NO_CHECK,
405
    constants.HV_SERIAL_CONSOLE: hv_base.NO_CHECK,
406
    constants.HV_VNC_BIND_ADDRESS:
407
      (False, lambda x: (netutils.IP4Address.IsValid(x) or
408
                         utils.IsNormAbsPath(x)),
409
       "the VNC bind address must be either a valid IP address or an absolute"
410
       " pathname", None, None),
411
    constants.HV_VNC_TLS: hv_base.NO_CHECK,
412
    constants.HV_VNC_X509: hv_base.OPT_DIR_CHECK,
413
    constants.HV_VNC_X509_VERIFY: hv_base.NO_CHECK,
414
    constants.HV_VNC_PASSWORD_FILE: hv_base.OPT_FILE_CHECK,
415
    constants.HV_KVM_SPICE_BIND: hv_base.NO_CHECK, # will be checked later
416
    constants.HV_KVM_SPICE_IP_VERSION:
417
      (False, lambda x: (x == constants.IFACE_NO_IP_VERSION_SPECIFIED or
418
                         x in constants.VALID_IP_VERSIONS),
419
       "the SPICE IP version should be 4 or 6",
420
       None, None),
421
    constants.HV_KVM_SPICE_PASSWORD_FILE: hv_base.OPT_FILE_CHECK,
422
    constants.HV_KVM_FLOPPY_IMAGE_PATH: hv_base.OPT_FILE_CHECK,
423
    constants.HV_CDROM_IMAGE_PATH: hv_base.OPT_FILE_CHECK,
424
    constants.HV_KVM_CDROM2_IMAGE_PATH: hv_base.OPT_FILE_CHECK,
425
    constants.HV_BOOT_ORDER:
426
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_BO_TYPES),
427
    constants.HV_NIC_TYPE:
428
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_NIC_TYPES),
429
    constants.HV_DISK_TYPE:
430
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_DISK_TYPES),
431
    constants.HV_KVM_CDROM_DISK_TYPE:
432
      hv_base.ParamInSet(False, constants.HT_KVM_VALID_DISK_TYPES),
433
    constants.HV_USB_MOUSE:
434
      hv_base.ParamInSet(False, constants.HT_KVM_VALID_MOUSE_TYPES),
435
    constants.HV_KEYMAP: hv_base.NO_CHECK,
436
    constants.HV_MIGRATION_PORT: hv_base.REQ_NET_PORT_CHECK,
437
    constants.HV_MIGRATION_BANDWIDTH: hv_base.NO_CHECK,
438
    constants.HV_MIGRATION_DOWNTIME: hv_base.NO_CHECK,
439
    constants.HV_MIGRATION_MODE: hv_base.MIGRATION_MODE_CHECK,
440
    constants.HV_USE_LOCALTIME: hv_base.NO_CHECK,
441
    constants.HV_DISK_CACHE:
442
      hv_base.ParamInSet(True, constants.HT_VALID_CACHE_TYPES),
443
    constants.HV_SECURITY_MODEL:
444
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_SM_TYPES),
445
    constants.HV_SECURITY_DOMAIN: hv_base.NO_CHECK,
446
    constants.HV_KVM_FLAG:
447
      hv_base.ParamInSet(False, constants.HT_KVM_FLAG_VALUES),
448
    constants.HV_VHOST_NET: hv_base.NO_CHECK,
449
    constants.HV_KVM_USE_CHROOT: hv_base.NO_CHECK,
450
    constants.HV_MEM_PATH: hv_base.OPT_DIR_CHECK,
451
    constants.HV_REBOOT_BEHAVIOR:
452
      hv_base.ParamInSet(True, constants.REBOOT_BEHAVIORS)
453
    }
454

    
455
  _MIGRATION_STATUS_RE = re.compile("Migration\s+status:\s+(\w+)",
456
                                    re.M | re.I)
457
  _MIGRATION_INFO_MAX_BAD_ANSWERS = 5
458
  _MIGRATION_INFO_RETRY_DELAY = 2
459

    
460
  _VERSION_RE = re.compile(r"\b(\d+)\.(\d+)\.(\d+)\b")
461

    
462
  ANCILLARY_FILES = [
463
    _KVM_NETWORK_SCRIPT,
464
    ]
465

    
466
  def __init__(self):
467
    hv_base.BaseHypervisor.__init__(self)
468
    # Let's make sure the directories we need exist, even if the RUN_DIR lives
469
    # in a tmpfs filesystem or has been otherwise wiped out.
470
    dirs = [(dname, constants.RUN_DIRS_MODE) for dname in self._DIRS]
471
    utils.EnsureDirs(dirs)
472

    
473
  @classmethod
474
  def _InstancePidFile(cls, instance_name):
475
    """Returns the instance pidfile.
476

477
    """
478
    return utils.PathJoin(cls._PIDS_DIR, instance_name)
479

    
480
  @classmethod
481
  def _InstanceUidFile(cls, instance_name):
482
    """Returns the instance uidfile.
483

484
    """
485
    return utils.PathJoin(cls._UIDS_DIR, instance_name)
486

    
487
  @classmethod
488
  def _InstancePidInfo(cls, pid):
489
    """Check pid file for instance information.
490

491
    Check that a pid file is associated with an instance, and retrieve
492
    information from its command line.
493

494
    @type pid: string or int
495
    @param pid: process id of the instance to check
496
    @rtype: tuple
497
    @return: (instance_name, memory, vcpus)
498
    @raise errors.HypervisorError: when an instance cannot be found
499

500
    """
501
    alive = utils.IsProcessAlive(pid)
502
    if not alive:
503
      raise errors.HypervisorError("Cannot get info for pid %s" % pid)
504

    
505
    cmdline_file = utils.PathJoin("/proc", str(pid), "cmdline")
506
    try:
507
      cmdline = utils.ReadFile(cmdline_file)
508
    except EnvironmentError, err:
509
      raise errors.HypervisorError("Can't open cmdline file for pid %s: %s" %
510
                                   (pid, err))
511

    
512
    instance = None
513
    memory = 0
514
    vcpus = 0
515

    
516
    arg_list = cmdline.split("\x00")
517
    while arg_list:
518
      arg = arg_list.pop(0)
519
      if arg == "-name":
520
        instance = arg_list.pop(0)
521
      elif arg == "-m":
522
        memory = int(arg_list.pop(0))
523
      elif arg == "-smp":
524
        vcpus = int(arg_list.pop(0))
525

    
526
    if instance is None:
527
      raise errors.HypervisorError("Pid %s doesn't contain a ganeti kvm"
528
                                   " instance" % pid)
529

    
530
    return (instance, memory, vcpus)
531

    
532
  def _InstancePidAlive(self, instance_name):
533
    """Returns the instance pidfile, pid, and liveness.
534

535
    @type instance_name: string
536
    @param instance_name: instance name
537
    @rtype: tuple
538
    @return: (pid file name, pid, liveness)
539

540
    """
541
    pidfile = self._InstancePidFile(instance_name)
542
    pid = utils.ReadPidFile(pidfile)
543

    
544
    alive = False
545
    try:
546
      cmd_instance = self._InstancePidInfo(pid)[0]
547
      alive = (cmd_instance == instance_name)
548
    except errors.HypervisorError:
549
      pass
550

    
551
    return (pidfile, pid, alive)
552

    
553
  def _CheckDown(self, instance_name):
554
    """Raises an error unless the given instance is down.
555

556
    """
557
    alive = self._InstancePidAlive(instance_name)[2]
558
    if alive:
559
      raise errors.HypervisorError("Failed to start instance %s: %s" %
560
                                   (instance_name, "already running"))
561

    
562
  @classmethod
563
  def _InstanceMonitor(cls, instance_name):
564
    """Returns the instance monitor socket name
565

566
    """
567
    return utils.PathJoin(cls._CTRL_DIR, "%s.monitor" % instance_name)
568

    
569
  @classmethod
570
  def _InstanceSerial(cls, instance_name):
571
    """Returns the instance serial socket name
572

573
    """
574
    return utils.PathJoin(cls._CTRL_DIR, "%s.serial" % instance_name)
575

    
576
  @classmethod
577
  def _InstanceQmpMonitor(cls, instance_name):
578
    """Returns the instance serial QMP socket name
579

580
    """
581
    return utils.PathJoin(cls._CTRL_DIR, "%s.qmp" % instance_name)
582

    
583
  @staticmethod
584
  def _SocatUnixConsoleParams():
585
    """Returns the correct parameters for socat
586

587
    If we have a new-enough socat we can use raw mode with an escape character.
588

589
    """
590
    if constants.SOCAT_USE_ESCAPE:
591
      return "raw,echo=0,escape=%s" % constants.SOCAT_ESCAPE_CODE
592
    else:
593
      return "echo=0,icanon=0"
594

    
595
  @classmethod
596
  def _InstanceKVMRuntime(cls, instance_name):
597
    """Returns the instance KVM runtime filename
598

599
    """
600
    return utils.PathJoin(cls._CONF_DIR, "%s.runtime" % instance_name)
601

    
602
  @classmethod
603
  def _InstanceChrootDir(cls, instance_name):
604
    """Returns the name of the KVM chroot dir of the instance
605

606
    """
607
    return utils.PathJoin(cls._CHROOT_DIR, instance_name)
608

    
609
  @classmethod
610
  def _InstanceNICDir(cls, instance_name):
611
    """Returns the name of the directory holding the tap device files for a
612
    given instance.
613

614
    """
615
    return utils.PathJoin(cls._NICS_DIR, instance_name)
616

    
617
  @classmethod
618
  def _InstanceNICFile(cls, instance_name, seq):
619
    """Returns the name of the file containing the tap device for a given NIC
620

621
    """
622
    return utils.PathJoin(cls._InstanceNICDir(instance_name), str(seq))
623

    
624
  @classmethod
625
  def _InstanceKeymapFile(cls, instance_name):
626
    """Returns the name of the file containing the keymap for a given instance
627

628
    """
629
    return utils.PathJoin(cls._KEYMAP_DIR, instance_name)
630

    
631
  @classmethod
632
  def _TryReadUidFile(cls, uid_file):
633
    """Try to read a uid file
634

635
    """
636
    if os.path.exists(uid_file):
637
      try:
638
        uid = int(utils.ReadOneLineFile(uid_file))
639
        return uid
640
      except EnvironmentError:
641
        logging.warning("Can't read uid file", exc_info=True)
642
      except (TypeError, ValueError):
643
        logging.warning("Can't parse uid file contents", exc_info=True)
644
    return None
645

    
646
  @classmethod
647
  def _RemoveInstanceRuntimeFiles(cls, pidfile, instance_name):
648
    """Removes an instance's rutime sockets/files/dirs.
649

650
    """
651
    utils.RemoveFile(pidfile)
652
    utils.RemoveFile(cls._InstanceMonitor(instance_name))
653
    utils.RemoveFile(cls._InstanceSerial(instance_name))
654
    utils.RemoveFile(cls._InstanceQmpMonitor(instance_name))
655
    utils.RemoveFile(cls._InstanceKVMRuntime(instance_name))
656
    utils.RemoveFile(cls._InstanceKeymapFile(instance_name))
657
    uid_file = cls._InstanceUidFile(instance_name)
658
    uid = cls._TryReadUidFile(uid_file)
659
    utils.RemoveFile(uid_file)
660
    if uid is not None:
661
      uidpool.ReleaseUid(uid)
662
    try:
663
      shutil.rmtree(cls._InstanceNICDir(instance_name))
664
    except OSError, err:
665
      if err.errno != errno.ENOENT:
666
        raise
667
    try:
668
      chroot_dir = cls._InstanceChrootDir(instance_name)
669
      utils.RemoveDir(chroot_dir)
670
    except OSError, err:
671
      if err.errno == errno.ENOTEMPTY:
672
        # The chroot directory is expected to be empty, but it isn't.
673
        new_chroot_dir = tempfile.mkdtemp(dir=cls._CHROOT_QUARANTINE_DIR,
674
                                          prefix="%s-%s-" %
675
                                          (instance_name,
676
                                           utils.TimestampForFilename()))
677
        logging.warning("The chroot directory of instance %s can not be"
678
                        " removed as it is not empty. Moving it to the"
679
                        " quarantine instead. Please investigate the"
680
                        " contents (%s) and clean up manually",
681
                        instance_name, new_chroot_dir)
682
        utils.RenameFile(chroot_dir, new_chroot_dir)
683
      else:
684
        raise
685

    
686
  @staticmethod
687
  def _ConfigureNIC(instance, seq, nic, tap):
688
    """Run the network configuration script for a specified NIC
689

690
    @param instance: instance we're acting on
691
    @type instance: instance object
692
    @param seq: nic sequence number
693
    @type seq: int
694
    @param nic: nic we're acting on
695
    @type nic: nic object
696
    @param tap: the host's tap interface this NIC corresponds to
697
    @type tap: str
698

699
    """
700

    
701
    if instance.tags:
702
      tags = " ".join(instance.tags)
703
    else:
704
      tags = ""
705

    
706
    env = {
707
      "PATH": "%s:/sbin:/usr/sbin" % os.environ["PATH"],
708
      "INSTANCE": instance.name,
709
      "MAC": nic.mac,
710
      "MODE": nic.nicparams[constants.NIC_MODE],
711
      "INTERFACE": tap,
712
      "INTERFACE_INDEX": str(seq),
713
      "TAGS": tags,
714
    }
715

    
716
    if nic.ip:
717
      env["IP"] = nic.ip
718

    
719
    if nic.nicparams[constants.NIC_LINK]:
720
      env["LINK"] = nic.nicparams[constants.NIC_LINK]
721

    
722
    if nic.nicparams[constants.NIC_MODE] == constants.NIC_MODE_BRIDGED:
723
      env["BRIDGE"] = nic.nicparams[constants.NIC_LINK]
724

    
725
    result = utils.RunCmd([constants.KVM_IFUP, tap], env=env)
726
    if result.failed:
727
      raise errors.HypervisorError("Failed to configure interface %s: %s."
728
                                   " Network configuration script output: %s" %
729
                                   (tap, result.fail_reason, result.output))
730

    
731
  def ListInstances(self):
732
    """Get the list of running instances.
733

734
    We can do this by listing our live instances directory and
735
    checking whether the associated kvm process is still alive.
736

737
    """
738
    result = []
739
    for name in os.listdir(self._PIDS_DIR):
740
      if self._InstancePidAlive(name)[2]:
741
        result.append(name)
742
    return result
743

    
744
  def GetInstanceInfo(self, instance_name):
745
    """Get instance properties.
746

747
    @type instance_name: string
748
    @param instance_name: the instance name
749
    @rtype: tuple of strings
750
    @return: (name, id, memory, vcpus, stat, times)
751

752
    """
753
    _, pid, alive = self._InstancePidAlive(instance_name)
754
    if not alive:
755
      return None
756

    
757
    _, memory, vcpus = self._InstancePidInfo(pid)
758
    stat = "---b-"
759
    times = "0"
760

    
761
    return (instance_name, pid, memory, vcpus, stat, times)
762

    
763
  def GetAllInstancesInfo(self):
764
    """Get properties of all instances.
765

766
    @return: list of tuples (name, id, memory, vcpus, stat, times)
767

768
    """
769
    data = []
770
    for name in os.listdir(self._PIDS_DIR):
771
      try:
772
        info = self.GetInstanceInfo(name)
773
      except errors.HypervisorError:
774
        continue
775
      if info:
776
        data.append(info)
777
    return data
778

    
779
  def _GenerateKVMRuntime(self, instance, block_devices, startup_paused):
780
    """Generate KVM information to start an instance.
781

782
    """
783
    _, v_major, v_min, _ = self._GetKVMVersion()
784

    
785
    pidfile = self._InstancePidFile(instance.name)
786
    kvm = constants.KVM_PATH
787
    kvm_cmd = [kvm]
788
    # used just by the vnc server, if enabled
789
    kvm_cmd.extend(["-name", instance.name])
790
    kvm_cmd.extend(["-m", instance.beparams[constants.BE_MEMORY]])
791
    kvm_cmd.extend(["-smp", instance.beparams[constants.BE_VCPUS]])
792
    kvm_cmd.extend(["-pidfile", pidfile])
793
    kvm_cmd.extend(["-daemonize"])
794
    if not instance.hvparams[constants.HV_ACPI]:
795
      kvm_cmd.extend(["-no-acpi"])
796
    if startup_paused:
797
      kvm_cmd.extend(["-S"])
798
    if instance.hvparams[constants.HV_REBOOT_BEHAVIOR] == \
799
        constants.INSTANCE_REBOOT_EXIT:
800
      kvm_cmd.extend(["-no-reboot"])
801

    
802
    hvp = instance.hvparams
803
    boot_disk = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_DISK
804
    boot_cdrom = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_CDROM
805
    boot_floppy = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_FLOPPY
806
    boot_network = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_NETWORK
807

    
808
    self.ValidateParameters(hvp)
809

    
810
    if hvp[constants.HV_KVM_FLAG] == constants.HT_KVM_ENABLED:
811
      kvm_cmd.extend(["-enable-kvm"])
812
    elif hvp[constants.HV_KVM_FLAG] == constants.HT_KVM_DISABLED:
813
      kvm_cmd.extend(["-disable-kvm"])
814

    
815
    if boot_network:
816
      kvm_cmd.extend(["-boot", "n"])
817

    
818
    disk_type = hvp[constants.HV_DISK_TYPE]
819
    if disk_type == constants.HT_DISK_PARAVIRTUAL:
820
      if_val = ",if=virtio"
821
    else:
822
      if_val = ",if=%s" % disk_type
823
    # Cache mode
824
    disk_cache = hvp[constants.HV_DISK_CACHE]
825
    if instance.disk_template in constants.DTS_EXT_MIRROR:
826
      if disk_cache != "none":
827
        # TODO: make this a hard error, instead of a silent overwrite
828
        logging.warning("KVM: overriding disk_cache setting '%s' with 'none'"
829
                        " to prevent shared storage corruption on migration",
830
                        disk_cache)
831
      cache_val = ",cache=none"
832
    elif disk_cache != constants.HT_CACHE_DEFAULT:
833
      cache_val = ",cache=%s" % disk_cache
834
    else:
835
      cache_val = ""
836
    for cfdev, dev_path in block_devices:
837
      if cfdev.mode != constants.DISK_RDWR:
838
        raise errors.HypervisorError("Instance has read-only disks which"
839
                                     " are not supported by KVM")
840
      # TODO: handle FD_LOOP and FD_BLKTAP (?)
841
      boot_val = ""
842
      if boot_disk:
843
        kvm_cmd.extend(["-boot", "c"])
844
        boot_disk = False
845
        if (v_major, v_min) < (0, 14) and disk_type != constants.HT_DISK_IDE:
846
          boot_val = ",boot=on"
847

    
848
      drive_val = "file=%s,format=raw%s%s%s" % (dev_path, if_val, boot_val,
849
                                                cache_val)
850
      kvm_cmd.extend(["-drive", drive_val])
851

    
852
    #Now we can specify a different device type for CDROM devices.
853
    cdrom_disk_type = hvp[constants.HV_KVM_CDROM_DISK_TYPE]
854
    if not cdrom_disk_type:
855
      cdrom_disk_type = disk_type
856

    
857
    iso_image = hvp[constants.HV_CDROM_IMAGE_PATH]
858
    if iso_image:
859
      options = ",format=raw,media=cdrom"
860
      if boot_cdrom:
861
        kvm_cmd.extend(["-boot", "d"])
862
        if cdrom_disk_type != constants.HT_DISK_IDE:
863
          options = "%s,boot=on,if=%s" % (options, constants.HT_DISK_IDE)
864
        else:
865
          options = "%s,boot=on" % options
866
      else:
867
        if cdrom_disk_type == constants.HT_DISK_PARAVIRTUAL:
868
          if_val = ",if=virtio"
869
        else:
870
          if_val = ",if=%s" % cdrom_disk_type
871
        options = "%s%s" % (options, if_val)
872
      drive_val = "file=%s%s" % (iso_image, options)
873
      kvm_cmd.extend(["-drive", drive_val])
874

    
875
    iso_image2 = hvp[constants.HV_KVM_CDROM2_IMAGE_PATH]
876
    if iso_image2:
877
      options = ",format=raw,media=cdrom"
878
      if cdrom_disk_type == constants.HT_DISK_PARAVIRTUAL:
879
        if_val = ",if=virtio"
880
      else:
881
        if_val = ",if=%s" % cdrom_disk_type
882
      options = "%s%s" % (options, if_val)
883
      drive_val = "file=%s%s" % (iso_image2, options)
884
      kvm_cmd.extend(["-drive", drive_val])
885

    
886
    floppy_image = hvp[constants.HV_KVM_FLOPPY_IMAGE_PATH]
887
    if floppy_image:
888
      options = ",format=raw,media=disk"
889
      if boot_floppy:
890
        kvm_cmd.extend(["-boot", "a"])
891
        options = "%s,boot=on" % options
892
      if_val = ",if=floppy"
893
      options = "%s%s" % (options, if_val)
894
      drive_val = "file=%s%s" % (floppy_image, options)
895
      kvm_cmd.extend(["-drive", drive_val])
896

    
897
    kernel_path = hvp[constants.HV_KERNEL_PATH]
898
    if kernel_path:
899
      kvm_cmd.extend(["-kernel", kernel_path])
900
      initrd_path = hvp[constants.HV_INITRD_PATH]
901
      if initrd_path:
902
        kvm_cmd.extend(["-initrd", initrd_path])
903
      root_append = ["root=%s" % hvp[constants.HV_ROOT_PATH],
904
                     hvp[constants.HV_KERNEL_ARGS]]
905
      if hvp[constants.HV_SERIAL_CONSOLE]:
906
        root_append.append("console=ttyS0,38400")
907
      kvm_cmd.extend(["-append", " ".join(root_append)])
908

    
909
    mem_path = hvp[constants.HV_MEM_PATH]
910
    if mem_path:
911
      kvm_cmd.extend(["-mem-path", mem_path, "-mem-prealloc"])
912

    
913
    mouse_type = hvp[constants.HV_USB_MOUSE]
914
    vnc_bind_address = hvp[constants.HV_VNC_BIND_ADDRESS]
915

    
916
    if mouse_type:
917
      kvm_cmd.extend(["-usb"])
918
      kvm_cmd.extend(["-usbdevice", mouse_type])
919
    elif vnc_bind_address:
920
      kvm_cmd.extend(["-usbdevice", constants.HT_MOUSE_TABLET])
921

    
922
    keymap = hvp[constants.HV_KEYMAP]
923
    if keymap:
924
      keymap_path = self._InstanceKeymapFile(instance.name)
925
      # If a keymap file is specified, KVM won't use its internal defaults. By
926
      # first including the "en-us" layout, an error on loading the actual
927
      # layout (e.g. because it can't be found) won't lead to a non-functional
928
      # keyboard. A keyboard with incorrect keys is still better than none.
929
      utils.WriteFile(keymap_path, data="include en-us\ninclude %s\n" % keymap)
930
      kvm_cmd.extend(["-k", keymap_path])
931

    
932
    if vnc_bind_address:
933
      if netutils.IP4Address.IsValid(vnc_bind_address):
934
        if instance.network_port > constants.VNC_BASE_PORT:
935
          display = instance.network_port - constants.VNC_BASE_PORT
936
          if vnc_bind_address == constants.IP4_ADDRESS_ANY:
937
            vnc_arg = ":%d" % (display)
938
          else:
939
            vnc_arg = "%s:%d" % (vnc_bind_address, display)
940
        else:
941
          logging.error("Network port is not a valid VNC display (%d < %d)."
942
                        " Not starting VNC", instance.network_port,
943
                        constants.VNC_BASE_PORT)
944
          vnc_arg = "none"
945

    
946
        # Only allow tls and other option when not binding to a file, for now.
947
        # kvm/qemu gets confused otherwise about the filename to use.
948
        vnc_append = ""
949
        if hvp[constants.HV_VNC_TLS]:
950
          vnc_append = "%s,tls" % vnc_append
951
          if hvp[constants.HV_VNC_X509_VERIFY]:
952
            vnc_append = "%s,x509verify=%s" % (vnc_append,
953
                                               hvp[constants.HV_VNC_X509])
954
          elif hvp[constants.HV_VNC_X509]:
955
            vnc_append = "%s,x509=%s" % (vnc_append,
956
                                         hvp[constants.HV_VNC_X509])
957
        if hvp[constants.HV_VNC_PASSWORD_FILE]:
958
          vnc_append = "%s,password" % vnc_append
959

    
960
        vnc_arg = "%s%s" % (vnc_arg, vnc_append)
961

    
962
      else:
963
        vnc_arg = "unix:%s/%s.vnc" % (vnc_bind_address, instance.name)
964

    
965
      kvm_cmd.extend(["-vnc", vnc_arg])
966
    else:
967
      kvm_cmd.extend(["-nographic"])
968

    
969
    monitor_dev = ("unix:%s,server,nowait" %
970
                   self._InstanceMonitor(instance.name))
971
    kvm_cmd.extend(["-monitor", monitor_dev])
972
    if hvp[constants.HV_SERIAL_CONSOLE]:
973
      serial_dev = ("unix:%s,server,nowait" %
974
                    self._InstanceSerial(instance.name))
975
      kvm_cmd.extend(["-serial", serial_dev])
976
    else:
977
      kvm_cmd.extend(["-serial", "none"])
978

    
979
    spice_bind = hvp[constants.HV_KVM_SPICE_BIND]
980
    spice_ip_version = None
981
    if spice_bind:
982
      if netutils.IsValidInterface(spice_bind):
983
        # The user specified a network interface, we have to figure out the IP
984
        # address.
985
        addresses = netutils.GetInterfaceIpAddresses(spice_bind)
986
        spice_ip_version = hvp[constants.HV_KVM_SPICE_IP_VERSION]
987

    
988
        # if the user specified an IP version and the interface does not
989
        # have that kind of IP addresses, throw an exception
990
        if spice_ip_version != constants.IFACE_NO_IP_VERSION_SPECIFIED:
991
          if not addresses[spice_ip_version]:
992
            raise errors.HypervisorError("spice: unable to get an IPv%s address"
993
                                         " for %s" % (spice_ip_version,
994
                                                      spice_bind))
995

    
996
        # the user did not specify an IP version, we have to figure it out
997
        elif (addresses[constants.IP4_VERSION] and
998
              addresses[constants.IP6_VERSION]):
999
          # we have both ipv4 and ipv6, let's use the cluster default IP
1000
          # version
1001
          cluster_family = ssconf.SimpleStore().GetPrimaryIPFamily()
1002
          spice_ip_version = netutils.IPAddress.GetVersionFromAddressFamily(
1003
              cluster_family)
1004
        elif addresses[constants.IP4_VERSION]:
1005
          spice_ip_version = constants.IP4_VERSION
1006
        elif addresses[constants.IP6_VERSION]:
1007
          spice_ip_version = constants.IP6_VERSION
1008
        else:
1009
          raise errors.HypervisorError("spice: unable to get an IP address"
1010
                                       " for %s" % (spice_bind))
1011

    
1012
        spice_address = addresses[spice_ip_version][0]
1013

    
1014
      else:
1015
        # spice_bind is known to be a valid IP address, because
1016
        # ValidateParameters checked it.
1017
        spice_address = spice_bind
1018

    
1019
      spice_arg = "addr=%s,port=%s" % (spice_address, instance.network_port)
1020
      if not hvp[constants.HV_KVM_SPICE_PASSWORD_FILE]:
1021
        spice_arg = "%s,disable-ticketing" % spice_arg
1022

    
1023
      if spice_ip_version:
1024
        spice_arg = "%s,ipv%s" % (spice_arg, spice_ip_version)
1025

    
1026
      logging.info("KVM: SPICE will listen on port %s", instance.network_port)
1027
      kvm_cmd.extend(["-spice", spice_arg])
1028

    
1029
      # Tell kvm to use the paravirtualized graphic card, optimized for SPICE
1030
      kvm_cmd.extend(["-vga", "qxl"])
1031

    
1032
    if hvp[constants.HV_USE_LOCALTIME]:
1033
      kvm_cmd.extend(["-localtime"])
1034

    
1035
    if hvp[constants.HV_KVM_USE_CHROOT]:
1036
      kvm_cmd.extend(["-chroot", self._InstanceChrootDir(instance.name)])
1037

    
1038
    # Save the current instance nics, but defer their expansion as parameters,
1039
    # as we'll need to generate executable temp files for them.
1040
    kvm_nics = instance.nics
1041
    hvparams = hvp
1042

    
1043
    return (kvm_cmd, kvm_nics, hvparams)
1044

    
1045
  def _WriteKVMRuntime(self, instance_name, data):
1046
    """Write an instance's KVM runtime
1047

1048
    """
1049
    try:
1050
      utils.WriteFile(self._InstanceKVMRuntime(instance_name),
1051
                      data=data)
1052
    except EnvironmentError, err:
1053
      raise errors.HypervisorError("Failed to save KVM runtime file: %s" % err)
1054

    
1055
  def _ReadKVMRuntime(self, instance_name):
1056
    """Read an instance's KVM runtime
1057

1058
    """
1059
    try:
1060
      file_content = utils.ReadFile(self._InstanceKVMRuntime(instance_name))
1061
    except EnvironmentError, err:
1062
      raise errors.HypervisorError("Failed to load KVM runtime file: %s" % err)
1063
    return file_content
1064

    
1065
  def _SaveKVMRuntime(self, instance, kvm_runtime):
1066
    """Save an instance's KVM runtime
1067

1068
    """
1069
    kvm_cmd, kvm_nics, hvparams = kvm_runtime
1070
    serialized_nics = [nic.ToDict() for nic in kvm_nics]
1071
    serialized_form = serializer.Dump((kvm_cmd, serialized_nics, hvparams))
1072
    self._WriteKVMRuntime(instance.name, serialized_form)
1073

    
1074
  def _LoadKVMRuntime(self, instance, serialized_runtime=None):
1075
    """Load an instance's KVM runtime
1076

1077
    """
1078
    if not serialized_runtime:
1079
      serialized_runtime = self._ReadKVMRuntime(instance.name)
1080
    loaded_runtime = serializer.Load(serialized_runtime)
1081
    kvm_cmd, serialized_nics, hvparams = loaded_runtime
1082
    kvm_nics = [objects.NIC.FromDict(snic) for snic in serialized_nics]
1083
    return (kvm_cmd, kvm_nics, hvparams)
1084

    
1085
  def _RunKVMCmd(self, name, kvm_cmd, tap_fds=None):
1086
    """Run the KVM cmd and check for errors
1087

1088
    @type name: string
1089
    @param name: instance name
1090
    @type kvm_cmd: list of strings
1091
    @param kvm_cmd: runcmd input for kvm
1092
    @type tap_fds: list of int
1093
    @param tap_fds: fds of tap devices opened by Ganeti
1094

1095
    """
1096
    try:
1097
      result = utils.RunCmd(kvm_cmd, noclose_fds=tap_fds)
1098
    finally:
1099
      for fd in tap_fds:
1100
        utils_wrapper.CloseFdNoError(fd)
1101

    
1102
    if result.failed:
1103
      raise errors.HypervisorError("Failed to start instance %s: %s (%s)" %
1104
                                   (name, result.fail_reason, result.output))
1105
    if not self._InstancePidAlive(name)[2]:
1106
      raise errors.HypervisorError("Failed to start instance %s" % name)
1107

    
1108
  def _ExecuteKVMRuntime(self, instance, kvm_runtime, incoming=None):
1109
    """Execute a KVM cmd, after completing it with some last minute data
1110

1111
    @type incoming: tuple of strings
1112
    @param incoming: (target_host_ip, port)
1113

1114
    """
1115
    # Small _ExecuteKVMRuntime hv parameters programming howto:
1116
    #  - conf_hvp contains the parameters as configured on ganeti. they might
1117
    #    have changed since the instance started; only use them if the change
1118
    #    won't affect the inside of the instance (which hasn't been rebooted).
1119
    #  - up_hvp contains the parameters as they were when the instance was
1120
    #    started, plus any new parameter which has been added between ganeti
1121
    #    versions: it is paramount that those default to a value which won't
1122
    #    affect the inside of the instance as well.
1123
    conf_hvp = instance.hvparams
1124
    name = instance.name
1125
    self._CheckDown(name)
1126

    
1127
    temp_files = []
1128

    
1129
    kvm_cmd, kvm_nics, up_hvp = kvm_runtime
1130
    up_hvp = objects.FillDict(conf_hvp, up_hvp)
1131

    
1132
    _, v_major, v_min, _ = self._GetKVMVersion()
1133

    
1134
    # We know it's safe to run as a different user upon migration, so we'll use
1135
    # the latest conf, from conf_hvp.
1136
    security_model = conf_hvp[constants.HV_SECURITY_MODEL]
1137
    if security_model == constants.HT_SM_USER:
1138
      kvm_cmd.extend(["-runas", conf_hvp[constants.HV_SECURITY_DOMAIN]])
1139

    
1140
    # We have reasons to believe changing something like the nic driver/type
1141
    # upon migration won't exactly fly with the instance kernel, so for nic
1142
    # related parameters we'll use up_hvp
1143
    tapfds = []
1144
    taps = []
1145
    if not kvm_nics:
1146
      kvm_cmd.extend(["-net", "none"])
1147
    else:
1148
      vnet_hdr = False
1149
      tap_extra = ""
1150
      nic_type = up_hvp[constants.HV_NIC_TYPE]
1151
      if nic_type == constants.HT_NIC_PARAVIRTUAL:
1152
        # From version 0.12.0, kvm uses a new sintax for network configuration.
1153
        if (v_major, v_min) >= (0, 12):
1154
          nic_model = "virtio-net-pci"
1155
          vnet_hdr = True
1156
        else:
1157
          nic_model = "virtio"
1158

    
1159
        if up_hvp[constants.HV_VHOST_NET]:
1160
          # vhost_net is only available from version 0.13.0 or newer
1161
          if (v_major, v_min) >= (0, 13):
1162
            tap_extra = ",vhost=on"
1163
          else:
1164
            raise errors.HypervisorError("vhost_net is configured"
1165
                                        " but it is not available")
1166
      else:
1167
        nic_model = nic_type
1168

    
1169
      for nic_seq, nic in enumerate(kvm_nics):
1170
        tapname, tapfd = _OpenTap(vnet_hdr)
1171
        tapfds.append(tapfd)
1172
        taps.append(tapname)
1173
        if (v_major, v_min) >= (0, 12):
1174
          nic_val = "%s,mac=%s,netdev=netdev%s" % (nic_model, nic.mac, nic_seq)
1175
          tap_val = "type=tap,id=netdev%s,fd=%d%s" % (nic_seq, tapfd, tap_extra)
1176
          kvm_cmd.extend(["-netdev", tap_val, "-device", nic_val])
1177
        else:
1178
          nic_val = "nic,vlan=%s,macaddr=%s,model=%s" % (nic_seq,
1179
                                                         nic.mac, nic_model)
1180
          tap_val = "tap,vlan=%s,fd=%d" % (nic_seq, tapfd)
1181
          kvm_cmd.extend(["-net", tap_val, "-net", nic_val])
1182

    
1183
    if incoming:
1184
      target, port = incoming
1185
      kvm_cmd.extend(["-incoming", "tcp:%s:%s" % (target, port)])
1186

    
1187
    # Changing the vnc password doesn't bother the guest that much. At most it
1188
    # will surprise people who connect to it. Whether positively or negatively
1189
    # it's debatable.
1190
    vnc_pwd_file = conf_hvp[constants.HV_VNC_PASSWORD_FILE]
1191
    vnc_pwd = None
1192
    if vnc_pwd_file:
1193
      try:
1194
        vnc_pwd = utils.ReadOneLineFile(vnc_pwd_file, strict=True)
1195
      except EnvironmentError, err:
1196
        raise errors.HypervisorError("Failed to open VNC password file %s: %s"
1197
                                     % (vnc_pwd_file, err))
1198

    
1199
    if conf_hvp[constants.HV_KVM_USE_CHROOT]:
1200
      utils.EnsureDirs([(self._InstanceChrootDir(name),
1201
                         constants.SECURE_DIR_MODE)])
1202

    
1203
    # Automatically enable QMP if version is >= 0.14
1204
    if (v_major, v_min) >= (0, 14):
1205
      logging.debug("Enabling QMP")
1206
      kvm_cmd.extend(["-qmp", "unix:%s,server,nowait" %
1207
                    self._InstanceQmpMonitor(instance.name)])
1208

    
1209
    # Configure the network now for starting instances and bridged interfaces,
1210
    # during FinalizeMigration for incoming instances' routed interfaces
1211
    for nic_seq, nic in enumerate(kvm_nics):
1212
      if (incoming and
1213
          nic.nicparams[constants.NIC_MODE] != constants.NIC_MODE_BRIDGED):
1214
        continue
1215
      self._ConfigureNIC(instance, nic_seq, nic, taps[nic_seq])
1216

    
1217
    if security_model == constants.HT_SM_POOL:
1218
      ss = ssconf.SimpleStore()
1219
      uid_pool = uidpool.ParseUidPool(ss.GetUidPool(), separator="\n")
1220
      all_uids = set(uidpool.ExpandUidPool(uid_pool))
1221
      uid = uidpool.RequestUnusedUid(all_uids)
1222
      try:
1223
        username = pwd.getpwuid(uid.GetUid()).pw_name
1224
        kvm_cmd.extend(["-runas", username])
1225
        self._RunKVMCmd(name, kvm_cmd, tapfds)
1226
      except:
1227
        uidpool.ReleaseUid(uid)
1228
        raise
1229
      else:
1230
        uid.Unlock()
1231
        utils.WriteFile(self._InstanceUidFile(name), data=uid.AsStr())
1232
    else:
1233
      self._RunKVMCmd(name, kvm_cmd, tapfds)
1234

    
1235
    utils.EnsureDirs([(self._InstanceNICDir(instance.name),
1236
                     constants.RUN_DIRS_MODE)])
1237
    for nic_seq, tap in enumerate(taps):
1238
      utils.WriteFile(self._InstanceNICFile(instance.name, nic_seq),
1239
                      data=tap)
1240

    
1241
    if vnc_pwd:
1242
      change_cmd = "change vnc password %s" % vnc_pwd
1243
      self._CallMonitorCommand(instance.name, change_cmd)
1244

    
1245
    # Setting SPICE password. We are not vulnerable to malicious passwordless
1246
    # connection attempts because SPICE by default does not allow connections
1247
    # if neither a password nor the "disable_ticketing" options are specified.
1248
    # As soon as we send the password via QMP, that password is a valid ticket
1249
    # for connection.
1250
    spice_password_file = conf_hvp[constants.HV_KVM_SPICE_PASSWORD_FILE]
1251
    if spice_password_file:
1252
      try:
1253
        spice_pwd = utils.ReadOneLineFile(spice_password_file, strict=True)
1254
        qmp = QmpConnection(self._InstanceQmpMonitor(instance.name))
1255
        qmp.connect()
1256
        arguments = {
1257
            "protocol": "spice",
1258
            "password": spice_pwd,
1259
        }
1260
        qmp.Execute("set_password", arguments)
1261
      except EnvironmentError, err:
1262
        raise errors.HypervisorError("Failed to open SPICE password file %s: %s"
1263
                                     % (spice_password_file, err))
1264

    
1265
    for filename in temp_files:
1266
      utils.RemoveFile(filename)
1267

    
1268
  def StartInstance(self, instance, block_devices, startup_paused):
1269
    """Start an instance.
1270

1271
    """
1272
    self._CheckDown(instance.name)
1273
    kvm_runtime = self._GenerateKVMRuntime(instance, block_devices,
1274
                                           startup_paused)
1275
    self._SaveKVMRuntime(instance, kvm_runtime)
1276
    self._ExecuteKVMRuntime(instance, kvm_runtime)
1277

    
1278
  def _CallMonitorCommand(self, instance_name, command):
1279
    """Invoke a command on the instance monitor.
1280

1281
    """
1282
    socat = ("echo %s | %s STDIO UNIX-CONNECT:%s" %
1283
             (utils.ShellQuote(command),
1284
              constants.SOCAT_PATH,
1285
              utils.ShellQuote(self._InstanceMonitor(instance_name))))
1286
    result = utils.RunCmd(socat)
1287
    if result.failed:
1288
      msg = ("Failed to send command '%s' to instance %s."
1289
             " output: %s, error: %s, fail_reason: %s" %
1290
             (command, instance_name,
1291
              result.stdout, result.stderr, result.fail_reason))
1292
      raise errors.HypervisorError(msg)
1293

    
1294
    return result
1295

    
1296
  @classmethod
1297
  def _GetKVMVersion(cls):
1298
    """Return the installed KVM version.
1299

1300
    @return: (version, v_maj, v_min, v_rev)
1301
    @raise L{errors.HypervisorError}: when the KVM version cannot be retrieved
1302

1303
    """
1304
    result = utils.RunCmd([constants.KVM_PATH, "--help"])
1305
    if result.failed:
1306
      raise errors.HypervisorError("Unable to get KVM version")
1307
    match = cls._VERSION_RE.search(result.output.splitlines()[0])
1308
    if not match:
1309
      raise errors.HypervisorError("Unable to get KVM version")
1310

    
1311
    return (match.group(0), int(match.group(1)), int(match.group(2)),
1312
            int(match.group(3)))
1313

    
1314
  def StopInstance(self, instance, force=False, retry=False, name=None):
1315
    """Stop an instance.
1316

1317
    """
1318
    if name is not None and not force:
1319
      raise errors.HypervisorError("Cannot shutdown cleanly by name only")
1320
    if name is None:
1321
      name = instance.name
1322
      acpi = instance.hvparams[constants.HV_ACPI]
1323
    else:
1324
      acpi = False
1325
    _, pid, alive = self._InstancePidAlive(name)
1326
    if pid > 0 and alive:
1327
      if force or not acpi:
1328
        utils.KillProcess(pid)
1329
      else:
1330
        self._CallMonitorCommand(name, "system_powerdown")
1331

    
1332
  def CleanupInstance(self, instance_name):
1333
    """Cleanup after a stopped instance
1334

1335
    """
1336
    pidfile, pid, alive = self._InstancePidAlive(instance_name)
1337
    if pid > 0 and alive:
1338
      raise errors.HypervisorError("Cannot cleanup a live instance")
1339
    self._RemoveInstanceRuntimeFiles(pidfile, instance_name)
1340

    
1341
  def RebootInstance(self, instance):
1342
    """Reboot an instance.
1343

1344
    """
1345
    # For some reason if we do a 'send-key ctrl-alt-delete' to the control
1346
    # socket the instance will stop, but now power up again. So we'll resort
1347
    # to shutdown and restart.
1348
    _, _, alive = self._InstancePidAlive(instance.name)
1349
    if not alive:
1350
      raise errors.HypervisorError("Failed to reboot instance %s:"
1351
                                   " not running" % instance.name)
1352
    # StopInstance will delete the saved KVM runtime so:
1353
    # ...first load it...
1354
    kvm_runtime = self._LoadKVMRuntime(instance)
1355
    # ...now we can safely call StopInstance...
1356
    if not self.StopInstance(instance):
1357
      self.StopInstance(instance, force=True)
1358
    # ...and finally we can save it again, and execute it...
1359
    self._SaveKVMRuntime(instance, kvm_runtime)
1360
    self._ExecuteKVMRuntime(instance, kvm_runtime)
1361

    
1362
  def MigrationInfo(self, instance):
1363
    """Get instance information to perform a migration.
1364

1365
    @type instance: L{objects.Instance}
1366
    @param instance: instance to be migrated
1367
    @rtype: string
1368
    @return: content of the KVM runtime file
1369

1370
    """
1371
    return self._ReadKVMRuntime(instance.name)
1372

    
1373
  def AcceptInstance(self, instance, info, target):
1374
    """Prepare to accept an instance.
1375

1376
    @type instance: L{objects.Instance}
1377
    @param instance: instance to be accepted
1378
    @type info: string
1379
    @param info: content of the KVM runtime file on the source node
1380
    @type target: string
1381
    @param target: target host (usually ip), on this node
1382

1383
    """
1384
    kvm_runtime = self._LoadKVMRuntime(instance, serialized_runtime=info)
1385
    incoming_address = (target, instance.hvparams[constants.HV_MIGRATION_PORT])
1386
    self._ExecuteKVMRuntime(instance, kvm_runtime, incoming=incoming_address)
1387

    
1388
  def FinalizeMigration(self, instance, info, success):
1389
    """Finalize an instance migration.
1390

1391
    Stop the incoming mode KVM.
1392

1393
    @type instance: L{objects.Instance}
1394
    @param instance: instance whose migration is being finalized
1395

1396
    """
1397
    if success:
1398
      kvm_runtime = self._LoadKVMRuntime(instance, serialized_runtime=info)
1399
      kvm_nics = kvm_runtime[1]
1400

    
1401
      for nic_seq, nic in enumerate(kvm_nics):
1402
        if nic.nicparams[constants.NIC_MODE] == constants.NIC_MODE_BRIDGED:
1403
          # Bridged interfaces have already been configured
1404
          continue
1405
        try:
1406
          tap = utils.ReadFile(self._InstanceNICFile(instance.name, nic_seq))
1407
        except EnvironmentError, err:
1408
          logging.warning("Failed to find host interface for %s NIC #%d: %s",
1409
                          instance.name, nic_seq, str(err))
1410
          continue
1411
        try:
1412
          self._ConfigureNIC(instance, nic_seq, nic, tap)
1413
        except errors.HypervisorError, err:
1414
          logging.warning(str(err))
1415

    
1416
      self._WriteKVMRuntime(instance.name, info)
1417
    else:
1418
      self.StopInstance(instance, force=True)
1419

    
1420
  def MigrateInstance(self, instance, target, live):
1421
    """Migrate an instance to a target node.
1422

1423
    The migration will not be attempted if the instance is not
1424
    currently running.
1425

1426
    @type instance: L{objects.Instance}
1427
    @param instance: the instance to be migrated
1428
    @type target: string
1429
    @param target: ip address of the target node
1430
    @type live: boolean
1431
    @param live: perform a live migration
1432

1433
    """
1434
    instance_name = instance.name
1435
    port = instance.hvparams[constants.HV_MIGRATION_PORT]
1436
    pidfile, pid, alive = self._InstancePidAlive(instance_name)
1437
    if not alive:
1438
      raise errors.HypervisorError("Instance not running, cannot migrate")
1439

    
1440
    if not live:
1441
      self._CallMonitorCommand(instance_name, "stop")
1442

    
1443
    migrate_command = ("migrate_set_speed %dm" %
1444
        instance.hvparams[constants.HV_MIGRATION_BANDWIDTH])
1445
    self._CallMonitorCommand(instance_name, migrate_command)
1446

    
1447
    migrate_command = ("migrate_set_downtime %dms" %
1448
        instance.hvparams[constants.HV_MIGRATION_DOWNTIME])
1449
    self._CallMonitorCommand(instance_name, migrate_command)
1450

    
1451
    migrate_command = "migrate -d tcp:%s:%s" % (target, port)
1452
    self._CallMonitorCommand(instance_name, migrate_command)
1453

    
1454
    info_command = "info migrate"
1455
    done = False
1456
    broken_answers = 0
1457
    while not done:
1458
      result = self._CallMonitorCommand(instance_name, info_command)
1459
      match = self._MIGRATION_STATUS_RE.search(result.stdout)
1460
      if not match:
1461
        broken_answers += 1
1462
        if not result.stdout:
1463
          logging.info("KVM: empty 'info migrate' result")
1464
        else:
1465
          logging.warning("KVM: unknown 'info migrate' result: %s",
1466
                          result.stdout)
1467
        time.sleep(self._MIGRATION_INFO_RETRY_DELAY)
1468
      else:
1469
        status = match.group(1)
1470
        if status == "completed":
1471
          done = True
1472
        elif status == "active":
1473
          # reset the broken answers count
1474
          broken_answers = 0
1475
          time.sleep(self._MIGRATION_INFO_RETRY_DELAY)
1476
        elif status == "failed" or status == "cancelled":
1477
          if not live:
1478
            self._CallMonitorCommand(instance_name, 'cont')
1479
          raise errors.HypervisorError("Migration %s at the kvm level" %
1480
                                       status)
1481
        else:
1482
          logging.warning("KVM: unknown migration status '%s'", status)
1483
          broken_answers += 1
1484
          time.sleep(self._MIGRATION_INFO_RETRY_DELAY)
1485
      if broken_answers >= self._MIGRATION_INFO_MAX_BAD_ANSWERS:
1486
        raise errors.HypervisorError("Too many 'info migrate' broken answers")
1487

    
1488
    utils.KillProcess(pid)
1489
    self._RemoveInstanceRuntimeFiles(pidfile, instance_name)
1490

    
1491
  def GetNodeInfo(self):
1492
    """Return information about the node.
1493

1494
    This is just a wrapper over the base GetLinuxNodeInfo method.
1495

1496
    @return: a dict with the following keys (values in MiB):
1497
          - memory_total: the total memory size on the node
1498
          - memory_free: the available memory on the node for instances
1499
          - memory_dom0: the memory used by the node itself, if available
1500

1501
    """
1502
    return self.GetLinuxNodeInfo()
1503

    
1504
  @classmethod
1505
  def GetInstanceConsole(cls, instance, hvparams, beparams):
1506
    """Return a command for connecting to the console of an instance.
1507

1508
    """
1509
    if hvparams[constants.HV_SERIAL_CONSOLE]:
1510
      cmd = [constants.KVM_CONSOLE_WRAPPER,
1511
             constants.SOCAT_PATH, utils.ShellQuote(instance.name),
1512
             utils.ShellQuote(cls._InstanceMonitor(instance.name)),
1513
             "STDIO,%s" % cls._SocatUnixConsoleParams(),
1514
             "UNIX-CONNECT:%s" % cls._InstanceSerial(instance.name)]
1515
      return objects.InstanceConsole(instance=instance.name,
1516
                                     kind=constants.CONS_SSH,
1517
                                     host=instance.primary_node,
1518
                                     user=constants.GANETI_RUNAS,
1519
                                     command=cmd)
1520

    
1521
    vnc_bind_address = hvparams[constants.HV_VNC_BIND_ADDRESS]
1522
    if vnc_bind_address and instance.network_port > constants.VNC_BASE_PORT:
1523
      display = instance.network_port - constants.VNC_BASE_PORT
1524
      return objects.InstanceConsole(instance=instance.name,
1525
                                     kind=constants.CONS_VNC,
1526
                                     host=vnc_bind_address,
1527
                                     port=instance.network_port,
1528
                                     display=display)
1529

    
1530
    spice_bind = hvparams[constants.HV_KVM_SPICE_BIND]
1531
    if spice_bind:
1532
      return objects.InstanceConsole(instance=instance.name,
1533
                                     kind=constants.CONS_SPICE,
1534
                                     host=spice_bind,
1535
                                     port=instance.network_port)
1536

    
1537
    return objects.InstanceConsole(instance=instance.name,
1538
                                   kind=constants.CONS_MESSAGE,
1539
                                   message=("No serial shell for instance %s" %
1540
                                            instance.name))
1541

    
1542
  def Verify(self):
1543
    """Verify the hypervisor.
1544

1545
    Check that the binary exists.
1546

1547
    """
1548
    if not os.path.exists(constants.KVM_PATH):
1549
      return "The kvm binary ('%s') does not exist." % constants.KVM_PATH
1550
    if not os.path.exists(constants.SOCAT_PATH):
1551
      return "The socat binary ('%s') does not exist." % constants.SOCAT_PATH
1552

    
1553
  @classmethod
1554
  def CheckParameterSyntax(cls, hvparams):
1555
    """Check the given parameters for validity.
1556

1557
    @type hvparams:  dict
1558
    @param hvparams: dictionary with parameter names/value
1559
    @raise errors.HypervisorError: when a parameter is not valid
1560

1561
    """
1562
    super(KVMHypervisor, cls).CheckParameterSyntax(hvparams)
1563

    
1564
    kernel_path = hvparams[constants.HV_KERNEL_PATH]
1565
    if kernel_path:
1566
      if not hvparams[constants.HV_ROOT_PATH]:
1567
        raise errors.HypervisorError("Need a root partition for the instance,"
1568
                                     " if a kernel is defined")
1569

    
1570
    if (hvparams[constants.HV_VNC_X509_VERIFY] and
1571
        not hvparams[constants.HV_VNC_X509]):
1572
      raise errors.HypervisorError("%s must be defined, if %s is" %
1573
                                   (constants.HV_VNC_X509,
1574
                                    constants.HV_VNC_X509_VERIFY))
1575

    
1576
    boot_order = hvparams[constants.HV_BOOT_ORDER]
1577
    if (boot_order == constants.HT_BO_CDROM and
1578
        not hvparams[constants.HV_CDROM_IMAGE_PATH]):
1579
      raise errors.HypervisorError("Cannot boot from cdrom without an"
1580
                                   " ISO path")
1581

    
1582
    security_model = hvparams[constants.HV_SECURITY_MODEL]
1583
    if security_model == constants.HT_SM_USER:
1584
      if not hvparams[constants.HV_SECURITY_DOMAIN]:
1585
        raise errors.HypervisorError("A security domain (user to run kvm as)"
1586
                                     " must be specified")
1587
    elif (security_model == constants.HT_SM_NONE or
1588
          security_model == constants.HT_SM_POOL):
1589
      if hvparams[constants.HV_SECURITY_DOMAIN]:
1590
        raise errors.HypervisorError("Cannot have a security domain when the"
1591
                                     " security model is 'none' or 'pool'")
1592

    
1593
    spice_bind = hvparams[constants.HV_KVM_SPICE_BIND]
1594
    spice_ip_version = hvparams[constants.HV_KVM_SPICE_IP_VERSION]
1595
    if spice_bind:
1596
      if spice_ip_version != constants.IFACE_NO_IP_VERSION_SPECIFIED:
1597
        # if an IP version is specified, the spice_bind parameter must be an
1598
        # IP of that family
1599
        if (netutils.IP4Address.IsValid(spice_bind) and
1600
            spice_ip_version != constants.IP4_VERSION):
1601
          raise errors.HypervisorError("spice: got an IPv4 address (%s), but"
1602
                                       " the specified IP version is %s" %
1603
                                       (spice_bind, spice_ip_version))
1604

    
1605
        if (netutils.IP6Address.IsValid(spice_bind) and
1606
            spice_ip_version != constants.IP6_VERSION):
1607
          raise errors.HypervisorError("spice: got an IPv6 address (%s), but"
1608
                                       " the specified IP version is %s" %
1609
                                       (spice_bind, spice_ip_version))
1610
    else:
1611
      # All the other SPICE parameters depend on spice_bind being set. Raise an
1612
      # error if any of them is set without it.
1613
      spice_additional_params = frozenset([
1614
        constants.HV_KVM_SPICE_IP_VERSION,
1615
        constants.HV_KVM_SPICE_PASSWORD_FILE,
1616
        ])
1617
      for param in spice_additional_params:
1618
        if hvparams[param]:
1619
          raise errors.HypervisorError("spice: %s requires %s to be set" %
1620
                                       (param, constants.HV_KVM_SPICE_BIND))
1621

    
1622
  @classmethod
1623
  def ValidateParameters(cls, hvparams):
1624
    """Check the given parameters for validity.
1625

1626
    @type hvparams:  dict
1627
    @param hvparams: dictionary with parameter names/value
1628
    @raise errors.HypervisorError: when a parameter is not valid
1629

1630
    """
1631
    super(KVMHypervisor, cls).ValidateParameters(hvparams)
1632

    
1633
    security_model = hvparams[constants.HV_SECURITY_MODEL]
1634
    if security_model == constants.HT_SM_USER:
1635
      username = hvparams[constants.HV_SECURITY_DOMAIN]
1636
      try:
1637
        pwd.getpwnam(username)
1638
      except KeyError:
1639
        raise errors.HypervisorError("Unknown security domain user %s"
1640
                                     % username)
1641

    
1642
    spice_bind = hvparams[constants.HV_KVM_SPICE_BIND]
1643
    if spice_bind:
1644
      # only one of VNC and SPICE can be used currently.
1645
      if hvparams[constants.HV_VNC_BIND_ADDRESS]:
1646
        raise errors.HypervisorError("both SPICE and VNC are configured, but"
1647
                                     " only one of them can be used at a"
1648
                                     " given time.")
1649

    
1650
      # KVM version should be >= 0.14.0
1651
      _, v_major, v_min, _ = cls._GetKVMVersion()
1652
      if (v_major, v_min) < (0, 14):
1653
        raise errors.HypervisorError("spice is configured, but it is not"
1654
                                     " available in versions of KVM < 0.14")
1655

    
1656
      # if spice_bind is not an IP address, it must be a valid interface
1657
      bound_to_addr = (netutils.IP4Address.IsValid(spice_bind)
1658
                       or netutils.IP6Address.IsValid(spice_bind))
1659
      if not bound_to_addr and not netutils.IsValidInterface(spice_bind):
1660
        raise errors.HypervisorError("spice: the %s parameter must be either"
1661
                                     " a valid IP address or interface name" %
1662
                                     constants.HV_KVM_SPICE_BIND)
1663

    
1664
  @classmethod
1665
  def PowercycleNode(cls):
1666
    """KVM powercycle, just a wrapper over Linux powercycle.
1667

1668
    """
1669
    cls.LinuxPowercycle()