Statistics
| Branch: | Tag: | Revision:

root / lib / hypervisor / hv_kvm.py @ b74de5e8

History | View | Annotate | Download (93.8 kB)

1
#
2
#
3

    
4
# Copyright (C) 2008, 2009, 2010, 2011, 2012, 2013 Google Inc.
5
#
6
# This program is free software; you can redistribute it and/or modify
7
# it under the terms of the GNU General Public License as published by
8
# the Free Software Foundation; either version 2 of the License, or
9
# (at your option) any later version.
10
#
11
# This program is distributed in the hope that it will be useful, but
12
# WITHOUT ANY WARRANTY; without even the implied warranty of
13
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
# General Public License for more details.
15
#
16
# You should have received a copy of the GNU General Public License
17
# along with this program; if not, write to the Free Software
18
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19
# 02110-1301, USA.
20

    
21

    
22
"""KVM hypervisor
23

24
"""
25

    
26
import errno
27
import os
28
import os.path
29
import re
30
import tempfile
31
import time
32
import logging
33
import pwd
34
import struct
35
import fcntl
36
import shutil
37
import socket
38
import stat
39
import StringIO
40
from bitarray import bitarray
41
try:
42
  import affinity   # pylint: disable=F0401
43
except ImportError:
44
  affinity = None
45
try:
46
  import fdsend   # pylint: disable=F0401
47
except ImportError:
48
  fdsend = None
49

    
50
from ganeti import utils
51
from ganeti import constants
52
from ganeti import errors
53
from ganeti import serializer
54
from ganeti import objects
55
from ganeti import uidpool
56
from ganeti import ssconf
57
from ganeti import netutils
58
from ganeti import pathutils
59
from ganeti.hypervisor import hv_base
60
from ganeti.utils import wrapper as utils_wrapper
61

    
62

    
63
_KVM_NETWORK_SCRIPT = pathutils.CONF_DIR + "/kvm-vif-bridge"
64
_KVM_START_PAUSED_FLAG = "-S"
65

    
66
# TUN/TAP driver constants, taken from <linux/if_tun.h>
67
# They are architecture-independent and already hardcoded in qemu-kvm source,
68
# so we can safely include them here.
69
TUNSETIFF = 0x400454ca
70
TUNGETIFF = 0x800454d2
71
TUNGETFEATURES = 0x800454cf
72
IFF_TAP = 0x0002
73
IFF_NO_PI = 0x1000
74
IFF_VNET_HDR = 0x4000
75

    
76
#: SPICE parameters which depend on L{constants.HV_KVM_SPICE_BIND}
77
_SPICE_ADDITIONAL_PARAMS = frozenset([
78
  constants.HV_KVM_SPICE_IP_VERSION,
79
  constants.HV_KVM_SPICE_PASSWORD_FILE,
80
  constants.HV_KVM_SPICE_LOSSLESS_IMG_COMPR,
81
  constants.HV_KVM_SPICE_JPEG_IMG_COMPR,
82
  constants.HV_KVM_SPICE_ZLIB_GLZ_IMG_COMPR,
83
  constants.HV_KVM_SPICE_STREAMING_VIDEO_DETECTION,
84
  constants.HV_KVM_SPICE_USE_TLS,
85
  ])
86

    
87
# Constant bitarray that reflects to a free pci slot
88
# Use it with bitarray.search()
89
_AVAILABLE_PCI_SLOT = bitarray("0")
90

    
91
# below constants show the format of runtime file
92
# the nics are in second possition, while the disks in 4th (last)
93
# moreover disk entries are stored in tupples of L{objects.Disk}, dev_path
94
_KVM_NICS_RUNTIME_INDEX = 1
95
_KVM_DISKS_RUNTIME_INDEX = 3
96
_DEVICE_RUNTIME_INDEX = {
97
  constants.HOTPLUG_TARGET_DISK: _KVM_DISKS_RUNTIME_INDEX,
98
  constants.HOTPLUG_TARGET_NIC: _KVM_NICS_RUNTIME_INDEX
99
  }
100
_FIND_RUNTIME_ENTRY = {
101
  constants.HOTPLUG_TARGET_NIC:
102
    lambda nic, kvm_nics: [n for n in kvm_nics if n.uuid == nic.uuid],
103
  constants.HOTPLUG_TARGET_DISK:
104
    lambda disk, kvm_disks: [(d, l) for (d, l) in kvm_disks
105
                             if d.uuid == disk.uuid]
106
  }
107
_RUNTIME_DEVICE = {
108
  constants.HOTPLUG_TARGET_NIC: lambda d: d,
109
  constants.HOTPLUG_TARGET_DISK: lambda (d, e): d
110
  }
111
_RUNTIME_ENTRY = {
112
  constants.HOTPLUG_TARGET_NIC: lambda d, e: d,
113
  constants.HOTPLUG_TARGET_DISK: lambda d, e: (d, e)
114
  }
115

    
116

    
117
def _GenerateDeviceKVMId(dev_type, dev):
118
  """Helper function to generate a unique device name used by KVM
119

120
  QEMU monitor commands use names to identify devices. Here we use their pci
121
  slot and a part of their UUID to name them. dev.pci might be None for old
122
  devices in the cluster.
123

124
  @type dev_type: sting
125
  @param dev_type: device type of param dev
126
  @type dev: L{objects.Disk} or L{objects.NIC}
127
  @param dev: the device object for which we generate a kvm name
128
  @raise errors.HotplugError: in case a device has no pci slot (old devices)
129

130
  """
131

    
132
  if not dev.pci:
133
    raise errors.HotplugError("Hotplug is not supported for %s with UUID %s" %
134
                              (dev_type, dev.uuid))
135

    
136
  return "%s-%s-pci-%d" % (dev_type.lower(), dev.uuid.split("-")[0], dev.pci)
137

    
138

    
139
def _UpdatePCISlots(dev, pci_reservations):
140
  """Update pci configuration for a stopped instance
141

142
  If dev has a pci slot the reserve it, else find first available
143
  in pci_reservations bitarray. It acts on the same objects passed
144
  as params so there is no need to return anything.
145

146
  @type dev: L{objects.Disk} or L{objects.NIC}
147
  @param dev: the device object for which we update its pci slot
148
  @type pci_reservations: bitarray
149
  @param pci_reservations: existing pci reservations for an instance
150
  @raise errors.HotplugError: in case an instance has all its slot occupied
151

152
  """
153
  if dev.pci:
154
    free = dev.pci
155
  else: # pylint: disable=E1103
156
    [free] = pci_reservations.search(_AVAILABLE_PCI_SLOT, 1)
157
    if not free:
158
      raise errors.HypervisorError("All PCI slots occupied")
159
    dev.pci = int(free)
160

    
161
  pci_reservations[free] = True
162

    
163

    
164
def _GetExistingDeviceInfo(dev_type, device, runtime):
165
  """Helper function to get an existing device inside the runtime file
166

167
  Used when an instance is running. Load kvm runtime file and search
168
  for a device based on its type and uuid.
169

170
  @type dev_type: sting
171
  @param dev_type: device type of param dev
172
  @type device: L{objects.Disk} or L{objects.NIC}
173
  @param device: the device object for which we generate a kvm name
174
  @type runtime: tuple (cmd, nics, hvparams, disks)
175
  @param runtime: the runtime data to search for the device
176
  @raise errors.HotplugError: in case the requested device does not
177
    exist (e.g. device has been added without --hotplug option) or
178
    device info has not pci slot (e.g. old devices in the cluster)
179

180
  """
181
  index = _DEVICE_RUNTIME_INDEX[dev_type]
182
  found = _FIND_RUNTIME_ENTRY[dev_type](device, runtime[index])
183
  if not found:
184
    raise errors.HotplugError("Cannot find runtime info for %s with UUID %s" %
185
                              (dev_type, device.uuid))
186

    
187
  return found[0]
188

    
189

    
190
def _GetTunFeatures(fd, _ioctl=fcntl.ioctl):
191
  """Retrieves supported TUN features from file descriptor.
192

193
  @see: L{_ProbeTapVnetHdr}
194

195
  """
196
  req = struct.pack("I", 0)
197
  try:
198
    buf = _ioctl(fd, TUNGETFEATURES, req)
199
  except EnvironmentError, err:
200
    logging.warning("ioctl(TUNGETFEATURES) failed: %s", err)
201
    return None
202
  else:
203
    (flags, ) = struct.unpack("I", buf)
204
    return flags
205

    
206

    
207
def _ProbeTapVnetHdr(fd, _features_fn=_GetTunFeatures):
208
  """Check whether to enable the IFF_VNET_HDR flag.
209

210
  To do this, _all_ of the following conditions must be met:
211
   1. TUNGETFEATURES ioctl() *must* be implemented
212
   2. TUNGETFEATURES ioctl() result *must* contain the IFF_VNET_HDR flag
213
   3. TUNGETIFF ioctl() *must* be implemented; reading the kernel code in
214
      drivers/net/tun.c there is no way to test this until after the tap device
215
      has been created using TUNSETIFF, and there is no way to change the
216
      IFF_VNET_HDR flag after creating the interface, catch-22! However both
217
      TUNGETIFF and TUNGETFEATURES were introduced in kernel version 2.6.27,
218
      thus we can expect TUNGETIFF to be present if TUNGETFEATURES is.
219

220
   @type fd: int
221
   @param fd: the file descriptor of /dev/net/tun
222

223
  """
224
  flags = _features_fn(fd)
225

    
226
  if flags is None:
227
    # Not supported
228
    return False
229

    
230
  result = bool(flags & IFF_VNET_HDR)
231

    
232
  if not result:
233
    logging.warning("Kernel does not support IFF_VNET_HDR, not enabling")
234

    
235
  return result
236

    
237

    
238
def _OpenTap(vnet_hdr=True):
239
  """Open a new tap device and return its file descriptor.
240

241
  This is intended to be used by a qemu-type hypervisor together with the -net
242
  tap,fd=<fd> command line parameter.
243

244
  @type vnet_hdr: boolean
245
  @param vnet_hdr: Enable the VNET Header
246
  @return: (ifname, tapfd)
247
  @rtype: tuple
248

249
  """
250
  try:
251
    tapfd = os.open("/dev/net/tun", os.O_RDWR)
252
  except EnvironmentError:
253
    raise errors.HypervisorError("Failed to open /dev/net/tun")
254

    
255
  flags = IFF_TAP | IFF_NO_PI
256

    
257
  if vnet_hdr and _ProbeTapVnetHdr(tapfd):
258
    flags |= IFF_VNET_HDR
259

    
260
  # The struct ifreq ioctl request (see netdevice(7))
261
  ifr = struct.pack("16sh", "", flags)
262

    
263
  try:
264
    res = fcntl.ioctl(tapfd, TUNSETIFF, ifr)
265
  except EnvironmentError, err:
266
    raise errors.HypervisorError("Failed to allocate a new TAP device: %s" %
267
                                 err)
268

    
269
  # Get the interface name from the ioctl
270
  ifname = struct.unpack("16sh", res)[0].strip("\x00")
271
  return (ifname, tapfd)
272

    
273

    
274
class QmpMessage:
275
  """QEMU Messaging Protocol (QMP) message.
276

277
  """
278
  def __init__(self, data):
279
    """Creates a new QMP message based on the passed data.
280

281
    """
282
    if not isinstance(data, dict):
283
      raise TypeError("QmpMessage must be initialized with a dict")
284

    
285
    self.data = data
286

    
287
  def __getitem__(self, field_name):
288
    """Get the value of the required field if present, or None.
289

290
    Overrides the [] operator to provide access to the message data,
291
    returning None if the required item is not in the message
292
    @return: the value of the field_name field, or None if field_name
293
             is not contained in the message
294

295
    """
296
    return self.data.get(field_name, None)
297

    
298
  def __setitem__(self, field_name, field_value):
299
    """Set the value of the required field_name to field_value.
300

301
    """
302
    self.data[field_name] = field_value
303

    
304
  @staticmethod
305
  def BuildFromJsonString(json_string):
306
    """Build a QmpMessage from a JSON encoded string.
307

308
    @type json_string: str
309
    @param json_string: JSON string representing the message
310
    @rtype: L{QmpMessage}
311
    @return: a L{QmpMessage} built from json_string
312

313
    """
314
    # Parse the string
315
    data = serializer.LoadJson(json_string)
316
    return QmpMessage(data)
317

    
318
  def __str__(self):
319
    # The protocol expects the JSON object to be sent as a single line.
320
    return serializer.DumpJson(self.data)
321

    
322
  def __eq__(self, other):
323
    # When comparing two QmpMessages, we are interested in comparing
324
    # their internal representation of the message data
325
    return self.data == other.data
326

    
327

    
328
class MonitorSocket(object):
329
  _SOCKET_TIMEOUT = 5
330

    
331
  def __init__(self, monitor_filename):
332
    """Instantiates the MonitorSocket object.
333

334
    @type monitor_filename: string
335
    @param monitor_filename: the filename of the UNIX raw socket on which the
336
                             monitor (QMP or simple one) is listening
337

338
    """
339
    self.monitor_filename = monitor_filename
340
    self.sock = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)
341
    # We want to fail if the server doesn't send a complete message
342
    # in a reasonable amount of time
343
    self.sock.settimeout(self._SOCKET_TIMEOUT)
344
    self._connected = False
345

    
346
  def _check_socket(self):
347
    sock_stat = None
348
    try:
349
      sock_stat = os.stat(self.monitor_filename)
350
    except EnvironmentError, err:
351
      if err.errno == errno.ENOENT:
352
        raise errors.HypervisorError("No monitor socket found")
353
      else:
354
        raise errors.HypervisorError("Error checking monitor socket: %s",
355
                                     utils.ErrnoOrStr(err))
356
    if not stat.S_ISSOCK(sock_stat.st_mode):
357
      raise errors.HypervisorError("Monitor socket is not a socket")
358

    
359
  def _check_connection(self):
360
    """Make sure that the connection is established.
361

362
    """
363
    if not self._connected:
364
      raise errors.ProgrammerError("To use a MonitorSocket you need to first"
365
                                   " invoke connect() on it")
366

    
367
  def connect(self):
368
    """Connects to the monitor.
369

370
    Connects to the UNIX socket
371

372
    @raise errors.HypervisorError: when there are communication errors
373

374
    """
375
    if self._connected:
376
      raise errors.ProgrammerError("Cannot connect twice")
377

    
378
    self._check_socket()
379

    
380
    # Check file existance/stuff
381
    try:
382
      self.sock.connect(self.monitor_filename)
383
    except EnvironmentError:
384
      raise errors.HypervisorError("Can't connect to qmp socket")
385
    self._connected = True
386

    
387
  def close(self):
388
    """Closes the socket
389

390
    It cannot be used after this call.
391

392
    """
393
    self.sock.close()
394

    
395

    
396
class QmpConnection(MonitorSocket):
397
  """Connection to the QEMU Monitor using the QEMU Monitor Protocol (QMP).
398

399
  """
400
  _FIRST_MESSAGE_KEY = "QMP"
401
  _EVENT_KEY = "event"
402
  _ERROR_KEY = "error"
403
  _RETURN_KEY = RETURN_KEY = "return"
404
  _ACTUAL_KEY = ACTUAL_KEY = "actual"
405
  _ERROR_CLASS_KEY = "class"
406
  _ERROR_DATA_KEY = "data"
407
  _ERROR_DESC_KEY = "desc"
408
  _EXECUTE_KEY = "execute"
409
  _ARGUMENTS_KEY = "arguments"
410
  _CAPABILITIES_COMMAND = "qmp_capabilities"
411
  _MESSAGE_END_TOKEN = "\r\n"
412

    
413
  def __init__(self, monitor_filename):
414
    super(QmpConnection, self).__init__(monitor_filename)
415
    self._buf = ""
416

    
417
  def connect(self):
418
    """Connects to the QMP monitor.
419

420
    Connects to the UNIX socket and makes sure that we can actually send and
421
    receive data to the kvm instance via QMP.
422

423
    @raise errors.HypervisorError: when there are communication errors
424
    @raise errors.ProgrammerError: when there are data serialization errors
425

426
    """
427
    super(QmpConnection, self).connect()
428
    # Check if we receive a correct greeting message from the server
429
    # (As per the QEMU Protocol Specification 0.1 - section 2.2)
430
    greeting = self._Recv()
431
    if not greeting[self._FIRST_MESSAGE_KEY]:
432
      self._connected = False
433
      raise errors.HypervisorError("kvm: QMP communication error (wrong"
434
                                   " server greeting")
435

    
436
    # Let's put the monitor in command mode using the qmp_capabilities
437
    # command, or else no command will be executable.
438
    # (As per the QEMU Protocol Specification 0.1 - section 4)
439
    self.Execute(self._CAPABILITIES_COMMAND)
440

    
441
  def _ParseMessage(self, buf):
442
    """Extract and parse a QMP message from the given buffer.
443

444
    Seeks for a QMP message in the given buf. If found, it parses it and
445
    returns it together with the rest of the characters in the buf.
446
    If no message is found, returns None and the whole buffer.
447

448
    @raise errors.ProgrammerError: when there are data serialization errors
449

450
    """
451
    message = None
452
    # Check if we got the message end token (CRLF, as per the QEMU Protocol
453
    # Specification 0.1 - Section 2.1.1)
454
    pos = buf.find(self._MESSAGE_END_TOKEN)
455
    if pos >= 0:
456
      try:
457
        message = QmpMessage.BuildFromJsonString(buf[:pos + 1])
458
      except Exception, err:
459
        raise errors.ProgrammerError("QMP data serialization error: %s" % err)
460
      buf = buf[pos + 1:]
461

    
462
    return (message, buf)
463

    
464
  def _Recv(self):
465
    """Receives a message from QMP and decodes the received JSON object.
466

467
    @rtype: QmpMessage
468
    @return: the received message
469
    @raise errors.HypervisorError: when there are communication errors
470
    @raise errors.ProgrammerError: when there are data serialization errors
471

472
    """
473
    self._check_connection()
474

    
475
    # Check if there is already a message in the buffer
476
    (message, self._buf) = self._ParseMessage(self._buf)
477
    if message:
478
      return message
479

    
480
    recv_buffer = StringIO.StringIO(self._buf)
481
    recv_buffer.seek(len(self._buf))
482
    try:
483
      while True:
484
        data = self.sock.recv(4096)
485
        if not data:
486
          break
487
        recv_buffer.write(data)
488

    
489
        (message, self._buf) = self._ParseMessage(recv_buffer.getvalue())
490
        if message:
491
          return message
492

    
493
    except socket.timeout, err:
494
      raise errors.HypervisorError("Timeout while receiving a QMP message: "
495
                                   "%s" % (err))
496
    except socket.error, err:
497
      raise errors.HypervisorError("Unable to receive data from KVM using the"
498
                                   " QMP protocol: %s" % err)
499

    
500
  def _Send(self, message):
501
    """Encodes and sends a message to KVM using QMP.
502

503
    @type message: QmpMessage
504
    @param message: message to send to KVM
505
    @raise errors.HypervisorError: when there are communication errors
506
    @raise errors.ProgrammerError: when there are data serialization errors
507

508
    """
509
    self._check_connection()
510
    try:
511
      message_str = str(message)
512
    except Exception, err:
513
      raise errors.ProgrammerError("QMP data deserialization error: %s" % err)
514

    
515
    try:
516
      self.sock.sendall(message_str)
517
    except socket.timeout, err:
518
      raise errors.HypervisorError("Timeout while sending a QMP message: "
519
                                   "%s (%s)" % (err.string, err.errno))
520
    except socket.error, err:
521
      raise errors.HypervisorError("Unable to send data from KVM using the"
522
                                   " QMP protocol: %s" % err)
523

    
524
  def Execute(self, command, arguments=None):
525
    """Executes a QMP command and returns the response of the server.
526

527
    @type command: str
528
    @param command: the command to execute
529
    @type arguments: dict
530
    @param arguments: dictionary of arguments to be passed to the command
531
    @rtype: dict
532
    @return: dictionary representing the received JSON object
533
    @raise errors.HypervisorError: when there are communication errors
534
    @raise errors.ProgrammerError: when there are data serialization errors
535

536
    """
537
    self._check_connection()
538
    message = QmpMessage({self._EXECUTE_KEY: command})
539
    if arguments:
540
      message[self._ARGUMENTS_KEY] = arguments
541
    self._Send(message)
542

    
543
    # Events can occur between the sending of the command and the reception
544
    # of the response, so we need to filter out messages with the event key.
545
    while True:
546
      response = self._Recv()
547
      err = response[self._ERROR_KEY]
548
      if err:
549
        raise errors.HypervisorError("kvm: error executing the %s"
550
                                     " command: %s (%s, %s):" %
551
                                     (command,
552
                                      err[self._ERROR_DESC_KEY],
553
                                      err[self._ERROR_CLASS_KEY],
554
                                      err[self._ERROR_DATA_KEY]))
555

    
556
      elif not response[self._EVENT_KEY]:
557
        return response
558

    
559

    
560
class KVMHypervisor(hv_base.BaseHypervisor):
561
  """KVM hypervisor interface
562

563
  """
564
  CAN_MIGRATE = True
565

    
566
  _ROOT_DIR = pathutils.RUN_DIR + "/kvm-hypervisor"
567
  _PIDS_DIR = _ROOT_DIR + "/pid" # contains live instances pids
568
  _UIDS_DIR = _ROOT_DIR + "/uid" # contains instances reserved uids
569
  _CTRL_DIR = _ROOT_DIR + "/ctrl" # contains instances control sockets
570
  _CONF_DIR = _ROOT_DIR + "/conf" # contains instances startup data
571
  _NICS_DIR = _ROOT_DIR + "/nic" # contains instances nic <-> tap associations
572
  _KEYMAP_DIR = _ROOT_DIR + "/keymap" # contains instances keymaps
573
  # KVM instances with chroot enabled are started in empty chroot directories.
574
  _CHROOT_DIR = _ROOT_DIR + "/chroot" # for empty chroot directories
575
  # After an instance is stopped, its chroot directory is removed.
576
  # If the chroot directory is not empty, it can't be removed.
577
  # A non-empty chroot directory indicates a possible security incident.
578
  # To support forensics, the non-empty chroot directory is quarantined in
579
  # a separate directory, called 'chroot-quarantine'.
580
  _CHROOT_QUARANTINE_DIR = _ROOT_DIR + "/chroot-quarantine"
581
  _DIRS = [_ROOT_DIR, _PIDS_DIR, _UIDS_DIR, _CTRL_DIR, _CONF_DIR, _NICS_DIR,
582
           _CHROOT_DIR, _CHROOT_QUARANTINE_DIR, _KEYMAP_DIR]
583

    
584
  PARAMETERS = {
585
    constants.HV_KVM_PATH: hv_base.REQ_FILE_CHECK,
586
    constants.HV_KERNEL_PATH: hv_base.OPT_FILE_CHECK,
587
    constants.HV_INITRD_PATH: hv_base.OPT_FILE_CHECK,
588
    constants.HV_ROOT_PATH: hv_base.NO_CHECK,
589
    constants.HV_KERNEL_ARGS: hv_base.NO_CHECK,
590
    constants.HV_ACPI: hv_base.NO_CHECK,
591
    constants.HV_SERIAL_CONSOLE: hv_base.NO_CHECK,
592
    constants.HV_SERIAL_SPEED: hv_base.NO_CHECK,
593
    constants.HV_VNC_BIND_ADDRESS:
594
      (False, lambda x: (netutils.IP4Address.IsValid(x) or
595
                         utils.IsNormAbsPath(x)),
596
       "The VNC bind address must be either a valid IP address or an absolute"
597
       " pathname", None, None),
598
    constants.HV_VNC_TLS: hv_base.NO_CHECK,
599
    constants.HV_VNC_X509: hv_base.OPT_DIR_CHECK,
600
    constants.HV_VNC_X509_VERIFY: hv_base.NO_CHECK,
601
    constants.HV_VNC_PASSWORD_FILE: hv_base.OPT_FILE_CHECK,
602
    constants.HV_KVM_SPICE_BIND: hv_base.NO_CHECK, # will be checked later
603
    constants.HV_KVM_SPICE_IP_VERSION:
604
      (False, lambda x: (x == constants.IFACE_NO_IP_VERSION_SPECIFIED or
605
                         x in constants.VALID_IP_VERSIONS),
606
       "The SPICE IP version should be 4 or 6",
607
       None, None),
608
    constants.HV_KVM_SPICE_PASSWORD_FILE: hv_base.OPT_FILE_CHECK,
609
    constants.HV_KVM_SPICE_LOSSLESS_IMG_COMPR:
610
      hv_base.ParamInSet(
611
        False, constants.HT_KVM_SPICE_VALID_LOSSLESS_IMG_COMPR_OPTIONS),
612
    constants.HV_KVM_SPICE_JPEG_IMG_COMPR:
613
      hv_base.ParamInSet(
614
        False, constants.HT_KVM_SPICE_VALID_LOSSY_IMG_COMPR_OPTIONS),
615
    constants.HV_KVM_SPICE_ZLIB_GLZ_IMG_COMPR:
616
      hv_base.ParamInSet(
617
        False, constants.HT_KVM_SPICE_VALID_LOSSY_IMG_COMPR_OPTIONS),
618
    constants.HV_KVM_SPICE_STREAMING_VIDEO_DETECTION:
619
      hv_base.ParamInSet(
620
        False, constants.HT_KVM_SPICE_VALID_VIDEO_STREAM_DETECTION_OPTIONS),
621
    constants.HV_KVM_SPICE_AUDIO_COMPR: hv_base.NO_CHECK,
622
    constants.HV_KVM_SPICE_USE_TLS: hv_base.NO_CHECK,
623
    constants.HV_KVM_SPICE_TLS_CIPHERS: hv_base.NO_CHECK,
624
    constants.HV_KVM_SPICE_USE_VDAGENT: hv_base.NO_CHECK,
625
    constants.HV_KVM_FLOPPY_IMAGE_PATH: hv_base.OPT_FILE_CHECK,
626
    constants.HV_CDROM_IMAGE_PATH: hv_base.OPT_FILE_CHECK,
627
    constants.HV_KVM_CDROM2_IMAGE_PATH: hv_base.OPT_FILE_CHECK,
628
    constants.HV_BOOT_ORDER:
629
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_BO_TYPES),
630
    constants.HV_NIC_TYPE:
631
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_NIC_TYPES),
632
    constants.HV_DISK_TYPE:
633
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_DISK_TYPES),
634
    constants.HV_KVM_CDROM_DISK_TYPE:
635
      hv_base.ParamInSet(False, constants.HT_KVM_VALID_DISK_TYPES),
636
    constants.HV_USB_MOUSE:
637
      hv_base.ParamInSet(False, constants.HT_KVM_VALID_MOUSE_TYPES),
638
    constants.HV_KEYMAP: hv_base.NO_CHECK,
639
    constants.HV_MIGRATION_PORT: hv_base.REQ_NET_PORT_CHECK,
640
    constants.HV_MIGRATION_BANDWIDTH: hv_base.REQ_NONNEGATIVE_INT_CHECK,
641
    constants.HV_MIGRATION_DOWNTIME: hv_base.REQ_NONNEGATIVE_INT_CHECK,
642
    constants.HV_MIGRATION_MODE: hv_base.MIGRATION_MODE_CHECK,
643
    constants.HV_USE_LOCALTIME: hv_base.NO_CHECK,
644
    constants.HV_DISK_CACHE:
645
      hv_base.ParamInSet(True, constants.HT_VALID_CACHE_TYPES),
646
    constants.HV_SECURITY_MODEL:
647
      hv_base.ParamInSet(True, constants.HT_KVM_VALID_SM_TYPES),
648
    constants.HV_SECURITY_DOMAIN: hv_base.NO_CHECK,
649
    constants.HV_KVM_FLAG:
650
      hv_base.ParamInSet(False, constants.HT_KVM_FLAG_VALUES),
651
    constants.HV_VHOST_NET: hv_base.NO_CHECK,
652
    constants.HV_KVM_USE_CHROOT: hv_base.NO_CHECK,
653
    constants.HV_MEM_PATH: hv_base.OPT_DIR_CHECK,
654
    constants.HV_REBOOT_BEHAVIOR:
655
      hv_base.ParamInSet(True, constants.REBOOT_BEHAVIORS),
656
    constants.HV_CPU_MASK: hv_base.OPT_MULTI_CPU_MASK_CHECK,
657
    constants.HV_CPU_TYPE: hv_base.NO_CHECK,
658
    constants.HV_CPU_CORES: hv_base.OPT_NONNEGATIVE_INT_CHECK,
659
    constants.HV_CPU_THREADS: hv_base.OPT_NONNEGATIVE_INT_CHECK,
660
    constants.HV_CPU_SOCKETS: hv_base.OPT_NONNEGATIVE_INT_CHECK,
661
    constants.HV_SOUNDHW: hv_base.NO_CHECK,
662
    constants.HV_USB_DEVICES: hv_base.NO_CHECK,
663
    constants.HV_VGA: hv_base.NO_CHECK,
664
    constants.HV_KVM_EXTRA: hv_base.NO_CHECK,
665
    constants.HV_KVM_MACHINE_VERSION: hv_base.NO_CHECK,
666
    constants.HV_VNET_HDR: hv_base.NO_CHECK,
667
    }
668

    
669
  _VIRTIO = "virtio"
670
  _VIRTIO_NET_PCI = "virtio-net-pci"
671
  _VIRTIO_BLK_PCI = "virtio-blk-pci"
672

    
673
  _MIGRATION_STATUS_RE = re.compile("Migration\s+status:\s+(\w+)",
674
                                    re.M | re.I)
675
  _MIGRATION_PROGRESS_RE = \
676
    re.compile(r"\s*transferred\s+ram:\s+(?P<transferred>\d+)\s+kbytes\s*\n"
677
               r"\s*remaining\s+ram:\s+(?P<remaining>\d+)\s+kbytes\s*\n"
678
               r"\s*total\s+ram:\s+(?P<total>\d+)\s+kbytes\s*\n", re.I)
679

    
680
  _MIGRATION_INFO_MAX_BAD_ANSWERS = 5
681
  _MIGRATION_INFO_RETRY_DELAY = 2
682

    
683
  _VERSION_RE = re.compile(r"\b(\d+)\.(\d+)(\.(\d+))?\b")
684

    
685
  _CPU_INFO_RE = re.compile(r"cpu\s+\#(\d+).*thread_id\s*=\s*(\d+)", re.I)
686
  _CPU_INFO_CMD = "info cpus"
687
  _CONT_CMD = "cont"
688

    
689
  _DEFAULT_MACHINE_VERSION_RE = re.compile(r"^(\S+).*\(default\)", re.M)
690
  _CHECK_MACHINE_VERSION_RE = \
691
    staticmethod(lambda x: re.compile(r"^(%s)[ ]+.*PC" % x, re.M))
692

    
693
  _QMP_RE = re.compile(r"^-qmp\s", re.M)
694
  _SPICE_RE = re.compile(r"^-spice\s", re.M)
695
  _VHOST_RE = re.compile(r"^-net\s.*,vhost=on|off", re.M)
696
  _ENABLE_KVM_RE = re.compile(r"^-enable-kvm\s", re.M)
697
  _DISABLE_KVM_RE = re.compile(r"^-disable-kvm\s", re.M)
698
  _NETDEV_RE = re.compile(r"^-netdev\s", re.M)
699
  _DISPLAY_RE = re.compile(r"^-display\s", re.M)
700
  _MACHINE_RE = re.compile(r"^-machine\s", re.M)
701
  _VIRTIO_NET_RE = re.compile(r"^name \"%s\"" % _VIRTIO_NET_PCI, re.M)
702
  _VIRTIO_BLK_RE = re.compile(r"^name \"%s\"" % _VIRTIO_BLK_PCI, re.M)
703
  # match  -drive.*boot=on|off on different lines, but in between accept only
704
  # dashes not preceeded by a new line (which would mean another option
705
  # different than -drive is starting)
706
  _BOOT_RE = re.compile(r"^-drive\s([^-]|(?<!^)-)*,boot=on\|off", re.M | re.S)
707

    
708
  _INFO_PCI_RE = re.compile(r'Bus.*device[ ]*(\d+).*')
709
  _INFO_PCI_CMD = "info pci"
710
  _INFO_VERSION_RE = \
711
    re.compile(r'^QEMU (\d+)\.(\d+)(\.(\d+))?.*monitor.*', re.M)
712
  _INFO_VERSION_CMD = "info version"
713

    
714
  _DEFAULT_PCI_RESERVATIONS = "11110000000000000000000000000000"
715

    
716
  ANCILLARY_FILES = [
717
    _KVM_NETWORK_SCRIPT,
718
    ]
719
  ANCILLARY_FILES_OPT = [
720
    _KVM_NETWORK_SCRIPT,
721
    ]
722

    
723
  # Supported kvm options to get output from
724
  _KVMOPT_HELP = "help"
725
  _KVMOPT_MLIST = "mlist"
726
  _KVMOPT_DEVICELIST = "devicelist"
727

    
728
  # Command to execute to get the output from kvm, and whether to
729
  # accept the output even on failure.
730
  _KVMOPTS_CMDS = {
731
    _KVMOPT_HELP: (["--help"], False),
732
    _KVMOPT_MLIST: (["-M", "?"], False),
733
    _KVMOPT_DEVICELIST: (["-device", "?"], True),
734
  }
735

    
736
  def __init__(self):
737
    hv_base.BaseHypervisor.__init__(self)
738
    # Let's make sure the directories we need exist, even if the RUN_DIR lives
739
    # in a tmpfs filesystem or has been otherwise wiped out.
740
    dirs = [(dname, constants.RUN_DIRS_MODE) for dname in self._DIRS]
741
    utils.EnsureDirs(dirs)
742

    
743
  @classmethod
744
  def _InstancePidFile(cls, instance_name):
745
    """Returns the instance pidfile.
746

747
    """
748
    return utils.PathJoin(cls._PIDS_DIR, instance_name)
749

    
750
  @classmethod
751
  def _InstanceUidFile(cls, instance_name):
752
    """Returns the instance uidfile.
753

754
    """
755
    return utils.PathJoin(cls._UIDS_DIR, instance_name)
756

    
757
  @classmethod
758
  def _InstancePidInfo(cls, pid):
759
    """Check pid file for instance information.
760

761
    Check that a pid file is associated with an instance, and retrieve
762
    information from its command line.
763

764
    @type pid: string or int
765
    @param pid: process id of the instance to check
766
    @rtype: tuple
767
    @return: (instance_name, memory, vcpus)
768
    @raise errors.HypervisorError: when an instance cannot be found
769

770
    """
771
    alive = utils.IsProcessAlive(pid)
772
    if not alive:
773
      raise errors.HypervisorError("Cannot get info for pid %s" % pid)
774

    
775
    cmdline_file = utils.PathJoin("/proc", str(pid), "cmdline")
776
    try:
777
      cmdline = utils.ReadFile(cmdline_file)
778
    except EnvironmentError, err:
779
      raise errors.HypervisorError("Can't open cmdline file for pid %s: %s" %
780
                                   (pid, err))
781

    
782
    instance = None
783
    memory = 0
784
    vcpus = 0
785

    
786
    arg_list = cmdline.split("\x00")
787
    while arg_list:
788
      arg = arg_list.pop(0)
789
      if arg == "-name":
790
        instance = arg_list.pop(0)
791
      elif arg == "-m":
792
        memory = int(arg_list.pop(0))
793
      elif arg == "-smp":
794
        vcpus = int(arg_list.pop(0).split(",")[0])
795

    
796
    if instance is None:
797
      raise errors.HypervisorError("Pid %s doesn't contain a ganeti kvm"
798
                                   " instance" % pid)
799

    
800
    return (instance, memory, vcpus)
801

    
802
  def _InstancePidAlive(self, instance_name):
803
    """Returns the instance pidfile, pid, and liveness.
804

805
    @type instance_name: string
806
    @param instance_name: instance name
807
    @rtype: tuple
808
    @return: (pid file name, pid, liveness)
809

810
    """
811
    pidfile = self._InstancePidFile(instance_name)
812
    pid = utils.ReadPidFile(pidfile)
813

    
814
    alive = False
815
    try:
816
      cmd_instance = self._InstancePidInfo(pid)[0]
817
      alive = (cmd_instance == instance_name)
818
    except errors.HypervisorError:
819
      pass
820

    
821
    return (pidfile, pid, alive)
822

    
823
  def _CheckDown(self, instance_name):
824
    """Raises an error unless the given instance is down.
825

826
    """
827
    alive = self._InstancePidAlive(instance_name)[2]
828
    if alive:
829
      raise errors.HypervisorError("Failed to start instance %s: %s" %
830
                                   (instance_name, "already running"))
831

    
832
  @classmethod
833
  def _InstanceMonitor(cls, instance_name):
834
    """Returns the instance monitor socket name
835

836
    """
837
    return utils.PathJoin(cls._CTRL_DIR, "%s.monitor" % instance_name)
838

    
839
  @classmethod
840
  def _InstanceSerial(cls, instance_name):
841
    """Returns the instance serial socket name
842

843
    """
844
    return utils.PathJoin(cls._CTRL_DIR, "%s.serial" % instance_name)
845

    
846
  @classmethod
847
  def _InstanceQmpMonitor(cls, instance_name):
848
    """Returns the instance serial QMP socket name
849

850
    """
851
    return utils.PathJoin(cls._CTRL_DIR, "%s.qmp" % instance_name)
852

    
853
  @staticmethod
854
  def _SocatUnixConsoleParams():
855
    """Returns the correct parameters for socat
856

857
    If we have a new-enough socat we can use raw mode with an escape character.
858

859
    """
860
    if constants.SOCAT_USE_ESCAPE:
861
      return "raw,echo=0,escape=%s" % constants.SOCAT_ESCAPE_CODE
862
    else:
863
      return "echo=0,icanon=0"
864

    
865
  @classmethod
866
  def _InstanceKVMRuntime(cls, instance_name):
867
    """Returns the instance KVM runtime filename
868

869
    """
870
    return utils.PathJoin(cls._CONF_DIR, "%s.runtime" % instance_name)
871

    
872
  @classmethod
873
  def _InstanceChrootDir(cls, instance_name):
874
    """Returns the name of the KVM chroot dir of the instance
875

876
    """
877
    return utils.PathJoin(cls._CHROOT_DIR, instance_name)
878

    
879
  @classmethod
880
  def _InstanceNICDir(cls, instance_name):
881
    """Returns the name of the directory holding the tap device files for a
882
    given instance.
883

884
    """
885
    return utils.PathJoin(cls._NICS_DIR, instance_name)
886

    
887
  @classmethod
888
  def _InstanceNICFile(cls, instance_name, seq):
889
    """Returns the name of the file containing the tap device for a given NIC
890

891
    """
892
    return utils.PathJoin(cls._InstanceNICDir(instance_name), str(seq))
893

    
894
  @classmethod
895
  def _InstanceKeymapFile(cls, instance_name):
896
    """Returns the name of the file containing the keymap for a given instance
897

898
    """
899
    return utils.PathJoin(cls._KEYMAP_DIR, instance_name)
900

    
901
  @classmethod
902
  def _TryReadUidFile(cls, uid_file):
903
    """Try to read a uid file
904

905
    """
906
    if os.path.exists(uid_file):
907
      try:
908
        uid = int(utils.ReadOneLineFile(uid_file))
909
        return uid
910
      except EnvironmentError:
911
        logging.warning("Can't read uid file", exc_info=True)
912
      except (TypeError, ValueError):
913
        logging.warning("Can't parse uid file contents", exc_info=True)
914
    return None
915

    
916
  @classmethod
917
  def _RemoveInstanceRuntimeFiles(cls, pidfile, instance_name):
918
    """Removes an instance's rutime sockets/files/dirs.
919

920
    """
921
    utils.RemoveFile(pidfile)
922
    utils.RemoveFile(cls._InstanceMonitor(instance_name))
923
    utils.RemoveFile(cls._InstanceSerial(instance_name))
924
    utils.RemoveFile(cls._InstanceQmpMonitor(instance_name))
925
    utils.RemoveFile(cls._InstanceKVMRuntime(instance_name))
926
    utils.RemoveFile(cls._InstanceKeymapFile(instance_name))
927
    uid_file = cls._InstanceUidFile(instance_name)
928
    uid = cls._TryReadUidFile(uid_file)
929
    utils.RemoveFile(uid_file)
930
    if uid is not None:
931
      uidpool.ReleaseUid(uid)
932
    try:
933
      shutil.rmtree(cls._InstanceNICDir(instance_name))
934
    except OSError, err:
935
      if err.errno != errno.ENOENT:
936
        raise
937
    try:
938
      chroot_dir = cls._InstanceChrootDir(instance_name)
939
      utils.RemoveDir(chroot_dir)
940
    except OSError, err:
941
      if err.errno == errno.ENOTEMPTY:
942
        # The chroot directory is expected to be empty, but it isn't.
943
        new_chroot_dir = tempfile.mkdtemp(dir=cls._CHROOT_QUARANTINE_DIR,
944
                                          prefix="%s-%s-" %
945
                                          (instance_name,
946
                                           utils.TimestampForFilename()))
947
        logging.warning("The chroot directory of instance %s can not be"
948
                        " removed as it is not empty. Moving it to the"
949
                        " quarantine instead. Please investigate the"
950
                        " contents (%s) and clean up manually",
951
                        instance_name, new_chroot_dir)
952
        utils.RenameFile(chroot_dir, new_chroot_dir)
953
      else:
954
        raise
955

    
956
  @staticmethod
957
  def _ConfigureNIC(instance, seq, nic, tap):
958
    """Run the network configuration script for a specified NIC
959

960
    @param instance: instance we're acting on
961
    @type instance: instance object
962
    @param seq: nic sequence number
963
    @type seq: int
964
    @param nic: nic we're acting on
965
    @type nic: nic object
966
    @param tap: the host's tap interface this NIC corresponds to
967
    @type tap: str
968

969
    """
970
    if instance.tags:
971
      tags = " ".join(instance.tags)
972
    else:
973
      tags = ""
974

    
975
    env = {
976
      "PATH": "%s:/sbin:/usr/sbin" % os.environ["PATH"],
977
      "INSTANCE": instance.name,
978
      "MAC": nic.mac,
979
      "MODE": nic.nicparams[constants.NIC_MODE],
980
      "INTERFACE": tap,
981
      "INTERFACE_INDEX": str(seq),
982
      "TAGS": tags,
983
    }
984

    
985
    if nic.ip:
986
      env["IP"] = nic.ip
987

    
988
    if nic.nicparams[constants.NIC_LINK]:
989
      env["LINK"] = nic.nicparams[constants.NIC_LINK]
990

    
991
    if nic.network:
992
      n = objects.Network.FromDict(nic.netinfo)
993
      env.update(n.HooksDict())
994

    
995
    if nic.nicparams[constants.NIC_MODE] == constants.NIC_MODE_BRIDGED:
996
      env["BRIDGE"] = nic.nicparams[constants.NIC_LINK]
997

    
998
    result = utils.RunCmd([pathutils.KVM_IFUP, tap], env=env)
999
    if result.failed:
1000
      raise errors.HypervisorError("Failed to configure interface %s: %s;"
1001
                                   " network configuration script output: %s" %
1002
                                   (tap, result.fail_reason, result.output))
1003

    
1004
  @staticmethod
1005
  def _VerifyAffinityPackage():
1006
    if affinity is None:
1007
      raise errors.HypervisorError("affinity Python package not"
1008
                                   " found; cannot use CPU pinning under KVM")
1009

    
1010
  @staticmethod
1011
  def _BuildAffinityCpuMask(cpu_list):
1012
    """Create a CPU mask suitable for sched_setaffinity from a list of
1013
    CPUs.
1014

1015
    See man taskset for more info on sched_setaffinity masks.
1016
    For example: [ 0, 2, 5, 6 ] will return 101 (0x65, 0..01100101).
1017

1018
    @type cpu_list: list of int
1019
    @param cpu_list: list of physical CPU numbers to map to vCPUs in order
1020
    @rtype: int
1021
    @return: a bit mask of CPU affinities
1022

1023
    """
1024
    if cpu_list == constants.CPU_PINNING_OFF:
1025
      return constants.CPU_PINNING_ALL_KVM
1026
    else:
1027
      return sum(2 ** cpu for cpu in cpu_list)
1028

    
1029
  @classmethod
1030
  def _AssignCpuAffinity(cls, cpu_mask, process_id, thread_dict):
1031
    """Change CPU affinity for running VM according to given CPU mask.
1032

1033
    @param cpu_mask: CPU mask as given by the user. e.g. "0-2,4:all:1,3"
1034
    @type cpu_mask: string
1035
    @param process_id: process ID of KVM process. Used to pin entire VM
1036
                       to physical CPUs.
1037
    @type process_id: int
1038
    @param thread_dict: map of virtual CPUs to KVM thread IDs
1039
    @type thread_dict: dict int:int
1040

1041
    """
1042
    # Convert the string CPU mask to a list of list of int's
1043
    cpu_list = utils.ParseMultiCpuMask(cpu_mask)
1044

    
1045
    if len(cpu_list) == 1:
1046
      all_cpu_mapping = cpu_list[0]
1047
      if all_cpu_mapping == constants.CPU_PINNING_OFF:
1048
        # If CPU pinning has 1 entry that's "all", then do nothing
1049
        pass
1050
      else:
1051
        # If CPU pinning has one non-all entry, map the entire VM to
1052
        # one set of physical CPUs
1053
        cls._VerifyAffinityPackage()
1054
        affinity.set_process_affinity_mask(
1055
          process_id, cls._BuildAffinityCpuMask(all_cpu_mapping))
1056
    else:
1057
      # The number of vCPUs mapped should match the number of vCPUs
1058
      # reported by KVM. This was already verified earlier, so
1059
      # here only as a sanity check.
1060
      assert len(thread_dict) == len(cpu_list)
1061
      cls._VerifyAffinityPackage()
1062

    
1063
      # For each vCPU, map it to the proper list of physical CPUs
1064
      for vcpu, i in zip(cpu_list, range(len(cpu_list))):
1065
        affinity.set_process_affinity_mask(thread_dict[i],
1066
                                           cls._BuildAffinityCpuMask(vcpu))
1067

    
1068
  def _GetVcpuThreadIds(self, instance_name):
1069
    """Get a mapping of vCPU no. to thread IDs for the instance
1070

1071
    @type instance_name: string
1072
    @param instance_name: instance in question
1073
    @rtype: dictionary of int:int
1074
    @return: a dictionary mapping vCPU numbers to thread IDs
1075

1076
    """
1077
    result = {}
1078
    output = self._CallMonitorCommand(instance_name, self._CPU_INFO_CMD)
1079
    for line in output.stdout.splitlines():
1080
      match = self._CPU_INFO_RE.search(line)
1081
      if not match:
1082
        continue
1083
      grp = map(int, match.groups())
1084
      result[grp[0]] = grp[1]
1085

    
1086
    return result
1087

    
1088
  def _ExecuteCpuAffinity(self, instance_name, cpu_mask):
1089
    """Complete CPU pinning.
1090

1091
    @type instance_name: string
1092
    @param instance_name: name of instance
1093
    @type cpu_mask: string
1094
    @param cpu_mask: CPU pinning mask as entered by user
1095

1096
    """
1097
    # Get KVM process ID, to be used if need to pin entire VM
1098
    _, pid, _ = self._InstancePidAlive(instance_name)
1099
    # Get vCPU thread IDs, to be used if need to pin vCPUs separately
1100
    thread_dict = self._GetVcpuThreadIds(instance_name)
1101
    # Run CPU pinning, based on configured mask
1102
    self._AssignCpuAffinity(cpu_mask, pid, thread_dict)
1103

    
1104
  def ListInstances(self):
1105
    """Get the list of running instances.
1106

1107
    We can do this by listing our live instances directory and
1108
    checking whether the associated kvm process is still alive.
1109

1110
    """
1111
    result = []
1112
    for name in os.listdir(self._PIDS_DIR):
1113
      if self._InstancePidAlive(name)[2]:
1114
        result.append(name)
1115
    return result
1116

    
1117
  def GetInstanceInfo(self, instance_name):
1118
    """Get instance properties.
1119

1120
    @type instance_name: string
1121
    @param instance_name: the instance name
1122
    @rtype: tuple of strings
1123
    @return: (name, id, memory, vcpus, stat, times)
1124

1125
    """
1126
    _, pid, alive = self._InstancePidAlive(instance_name)
1127
    if not alive:
1128
      return None
1129

    
1130
    _, memory, vcpus = self._InstancePidInfo(pid)
1131
    istat = "---b-"
1132
    times = "0"
1133

    
1134
    try:
1135
      qmp = QmpConnection(self._InstanceQmpMonitor(instance_name))
1136
      qmp.connect()
1137
      vcpus = len(qmp.Execute("query-cpus")[qmp.RETURN_KEY])
1138
      # Will fail if ballooning is not enabled, but we can then just resort to
1139
      # the value above.
1140
      mem_bytes = qmp.Execute("query-balloon")[qmp.RETURN_KEY][qmp.ACTUAL_KEY]
1141
      memory = mem_bytes / 1048576
1142
    except errors.HypervisorError:
1143
      pass
1144

    
1145
    return (instance_name, pid, memory, vcpus, istat, times)
1146

    
1147
  def GetAllInstancesInfo(self):
1148
    """Get properties of all instances.
1149

1150
    @return: list of tuples (name, id, memory, vcpus, stat, times)
1151

1152
    """
1153
    data = []
1154
    for name in os.listdir(self._PIDS_DIR):
1155
      try:
1156
        info = self.GetInstanceInfo(name)
1157
      except errors.HypervisorError:
1158
        # Ignore exceptions due to instances being shut down
1159
        continue
1160
      if info:
1161
        data.append(info)
1162
    return data
1163

    
1164
  def _GenerateKVMBlockDevicesOptions(self, instance, block_devices,
1165
                                      kvmhelp, devlist):
1166
    """Generate KVM options regarding instance's block devices.
1167

1168
    @type instance: L{objects.Instance}
1169
    @param instance: the instance object
1170
    @type block_devices: list of tuples
1171
    @param block_devices: list of tuples [(disk, link_name)..]
1172
    @type kvmhelp: string
1173
    @param kvmhelp: output of kvm --help
1174
    @type devlist: string
1175
    @param devlist: output of kvm -device ?
1176
    @rtype: list
1177
    @return: list of command line options eventually used by kvm executable
1178

1179
    """
1180
    hvp = instance.hvparams
1181
    kernel_path = hvp[constants.HV_KERNEL_PATH]
1182
    if kernel_path:
1183
      boot_disk = False
1184
    else:
1185
      boot_disk = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_DISK
1186
    kvm_path = hvp[constants.HV_KVM_PATH]
1187

    
1188
    # whether this is an older KVM version that uses the boot=on flag
1189
    # on devices
1190
    needs_boot_flag = self._BOOT_RE.search(kvmhelp)
1191

    
1192
    dev_opts = []
1193
    device_driver = None
1194
    disk_type = hvp[constants.HV_DISK_TYPE]
1195
    if disk_type == constants.HT_DISK_PARAVIRTUAL:
1196
      if_val = ",if=%s" % self._VIRTIO
1197
      try:
1198
        if self._VIRTIO_BLK_RE.search(devlist):
1199
          if_val = ",if=none"
1200
          # will be passed in -device option as driver
1201
          device_driver = self._VIRTIO_BLK_PCI
1202
      except errors.HypervisorError, _:
1203
        pass
1204
    else:
1205
      if_val = ",if=%s" % disk_type
1206
    # Cache mode
1207
    disk_cache = hvp[constants.HV_DISK_CACHE]
1208
    if instance.disk_template in constants.DTS_EXT_MIRROR:
1209
      if disk_cache != "none":
1210
        # TODO: make this a hard error, instead of a silent overwrite
1211
        logging.warning("KVM: overriding disk_cache setting '%s' with 'none'"
1212
                        " to prevent shared storage corruption on migration",
1213
                        disk_cache)
1214
      cache_val = ",cache=none"
1215
    elif disk_cache != constants.HT_CACHE_DEFAULT:
1216
      cache_val = ",cache=%s" % disk_cache
1217
    else:
1218
      cache_val = ""
1219
    for cfdev, dev_path in block_devices:
1220
      if cfdev.mode != constants.DISK_RDWR:
1221
        raise errors.HypervisorError("Instance has read-only disks which"
1222
                                     " are not supported by KVM")
1223
      # TODO: handle FD_LOOP and FD_BLKTAP (?)
1224
      boot_val = ""
1225
      if boot_disk:
1226
        dev_opts.extend(["-boot", "c"])
1227
        boot_disk = False
1228
        if needs_boot_flag and disk_type != constants.HT_DISK_IDE:
1229
          boot_val = ",boot=on"
1230
      drive_val = "file=%s,format=raw%s%s%s" % \
1231
                  (dev_path, if_val, boot_val, cache_val)
1232

    
1233
      if device_driver:
1234
        # block_devices are the 4th entry of runtime file that did not exist in
1235
        # the past. That means that cfdev should always have pci slot and
1236
        # _GenerateDeviceKVMId() will not raise a exception.
1237
        kvm_devid = _GenerateDeviceKVMId(constants.HOTPLUG_TARGET_DISK, cfdev)
1238
        drive_val += (",id=%s" % kvm_devid)
1239
        drive_val += (",bus=0,unit=%d" % cfdev.pci)
1240
        dev_val = ("%s,drive=%s,id=%s" %
1241
                   (device_driver, kvm_devid, kvm_devid))
1242
        dev_val += ",bus=pci.0,addr=%s" % hex(cfdev.pci)
1243
        dev_opts.extend(["-device", dev_val])
1244

    
1245
      dev_opts.extend(["-drive", drive_val])
1246

    
1247
    return dev_opts
1248

    
1249
  def _GenerateKVMRuntime(self, instance, block_devices, startup_paused,
1250
                          kvmhelp):
1251
    """Generate KVM information to start an instance.
1252

1253
    @type kvmhelp: string
1254
    @param kvmhelp: output of kvm --help
1255
    @attention: this function must not have any side-effects; for
1256
        example, it must not write to the filesystem, or read values
1257
        from the current system the are expected to differ between
1258
        nodes, since it is only run once at instance startup;
1259
        actions/kvm arguments that can vary between systems should be
1260
        done in L{_ExecuteKVMRuntime}
1261

1262
    """
1263
    # pylint: disable=R0912,R0914,R0915
1264
    hvp = instance.hvparams
1265
    self.ValidateParameters(hvp)
1266

    
1267
    pidfile = self._InstancePidFile(instance.name)
1268
    kvm = hvp[constants.HV_KVM_PATH]
1269
    kvm_cmd = [kvm]
1270
    # used just by the vnc server, if enabled
1271
    kvm_cmd.extend(["-name", instance.name])
1272
    kvm_cmd.extend(["-m", instance.beparams[constants.BE_MAXMEM]])
1273

    
1274
    smp_list = ["%s" % instance.beparams[constants.BE_VCPUS]]
1275
    if hvp[constants.HV_CPU_CORES]:
1276
      smp_list.append("cores=%s" % hvp[constants.HV_CPU_CORES])
1277
    if hvp[constants.HV_CPU_THREADS]:
1278
      smp_list.append("threads=%s" % hvp[constants.HV_CPU_THREADS])
1279
    if hvp[constants.HV_CPU_SOCKETS]:
1280
      smp_list.append("sockets=%s" % hvp[constants.HV_CPU_SOCKETS])
1281

    
1282
    kvm_cmd.extend(["-smp", ",".join(smp_list)])
1283

    
1284
    kvm_cmd.extend(["-pidfile", pidfile])
1285
    kvm_cmd.extend(["-balloon", "virtio"])
1286
    kvm_cmd.extend(["-daemonize"])
1287
    if not instance.hvparams[constants.HV_ACPI]:
1288
      kvm_cmd.extend(["-no-acpi"])
1289
    if instance.hvparams[constants.HV_REBOOT_BEHAVIOR] == \
1290
        constants.INSTANCE_REBOOT_EXIT:
1291
      kvm_cmd.extend(["-no-reboot"])
1292

    
1293
    mversion = hvp[constants.HV_KVM_MACHINE_VERSION]
1294
    if not mversion:
1295
      mversion = self._GetDefaultMachineVersion(kvm)
1296
    if self._MACHINE_RE.search(kvmhelp):
1297
      # TODO (2.8): kernel_irqchip and kvm_shadow_mem machine properties, as
1298
      # extra hypervisor parameters. We should also investigate whether and how
1299
      # shadow_mem should be considered for the resource model.
1300
      if (hvp[constants.HV_KVM_FLAG] == constants.HT_KVM_ENABLED):
1301
        specprop = ",accel=kvm"
1302
      else:
1303
        specprop = ""
1304
      machinespec = "%s%s" % (mversion, specprop)
1305
      kvm_cmd.extend(["-machine", machinespec])
1306
    else:
1307
      kvm_cmd.extend(["-M", mversion])
1308
      if (hvp[constants.HV_KVM_FLAG] == constants.HT_KVM_ENABLED and
1309
          self._ENABLE_KVM_RE.search(kvmhelp)):
1310
        kvm_cmd.extend(["-enable-kvm"])
1311
      elif (hvp[constants.HV_KVM_FLAG] == constants.HT_KVM_DISABLED and
1312
            self._DISABLE_KVM_RE.search(kvmhelp)):
1313
        kvm_cmd.extend(["-disable-kvm"])
1314

    
1315
    kernel_path = hvp[constants.HV_KERNEL_PATH]
1316
    if kernel_path:
1317
      boot_cdrom = boot_floppy = boot_network = False
1318
    else:
1319
      boot_cdrom = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_CDROM
1320
      boot_floppy = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_FLOPPY
1321
      boot_network = hvp[constants.HV_BOOT_ORDER] == constants.HT_BO_NETWORK
1322

    
1323
    if startup_paused:
1324
      kvm_cmd.extend([_KVM_START_PAUSED_FLAG])
1325

    
1326
    if boot_network:
1327
      kvm_cmd.extend(["-boot", "n"])
1328

    
1329
    # whether this is an older KVM version that uses the boot=on flag
1330
    # on devices
1331
    needs_boot_flag = self._BOOT_RE.search(kvmhelp)
1332

    
1333
    disk_type = hvp[constants.HV_DISK_TYPE]
1334

    
1335
    #Now we can specify a different device type for CDROM devices.
1336
    cdrom_disk_type = hvp[constants.HV_KVM_CDROM_DISK_TYPE]
1337
    if not cdrom_disk_type:
1338
      cdrom_disk_type = disk_type
1339

    
1340
    iso_image = hvp[constants.HV_CDROM_IMAGE_PATH]
1341
    if iso_image:
1342
      options = ",format=raw,media=cdrom"
1343
      # set cdrom 'if' type
1344
      if boot_cdrom:
1345
        actual_cdrom_type = constants.HT_DISK_IDE
1346
      elif cdrom_disk_type == constants.HT_DISK_PARAVIRTUAL:
1347
        actual_cdrom_type = "virtio"
1348
      else:
1349
        actual_cdrom_type = cdrom_disk_type
1350
      if_val = ",if=%s" % actual_cdrom_type
1351
      # set boot flag, if needed
1352
      boot_val = ""
1353
      if boot_cdrom:
1354
        kvm_cmd.extend(["-boot", "d"])
1355
        if needs_boot_flag:
1356
          boot_val = ",boot=on"
1357
      # and finally build the entire '-drive' value
1358
      drive_val = "file=%s%s%s%s" % (iso_image, options, if_val, boot_val)
1359
      kvm_cmd.extend(["-drive", drive_val])
1360

    
1361
    iso_image2 = hvp[constants.HV_KVM_CDROM2_IMAGE_PATH]
1362
    if iso_image2:
1363
      options = ",format=raw,media=cdrom"
1364
      if cdrom_disk_type == constants.HT_DISK_PARAVIRTUAL:
1365
        if_val = ",if=virtio"
1366
      else:
1367
        if_val = ",if=%s" % cdrom_disk_type
1368
      drive_val = "file=%s%s%s" % (iso_image2, options, if_val)
1369
      kvm_cmd.extend(["-drive", drive_val])
1370

    
1371
    floppy_image = hvp[constants.HV_KVM_FLOPPY_IMAGE_PATH]
1372
    if floppy_image:
1373
      options = ",format=raw,media=disk"
1374
      if boot_floppy:
1375
        kvm_cmd.extend(["-boot", "a"])
1376
        options = "%s,boot=on" % options
1377
      if_val = ",if=floppy"
1378
      options = "%s%s" % (options, if_val)
1379
      drive_val = "file=%s%s" % (floppy_image, options)
1380
      kvm_cmd.extend(["-drive", drive_val])
1381

    
1382
    if kernel_path:
1383
      kvm_cmd.extend(["-kernel", kernel_path])
1384
      initrd_path = hvp[constants.HV_INITRD_PATH]
1385
      if initrd_path:
1386
        kvm_cmd.extend(["-initrd", initrd_path])
1387
      root_append = ["root=%s" % hvp[constants.HV_ROOT_PATH],
1388
                     hvp[constants.HV_KERNEL_ARGS]]
1389
      if hvp[constants.HV_SERIAL_CONSOLE]:
1390
        serial_speed = hvp[constants.HV_SERIAL_SPEED]
1391
        root_append.append("console=ttyS0,%s" % serial_speed)
1392
      kvm_cmd.extend(["-append", " ".join(root_append)])
1393

    
1394
    mem_path = hvp[constants.HV_MEM_PATH]
1395
    if mem_path:
1396
      kvm_cmd.extend(["-mem-path", mem_path, "-mem-prealloc"])
1397

    
1398
    monitor_dev = ("unix:%s,server,nowait" %
1399
                   self._InstanceMonitor(instance.name))
1400
    kvm_cmd.extend(["-monitor", monitor_dev])
1401
    if hvp[constants.HV_SERIAL_CONSOLE]:
1402
      serial_dev = ("unix:%s,server,nowait" %
1403
                    self._InstanceSerial(instance.name))
1404
      kvm_cmd.extend(["-serial", serial_dev])
1405
    else:
1406
      kvm_cmd.extend(["-serial", "none"])
1407

    
1408
    mouse_type = hvp[constants.HV_USB_MOUSE]
1409
    vnc_bind_address = hvp[constants.HV_VNC_BIND_ADDRESS]
1410
    spice_bind = hvp[constants.HV_KVM_SPICE_BIND]
1411
    spice_ip_version = None
1412

    
1413
    kvm_cmd.extend(["-usb"])
1414

    
1415
    if mouse_type:
1416
      kvm_cmd.extend(["-usbdevice", mouse_type])
1417
    elif vnc_bind_address:
1418
      kvm_cmd.extend(["-usbdevice", constants.HT_MOUSE_TABLET])
1419

    
1420
    if vnc_bind_address:
1421
      if netutils.IP4Address.IsValid(vnc_bind_address):
1422
        if instance.network_port > constants.VNC_BASE_PORT:
1423
          display = instance.network_port - constants.VNC_BASE_PORT
1424
          if vnc_bind_address == constants.IP4_ADDRESS_ANY:
1425
            vnc_arg = ":%d" % (display)
1426
          else:
1427
            vnc_arg = "%s:%d" % (vnc_bind_address, display)
1428
        else:
1429
          logging.error("Network port is not a valid VNC display (%d < %d),"
1430
                        " not starting VNC",
1431
                        instance.network_port, constants.VNC_BASE_PORT)
1432
          vnc_arg = "none"
1433

    
1434
        # Only allow tls and other option when not binding to a file, for now.
1435
        # kvm/qemu gets confused otherwise about the filename to use.
1436
        vnc_append = ""
1437
        if hvp[constants.HV_VNC_TLS]:
1438
          vnc_append = "%s,tls" % vnc_append
1439
          if hvp[constants.HV_VNC_X509_VERIFY]:
1440
            vnc_append = "%s,x509verify=%s" % (vnc_append,
1441
                                               hvp[constants.HV_VNC_X509])
1442
          elif hvp[constants.HV_VNC_X509]:
1443
            vnc_append = "%s,x509=%s" % (vnc_append,
1444
                                         hvp[constants.HV_VNC_X509])
1445
        if hvp[constants.HV_VNC_PASSWORD_FILE]:
1446
          vnc_append = "%s,password" % vnc_append
1447

    
1448
        vnc_arg = "%s%s" % (vnc_arg, vnc_append)
1449

    
1450
      else:
1451
        vnc_arg = "unix:%s/%s.vnc" % (vnc_bind_address, instance.name)
1452

    
1453
      kvm_cmd.extend(["-vnc", vnc_arg])
1454
    elif spice_bind:
1455
      # FIXME: this is wrong here; the iface ip address differs
1456
      # between systems, so it should be done in _ExecuteKVMRuntime
1457
      if netutils.IsValidInterface(spice_bind):
1458
        # The user specified a network interface, we have to figure out the IP
1459
        # address.
1460
        addresses = netutils.GetInterfaceIpAddresses(spice_bind)
1461
        spice_ip_version = hvp[constants.HV_KVM_SPICE_IP_VERSION]
1462

    
1463
        # if the user specified an IP version and the interface does not
1464
        # have that kind of IP addresses, throw an exception
1465
        if spice_ip_version != constants.IFACE_NO_IP_VERSION_SPECIFIED:
1466
          if not addresses[spice_ip_version]:
1467
            raise errors.HypervisorError("SPICE: Unable to get an IPv%s address"
1468
                                         " for %s" % (spice_ip_version,
1469
                                                      spice_bind))
1470

    
1471
        # the user did not specify an IP version, we have to figure it out
1472
        elif (addresses[constants.IP4_VERSION] and
1473
              addresses[constants.IP6_VERSION]):
1474
          # we have both ipv4 and ipv6, let's use the cluster default IP
1475
          # version
1476
          cluster_family = ssconf.SimpleStore().GetPrimaryIPFamily()
1477
          spice_ip_version = \
1478
            netutils.IPAddress.GetVersionFromAddressFamily(cluster_family)
1479
        elif addresses[constants.IP4_VERSION]:
1480
          spice_ip_version = constants.IP4_VERSION
1481
        elif addresses[constants.IP6_VERSION]:
1482
          spice_ip_version = constants.IP6_VERSION
1483
        else:
1484
          raise errors.HypervisorError("SPICE: Unable to get an IP address"
1485
                                       " for %s" % (spice_bind))
1486

    
1487
        spice_address = addresses[spice_ip_version][0]
1488

    
1489
      else:
1490
        # spice_bind is known to be a valid IP address, because
1491
        # ValidateParameters checked it.
1492
        spice_address = spice_bind
1493

    
1494
      spice_arg = "addr=%s" % spice_address
1495
      if hvp[constants.HV_KVM_SPICE_USE_TLS]:
1496
        spice_arg = ("%s,tls-port=%s,x509-cacert-file=%s" %
1497
                     (spice_arg, instance.network_port,
1498
                      pathutils.SPICE_CACERT_FILE))
1499
        spice_arg = ("%s,x509-key-file=%s,x509-cert-file=%s" %
1500
                     (spice_arg, pathutils.SPICE_CERT_FILE,
1501
                      pathutils.SPICE_CERT_FILE))
1502
        tls_ciphers = hvp[constants.HV_KVM_SPICE_TLS_CIPHERS]
1503
        if tls_ciphers:
1504
          spice_arg = "%s,tls-ciphers=%s" % (spice_arg, tls_ciphers)
1505
      else:
1506
        spice_arg = "%s,port=%s" % (spice_arg, instance.network_port)
1507

    
1508
      if not hvp[constants.HV_KVM_SPICE_PASSWORD_FILE]:
1509
        spice_arg = "%s,disable-ticketing" % spice_arg
1510

    
1511
      if spice_ip_version:
1512
        spice_arg = "%s,ipv%s" % (spice_arg, spice_ip_version)
1513

    
1514
      # Image compression options
1515
      img_lossless = hvp[constants.HV_KVM_SPICE_LOSSLESS_IMG_COMPR]
1516
      img_jpeg = hvp[constants.HV_KVM_SPICE_JPEG_IMG_COMPR]
1517
      img_zlib_glz = hvp[constants.HV_KVM_SPICE_ZLIB_GLZ_IMG_COMPR]
1518
      if img_lossless:
1519
        spice_arg = "%s,image-compression=%s" % (spice_arg, img_lossless)
1520
      if img_jpeg:
1521
        spice_arg = "%s,jpeg-wan-compression=%s" % (spice_arg, img_jpeg)
1522
      if img_zlib_glz:
1523
        spice_arg = "%s,zlib-glz-wan-compression=%s" % (spice_arg, img_zlib_glz)
1524

    
1525
      # Video stream detection
1526
      video_streaming = hvp[constants.HV_KVM_SPICE_STREAMING_VIDEO_DETECTION]
1527
      if video_streaming:
1528
        spice_arg = "%s,streaming-video=%s" % (spice_arg, video_streaming)
1529

    
1530
      # Audio compression, by default in qemu-kvm it is on
1531
      if not hvp[constants.HV_KVM_SPICE_AUDIO_COMPR]:
1532
        spice_arg = "%s,playback-compression=off" % spice_arg
1533
      if not hvp[constants.HV_KVM_SPICE_USE_VDAGENT]:
1534
        spice_arg = "%s,agent-mouse=off" % spice_arg
1535
      else:
1536
        # Enable the spice agent communication channel between the host and the
1537
        # agent.
1538
        kvm_cmd.extend(["-device", "virtio-serial-pci"])
1539
        kvm_cmd.extend([
1540
          "-device",
1541
          "virtserialport,chardev=spicechannel0,name=com.redhat.spice.0",
1542
          ])
1543
        kvm_cmd.extend(["-chardev", "spicevmc,id=spicechannel0,name=vdagent"])
1544

    
1545
      logging.info("KVM: SPICE will listen on port %s", instance.network_port)
1546
      kvm_cmd.extend(["-spice", spice_arg])
1547

    
1548
    else:
1549
      # From qemu 1.4 -nographic is incompatible with -daemonize. The new way
1550
      # also works in earlier versions though (tested with 1.1 and 1.3)
1551
      if self._DISPLAY_RE.search(kvmhelp):
1552
        kvm_cmd.extend(["-display", "none"])
1553
      else:
1554
        kvm_cmd.extend(["-nographic"])
1555

    
1556
    if hvp[constants.HV_USE_LOCALTIME]:
1557
      kvm_cmd.extend(["-localtime"])
1558

    
1559
    if hvp[constants.HV_KVM_USE_CHROOT]:
1560
      kvm_cmd.extend(["-chroot", self._InstanceChrootDir(instance.name)])
1561

    
1562
    # Add qemu-KVM -cpu param
1563
    if hvp[constants.HV_CPU_TYPE]:
1564
      kvm_cmd.extend(["-cpu", hvp[constants.HV_CPU_TYPE]])
1565

    
1566
    # As requested by music lovers
1567
    if hvp[constants.HV_SOUNDHW]:
1568
      kvm_cmd.extend(["-soundhw", hvp[constants.HV_SOUNDHW]])
1569

    
1570
    # Pass a -vga option if requested, or if spice is used, for backwards
1571
    # compatibility.
1572
    if hvp[constants.HV_VGA]:
1573
      kvm_cmd.extend(["-vga", hvp[constants.HV_VGA]])
1574
    elif spice_bind:
1575
      kvm_cmd.extend(["-vga", "qxl"])
1576

    
1577
    # Various types of usb devices, comma separated
1578
    if hvp[constants.HV_USB_DEVICES]:
1579
      for dev in hvp[constants.HV_USB_DEVICES].split(","):
1580
        kvm_cmd.extend(["-usbdevice", dev])
1581

    
1582
    if hvp[constants.HV_KVM_EXTRA]:
1583
      kvm_cmd.extend(hvp[constants.HV_KVM_EXTRA].split(" "))
1584

    
1585
    pci_reservations = bitarray(self._DEFAULT_PCI_RESERVATIONS)
1586
    kvm_disks = []
1587
    for disk, dev_path in block_devices:
1588
      _UpdatePCISlots(disk, pci_reservations)
1589
      kvm_disks.append((disk, dev_path))
1590

    
1591
    kvm_nics = []
1592
    for nic in instance.nics:
1593
      _UpdatePCISlots(nic, pci_reservations)
1594
      kvm_nics.append(nic)
1595

    
1596
    hvparams = hvp
1597

    
1598
    return (kvm_cmd, kvm_nics, hvparams, kvm_disks)
1599

    
1600
  def _WriteKVMRuntime(self, instance_name, data):
1601
    """Write an instance's KVM runtime
1602

1603
    """
1604
    try:
1605
      utils.WriteFile(self._InstanceKVMRuntime(instance_name),
1606
                      data=data)
1607
    except EnvironmentError, err:
1608
      raise errors.HypervisorError("Failed to save KVM runtime file: %s" % err)
1609

    
1610
  def _ReadKVMRuntime(self, instance_name):
1611
    """Read an instance's KVM runtime
1612

1613
    """
1614
    try:
1615
      file_content = utils.ReadFile(self._InstanceKVMRuntime(instance_name))
1616
    except EnvironmentError, err:
1617
      raise errors.HypervisorError("Failed to load KVM runtime file: %s" % err)
1618
    return file_content
1619

    
1620
  def _SaveKVMRuntime(self, instance, kvm_runtime):
1621
    """Save an instance's KVM runtime
1622

1623
    """
1624
    kvm_cmd, kvm_nics, hvparams, block_devices = kvm_runtime
1625

    
1626
    serialized_nics = [nic.ToDict() for nic in kvm_nics]
1627
    serialized_blockdevs = [(blk.ToDict(), link) for blk, link in block_devices]
1628
    serialized_form = serializer.Dump((kvm_cmd, serialized_nics, hvparams,
1629
                                      serialized_blockdevs))
1630

    
1631
    self._WriteKVMRuntime(instance.name, serialized_form)
1632

    
1633
  def _LoadKVMRuntime(self, instance, serialized_runtime=None):
1634
    """Load an instance's KVM runtime
1635

1636
    """
1637
    if not serialized_runtime:
1638
      serialized_runtime = self._ReadKVMRuntime(instance.name)
1639

    
1640
    loaded_runtime = serializer.Load(serialized_runtime)
1641
    if len(loaded_runtime) == 3:
1642
      serialized_blockdevs = []
1643
      kvm_cmd, serialized_nics, hvparams = loaded_runtime
1644
    else:
1645
      kvm_cmd, serialized_nics, hvparams, serialized_blockdevs = loaded_runtime
1646

    
1647
    kvm_nics = [objects.NIC.FromDict(snic) for snic in serialized_nics]
1648
    block_devices = [(objects.Disk.FromDict(sdisk), link)
1649
                     for sdisk, link in serialized_blockdevs]
1650

    
1651
    return (kvm_cmd, kvm_nics, hvparams, block_devices)
1652

    
1653
  def _RunKVMCmd(self, name, kvm_cmd, tap_fds=None):
1654
    """Run the KVM cmd and check for errors
1655

1656
    @type name: string
1657
    @param name: instance name
1658
    @type kvm_cmd: list of strings
1659
    @param kvm_cmd: runcmd input for kvm
1660
    @type tap_fds: list of int
1661
    @param tap_fds: fds of tap devices opened by Ganeti
1662

1663
    """
1664
    try:
1665
      result = utils.RunCmd(kvm_cmd, noclose_fds=tap_fds)
1666
    finally:
1667
      for fd in tap_fds:
1668
        utils_wrapper.CloseFdNoError(fd)
1669

    
1670
    if result.failed:
1671
      raise errors.HypervisorError("Failed to start instance %s: %s (%s)" %
1672
                                   (name, result.fail_reason, result.output))
1673
    if not self._InstancePidAlive(name)[2]:
1674
      raise errors.HypervisorError("Failed to start instance %s" % name)
1675

    
1676
  # 52/50 local variables
1677
  # pylint: disable=R0914
1678
  def _ExecuteKVMRuntime(self, instance, kvm_runtime, kvmhelp, incoming=None):
1679
    """Execute a KVM cmd, after completing it with some last minute data.
1680

1681
    @type incoming: tuple of strings
1682
    @param incoming: (target_host_ip, port)
1683
    @type kvmhelp: string
1684
    @param kvmhelp: output of kvm --help
1685

1686
    """
1687
    # Small _ExecuteKVMRuntime hv parameters programming howto:
1688
    #  - conf_hvp contains the parameters as configured on ganeti. they might
1689
    #    have changed since the instance started; only use them if the change
1690
    #    won't affect the inside of the instance (which hasn't been rebooted).
1691
    #  - up_hvp contains the parameters as they were when the instance was
1692
    #    started, plus any new parameter which has been added between ganeti
1693
    #    versions: it is paramount that those default to a value which won't
1694
    #    affect the inside of the instance as well.
1695
    conf_hvp = instance.hvparams
1696
    name = instance.name
1697
    self._CheckDown(name)
1698

    
1699
    temp_files = []
1700

    
1701
    kvm_cmd, kvm_nics, up_hvp, block_devices = kvm_runtime
1702
    # the first element of kvm_cmd is always the path to the kvm binary
1703
    kvm_path = kvm_cmd[0]
1704
    up_hvp = objects.FillDict(conf_hvp, up_hvp)
1705

    
1706
    # We know it's safe to run as a different user upon migration, so we'll use
1707
    # the latest conf, from conf_hvp.
1708
    security_model = conf_hvp[constants.HV_SECURITY_MODEL]
1709
    if security_model == constants.HT_SM_USER:
1710
      kvm_cmd.extend(["-runas", conf_hvp[constants.HV_SECURITY_DOMAIN]])
1711

    
1712
    keymap = conf_hvp[constants.HV_KEYMAP]
1713
    if keymap:
1714
      keymap_path = self._InstanceKeymapFile(name)
1715
      # If a keymap file is specified, KVM won't use its internal defaults. By
1716
      # first including the "en-us" layout, an error on loading the actual
1717
      # layout (e.g. because it can't be found) won't lead to a non-functional
1718
      # keyboard. A keyboard with incorrect keys is still better than none.
1719
      utils.WriteFile(keymap_path, data="include en-us\ninclude %s\n" % keymap)
1720
      kvm_cmd.extend(["-k", keymap_path])
1721

    
1722
    # We have reasons to believe changing something like the nic driver/type
1723
    # upon migration won't exactly fly with the instance kernel, so for nic
1724
    # related parameters we'll use up_hvp
1725
    tapfds = []
1726
    taps = []
1727
    devlist = self._GetKVMOutput(kvm_path, self._KVMOPT_DEVICELIST)
1728
    if not kvm_nics:
1729
      kvm_cmd.extend(["-net", "none"])
1730
    else:
1731
      vnet_hdr = False
1732
      tap_extra = ""
1733
      nic_type = up_hvp[constants.HV_NIC_TYPE]
1734
      if nic_type == constants.HT_NIC_PARAVIRTUAL:
1735
        nic_model = self._VIRTIO
1736
        try:
1737
          if self._VIRTIO_NET_RE.search(devlist):
1738
            nic_model = self._VIRTIO_NET_PCI
1739
            vnet_hdr = up_hvp[constants.HV_VNET_HDR]
1740
        except errors.HypervisorError, _:
1741
          # Older versions of kvm don't support DEVICE_LIST, but they don't
1742
          # have new virtio syntax either.
1743
          pass
1744

    
1745
        if up_hvp[constants.HV_VHOST_NET]:
1746
          # check for vhost_net support
1747
          if self._VHOST_RE.search(kvmhelp):
1748
            tap_extra = ",vhost=on"
1749
          else:
1750
            raise errors.HypervisorError("vhost_net is configured"
1751
                                         " but it is not available")
1752
      else:
1753
        nic_model = nic_type
1754

    
1755
      kvm_supports_netdev = self._NETDEV_RE.search(kvmhelp)
1756

    
1757
      for nic_seq, nic in enumerate(kvm_nics):
1758
        tapname, tapfd = _OpenTap(vnet_hdr=vnet_hdr)
1759
        tapfds.append(tapfd)
1760
        taps.append(tapname)
1761
        if kvm_supports_netdev:
1762
          nic_val = "%s,mac=%s" % (nic_model, nic.mac)
1763
          try:
1764
            # kvm_nics already exist in old runtime files and thus there might
1765
            # be some entries without pci slot (therefore try: except:)
1766
            kvm_devid = _GenerateDeviceKVMId(constants.HOTPLUG_TARGET_NIC, nic)
1767
            netdev = kvm_devid
1768
            nic_val += (",id=%s,bus=pci.0,addr=%s" % (kvm_devid, hex(nic.pci)))
1769
          except errors.HotplugError:
1770
            netdev = "netdev%d" % nic_seq
1771
          nic_val += (",netdev=%s" % netdev)
1772
          tap_val = ("type=tap,id=%s,fd=%d%s" %
1773
                     (netdev, tapfd, tap_extra))
1774
          kvm_cmd.extend(["-netdev", tap_val, "-device", nic_val])
1775
        else:
1776
          nic_val = "nic,vlan=%s,macaddr=%s,model=%s" % (nic_seq,
1777
                                                         nic.mac, nic_model)
1778
          tap_val = "tap,vlan=%s,fd=%d" % (nic_seq, tapfd)
1779
          kvm_cmd.extend(["-net", tap_val, "-net", nic_val])
1780

    
1781
    if incoming:
1782
      target, port = incoming
1783
      kvm_cmd.extend(["-incoming", "tcp:%s:%s" % (target, port)])
1784

    
1785
    # Changing the vnc password doesn't bother the guest that much. At most it
1786
    # will surprise people who connect to it. Whether positively or negatively
1787
    # it's debatable.
1788
    vnc_pwd_file = conf_hvp[constants.HV_VNC_PASSWORD_FILE]
1789
    vnc_pwd = None
1790
    if vnc_pwd_file:
1791
      try:
1792
        vnc_pwd = utils.ReadOneLineFile(vnc_pwd_file, strict=True)
1793
      except EnvironmentError, err:
1794
        raise errors.HypervisorError("Failed to open VNC password file %s: %s"
1795
                                     % (vnc_pwd_file, err))
1796

    
1797
    if conf_hvp[constants.HV_KVM_USE_CHROOT]:
1798
      utils.EnsureDirs([(self._InstanceChrootDir(name),
1799
                         constants.SECURE_DIR_MODE)])
1800

    
1801
    # Automatically enable QMP if version is >= 0.14
1802
    if self._QMP_RE.search(kvmhelp):
1803
      logging.debug("Enabling QMP")
1804
      kvm_cmd.extend(["-qmp", "unix:%s,server,nowait" %
1805
                      self._InstanceQmpMonitor(instance.name)])
1806

    
1807
    # Configure the network now for starting instances and bridged interfaces,
1808
    # during FinalizeMigration for incoming instances' routed interfaces
1809
    for nic_seq, nic in enumerate(kvm_nics):
1810
      if (incoming and
1811
          nic.nicparams[constants.NIC_MODE] != constants.NIC_MODE_BRIDGED):
1812
        continue
1813
      self._ConfigureNIC(instance, nic_seq, nic, taps[nic_seq])
1814

    
1815
    bdev_opts = self._GenerateKVMBlockDevicesOptions(instance,
1816
                                                     block_devices,
1817
                                                     kvmhelp,
1818
                                                     devlist)
1819
    kvm_cmd.extend(bdev_opts)
1820
    # CPU affinity requires kvm to start paused, so we set this flag if the
1821
    # instance is not already paused and if we are not going to accept a
1822
    # migrating instance. In the latter case, pausing is not needed.
1823
    start_kvm_paused = not (_KVM_START_PAUSED_FLAG in kvm_cmd) and not incoming
1824
    if start_kvm_paused:
1825
      kvm_cmd.extend([_KVM_START_PAUSED_FLAG])
1826

    
1827
    # Note: CPU pinning is using up_hvp since changes take effect
1828
    # during instance startup anyway, and to avoid problems when soft
1829
    # rebooting the instance.
1830
    cpu_pinning = False
1831
    if up_hvp.get(constants.HV_CPU_MASK, None):
1832
      cpu_pinning = True
1833

    
1834
    if security_model == constants.HT_SM_POOL:
1835
      ss = ssconf.SimpleStore()
1836
      uid_pool = uidpool.ParseUidPool(ss.GetUidPool(), separator="\n")
1837
      all_uids = set(uidpool.ExpandUidPool(uid_pool))
1838
      uid = uidpool.RequestUnusedUid(all_uids)
1839
      try:
1840
        username = pwd.getpwuid(uid.GetUid()).pw_name
1841
        kvm_cmd.extend(["-runas", username])
1842
        self._RunKVMCmd(name, kvm_cmd, tapfds)
1843
      except:
1844
        uidpool.ReleaseUid(uid)
1845
        raise
1846
      else:
1847
        uid.Unlock()
1848
        utils.WriteFile(self._InstanceUidFile(name), data=uid.AsStr())
1849
    else:
1850
      self._RunKVMCmd(name, kvm_cmd, tapfds)
1851

    
1852
    utils.EnsureDirs([(self._InstanceNICDir(instance.name),
1853
                     constants.RUN_DIRS_MODE)])
1854
    for nic_seq, tap in enumerate(taps):
1855
      utils.WriteFile(self._InstanceNICFile(instance.name, nic_seq),
1856
                      data=tap)
1857

    
1858
    if vnc_pwd:
1859
      change_cmd = "change vnc password %s" % vnc_pwd
1860
      self._CallMonitorCommand(instance.name, change_cmd)
1861

    
1862
    # Setting SPICE password. We are not vulnerable to malicious passwordless
1863
    # connection attempts because SPICE by default does not allow connections
1864
    # if neither a password nor the "disable_ticketing" options are specified.
1865
    # As soon as we send the password via QMP, that password is a valid ticket
1866
    # for connection.
1867
    spice_password_file = conf_hvp[constants.HV_KVM_SPICE_PASSWORD_FILE]
1868
    if spice_password_file:
1869
      spice_pwd = ""
1870
      try:
1871
        spice_pwd = utils.ReadOneLineFile(spice_password_file, strict=True)
1872
      except EnvironmentError, err:
1873
        raise errors.HypervisorError("Failed to open SPICE password file %s: %s"
1874
                                     % (spice_password_file, err))
1875

    
1876
      qmp = QmpConnection(self._InstanceQmpMonitor(instance.name))
1877
      qmp.connect()
1878
      arguments = {
1879
          "protocol": "spice",
1880
          "password": spice_pwd,
1881
      }
1882
      qmp.Execute("set_password", arguments)
1883

    
1884
    for filename in temp_files:
1885
      utils.RemoveFile(filename)
1886

    
1887
    # If requested, set CPU affinity and resume instance execution
1888
    if cpu_pinning:
1889
      self._ExecuteCpuAffinity(instance.name, up_hvp[constants.HV_CPU_MASK])
1890

    
1891
    start_memory = self._InstanceStartupMemory(instance)
1892
    if start_memory < instance.beparams[constants.BE_MAXMEM]:
1893
      self.BalloonInstanceMemory(instance, start_memory)
1894

    
1895
    if start_kvm_paused:
1896
      # To control CPU pinning, ballooning, and vnc/spice passwords
1897
      # the VM was started in a frozen state. If freezing was not
1898
      # explicitly requested resume the vm status.
1899
      self._CallMonitorCommand(instance.name, self._CONT_CMD)
1900

    
1901
  def StartInstance(self, instance, block_devices, startup_paused):
1902
    """Start an instance.
1903

1904
    """
1905
    self._CheckDown(instance.name)
1906
    kvmpath = instance.hvparams[constants.HV_KVM_PATH]
1907
    kvmhelp = self._GetKVMOutput(kvmpath, self._KVMOPT_HELP)
1908
    kvm_runtime = self._GenerateKVMRuntime(instance, block_devices,
1909
                                           startup_paused, kvmhelp)
1910
    self._SaveKVMRuntime(instance, kvm_runtime)
1911
    self._ExecuteKVMRuntime(instance, kvm_runtime, kvmhelp)
1912

    
1913
  def _CallMonitorCommand(self, instance_name, command):
1914
    """Invoke a command on the instance monitor.
1915

1916
    """
1917
    # TODO: Replace monitor calls with QMP once KVM >= 0.14 is the minimum
1918
    # version. The monitor protocol is designed for human consumption, whereas
1919
    # QMP is made for programmatic usage. In the worst case QMP can also
1920
    # execute monitor commands. As it is, all calls to socat take at least
1921
    # 500ms and likely more: socat can't detect the end of the reply and waits
1922
    # for 500ms of no data received before exiting (500 ms is the default for
1923
    # the "-t" parameter).
1924
    socat = ("echo %s | %s STDIO UNIX-CONNECT:%s" %
1925
             (utils.ShellQuote(command),
1926
              constants.SOCAT_PATH,
1927
              utils.ShellQuote(self._InstanceMonitor(instance_name))))
1928
    result = utils.RunCmd(socat)
1929
    if result.failed:
1930
      msg = ("Failed to send command '%s' to instance '%s', reason '%s',"
1931
             " output: %s" %
1932
             (command, instance_name, result.fail_reason, result.output))
1933
      raise errors.HypervisorError(msg)
1934

    
1935
    return result
1936

    
1937
  def _GetFreePCISlot(self, instance, dev):
1938
    """Get the first available pci slot of a runnung instance.
1939

1940
    """
1941
    slots = bitarray(32)
1942
    slots.setall(False) # pylint: disable=E1101
1943
    output = self._CallMonitorCommand(instance.name, self._INFO_PCI_CMD)
1944
    for line in output.stdout.splitlines():
1945
      match = self._INFO_PCI_RE.search(line)
1946
      if match:
1947
        slot = int(match.group(1))
1948
        slots[slot] = True
1949

    
1950
    [free] = slots.search(_AVAILABLE_PCI_SLOT, 1) # pylint: disable=E1101
1951
    if not free:
1952
      raise errors.HypervisorError("All PCI slots occupied")
1953

    
1954
    dev.pci = int(free)
1955

    
1956
  def VerifyHotplugSupport(self, instance, action, dev_type):
1957
    """Check if hotplug is supported.
1958

1959
    Hotplug is *not* supported in case of:
1960
     - security models and chroot (disk hotplug)
1961
     - fdsend module is missing (nic hot-add)
1962

1963
    @raise errors.HypervisorError: in previous cases
1964

1965
    """
1966
    if dev_type == constants.HOTPLUG_TARGET_DISK:
1967
      hvp = instance.hvparams
1968
      security_model = hvp[constants.HV_SECURITY_MODEL]
1969
      use_chroot = hvp[constants.HV_KVM_USE_CHROOT]
1970
      if use_chroot:
1971
        raise errors.HotplugError("Disk hotplug is not supported"
1972
                                  " in case of chroot.")
1973
      if security_model != constants.HT_SM_NONE:
1974
        raise errors.HotplugError("Disk Hotplug is not supported in case"
1975
                                  " security models are used.")
1976

    
1977
    if (dev_type == constants.HOTPLUG_TARGET_NIC and
1978
        action == constants.HOTPLUG_ACTION_ADD and not fdsend):
1979
      raise errors.HotplugError("Cannot hot-add NIC."
1980
                                " fdsend python module is missing.")
1981
    return True
1982

    
1983
  def HotplugSupported(self, instance):
1984
    """Checks if hotplug is generally supported.
1985

1986
    Hotplug is *not* supported in case of:
1987
     - qemu versions < 1.0
1988
     - for stopped instances
1989

1990
    @raise errors.HypervisorError: in one of the previous cases
1991

1992
    """
1993
    output = self._CallMonitorCommand(instance.name, self._INFO_VERSION_CMD)
1994
    # TODO: search for netdev_add, drive_add, device_add.....
1995
    match = self._INFO_VERSION_RE.search(output.stdout)
1996
    if not match:
1997
      raise errors.HotplugError("Try hotplug only in running instances.")
1998
    v_major, v_min, _, _ = match.groups()
1999
    if (int(v_major), int(v_min)) < (1, 0):
2000
      raise errors.HotplugError("Hotplug not supported for qemu versions < 1.0")
2001

    
2002
  def _CallHotplugCommand(self, name, cmd):
2003
    output = self._CallMonitorCommand(name, cmd)
2004
    # TODO: parse output and check if succeeded
2005
    for line in output.stdout.splitlines():
2006
      logging.info("%s", line)
2007

    
2008
  def HotAddDevice(self, instance, dev_type, device, extra, seq):
2009
    """ Helper method to hot-add a new device
2010

2011
    It gets free pci slot generates the device name and invokes the
2012
    device specific method.
2013

2014
    """
2015
    # in case of hot-mod this is given
2016
    if device.pci is None:
2017
      self._GetFreePCISlot(instance, device)
2018
    kvm_devid = _GenerateDeviceKVMId(dev_type, device)
2019
    runtime = self._LoadKVMRuntime(instance)
2020
    if dev_type == constants.HOTPLUG_TARGET_DISK:
2021
      command = "drive_add dummy file=%s,if=none,id=%s,format=raw\n" % \
2022
                 (extra, kvm_devid)
2023
      command += ("device_add virtio-blk-pci,bus=pci.0,addr=%s,drive=%s,id=%s" %
2024
                  (hex(device.pci), kvm_devid, kvm_devid))
2025
    elif dev_type == constants.HOTPLUG_TARGET_NIC:
2026
      (tap, fd) = _OpenTap()
2027
      self._ConfigureNIC(instance, seq, device, tap)
2028
      self._PassTapFd(instance, fd, device)
2029
      command = "netdev_add tap,id=%s,fd=%s\n" % (kvm_devid, kvm_devid)
2030
      args = "virtio-net-pci,bus=pci.0,addr=%s,mac=%s,netdev=%s,id=%s" % \
2031
               (hex(device.pci), device.mac, kvm_devid, kvm_devid)
2032
      command += "device_add %s" % args
2033
      utils.WriteFile(self._InstanceNICFile(instance.name, seq), data=tap)
2034

    
2035
    self._CallHotplugCommand(instance.name, command)
2036
    # update relevant entries in runtime file
2037
    index = _DEVICE_RUNTIME_INDEX[dev_type]
2038
    entry = _RUNTIME_ENTRY[dev_type](device, extra)
2039
    runtime[index].append(entry)
2040
    self._SaveKVMRuntime(instance, runtime)
2041

    
2042
  def HotDelDevice(self, instance, dev_type, device, _, seq):
2043
    """ Helper method for hot-del device
2044

2045
    It gets device info from runtime file, generates the device name and
2046
    invokes the device specific method.
2047

2048
    """
2049
    runtime = self._LoadKVMRuntime(instance)
2050
    entry = _GetExistingDeviceInfo(dev_type, device, runtime)
2051
    kvm_device = _RUNTIME_DEVICE[dev_type](entry)
2052
    kvm_devid = _GenerateDeviceKVMId(dev_type, kvm_device)
2053
    if dev_type == constants.HOTPLUG_TARGET_DISK:
2054
      command = "device_del %s\n" % kvm_devid
2055
      command += "drive_del %s" % kvm_devid
2056
    elif dev_type == constants.HOTPLUG_TARGET_NIC:
2057
      command = "device_del %s\n" % kvm_devid
2058
      command += "netdev_del %s" % kvm_devid
2059
      utils.RemoveFile(self._InstanceNICFile(instance.name, seq))
2060
    self._CallHotplugCommand(instance.name, command)
2061
    index = _DEVICE_RUNTIME_INDEX[dev_type]
2062
    runtime[index].remove(entry)
2063
    self._SaveKVMRuntime(instance, runtime)
2064

    
2065
    return kvm_device.pci
2066

    
2067
  def HotModDevice(self, instance, dev_type, device, _, seq):
2068
    """ Helper method for hot-mod device
2069

2070
    It gets device info from runtime file, generates the device name and
2071
    invokes the device specific method. Currently only NICs support hot-mod
2072

2073
    """
2074
    if dev_type == constants.HOTPLUG_TARGET_NIC:
2075
      # putting it back in the same pci slot
2076
      device.pci = self.HotDelDevice(instance, dev_type, device, _, seq)
2077
      # TODO: remove sleep when socat gets removed
2078
      time.sleep(2)
2079
      self.HotAddDevice(instance, dev_type, device, _, seq)
2080

    
2081
  def _PassTapFd(self, instance, fd, nic):
2082
    """Pass file descriptor to kvm process via monitor socket using SCM_RIGHTS
2083

2084
    """
2085
    # TODO: factor out code related to unix sockets.
2086
    #       squash common parts between monitor and qmp
2087
    kvm_devid = _GenerateDeviceKVMId(constants.HOTPLUG_TARGET_NIC, nic)
2088
    command = "getfd %s\n" % kvm_devid
2089
    fds = [fd]
2090
    logging.info("%s", fds)
2091
    try:
2092
      monsock = MonitorSocket(self._InstanceMonitor(instance.name))
2093
      monsock.connect()
2094
      fdsend.sendfds(monsock.sock, command, fds=fds)
2095
    finally:
2096
      monsock.close()
2097

    
2098
  @classmethod
2099
  def _ParseKVMVersion(cls, text):
2100
    """Parse the KVM version from the --help output.
2101

2102
    @type text: string
2103
    @param text: output of kvm --help
2104
    @return: (version, v_maj, v_min, v_rev)
2105
    @raise errors.HypervisorError: when the KVM version cannot be retrieved
2106

2107
    """
2108
    match = cls._VERSION_RE.search(text.splitlines()[0])
2109
    if not match:
2110
      raise errors.HypervisorError("Unable to get KVM version")
2111

    
2112
    v_all = match.group(0)
2113
    v_maj = int(match.group(1))
2114
    v_min = int(match.group(2))
2115
    if match.group(4):
2116
      v_rev = int(match.group(4))
2117
    else:
2118
      v_rev = 0
2119
    return (v_all, v_maj, v_min, v_rev)
2120

    
2121
  @classmethod
2122
  def _GetKVMOutput(cls, kvm_path, option):
2123
    """Return the output of a kvm invocation
2124

2125
    @type kvm_path: string
2126
    @param kvm_path: path to the kvm executable
2127
    @type option: a key of _KVMOPTS_CMDS
2128
    @param option: kvm option to fetch the output from
2129
    @return: output a supported kvm invocation
2130
    @raise errors.HypervisorError: when the KVM help output cannot be retrieved
2131

2132
    """
2133
    assert option in cls._KVMOPTS_CMDS, "Invalid output option"
2134

    
2135
    optlist, can_fail = cls._KVMOPTS_CMDS[option]
2136

    
2137
    result = utils.RunCmd([kvm_path] + optlist)
2138
    if result.failed and not can_fail:
2139
      raise errors.HypervisorError("Unable to get KVM %s output" %
2140
                                    " ".join(cls._KVMOPTS_CMDS[option]))
2141
    return result.output
2142

    
2143
  @classmethod
2144
  def _GetKVMVersion(cls, kvm_path):
2145
    """Return the installed KVM version.
2146

2147
    @return: (version, v_maj, v_min, v_rev)
2148
    @raise errors.HypervisorError: when the KVM version cannot be retrieved
2149

2150
    """
2151
    return cls._ParseKVMVersion(cls._GetKVMOutput(kvm_path, cls._KVMOPT_HELP))
2152

    
2153
  @classmethod
2154
  def _GetDefaultMachineVersion(cls, kvm_path):
2155
    """Return the default hardware revision (e.g. pc-1.1)
2156

2157
    """
2158
    output = cls._GetKVMOutput(kvm_path, cls._KVMOPT_MLIST)
2159
    match = cls._DEFAULT_MACHINE_VERSION_RE.search(output)
2160
    if match:
2161
      return match.group(1)
2162
    else:
2163
      return "pc"
2164

    
2165
  def StopInstance(self, instance, force=False, retry=False, name=None):
2166
    """Stop an instance.
2167

2168
    """
2169
    if name is not None and not force:
2170
      raise errors.HypervisorError("Cannot shutdown cleanly by name only")
2171
    if name is None:
2172
      name = instance.name
2173
      acpi = instance.hvparams[constants.HV_ACPI]
2174
    else:
2175
      acpi = False
2176
    _, pid, alive = self._InstancePidAlive(name)
2177
    if pid > 0 and alive:
2178
      if force or not acpi:
2179
        utils.KillProcess(pid)
2180
      else:
2181
        self._CallMonitorCommand(name, "system_powerdown")
2182

    
2183
  def CleanupInstance(self, instance_name):
2184
    """Cleanup after a stopped instance
2185

2186
    """
2187
    pidfile, pid, alive = self._InstancePidAlive(instance_name)
2188
    if pid > 0 and alive:
2189
      raise errors.HypervisorError("Cannot cleanup a live instance")
2190
    self._RemoveInstanceRuntimeFiles(pidfile, instance_name)
2191

    
2192
  def RebootInstance(self, instance):
2193
    """Reboot an instance.
2194

2195
    """
2196
    # For some reason if we do a 'send-key ctrl-alt-delete' to the control
2197
    # socket the instance will stop, but now power up again. So we'll resort
2198
    # to shutdown and restart.
2199
    _, _, alive = self._InstancePidAlive(instance.name)
2200
    if not alive:
2201
      raise errors.HypervisorError("Failed to reboot instance %s:"
2202
                                   " not running" % instance.name)
2203
    # StopInstance will delete the saved KVM runtime so:
2204
    # ...first load it...
2205
    kvm_runtime = self._LoadKVMRuntime(instance)
2206
    # ...now we can safely call StopInstance...
2207
    if not self.StopInstance(instance):
2208
      self.StopInstance(instance, force=True)
2209
    # ...and finally we can save it again, and execute it...
2210
    self._SaveKVMRuntime(instance, kvm_runtime)
2211
    kvmpath = instance.hvparams[constants.HV_KVM_PATH]
2212
    kvmhelp = self._GetKVMOutput(kvmpath, self._KVMOPT_HELP)
2213
    self._ExecuteKVMRuntime(instance, kvm_runtime, kvmhelp)
2214

    
2215
  def MigrationInfo(self, instance):
2216
    """Get instance information to perform a migration.
2217

2218
    @type instance: L{objects.Instance}
2219
    @param instance: instance to be migrated
2220
    @rtype: string
2221
    @return: content of the KVM runtime file
2222

2223
    """
2224
    return self._ReadKVMRuntime(instance.name)
2225

    
2226
  def AcceptInstance(self, instance, info, target):
2227
    """Prepare to accept an instance.
2228

2229
    @type instance: L{objects.Instance}
2230
    @param instance: instance to be accepted
2231
    @type info: string
2232
    @param info: content of the KVM runtime file on the source node
2233
    @type target: string
2234
    @param target: target host (usually ip), on this node
2235

2236
    """
2237
    kvm_runtime = self._LoadKVMRuntime(instance, serialized_runtime=info)
2238
    incoming_address = (target, instance.hvparams[constants.HV_MIGRATION_PORT])
2239
    kvmpath = instance.hvparams[constants.HV_KVM_PATH]
2240
    kvmhelp = self._GetKVMOutput(kvmpath, self._KVMOPT_HELP)
2241
    self._ExecuteKVMRuntime(instance, kvm_runtime, kvmhelp,
2242
                            incoming=incoming_address)
2243

    
2244
  def FinalizeMigrationDst(self, instance, info, success):
2245
    """Finalize the instance migration on the target node.
2246

2247
    Stop the incoming mode KVM.
2248

2249
    @type instance: L{objects.Instance}
2250
    @param instance: instance whose migration is being finalized
2251

2252
    """
2253
    if success:
2254
      kvm_runtime = self._LoadKVMRuntime(instance, serialized_runtime=info)
2255
      kvm_nics = kvm_runtime[1]
2256

    
2257
      for nic_seq, nic in enumerate(kvm_nics):
2258
        if nic.nicparams[constants.NIC_MODE] == constants.NIC_MODE_BRIDGED:
2259
          # Bridged interfaces have already been configured
2260
          continue
2261
        try:
2262
          tap = utils.ReadFile(self._InstanceNICFile(instance.name, nic_seq))
2263
        except EnvironmentError, err:
2264
          logging.warning("Failed to find host interface for %s NIC #%d: %s",
2265
                          instance.name, nic_seq, str(err))
2266
          continue
2267
        try:
2268
          self._ConfigureNIC(instance, nic_seq, nic, tap)
2269
        except errors.HypervisorError, err:
2270
          logging.warning(str(err))
2271

    
2272
      self._WriteKVMRuntime(instance.name, info)
2273
    else:
2274
      self.StopInstance(instance, force=True)
2275

    
2276
  def MigrateInstance(self, instance, target, live):
2277
    """Migrate an instance to a target node.
2278

2279
    The migration will not be attempted if the instance is not
2280
    currently running.
2281

2282
    @type instance: L{objects.Instance}
2283
    @param instance: the instance to be migrated
2284
    @type target: string
2285
    @param target: ip address of the target node
2286
    @type live: boolean
2287
    @param live: perform a live migration
2288

2289
    """
2290
    instance_name = instance.name
2291
    port = instance.hvparams[constants.HV_MIGRATION_PORT]
2292
    _, _, alive = self._InstancePidAlive(instance_name)
2293
    if not alive:
2294
      raise errors.HypervisorError("Instance not running, cannot migrate")
2295

    
2296
    if not live:
2297
      self._CallMonitorCommand(instance_name, "stop")
2298

    
2299
    migrate_command = ("migrate_set_speed %dm" %
2300
                       instance.hvparams[constants.HV_MIGRATION_BANDWIDTH])
2301
    self._CallMonitorCommand(instance_name, migrate_command)
2302

    
2303
    migrate_command = ("migrate_set_downtime %dms" %
2304
                       instance.hvparams[constants.HV_MIGRATION_DOWNTIME])
2305
    self._CallMonitorCommand(instance_name, migrate_command)
2306

    
2307
    migrate_command = "migrate -d tcp:%s:%s" % (target, port)
2308
    self._CallMonitorCommand(instance_name, migrate_command)
2309

    
2310
  def FinalizeMigrationSource(self, instance, success, live):
2311
    """Finalize the instance migration on the source node.
2312

2313
    @type instance: L{objects.Instance}
2314
    @param instance: the instance that was migrated
2315
    @type success: bool
2316
    @param success: whether the migration succeeded or not
2317
    @type live: bool
2318
    @param live: whether the user requested a live migration or not
2319

2320
    """
2321
    if success:
2322
      pidfile, pid, _ = self._InstancePidAlive(instance.name)
2323
      utils.KillProcess(pid)
2324
      self._RemoveInstanceRuntimeFiles(pidfile, instance.name)
2325
    elif live:
2326
      self._CallMonitorCommand(instance.name, self._CONT_CMD)
2327

    
2328
  def GetMigrationStatus(self, instance):
2329
    """Get the migration status
2330

2331
    @type instance: L{objects.Instance}
2332
    @param instance: the instance that is being migrated
2333
    @rtype: L{objects.MigrationStatus}
2334
    @return: the status of the current migration (one of
2335
             L{constants.HV_MIGRATION_VALID_STATUSES}), plus any additional
2336
             progress info that can be retrieved from the hypervisor
2337

2338
    """
2339
    info_command = "info migrate"
2340
    for _ in range(self._MIGRATION_INFO_MAX_BAD_ANSWERS):
2341
      result = self._CallMonitorCommand(instance.name, info_command)
2342
      match = self._MIGRATION_STATUS_RE.search(result.stdout)
2343
      if not match:
2344
        if not result.stdout:
2345
          logging.info("KVM: empty 'info migrate' result")
2346
        else:
2347
          logging.warning("KVM: unknown 'info migrate' result: %s",
2348
                          result.stdout)
2349
      else:
2350
        status = match.group(1)
2351
        if status in constants.HV_KVM_MIGRATION_VALID_STATUSES:
2352
          migration_status = objects.MigrationStatus(status=status)
2353
          match = self._MIGRATION_PROGRESS_RE.search(result.stdout)
2354
          if match:
2355
            migration_status.transferred_ram = match.group("transferred")
2356
            migration_status.total_ram = match.group("total")
2357

    
2358
          return migration_status
2359

    
2360
        logging.warning("KVM: unknown migration status '%s'", status)
2361

    
2362
      time.sleep(self._MIGRATION_INFO_RETRY_DELAY)
2363

    
2364
    return objects.MigrationStatus(status=constants.HV_MIGRATION_FAILED)
2365

    
2366
  def BalloonInstanceMemory(self, instance, mem):
2367
    """Balloon an instance memory to a certain value.
2368

2369
    @type instance: L{objects.Instance}
2370
    @param instance: instance to be accepted
2371
    @type mem: int
2372
    @param mem: actual memory size to use for instance runtime
2373

2374
    """
2375
    self._CallMonitorCommand(instance.name, "balloon %d" % mem)
2376

    
2377
  def GetNodeInfo(self):
2378
    """Return information about the node.
2379

2380
    @return: a dict with the following keys (values in MiB):
2381
          - memory_total: the total memory size on the node
2382
          - memory_free: the available memory on the node for instances
2383
          - memory_dom0: the memory used by the node itself, if available
2384
          - hv_version: the hypervisor version in the form (major, minor,
2385
                        revision)
2386

2387
    """
2388
    result = self.GetLinuxNodeInfo()
2389
    # FIXME: this is the global kvm version, but the actual version can be
2390
    # customized as an hv parameter. we should use the nodegroup's default kvm
2391
    # path parameter here.
2392
    _, v_major, v_min, v_rev = self._GetKVMVersion(constants.KVM_PATH)
2393
    result[constants.HV_NODEINFO_KEY_VERSION] = (v_major, v_min, v_rev)
2394
    return result
2395

    
2396
  @classmethod
2397
  def GetInstanceConsole(cls, instance, hvparams, beparams):
2398
    """Return a command for connecting to the console of an instance.
2399

2400
    """
2401
    if hvparams[constants.HV_SERIAL_CONSOLE]:
2402
      cmd = [pathutils.KVM_CONSOLE_WRAPPER,
2403
             constants.SOCAT_PATH, utils.ShellQuote(instance.name),
2404
             utils.ShellQuote(cls._InstanceMonitor(instance.name)),
2405
             "STDIO,%s" % cls._SocatUnixConsoleParams(),
2406
             "UNIX-CONNECT:%s" % cls._InstanceSerial(instance.name)]
2407
      return objects.InstanceConsole(instance=instance.name,
2408
                                     kind=constants.CONS_SSH,
2409
                                     host=instance.primary_node,
2410
                                     user=constants.SSH_CONSOLE_USER,
2411
                                     command=cmd)
2412

    
2413
    vnc_bind_address = hvparams[constants.HV_VNC_BIND_ADDRESS]
2414
    if vnc_bind_address and instance.network_port > constants.VNC_BASE_PORT:
2415
      display = instance.network_port - constants.VNC_BASE_PORT
2416
      return objects.InstanceConsole(instance=instance.name,
2417
                                     kind=constants.CONS_VNC,
2418
                                     host=vnc_bind_address,
2419
                                     port=instance.network_port,
2420
                                     display=display)
2421

    
2422
    spice_bind = hvparams[constants.HV_KVM_SPICE_BIND]
2423
    if spice_bind:
2424
      return objects.InstanceConsole(instance=instance.name,
2425
                                     kind=constants.CONS_SPICE,
2426
                                     host=spice_bind,
2427
                                     port=instance.network_port)
2428

    
2429
    return objects.InstanceConsole(instance=instance.name,
2430
                                   kind=constants.CONS_MESSAGE,
2431
                                   message=("No serial shell for instance %s" %
2432
                                            instance.name))
2433

    
2434
  def Verify(self):
2435
    """Verify the hypervisor.
2436

2437
    Check that the required binaries exist.
2438

2439
    @return: Problem description if something is wrong, C{None} otherwise
2440

2441
    """
2442
    msgs = []
2443
    # FIXME: this is the global kvm binary, but the actual path can be
2444
    # customized as an hv parameter; we should use the nodegroup's
2445
    # default kvm path parameter here.
2446
    if not os.path.exists(constants.KVM_PATH):
2447
      msgs.append("The KVM binary ('%s') does not exist" % constants.KVM_PATH)
2448
    if not os.path.exists(constants.SOCAT_PATH):
2449
      msgs.append("The socat binary ('%s') does not exist" %
2450
                  constants.SOCAT_PATH)
2451

    
2452
    return self._FormatVerifyResults(msgs)
2453

    
2454
  @classmethod
2455
  def CheckParameterSyntax(cls, hvparams):
2456
    """Check the given parameters for validity.
2457

2458
    @type hvparams:  dict
2459
    @param hvparams: dictionary with parameter names/value
2460
    @raise errors.HypervisorError: when a parameter is not valid
2461

2462
    """
2463
    super(KVMHypervisor, cls).CheckParameterSyntax(hvparams)
2464

    
2465
    kernel_path = hvparams[constants.HV_KERNEL_PATH]
2466
    if kernel_path:
2467
      if not hvparams[constants.HV_ROOT_PATH]:
2468
        raise errors.HypervisorError("Need a root partition for the instance,"
2469
                                     " if a kernel is defined")
2470

    
2471
    if (hvparams[constants.HV_VNC_X509_VERIFY] and
2472
        not hvparams[constants.HV_VNC_X509]):
2473
      raise errors.HypervisorError("%s must be defined, if %s is" %
2474
                                   (constants.HV_VNC_X509,
2475
                                    constants.HV_VNC_X509_VERIFY))
2476

    
2477
    if hvparams[constants.HV_SERIAL_CONSOLE]:
2478
      serial_speed = hvparams[constants.HV_SERIAL_SPEED]
2479
      valid_speeds = constants.VALID_SERIAL_SPEEDS
2480
      if not serial_speed or serial_speed not in valid_speeds:
2481
        raise errors.HypervisorError("Invalid serial console speed, must be"
2482
                                     " one of: %s" %
2483
                                     utils.CommaJoin(valid_speeds))
2484

    
2485
    boot_order = hvparams[constants.HV_BOOT_ORDER]
2486
    if (boot_order == constants.HT_BO_CDROM and
2487
        not hvparams[constants.HV_CDROM_IMAGE_PATH]):
2488
      raise errors.HypervisorError("Cannot boot from cdrom without an"
2489
                                   " ISO path")
2490

    
2491
    security_model = hvparams[constants.HV_SECURITY_MODEL]
2492
    if security_model == constants.HT_SM_USER:
2493
      if not hvparams[constants.HV_SECURITY_DOMAIN]:
2494
        raise errors.HypervisorError("A security domain (user to run kvm as)"
2495
                                     " must be specified")
2496
    elif (security_model == constants.HT_SM_NONE or
2497
          security_model == constants.HT_SM_POOL):
2498
      if hvparams[constants.HV_SECURITY_DOMAIN]:
2499
        raise errors.HypervisorError("Cannot have a security domain when the"
2500
                                     " security model is 'none' or 'pool'")
2501

    
2502
    spice_bind = hvparams[constants.HV_KVM_SPICE_BIND]
2503
    spice_ip_version = hvparams[constants.HV_KVM_SPICE_IP_VERSION]
2504
    if spice_bind:
2505
      if spice_ip_version != constants.IFACE_NO_IP_VERSION_SPECIFIED:
2506
        # if an IP version is specified, the spice_bind parameter must be an
2507
        # IP of that family
2508
        if (netutils.IP4Address.IsValid(spice_bind) and
2509
            spice_ip_version != constants.IP4_VERSION):
2510
          raise errors.HypervisorError("SPICE: Got an IPv4 address (%s), but"
2511
                                       " the specified IP version is %s" %
2512
                                       (spice_bind, spice_ip_version))
2513

    
2514
        if (netutils.IP6Address.IsValid(spice_bind) and
2515
            spice_ip_version != constants.IP6_VERSION):
2516
          raise errors.HypervisorError("SPICE: Got an IPv6 address (%s), but"
2517
                                       " the specified IP version is %s" %
2518
                                       (spice_bind, spice_ip_version))
2519
    else:
2520
      # All the other SPICE parameters depend on spice_bind being set. Raise an
2521
      # error if any of them is set without it.
2522
      for param in _SPICE_ADDITIONAL_PARAMS:
2523
        if hvparams[param]:
2524
          raise errors.HypervisorError("SPICE: %s requires %s to be set" %
2525
                                       (param, constants.HV_KVM_SPICE_BIND))
2526

    
2527
  @classmethod
2528
  def ValidateParameters(cls, hvparams):
2529
    """Check the given parameters for validity.
2530

2531
    @type hvparams:  dict
2532
    @param hvparams: dictionary with parameter names/value
2533
    @raise errors.HypervisorError: when a parameter is not valid
2534

2535
    """
2536
    super(KVMHypervisor, cls).ValidateParameters(hvparams)
2537

    
2538
    kvm_path = hvparams[constants.HV_KVM_PATH]
2539

    
2540
    security_model = hvparams[constants.HV_SECURITY_MODEL]
2541
    if security_model == constants.HT_SM_USER:
2542
      username = hvparams[constants.HV_SECURITY_DOMAIN]
2543
      try:
2544
        pwd.getpwnam(username)
2545
      except KeyError:
2546
        raise errors.HypervisorError("Unknown security domain user %s"
2547
                                     % username)
2548

    
2549
    spice_bind = hvparams[constants.HV_KVM_SPICE_BIND]
2550
    if spice_bind:
2551
      # only one of VNC and SPICE can be used currently.
2552
      if hvparams[constants.HV_VNC_BIND_ADDRESS]:
2553
        raise errors.HypervisorError("Both SPICE and VNC are configured, but"
2554
                                     " only one of them can be used at a"
2555
                                     " given time")
2556

    
2557
      # check that KVM supports SPICE
2558
      kvmhelp = cls._GetKVMOutput(kvm_path, cls._KVMOPT_HELP)
2559
      if not cls._SPICE_RE.search(kvmhelp):
2560
        raise errors.HypervisorError("SPICE is configured, but it is not"
2561
                                     " supported according to 'kvm --help'")
2562

    
2563
      # if spice_bind is not an IP address, it must be a valid interface
2564
      bound_to_addr = (netutils.IP4Address.IsValid(spice_bind) or
2565
                       netutils.IP6Address.IsValid(spice_bind))
2566
      if not bound_to_addr and not netutils.IsValidInterface(spice_bind):
2567
        raise errors.HypervisorError("SPICE: The %s parameter must be either"
2568
                                     " a valid IP address or interface name" %
2569
                                     constants.HV_KVM_SPICE_BIND)
2570

    
2571
    machine_version = hvparams[constants.HV_KVM_MACHINE_VERSION]
2572
    if machine_version:
2573
      output = cls._GetKVMOutput(kvm_path, cls._KVMOPT_MLIST)
2574
      if not cls._CHECK_MACHINE_VERSION_RE(machine_version).search(output):
2575
        raise errors.HypervisorError("Unsupported machine version: %s" %
2576
                                     machine_version)
2577

    
2578
  @classmethod
2579
  def PowercycleNode(cls):
2580
    """KVM powercycle, just a wrapper over Linux powercycle.
2581

2582
    """
2583
    cls.LinuxPowercycle()