Statistics
| Branch: | Tag: | Revision:

root / lib / bootstrap.py @ 57c7bc57

History | View | Annotate | Download (31.1 kB)

1 a0c9f010 Michael Hanselmann
#
2 a0c9f010 Michael Hanselmann
#
3 a0c9f010 Michael Hanselmann
4 7925d409 Apollon Oikonomopoulos
# Copyright (C) 2006, 2007, 2008, 2010, 2011 Google Inc.
5 a0c9f010 Michael Hanselmann
#
6 a0c9f010 Michael Hanselmann
# This program is free software; you can redistribute it and/or modify
7 a0c9f010 Michael Hanselmann
# it under the terms of the GNU General Public License as published by
8 a0c9f010 Michael Hanselmann
# the Free Software Foundation; either version 2 of the License, or
9 a0c9f010 Michael Hanselmann
# (at your option) any later version.
10 a0c9f010 Michael Hanselmann
#
11 a0c9f010 Michael Hanselmann
# This program is distributed in the hope that it will be useful, but
12 a0c9f010 Michael Hanselmann
# WITHOUT ANY WARRANTY; without even the implied warranty of
13 a0c9f010 Michael Hanselmann
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 a0c9f010 Michael Hanselmann
# General Public License for more details.
15 a0c9f010 Michael Hanselmann
#
16 a0c9f010 Michael Hanselmann
# You should have received a copy of the GNU General Public License
17 a0c9f010 Michael Hanselmann
# along with this program; if not, write to the Free Software
18 a0c9f010 Michael Hanselmann
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19 a0c9f010 Michael Hanselmann
# 02110-1301, USA.
20 a0c9f010 Michael Hanselmann
21 a0c9f010 Michael Hanselmann
22 a0c9f010 Michael Hanselmann
"""Functions to bootstrap a new cluster.
23 a0c9f010 Michael Hanselmann

24 a0c9f010 Michael Hanselmann
"""
25 a0c9f010 Michael Hanselmann
26 a0c9f010 Michael Hanselmann
import os
27 a0c9f010 Michael Hanselmann
import os.path
28 a0c9f010 Michael Hanselmann
import re
29 b1b6ea87 Iustin Pop
import logging
30 d693c864 Iustin Pop
import time
31 a0c9f010 Michael Hanselmann
32 a0c9f010 Michael Hanselmann
from ganeti import rpc
33 a0c9f010 Michael Hanselmann
from ganeti import ssh
34 a0c9f010 Michael Hanselmann
from ganeti import utils
35 a0c9f010 Michael Hanselmann
from ganeti import errors
36 a0c9f010 Michael Hanselmann
from ganeti import config
37 a0c9f010 Michael Hanselmann
from ganeti import constants
38 b9eeeb02 Michael Hanselmann
from ganeti import objects
39 a0c9f010 Michael Hanselmann
from ganeti import ssconf
40 a33848a5 Guido Trotter
from ganeti import serializer
41 a5728081 Guido Trotter
from ganeti import hypervisor
42 a721e23a Luca Bigliardi
from ganeti import bdev
43 a744b676 Manuel Franceschini
from ganeti import netutils
44 d367b66c Manuel Franceschini
from ganeti import backend
45 3b6b6129 Michael Hanselmann
from ganeti import luxi
46 ff699aa9 Michael Hanselmann
from ganeti import jstore
47 3b6b6129 Michael Hanselmann
48 a0c9f010 Michael Hanselmann
49 88b92fe3 Guido Trotter
# ec_id for InitConfig's temporary reservation manager
50 88b92fe3 Guido Trotter
_INITCONF_ECID = "initconfig-ecid"
51 88b92fe3 Guido Trotter
52 3b6b6129 Michael Hanselmann
#: After how many seconds daemon must be responsive
53 3b6b6129 Michael Hanselmann
_DAEMON_READY_TIMEOUT = 10.0
54 3b6b6129 Michael Hanselmann
55 e38220e4 Michael Hanselmann
56 531baf8e Iustin Pop
def _InitSSHSetup():
57 a0c9f010 Michael Hanselmann
  """Setup the SSH configuration for the cluster.
58 a0c9f010 Michael Hanselmann

59 a0c9f010 Michael Hanselmann
  This generates a dsa keypair for root, adds the pub key to the
60 a0c9f010 Michael Hanselmann
  permitted hosts and adds the hostkey to its own known hosts.
61 a0c9f010 Michael Hanselmann

62 a0c9f010 Michael Hanselmann
  """
63 a0c9f010 Michael Hanselmann
  priv_key, pub_key, auth_keys = ssh.GetUserFiles(constants.GANETI_RUNAS)
64 a0c9f010 Michael Hanselmann
65 a0c9f010 Michael Hanselmann
  for name in priv_key, pub_key:
66 a0c9f010 Michael Hanselmann
    if os.path.exists(name):
67 a0c9f010 Michael Hanselmann
      utils.CreateBackup(name)
68 a0c9f010 Michael Hanselmann
    utils.RemoveFile(name)
69 a0c9f010 Michael Hanselmann
70 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ssh-keygen", "-t", "dsa",
71 a0c9f010 Michael Hanselmann
                         "-f", priv_key,
72 a0c9f010 Michael Hanselmann
                         "-q", "-N", ""])
73 a0c9f010 Michael Hanselmann
  if result.failed:
74 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not generate ssh keypair, error %s" %
75 a0c9f010 Michael Hanselmann
                             result.output)
76 a0c9f010 Michael Hanselmann
77 7a0156dc Luca Bigliardi
  utils.AddAuthorizedKey(auth_keys, utils.ReadFile(pub_key))
78 a0c9f010 Michael Hanselmann
79 a0c9f010 Michael Hanselmann
80 c008906b Michael Hanselmann
def GenerateHmacKey(file_name):
81 c008906b Michael Hanselmann
  """Writes a new HMAC key.
82 c008906b Michael Hanselmann

83 c008906b Michael Hanselmann
  @type file_name: str
84 c008906b Michael Hanselmann
  @param file_name: Path to output file
85 c008906b Michael Hanselmann

86 c008906b Michael Hanselmann
  """
87 43575108 Michael Hanselmann
  utils.WriteFile(file_name, data="%s\n" % utils.GenerateSecret(), mode=0400,
88 43575108 Michael Hanselmann
                  backup=True)
89 43575108 Michael Hanselmann
90 43575108 Michael Hanselmann
91 b6267745 Andrea Spadaccini
def GenerateClusterCrypto(new_cluster_cert, new_rapi_cert, new_spice_cert,
92 b6267745 Andrea Spadaccini
                          new_confd_hmac_key, new_cds,
93 b6267745 Andrea Spadaccini
                          rapi_cert_pem=None, spice_cert_pem=None,
94 b6267745 Andrea Spadaccini
                          spice_cacert_pem=None, cds=None,
95 aeefe835 Iustin Pop
                          nodecert_file=constants.NODED_CERT_FILE,
96 aeefe835 Iustin Pop
                          rapicert_file=constants.RAPI_CERT_FILE,
97 b6267745 Andrea Spadaccini
                          spicecert_file=constants.SPICE_CERT_FILE,
98 b6267745 Andrea Spadaccini
                          spicecacert_file=constants.SPICE_CACERT_FILE,
99 fc0726b9 Michael Hanselmann
                          hmackey_file=constants.CONFD_HMAC_KEY,
100 fc0726b9 Michael Hanselmann
                          cds_file=constants.CLUSTER_DOMAIN_SECRET_FILE):
101 43575108 Michael Hanselmann
  """Updates the cluster certificates, keys and secrets.
102 43575108 Michael Hanselmann

103 43575108 Michael Hanselmann
  @type new_cluster_cert: bool
104 43575108 Michael Hanselmann
  @param new_cluster_cert: Whether to generate a new cluster certificate
105 43575108 Michael Hanselmann
  @type new_rapi_cert: bool
106 43575108 Michael Hanselmann
  @param new_rapi_cert: Whether to generate a new RAPI certificate
107 b6267745 Andrea Spadaccini
  @type new_spice_cert: bool
108 b6267745 Andrea Spadaccini
  @param new_spice_cert: Whether to generate a new SPICE certificate
109 6b7d5878 Michael Hanselmann
  @type new_confd_hmac_key: bool
110 6b7d5878 Michael Hanselmann
  @param new_confd_hmac_key: Whether to generate a new HMAC key
111 3db3eb2a Michael Hanselmann
  @type new_cds: bool
112 3db3eb2a Michael Hanselmann
  @param new_cds: Whether to generate a new cluster domain secret
113 43575108 Michael Hanselmann
  @type rapi_cert_pem: string
114 43575108 Michael Hanselmann
  @param rapi_cert_pem: New RAPI certificate in PEM format
115 b6267745 Andrea Spadaccini
  @type spice_cert_pem: string
116 b6267745 Andrea Spadaccini
  @param spice_cert_pem: New SPICE certificate in PEM format
117 b6267745 Andrea Spadaccini
  @type spice_cacert_pem: string
118 b6267745 Andrea Spadaccini
  @param spice_cacert_pem: Certificate of the CA that signed the SPICE
119 b6267745 Andrea Spadaccini
                           certificate, in PEM format
120 3db3eb2a Michael Hanselmann
  @type cds: string
121 3db3eb2a Michael Hanselmann
  @param cds: New cluster domain secret
122 aeefe835 Iustin Pop
  @type nodecert_file: string
123 aeefe835 Iustin Pop
  @param nodecert_file: optional override of the node cert file path
124 aeefe835 Iustin Pop
  @type rapicert_file: string
125 aeefe835 Iustin Pop
  @param rapicert_file: optional override of the rapi cert file path
126 b6267745 Andrea Spadaccini
  @type spicecert_file: string
127 b6267745 Andrea Spadaccini
  @param spicecert_file: optional override of the spice cert file path
128 b6267745 Andrea Spadaccini
  @type spicecacert_file: string
129 b6267745 Andrea Spadaccini
  @param spicecacert_file: optional override of the spice CA cert file path
130 aeefe835 Iustin Pop
  @type hmackey_file: string
131 aeefe835 Iustin Pop
  @param hmackey_file: optional override of the hmac key file path
132 43575108 Michael Hanselmann

133 43575108 Michael Hanselmann
  """
134 168c1de2 Michael Hanselmann
  # noded SSL certificate
135 aeefe835 Iustin Pop
  cluster_cert_exists = os.path.exists(nodecert_file)
136 43575108 Michael Hanselmann
  if new_cluster_cert or not cluster_cert_exists:
137 43575108 Michael Hanselmann
    if cluster_cert_exists:
138 aeefe835 Iustin Pop
      utils.CreateBackup(nodecert_file)
139 43575108 Michael Hanselmann
140 aeefe835 Iustin Pop
    logging.debug("Generating new cluster certificate at %s", nodecert_file)
141 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(nodecert_file)
142 43575108 Michael Hanselmann
143 6b7d5878 Michael Hanselmann
  # confd HMAC key
144 aeefe835 Iustin Pop
  if new_confd_hmac_key or not os.path.exists(hmackey_file):
145 aeefe835 Iustin Pop
    logging.debug("Writing new confd HMAC key to %s", hmackey_file)
146 aeefe835 Iustin Pop
    GenerateHmacKey(hmackey_file)
147 43575108 Michael Hanselmann
148 43575108 Michael Hanselmann
  # RAPI
149 aeefe835 Iustin Pop
  rapi_cert_exists = os.path.exists(rapicert_file)
150 43575108 Michael Hanselmann
151 43575108 Michael Hanselmann
  if rapi_cert_pem:
152 43575108 Michael Hanselmann
    # Assume rapi_pem contains a valid PEM-formatted certificate and key
153 aeefe835 Iustin Pop
    logging.debug("Writing RAPI certificate at %s", rapicert_file)
154 aeefe835 Iustin Pop
    utils.WriteFile(rapicert_file, data=rapi_cert_pem, backup=True)
155 43575108 Michael Hanselmann
156 43575108 Michael Hanselmann
  elif new_rapi_cert or not rapi_cert_exists:
157 43575108 Michael Hanselmann
    if rapi_cert_exists:
158 aeefe835 Iustin Pop
      utils.CreateBackup(rapicert_file)
159 43575108 Michael Hanselmann
160 aeefe835 Iustin Pop
    logging.debug("Generating new RAPI certificate at %s", rapicert_file)
161 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(rapicert_file)
162 c008906b Michael Hanselmann
163 b6267745 Andrea Spadaccini
  # SPICE
164 b6267745 Andrea Spadaccini
  spice_cert_exists = os.path.exists(spicecert_file)
165 b6267745 Andrea Spadaccini
  spice_cacert_exists = os.path.exists(spicecacert_file)
166 b6267745 Andrea Spadaccini
  if spice_cert_pem:
167 b6267745 Andrea Spadaccini
    # spice_cert_pem implies also spice_cacert_pem
168 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE certificate at %s", spicecert_file)
169 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecert_file, data=spice_cert_pem, backup=True)
170 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE CA certificate at %s", spicecacert_file)
171 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecacert_file, data=spice_cacert_pem, backup=True)
172 b6267745 Andrea Spadaccini
  elif new_spice_cert or not spice_cert_exists:
173 b6267745 Andrea Spadaccini
    if spice_cert_exists:
174 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecert_file)
175 b6267745 Andrea Spadaccini
    if spice_cacert_exists:
176 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecacert_file)
177 b6267745 Andrea Spadaccini
178 b6267745 Andrea Spadaccini
    logging.debug("Generating new self-signed SPICE certificate at %s",
179 b6267745 Andrea Spadaccini
                  spicecert_file)
180 b6267745 Andrea Spadaccini
    (_, cert_pem) = utils.GenerateSelfSignedSslCert(spicecert_file)
181 b6267745 Andrea Spadaccini
182 b6267745 Andrea Spadaccini
    # Self-signed certificate -> the public certificate is also the CA public
183 b6267745 Andrea Spadaccini
    # certificate
184 b6267745 Andrea Spadaccini
    logging.debug("Writing the public certificate to %s",
185 b6267745 Andrea Spadaccini
                  spicecert_file)
186 b6267745 Andrea Spadaccini
    utils.io.WriteFile(spicecacert_file, mode=0400, data=cert_pem)
187 b6267745 Andrea Spadaccini
188 3db3eb2a Michael Hanselmann
  # Cluster domain secret
189 3db3eb2a Michael Hanselmann
  if cds:
190 fc0726b9 Michael Hanselmann
    logging.debug("Writing cluster domain secret to %s", cds_file)
191 fc0726b9 Michael Hanselmann
    utils.WriteFile(cds_file, data=cds, backup=True)
192 fc0726b9 Michael Hanselmann
193 fc0726b9 Michael Hanselmann
  elif new_cds or not os.path.exists(cds_file):
194 fc0726b9 Michael Hanselmann
    logging.debug("Generating new cluster domain secret at %s", cds_file)
195 fc0726b9 Michael Hanselmann
    GenerateHmacKey(cds_file)
196 3db3eb2a Michael Hanselmann
197 c008906b Michael Hanselmann
198 8f215968 Michael Hanselmann
def _InitGanetiServerSetup(master_name):
199 40a97d80 Michael Hanselmann
  """Setup the necessary configuration for the initial node daemon.
200 40a97d80 Michael Hanselmann

201 40a97d80 Michael Hanselmann
  This creates the nodepass file containing the shared password for
202 600535f0 Manuel Franceschini
  the cluster, generates the SSL certificate and starts the node daemon.
203 600535f0 Manuel Franceschini

204 600535f0 Manuel Franceschini
  @type master_name: str
205 600535f0 Manuel Franceschini
  @param master_name: Name of the master node
206 40a97d80 Michael Hanselmann

207 40a97d80 Michael Hanselmann
  """
208 43575108 Michael Hanselmann
  # Generate cluster secrets
209 b6267745 Andrea Spadaccini
  GenerateClusterCrypto(True, False, False, False, False)
210 4a34c5cf Guido Trotter
211 f154a7a3 Michael Hanselmann
  result = utils.RunCmd([constants.DAEMON_UTIL, "start", constants.NODED])
212 a0c9f010 Michael Hanselmann
  if result.failed:
213 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not start the node daemon, command %s"
214 a0c9f010 Michael Hanselmann
                             " had exitcode %s and error %s" %
215 a0c9f010 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
216 a0c9f010 Michael Hanselmann
217 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(master_name)
218 5627f375 Michael Hanselmann
219 5627f375 Michael Hanselmann
220 5627f375 Michael Hanselmann
def _WaitForNodeDaemon(node_name):
221 5627f375 Michael Hanselmann
  """Wait for node daemon to become responsive.
222 5627f375 Michael Hanselmann

223 5627f375 Michael Hanselmann
  """
224 d3833ebd Michael Hanselmann
  def _CheckNodeDaemon():
225 db04ce5d Michael Hanselmann
    result = rpc.BootstrapRunner().call_version([node_name])[node_name]
226 d3833ebd Michael Hanselmann
    if result.fail_msg:
227 d3833ebd Michael Hanselmann
      raise utils.RetryAgain()
228 8f215968 Michael Hanselmann
229 d3833ebd Michael Hanselmann
  try:
230 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckNodeDaemon, 1.0, _DAEMON_READY_TIMEOUT)
231 d3833ebd Michael Hanselmann
  except utils.RetryTimeout:
232 5627f375 Michael Hanselmann
    raise errors.OpExecError("Node daemon on %s didn't answer queries within"
233 3b6b6129 Michael Hanselmann
                             " %s seconds" % (node_name, _DAEMON_READY_TIMEOUT))
234 3b6b6129 Michael Hanselmann
235 3b6b6129 Michael Hanselmann
236 3b6b6129 Michael Hanselmann
def _WaitForMasterDaemon():
237 3b6b6129 Michael Hanselmann
  """Wait for master daemon to become responsive.
238 3b6b6129 Michael Hanselmann

239 3b6b6129 Michael Hanselmann
  """
240 3b6b6129 Michael Hanselmann
  def _CheckMasterDaemon():
241 3b6b6129 Michael Hanselmann
    try:
242 3b6b6129 Michael Hanselmann
      cl = luxi.Client()
243 3b6b6129 Michael Hanselmann
      (cluster_name, ) = cl.QueryConfigValues(["cluster_name"])
244 3b6b6129 Michael Hanselmann
    except Exception:
245 3b6b6129 Michael Hanselmann
      raise utils.RetryAgain()
246 3b6b6129 Michael Hanselmann
247 3b6b6129 Michael Hanselmann
    logging.debug("Received cluster name %s from master", cluster_name)
248 3b6b6129 Michael Hanselmann
249 3b6b6129 Michael Hanselmann
  try:
250 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckMasterDaemon, 1.0, _DAEMON_READY_TIMEOUT)
251 3b6b6129 Michael Hanselmann
  except utils.RetryTimeout:
252 3b6b6129 Michael Hanselmann
    raise errors.OpExecError("Master daemon didn't answer queries within"
253 3b6b6129 Michael Hanselmann
                             " %s seconds" % _DAEMON_READY_TIMEOUT)
254 5627f375 Michael Hanselmann
255 a0c9f010 Michael Hanselmann
256 0e3baaf3 Iustin Pop
def _InitFileStorage(file_storage_dir):
257 0e3baaf3 Iustin Pop
  """Initialize if needed the file storage.
258 0e3baaf3 Iustin Pop

259 0e3baaf3 Iustin Pop
  @param file_storage_dir: the user-supplied value
260 0e3baaf3 Iustin Pop
  @return: either empty string (if file storage was disabled at build
261 0e3baaf3 Iustin Pop
      time) or the normalized path to the storage directory
262 0e3baaf3 Iustin Pop

263 0e3baaf3 Iustin Pop
  """
264 0e3baaf3 Iustin Pop
  file_storage_dir = os.path.normpath(file_storage_dir)
265 0e3baaf3 Iustin Pop
266 0e3baaf3 Iustin Pop
  if not os.path.isabs(file_storage_dir):
267 0376655e Guido Trotter
    raise errors.OpPrereqError("File storage directory '%s' is not an absolute"
268 0376655e Guido Trotter
                               " path" % file_storage_dir, errors.ECODE_INVAL)
269 0e3baaf3 Iustin Pop
270 0e3baaf3 Iustin Pop
  if not os.path.exists(file_storage_dir):
271 0e3baaf3 Iustin Pop
    try:
272 0e3baaf3 Iustin Pop
      os.makedirs(file_storage_dir, 0750)
273 0e3baaf3 Iustin Pop
    except OSError, err:
274 0e3baaf3 Iustin Pop
      raise errors.OpPrereqError("Cannot create file storage directory"
275 0e3baaf3 Iustin Pop
                                 " '%s': %s" % (file_storage_dir, err),
276 0e3baaf3 Iustin Pop
                                 errors.ECODE_ENVIRON)
277 0e3baaf3 Iustin Pop
278 0e3baaf3 Iustin Pop
  if not os.path.isdir(file_storage_dir):
279 0e3baaf3 Iustin Pop
    raise errors.OpPrereqError("The file storage directory '%s' is not"
280 0e3baaf3 Iustin Pop
                               " a directory." % file_storage_dir,
281 0e3baaf3 Iustin Pop
                               errors.ECODE_ENVIRON)
282 0e3baaf3 Iustin Pop
  return file_storage_dir
283 0e3baaf3 Iustin Pop
284 0e3baaf3 Iustin Pop
285 b459a848 Andrea Spadaccini
def InitCluster(cluster_name, mac_prefix, # pylint: disable=R0913
286 5a8648eb Andrea Spadaccini
                master_netmask, master_netdev, file_storage_dir,
287 5a8648eb Andrea Spadaccini
                shared_file_storage_dir, candidate_pool_size, secondary_ip=None,
288 5a8648eb Andrea Spadaccini
                vg_name=None, beparams=None, nicparams=None, ndparams=None,
289 5a8648eb Andrea Spadaccini
                hvparams=None, enabled_hypervisors=None, modify_etc_hosts=True,
290 6204ee71 René Nussbaumer
                modify_ssh_setup=True, maintain_node_health=False,
291 6204ee71 René Nussbaumer
                drbd_helper=None, uid_pool=None, default_iallocator=None,
292 bf689b7a Andrea Spadaccini
                primary_ip_version=None, prealloc_wipe_disks=False,
293 bf689b7a Andrea Spadaccini
                use_external_mip_script=False):
294 a0c9f010 Michael Hanselmann
  """Initialise the cluster.
295 a0c9f010 Michael Hanselmann

296 ce735215 Guido Trotter
  @type candidate_pool_size: int
297 ce735215 Guido Trotter
  @param candidate_pool_size: master candidate pool size
298 ce735215 Guido Trotter

299 a0c9f010 Michael Hanselmann
  """
300 ce735215 Guido Trotter
  # TODO: complete the docstring
301 a0c9f010 Michael Hanselmann
  if config.ConfigWriter.IsCluster():
302 debac808 Iustin Pop
    raise errors.OpPrereqError("Cluster is already initialised",
303 debac808 Iustin Pop
                               errors.ECODE_STATE)
304 a0c9f010 Michael Hanselmann
305 b119bccb Guido Trotter
  if not enabled_hypervisors:
306 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors list must contain at"
307 debac808 Iustin Pop
                               " least one member", errors.ECODE_INVAL)
308 b119bccb Guido Trotter
  invalid_hvs = set(enabled_hypervisors) - constants.HYPER_TYPES
309 b119bccb Guido Trotter
  if invalid_hvs:
310 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors contains invalid"
311 debac808 Iustin Pop
                               " entries: %s" % invalid_hvs,
312 debac808 Iustin Pop
                               errors.ECODE_INVAL)
313 b119bccb Guido Trotter
314 5a8648eb Andrea Spadaccini
  try:
315 5a8648eb Andrea Spadaccini
    ipcls = netutils.IPAddress.GetClassFromIpVersion(primary_ip_version)
316 5a8648eb Andrea Spadaccini
  except errors.ProgrammerError:
317 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Invalid primary ip version: %d." %
318 2f20d07b Manuel Franceschini
                               primary_ip_version)
319 2f20d07b Manuel Franceschini
320 2f20d07b Manuel Franceschini
  hostname = netutils.GetHostname(family=ipcls.family)
321 2f20d07b Manuel Franceschini
  if not ipcls.IsValid(hostname.ip):
322 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) is not a valid IPv%d"
323 2f20d07b Manuel Franceschini
                               " address." % (hostname.ip, primary_ip_version))
324 2f20d07b Manuel Franceschini
325 2f20d07b Manuel Franceschini
  if ipcls.IsLoopback(hostname.ip):
326 8b312c1d Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) resolves to a loopback"
327 8b312c1d Manuel Franceschini
                               " address. Please fix DNS or %s." %
328 debac808 Iustin Pop
                               (hostname.ip, constants.ETC_HOSTS),
329 debac808 Iustin Pop
                               errors.ECODE_ENVIRON)
330 a0c9f010 Michael Hanselmann
331 2f20d07b Manuel Franceschini
  if not ipcls.Own(hostname.ip):
332 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Inconsistency: this host's name resolves"
333 a0c9f010 Michael Hanselmann
                               " to %s,\nbut this ip address does not"
334 7c4c22f5 Manuel Franceschini
                               " belong to this host" %
335 debac808 Iustin Pop
                               hostname.ip, errors.ECODE_ENVIRON)
336 a0c9f010 Michael Hanselmann
337 2f20d07b Manuel Franceschini
  clustername = netutils.GetHostname(name=cluster_name, family=ipcls.family)
338 a0c9f010 Michael Hanselmann
339 2f20d07b Manuel Franceschini
  if netutils.TcpPing(clustername.ip, constants.DEFAULT_NODED_PORT, timeout=5):
340 7c4c22f5 Manuel Franceschini
    raise errors.OpPrereqError("Cluster IP already active",
341 debac808 Iustin Pop
                               errors.ECODE_NOTUNIQUE)
342 a0c9f010 Michael Hanselmann
343 2f20d07b Manuel Franceschini
  if not secondary_ip:
344 2f20d07b Manuel Franceschini
    if primary_ip_version == constants.IP6_VERSION:
345 2f20d07b Manuel Franceschini
      raise errors.OpPrereqError("When using a IPv6 primary address, a valid"
346 7c4c22f5 Manuel Franceschini
                                 " IPv4 address must be given as secondary",
347 7c4c22f5 Manuel Franceschini
                                 errors.ECODE_INVAL)
348 b9eeeb02 Michael Hanselmann
    secondary_ip = hostname.ip
349 a0c9f010 Michael Hanselmann
350 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.IsValid(secondary_ip):
351 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Secondary IP address (%s) has to be a valid"
352 2f20d07b Manuel Franceschini
                               " IPv4 address." % secondary_ip,
353 2f20d07b Manuel Franceschini
                               errors.ECODE_INVAL)
354 2f20d07b Manuel Franceschini
355 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.Own(secondary_ip):
356 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("You gave %s as secondary IP,"
357 2f20d07b Manuel Franceschini
                               " but it does not belong to this host." %
358 2f20d07b Manuel Franceschini
                               secondary_ip, errors.ECODE_ENVIRON)
359 2f20d07b Manuel Franceschini
360 5a8648eb Andrea Spadaccini
  if master_netmask is not None:
361 5a8648eb Andrea Spadaccini
    if not ipcls.ValidateNetmask(master_netmask):
362 5a8648eb Andrea Spadaccini
      raise errors.OpPrereqError("CIDR netmask (%s) not valid for IPv%s " %
363 5a8648eb Andrea Spadaccini
                                  (master_netmask, primary_ip_version))
364 5a8648eb Andrea Spadaccini
  else:
365 5a8648eb Andrea Spadaccini
    master_netmask = ipcls.iplen
366 5a8648eb Andrea Spadaccini
367 a0c9f010 Michael Hanselmann
  if vg_name is not None:
368 a0c9f010 Michael Hanselmann
    # Check if volume group is valid
369 a0c9f010 Michael Hanselmann
    vgstatus = utils.CheckVolumeGroupSize(utils.ListVolumeGroups(), vg_name,
370 a0c9f010 Michael Hanselmann
                                          constants.MIN_VG_SIZE)
371 a0c9f010 Michael Hanselmann
    if vgstatus:
372 a0c9f010 Michael Hanselmann
      raise errors.OpPrereqError("Error: %s\nspecify --no-lvm-storage if"
373 debac808 Iustin Pop
                                 " you are not using lvm" % vgstatus,
374 debac808 Iustin Pop
                                 errors.ECODE_INVAL)
375 a0c9f010 Michael Hanselmann
376 a721e23a Luca Bigliardi
  if drbd_helper is not None:
377 a721e23a Luca Bigliardi
    try:
378 a721e23a Luca Bigliardi
      curr_helper = bdev.BaseDRBD.GetUsermodeHelper()
379 a721e23a Luca Bigliardi
    except errors.BlockDeviceError, err:
380 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error while checking drbd helper"
381 a721e23a Luca Bigliardi
                                 " (specify --no-drbd-storage if you are not"
382 a721e23a Luca Bigliardi
                                 " using drbd): %s" % str(err),
383 a721e23a Luca Bigliardi
                                 errors.ECODE_ENVIRON)
384 a721e23a Luca Bigliardi
    if drbd_helper != curr_helper:
385 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error: requiring %s as drbd helper but %s"
386 a721e23a Luca Bigliardi
                                 " is the current helper" % (drbd_helper,
387 a721e23a Luca Bigliardi
                                                             curr_helper),
388 a721e23a Luca Bigliardi
                                 errors.ECODE_INVAL)
389 a721e23a Luca Bigliardi
390 0376655e Guido Trotter
  if constants.ENABLE_FILE_STORAGE:
391 0376655e Guido Trotter
    file_storage_dir = _InitFileStorage(file_storage_dir)
392 0376655e Guido Trotter
  else:
393 0376655e Guido Trotter
    file_storage_dir = ""
394 0376655e Guido Trotter
395 0376655e Guido Trotter
  if constants.ENABLE_SHARED_FILE_STORAGE:
396 0376655e Guido Trotter
    shared_file_storage_dir = _InitFileStorage(shared_file_storage_dir)
397 0376655e Guido Trotter
  else:
398 0376655e Guido Trotter
    shared_file_storage_dir = ""
399 a0c9f010 Michael Hanselmann
400 a0c9f010 Michael Hanselmann
  if not re.match("^[0-9a-z]{2}:[0-9a-z]{2}:[0-9a-z]{2}$", mac_prefix):
401 debac808 Iustin Pop
    raise errors.OpPrereqError("Invalid mac prefix given '%s'" % mac_prefix,
402 debac808 Iustin Pop
                               errors.ECODE_INVAL)
403 a0c9f010 Michael Hanselmann
404 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ip", "link", "show", "dev", master_netdev])
405 a0c9f010 Michael Hanselmann
  if result.failed:
406 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Invalid master netdev given (%s): '%s'" %
407 a0c9f010 Michael Hanselmann
                               (master_netdev,
408 debac808 Iustin Pop
                                result.output.strip()), errors.ECODE_INVAL)
409 a0c9f010 Michael Hanselmann
410 9dae41ad Guido Trotter
  dirs = [(constants.RUN_GANETI_DIR, constants.RUN_DIRS_MODE)]
411 9dae41ad Guido Trotter
  utils.EnsureDirs(dirs)
412 9dae41ad Guido Trotter
413 a5728081 Guido Trotter
  utils.ForceDictType(beparams, constants.BES_PARAMETER_TYPES)
414 b6a30b0d Guido Trotter
  utils.ForceDictType(nicparams, constants.NICS_PARAMETER_TYPES)
415 b6a30b0d Guido Trotter
  objects.NIC.CheckParameterSyntax(nicparams)
416 b6a30b0d Guido Trotter
417 6204ee71 René Nussbaumer
  if ndparams is not None:
418 6204ee71 René Nussbaumer
    utils.ForceDictType(ndparams, constants.NDS_PARAMETER_TYPES)
419 6204ee71 René Nussbaumer
  else:
420 6204ee71 René Nussbaumer
    ndparams = dict(constants.NDC_DEFAULTS)
421 6204ee71 René Nussbaumer
422 a5728081 Guido Trotter
  # hvparams is a mapping of hypervisor->hvparams dict
423 a5728081 Guido Trotter
  for hv_name, hv_params in hvparams.iteritems():
424 a5728081 Guido Trotter
    utils.ForceDictType(hv_params, constants.HVS_PARAMETER_TYPES)
425 a5728081 Guido Trotter
    hv_class = hypervisor.GetHypervisor(hv_name)
426 a5728081 Guido Trotter
    hv_class.CheckParameterSyntax(hv_params)
427 d4b72030 Guido Trotter
428 a0c9f010 Michael Hanselmann
  # set up ssh config and /etc/hosts
429 13998ef2 Michael Hanselmann
  sshline = utils.ReadFile(constants.SSH_HOST_RSA_PUB)
430 a0c9f010 Michael Hanselmann
  sshkey = sshline.split(" ")[1]
431 a0c9f010 Michael Hanselmann
432 b86a6bcd Guido Trotter
  if modify_etc_hosts:
433 ea8ac9c9 René Nussbaumer
    utils.AddHostToEtcHosts(hostname.name, hostname.ip)
434 b86a6bcd Guido Trotter
435 b989b9d9 Ken Wehr
  if modify_ssh_setup:
436 b989b9d9 Ken Wehr
    _InitSSHSetup()
437 a0c9f010 Michael Hanselmann
438 bf4af505 Apollon Oikonomopoulos
  if default_iallocator is not None:
439 bf4af505 Apollon Oikonomopoulos
    alloc_script = utils.FindFile(default_iallocator,
440 bf4af505 Apollon Oikonomopoulos
                                  constants.IALLOCATOR_SEARCH_PATH,
441 bf4af505 Apollon Oikonomopoulos
                                  os.path.isfile)
442 bf4af505 Apollon Oikonomopoulos
    if alloc_script is None:
443 bf4af505 Apollon Oikonomopoulos
      raise errors.OpPrereqError("Invalid default iallocator script '%s'"
444 bf4af505 Apollon Oikonomopoulos
                                 " specified" % default_iallocator,
445 bf4af505 Apollon Oikonomopoulos
                                 errors.ECODE_INVAL)
446 d1e9c98d Iustin Pop
  elif constants.HTOOLS:
447 d1e9c98d Iustin Pop
    # htools was enabled at build-time, we default to it
448 d1e9c98d Iustin Pop
    if utils.FindFile(constants.IALLOC_HAIL,
449 d1e9c98d Iustin Pop
                      constants.IALLOCATOR_SEARCH_PATH,
450 d1e9c98d Iustin Pop
                      os.path.isfile):
451 d1e9c98d Iustin Pop
      default_iallocator = constants.IALLOC_HAIL
452 bf4af505 Apollon Oikonomopoulos
453 430b923c Iustin Pop
  now = time.time()
454 430b923c Iustin Pop
455 a0c9f010 Michael Hanselmann
  # init of cluster config file
456 b9eeeb02 Michael Hanselmann
  cluster_config = objects.Cluster(
457 b9eeeb02 Michael Hanselmann
    serial_no=1,
458 b9eeeb02 Michael Hanselmann
    rsahostkeypub=sshkey,
459 b9eeeb02 Michael Hanselmann
    highest_used_port=(constants.FIRST_DRBD_PORT - 1),
460 b9eeeb02 Michael Hanselmann
    mac_prefix=mac_prefix,
461 b9eeeb02 Michael Hanselmann
    volume_group_name=vg_name,
462 b9eeeb02 Michael Hanselmann
    tcpudp_port_pool=set(),
463 f6bd6e98 Michael Hanselmann
    master_node=hostname.name,
464 f6bd6e98 Michael Hanselmann
    master_ip=clustername.ip,
465 5a8648eb Andrea Spadaccini
    master_netmask=master_netmask,
466 f6bd6e98 Michael Hanselmann
    master_netdev=master_netdev,
467 f6bd6e98 Michael Hanselmann
    cluster_name=clustername.name,
468 f6bd6e98 Michael Hanselmann
    file_storage_dir=file_storage_dir,
469 4b97f902 Apollon Oikonomopoulos
    shared_file_storage_dir=shared_file_storage_dir,
470 ea3a925f Alexander Schreiber
    enabled_hypervisors=enabled_hypervisors,
471 4ef7f423 Guido Trotter
    beparams={constants.PP_DEFAULT: beparams},
472 b6a30b0d Guido Trotter
    nicparams={constants.PP_DEFAULT: nicparams},
473 6204ee71 René Nussbaumer
    ndparams=ndparams,
474 ea3a925f Alexander Schreiber
    hvparams=hvparams,
475 ce735215 Guido Trotter
    candidate_pool_size=candidate_pool_size,
476 022c3a0b Guido Trotter
    modify_etc_hosts=modify_etc_hosts,
477 b989b9d9 Ken Wehr
    modify_ssh_setup=modify_ssh_setup,
478 39b0f0c2 Balazs Lecz
    uid_pool=uid_pool,
479 430b923c Iustin Pop
    ctime=now,
480 430b923c Iustin Pop
    mtime=now,
481 3953242f Iustin Pop
    maintain_node_health=maintain_node_health,
482 a721e23a Luca Bigliardi
    drbd_usermode_helper=drbd_helper,
483 bf4af505 Apollon Oikonomopoulos
    default_iallocator=default_iallocator,
484 2f20d07b Manuel Franceschini
    primary_ip_family=ipcls.family,
485 3d914585 René Nussbaumer
    prealloc_wipe_disks=prealloc_wipe_disks,
486 bf689b7a Andrea Spadaccini
    use_external_mip_script=use_external_mip_script,
487 b9eeeb02 Michael Hanselmann
    )
488 b9eeeb02 Michael Hanselmann
  master_node_config = objects.Node(name=hostname.name,
489 b9eeeb02 Michael Hanselmann
                                    primary_ip=hostname.ip,
490 b9222f32 Guido Trotter
                                    secondary_ip=secondary_ip,
491 c044f32c Guido Trotter
                                    serial_no=1,
492 c044f32c Guido Trotter
                                    master_candidate=True,
493 af64c0ea Iustin Pop
                                    offline=False, drained=False,
494 435e4bd6 Michael Hanselmann
                                    ctime=now, mtime=now,
495 c044f32c Guido Trotter
                                    )
496 9e1333b9 Guido Trotter
  InitConfig(constants.CONFIG_VERSION, cluster_config, master_node_config)
497 d367b66c Manuel Franceschini
  cfg = config.ConfigWriter(offline=True)
498 9e1333b9 Guido Trotter
  ssh.WriteKnownHostsFile(cfg, constants.SSH_KNOWN_HOSTS_FILE)
499 a4eae71f Michael Hanselmann
  cfg.Update(cfg.GetClusterInfo(), logging.error)
500 d367b66c Manuel Franceschini
  backend.WriteSsconfFiles(cfg.GetSsconfValues())
501 d367b66c Manuel Franceschini
502 d367b66c Manuel Franceschini
  # set up the inter-node password and certificate
503 d367b66c Manuel Franceschini
  _InitGanetiServerSetup(hostname.name)
504 827f753e Guido Trotter
505 952d7515 Michael Hanselmann
  logging.debug("Starting daemons")
506 952d7515 Michael Hanselmann
  result = utils.RunCmd([constants.DAEMON_UTIL, "start-all"])
507 952d7515 Michael Hanselmann
  if result.failed:
508 952d7515 Michael Hanselmann
    raise errors.OpExecError("Could not start daemons, command %s"
509 952d7515 Michael Hanselmann
                             " had exitcode %s and error %s" %
510 952d7515 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
511 b3f1cf6f Iustin Pop
512 3b6b6129 Michael Hanselmann
  _WaitForMasterDaemon()
513 b3f1cf6f Iustin Pop
514 b1b6ea87 Iustin Pop
515 02f99608 Oleksiy Mishchenko
def InitConfig(version, cluster_config, master_node_config,
516 02f99608 Oleksiy Mishchenko
               cfg_file=constants.CLUSTER_CONF_FILE):
517 7b3a8fb5 Iustin Pop
  """Create the initial cluster configuration.
518 7b3a8fb5 Iustin Pop

519 7b3a8fb5 Iustin Pop
  It will contain the current node, which will also be the master
520 7b3a8fb5 Iustin Pop
  node, and no instances.
521 7b3a8fb5 Iustin Pop

522 7b3a8fb5 Iustin Pop
  @type version: int
523 c41eea6e Iustin Pop
  @param version: configuration version
524 c41eea6e Iustin Pop
  @type cluster_config: L{objects.Cluster}
525 c41eea6e Iustin Pop
  @param cluster_config: cluster configuration
526 c41eea6e Iustin Pop
  @type master_node_config: L{objects.Node}
527 c41eea6e Iustin Pop
  @param master_node_config: master node configuration
528 c41eea6e Iustin Pop
  @type cfg_file: string
529 c41eea6e Iustin Pop
  @param cfg_file: configuration file path
530 c41eea6e Iustin Pop

531 7b3a8fb5 Iustin Pop
  """
532 88b92fe3 Guido Trotter
  uuid_generator = config.TemporaryReservationManager()
533 88b92fe3 Guido Trotter
  cluster_config.uuid = uuid_generator.Generate([], utils.NewUUID,
534 88b92fe3 Guido Trotter
                                                _INITCONF_ECID)
535 88b92fe3 Guido Trotter
  master_node_config.uuid = uuid_generator.Generate([], utils.NewUUID,
536 88b92fe3 Guido Trotter
                                                    _INITCONF_ECID)
537 7b3a8fb5 Iustin Pop
  nodes = {
538 7b3a8fb5 Iustin Pop
    master_node_config.name: master_node_config,
539 7b3a8fb5 Iustin Pop
    }
540 88b92fe3 Guido Trotter
  default_nodegroup = objects.NodeGroup(
541 88b92fe3 Guido Trotter
    uuid=uuid_generator.Generate([], utils.NewUUID, _INITCONF_ECID),
542 75cf411a Adeodato Simo
    name=constants.INITIAL_NODE_GROUP_NAME,
543 88b92fe3 Guido Trotter
    members=[master_node_config.name],
544 88b92fe3 Guido Trotter
    )
545 88b92fe3 Guido Trotter
  nodegroups = {
546 88b92fe3 Guido Trotter
    default_nodegroup.uuid: default_nodegroup,
547 88b92fe3 Guido Trotter
    }
548 d693c864 Iustin Pop
  now = time.time()
549 7b3a8fb5 Iustin Pop
  config_data = objects.ConfigData(version=version,
550 7b3a8fb5 Iustin Pop
                                   cluster=cluster_config,
551 88b92fe3 Guido Trotter
                                   nodegroups=nodegroups,
552 7b3a8fb5 Iustin Pop
                                   nodes=nodes,
553 7b3a8fb5 Iustin Pop
                                   instances={},
554 d693c864 Iustin Pop
                                   serial_no=1,
555 d693c864 Iustin Pop
                                   ctime=now, mtime=now)
556 a33848a5 Guido Trotter
  utils.WriteFile(cfg_file,
557 a33848a5 Guido Trotter
                  data=serializer.Dump(config_data.ToDict()),
558 a33848a5 Guido Trotter
                  mode=0600)
559 02f99608 Oleksiy Mishchenko
560 02f99608 Oleksiy Mishchenko
561 140aa4a8 Iustin Pop
def FinalizeClusterDestroy(master):
562 140aa4a8 Iustin Pop
  """Execute the last steps of cluster destroy
563 140aa4a8 Iustin Pop

564 140aa4a8 Iustin Pop
  This function shuts down all the daemons, completing the destroy
565 140aa4a8 Iustin Pop
  begun in cmdlib.LUDestroyOpcode.
566 140aa4a8 Iustin Pop

567 140aa4a8 Iustin Pop
  """
568 b989b9d9 Ken Wehr
  cfg = config.ConfigWriter()
569 b989b9d9 Ken Wehr
  modify_ssh_setup = cfg.GetClusterInfo().modify_ssh_setup
570 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
571 7c74bbe0 Andrea Spadaccini
572 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
573 c79198a0 Andrea Spadaccini
  master_params.name = master
574 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
575 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
576 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
577 c79198a0 Andrea Spadaccini
578 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
579 7c74bbe0 Andrea Spadaccini
  if msg:
580 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
581 7c74bbe0 Andrea Spadaccini
582 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(master)
583 3cebe102 Michael Hanselmann
  msg = result.fail_msg
584 6c00d19a Iustin Pop
  if msg:
585 099c52ad Iustin Pop
    logging.warning("Could not disable the master role: %s", msg)
586 7c74bbe0 Andrea Spadaccini
587 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_leave_cluster(master, modify_ssh_setup)
588 3cebe102 Michael Hanselmann
  msg = result.fail_msg
589 0623d351 Iustin Pop
  if msg:
590 0623d351 Iustin Pop
    logging.warning("Could not shutdown the node daemon and cleanup"
591 0623d351 Iustin Pop
                    " the node: %s", msg)
592 140aa4a8 Iustin Pop
593 140aa4a8 Iustin Pop
594 87622829 Iustin Pop
def SetupNodeDaemon(cluster_name, node, ssh_key_check):
595 827f753e Guido Trotter
  """Add a node to the cluster.
596 827f753e Guido Trotter

597 b1b6ea87 Iustin Pop
  This function must be called before the actual opcode, and will ssh
598 b1b6ea87 Iustin Pop
  to the remote node, copy the needed files, and start ganeti-noded,
599 b1b6ea87 Iustin Pop
  allowing the master to do the rest via normal rpc calls.
600 827f753e Guido Trotter

601 87622829 Iustin Pop
  @param cluster_name: the cluster name
602 87622829 Iustin Pop
  @param node: the name of the new node
603 87622829 Iustin Pop
  @param ssh_key_check: whether to do a strict key check
604 827f753e Guido Trotter

605 827f753e Guido Trotter
  """
606 b43dcc5a Manuel Franceschini
  family = ssconf.SimpleStore().GetPrimaryIPFamily()
607 b43dcc5a Manuel Franceschini
  sshrunner = ssh.SshRunner(cluster_name,
608 72729d6e Michael Hanselmann
                            ipv6=(family == netutils.IP6Address.family))
609 827f753e Guido Trotter
610 b43dcc5a Manuel Franceschini
  bind_address = constants.IP4_ADDRESS_ANY
611 b43dcc5a Manuel Franceschini
  if family == netutils.IP6Address.family:
612 b43dcc5a Manuel Franceschini
    bind_address = constants.IP6_ADDRESS_ANY
613 b43dcc5a Manuel Franceschini
614 827f753e Guido Trotter
  # set up inter-node password and certificate and restarts the node daemon
615 827f753e Guido Trotter
  # and then connect with ssh to set password and start ganeti-noded
616 827f753e Guido Trotter
  # note that all the below variables are sanitized at this point,
617 827f753e Guido Trotter
  # either by being constants or by the checks above
618 9294514d René Nussbaumer
  sshrunner.CopyFileToNode(node, constants.NODED_CERT_FILE)
619 9294514d René Nussbaumer
  sshrunner.CopyFileToNode(node, constants.RAPI_CERT_FILE)
620 bfe86c76 Andrea Spadaccini
  sshrunner.CopyFileToNode(node, constants.SPICE_CERT_FILE)
621 bfe86c76 Andrea Spadaccini
  sshrunner.CopyFileToNode(node, constants.SPICE_CACERT_FILE)
622 9294514d René Nussbaumer
  sshrunner.CopyFileToNode(node, constants.CONFD_HMAC_KEY)
623 72729d6e Michael Hanselmann
  mycommand = ("%s stop-all; %s start %s -b %s" %
624 72729d6e Michael Hanselmann
               (constants.DAEMON_UTIL, constants.DAEMON_UTIL, constants.NODED,
625 72729d6e Michael Hanselmann
                utils.ShellQuote(bind_address)))
626 827f753e Guido Trotter
627 c4b6c29c Michael Hanselmann
  result = sshrunner.Run(node, 'root', mycommand, batch=False,
628 c4b6c29c Michael Hanselmann
                         ask_key=ssh_key_check,
629 9294514d René Nussbaumer
                         use_cluster_key=True,
630 c4b6c29c Michael Hanselmann
                         strict_host_check=ssh_key_check)
631 827f753e Guido Trotter
  if result.failed:
632 827f753e Guido Trotter
    raise errors.OpExecError("Remote command on node %s, error: %s,"
633 827f753e Guido Trotter
                             " output: %s" %
634 827f753e Guido Trotter
                             (node, result.fail_reason, result.output))
635 827f753e Guido Trotter
636 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(node)
637 5627f375 Michael Hanselmann
638 b1b6ea87 Iustin Pop
639 8e2524c3 Guido Trotter
def MasterFailover(no_voting=False):
640 b1b6ea87 Iustin Pop
  """Failover the master node.
641 b1b6ea87 Iustin Pop

642 b1b6ea87 Iustin Pop
  This checks that we are not already the master, and will cause the
643 b1b6ea87 Iustin Pop
  current master to cease being master, and the non-master to become
644 b1b6ea87 Iustin Pop
  new master.
645 b1b6ea87 Iustin Pop

646 8e2524c3 Guido Trotter
  @type no_voting: boolean
647 8e2524c3 Guido Trotter
  @param no_voting: force the operation without remote nodes agreement
648 8e2524c3 Guido Trotter
                      (dangerous)
649 8e2524c3 Guido Trotter

650 b1b6ea87 Iustin Pop
  """
651 8135a2db Iustin Pop
  sstore = ssconf.SimpleStore()
652 b1b6ea87 Iustin Pop
653 8135a2db Iustin Pop
  old_master, new_master = ssconf.GetMasterAndMyself(sstore)
654 8135a2db Iustin Pop
  node_list = sstore.GetNodeList()
655 8135a2db Iustin Pop
  mc_list = sstore.GetMasterCandidates()
656 b1b6ea87 Iustin Pop
657 b1b6ea87 Iustin Pop
  if old_master == new_master:
658 b1b6ea87 Iustin Pop
    raise errors.OpPrereqError("This commands must be run on the node"
659 b1b6ea87 Iustin Pop
                               " where you want the new master to be."
660 b1b6ea87 Iustin Pop
                               " %s is already the master" %
661 debac808 Iustin Pop
                               old_master, errors.ECODE_INVAL)
662 d5927e48 Iustin Pop
663 8135a2db Iustin Pop
  if new_master not in mc_list:
664 8135a2db Iustin Pop
    mc_no_master = [name for name in mc_list if name != old_master]
665 8135a2db Iustin Pop
    raise errors.OpPrereqError("This node is not among the nodes marked"
666 8135a2db Iustin Pop
                               " as master candidates. Only these nodes"
667 8135a2db Iustin Pop
                               " can become masters. Current list of"
668 8135a2db Iustin Pop
                               " master candidates is:\n"
669 debac808 Iustin Pop
                               "%s" % ('\n'.join(mc_no_master)),
670 debac808 Iustin Pop
                               errors.ECODE_STATE)
671 8135a2db Iustin Pop
672 8e2524c3 Guido Trotter
  if not no_voting:
673 8e2524c3 Guido Trotter
    vote_list = GatherMasterVotes(node_list)
674 8e2524c3 Guido Trotter
675 8e2524c3 Guido Trotter
    if vote_list:
676 8e2524c3 Guido Trotter
      voted_master = vote_list[0][0]
677 8e2524c3 Guido Trotter
      if voted_master is None:
678 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("Cluster is inconsistent, most nodes did"
679 debac808 Iustin Pop
                                   " not respond.", errors.ECODE_ENVIRON)
680 8e2524c3 Guido Trotter
      elif voted_master != old_master:
681 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("I have a wrong configuration, I believe"
682 8e2524c3 Guido Trotter
                                   " the master is %s but the other nodes"
683 8e2524c3 Guido Trotter
                                   " voted %s. Please resync the configuration"
684 8e2524c3 Guido Trotter
                                   " of this node." %
685 debac808 Iustin Pop
                                   (old_master, voted_master),
686 debac808 Iustin Pop
                                   errors.ECODE_STATE)
687 b1b6ea87 Iustin Pop
  # end checks
688 b1b6ea87 Iustin Pop
689 b1b6ea87 Iustin Pop
  rcode = 0
690 b1b6ea87 Iustin Pop
691 d5927e48 Iustin Pop
  logging.info("Setting master to %s, old master: %s", new_master, old_master)
692 b1b6ea87 Iustin Pop
693 21004460 Iustin Pop
  try:
694 21004460 Iustin Pop
    # instantiate a real config writer, as we now know we have the
695 21004460 Iustin Pop
    # configuration data
696 eb180fe2 Iustin Pop
    cfg = config.ConfigWriter(accept_foreign=True)
697 21004460 Iustin Pop
698 21004460 Iustin Pop
    cluster_info = cfg.GetClusterInfo()
699 21004460 Iustin Pop
    cluster_info.master_node = new_master
700 21004460 Iustin Pop
    # this will also regenerate the ssconf files, since we updated the
701 21004460 Iustin Pop
    # cluster info
702 21004460 Iustin Pop
    cfg.Update(cluster_info, logging.error)
703 21004460 Iustin Pop
  except errors.ConfigurationError, err:
704 21004460 Iustin Pop
    logging.error("Error while trying to set the new master: %s",
705 21004460 Iustin Pop
                  str(err))
706 21004460 Iustin Pop
    return 1
707 21004460 Iustin Pop
708 21004460 Iustin Pop
  # if cfg.Update worked, then it means the old master daemon won't be
709 21004460 Iustin Pop
  # able now to write its own config file (we rely on locking in both
710 21004460 Iustin Pop
  # backend.UploadFile() and ConfigWriter._Write(); hence the next
711 21004460 Iustin Pop
  # step is to kill the old master
712 21004460 Iustin Pop
713 21004460 Iustin Pop
  logging.info("Stopping the master daemon on node %s", old_master)
714 21004460 Iustin Pop
715 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
716 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
717 c79198a0 Andrea Spadaccini
  master_params.name = old_master
718 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
719 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
720 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
721 c79198a0 Andrea Spadaccini
722 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
723 7c74bbe0 Andrea Spadaccini
  if msg:
724 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
725 7c74bbe0 Andrea Spadaccini
726 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(old_master)
727 3cebe102 Michael Hanselmann
  msg = result.fail_msg
728 6c00d19a Iustin Pop
  if msg:
729 d5927e48 Iustin Pop
    logging.error("Could not disable the master role on the old master"
730 6c00d19a Iustin Pop
                 " %s, please disable manually: %s", old_master, msg)
731 b1b6ea87 Iustin Pop
732 21004460 Iustin Pop
  logging.info("Checking master IP non-reachability...")
733 21004460 Iustin Pop
734 425f0f54 Iustin Pop
  master_ip = sstore.GetMasterIP()
735 425f0f54 Iustin Pop
  total_timeout = 30
736 e687ec01 Michael Hanselmann
737 d23ef431 Michael Hanselmann
  # Here we have a phase where no master should be running
738 425f0f54 Iustin Pop
  def _check_ip():
739 a744b676 Manuel Franceschini
    if netutils.TcpPing(master_ip, constants.DEFAULT_NODED_PORT):
740 425f0f54 Iustin Pop
      raise utils.RetryAgain()
741 425f0f54 Iustin Pop
742 425f0f54 Iustin Pop
  try:
743 425f0f54 Iustin Pop
    utils.Retry(_check_ip, (1, 1.5, 5), total_timeout)
744 425f0f54 Iustin Pop
  except utils.RetryTimeout:
745 425f0f54 Iustin Pop
    logging.warning("The master IP is still reachable after %s seconds,"
746 425f0f54 Iustin Pop
                    " continuing but activating the master on the current"
747 425f0f54 Iustin Pop
                    " node will probably fail", total_timeout)
748 b1b6ea87 Iustin Pop
749 ff699aa9 Michael Hanselmann
  if jstore.CheckDrainFlag():
750 ff699aa9 Michael Hanselmann
    logging.info("Undraining job queue")
751 ff699aa9 Michael Hanselmann
    jstore.SetDrainFlag(False)
752 ff699aa9 Michael Hanselmann
753 21004460 Iustin Pop
  logging.info("Starting the master daemons on the new master")
754 d5927e48 Iustin Pop
755 db04ce5d Michael Hanselmann
  result = rpc.BootstrapRunner().call_node_start_master_daemons(new_master,
756 db04ce5d Michael Hanselmann
                                                                no_voting)
757 3cebe102 Michael Hanselmann
  msg = result.fail_msg
758 b726aff0 Iustin Pop
  if msg:
759 d5927e48 Iustin Pop
    logging.error("Could not start the master role on the new master"
760 b726aff0 Iustin Pop
                  " %s, please check: %s", new_master, msg)
761 b1b6ea87 Iustin Pop
    rcode = 1
762 b1b6ea87 Iustin Pop
763 21004460 Iustin Pop
  logging.info("Master failed over from %s to %s", old_master, new_master)
764 b1b6ea87 Iustin Pop
  return rcode
765 d7cdb55d Iustin Pop
766 d7cdb55d Iustin Pop
767 8eb148ae Iustin Pop
def GetMaster():
768 8eb148ae Iustin Pop
  """Returns the current master node.
769 8eb148ae Iustin Pop

770 8eb148ae Iustin Pop
  This is a separate function in bootstrap since it's needed by
771 8eb148ae Iustin Pop
  gnt-cluster, and instead of importing directly ssconf, it's better
772 8eb148ae Iustin Pop
  to abstract it in bootstrap, where we do use ssconf in other
773 8eb148ae Iustin Pop
  functions too.
774 8eb148ae Iustin Pop

775 8eb148ae Iustin Pop
  """
776 8eb148ae Iustin Pop
  sstore = ssconf.SimpleStore()
777 8eb148ae Iustin Pop
778 8eb148ae Iustin Pop
  old_master, _ = ssconf.GetMasterAndMyself(sstore)
779 8eb148ae Iustin Pop
780 8eb148ae Iustin Pop
  return old_master
781 8eb148ae Iustin Pop
782 8eb148ae Iustin Pop
783 d7cdb55d Iustin Pop
def GatherMasterVotes(node_list):
784 d7cdb55d Iustin Pop
  """Check the agreement on who is the master.
785 d7cdb55d Iustin Pop

786 d7cdb55d Iustin Pop
  This function will return a list of (node, number of votes), ordered
787 d7cdb55d Iustin Pop
  by the number of votes. Errors will be denoted by the key 'None'.
788 d7cdb55d Iustin Pop

789 d7cdb55d Iustin Pop
  Note that the sum of votes is the number of nodes this machine
790 d7cdb55d Iustin Pop
  knows, whereas the number of entries in the list could be different
791 d7cdb55d Iustin Pop
  (if some nodes vote for another master).
792 d7cdb55d Iustin Pop

793 d7cdb55d Iustin Pop
  We remove ourselves from the list since we know that (bugs aside)
794 d7cdb55d Iustin Pop
  since we use the same source for configuration information for both
795 d7cdb55d Iustin Pop
  backend and boostrap, we'll always vote for ourselves.
796 d7cdb55d Iustin Pop

797 d7cdb55d Iustin Pop
  @type node_list: list
798 d7cdb55d Iustin Pop
  @param node_list: the list of nodes to query for master info; the current
799 5bbd3f7f Michael Hanselmann
      node will be removed if it is in the list
800 d7cdb55d Iustin Pop
  @rtype: list
801 d7cdb55d Iustin Pop
  @return: list of (node, votes)
802 d7cdb55d Iustin Pop

803 d7cdb55d Iustin Pop
  """
804 b705c7a6 Manuel Franceschini
  myself = netutils.Hostname.GetSysName()
805 d7cdb55d Iustin Pop
  try:
806 d7cdb55d Iustin Pop
    node_list.remove(myself)
807 d7cdb55d Iustin Pop
  except ValueError:
808 d7cdb55d Iustin Pop
    pass
809 d7cdb55d Iustin Pop
  if not node_list:
810 d7cdb55d Iustin Pop
    # no nodes left (eventually after removing myself)
811 d7cdb55d Iustin Pop
    return []
812 db04ce5d Michael Hanselmann
  results = rpc.BootstrapRunner().call_master_info(node_list)
813 d7cdb55d Iustin Pop
  if not isinstance(results, dict):
814 d7cdb55d Iustin Pop
    # this should not happen (unless internal error in rpc)
815 d7cdb55d Iustin Pop
    logging.critical("Can't complete rpc call, aborting master startup")
816 d7cdb55d Iustin Pop
    return [(None, len(node_list))]
817 d7cdb55d Iustin Pop
  votes = {}
818 d7cdb55d Iustin Pop
  for node in results:
819 781de953 Iustin Pop
    nres = results[node]
820 2a52a064 Iustin Pop
    data = nres.payload
821 3cebe102 Michael Hanselmann
    msg = nres.fail_msg
822 2a52a064 Iustin Pop
    fail = False
823 2a52a064 Iustin Pop
    if msg:
824 2a52a064 Iustin Pop
      logging.warning("Error contacting node %s: %s", node, msg)
825 2a52a064 Iustin Pop
      fail = True
826 909b3a0e Andrea Spadaccini
    # for now we accept both length 3, 4 and 5 (data[3] is primary ip version
827 909b3a0e Andrea Spadaccini
    # and data[4] is the master netmask)
828 2a52a064 Iustin Pop
    elif not isinstance(data, (tuple, list)) or len(data) < 3:
829 2a52a064 Iustin Pop
      logging.warning("Invalid data received from node %s: %s", node, data)
830 2a52a064 Iustin Pop
      fail = True
831 2a52a064 Iustin Pop
    if fail:
832 d7cdb55d Iustin Pop
      if None not in votes:
833 d7cdb55d Iustin Pop
        votes[None] = 0
834 d7cdb55d Iustin Pop
      votes[None] += 1
835 d7cdb55d Iustin Pop
      continue
836 781de953 Iustin Pop
    master_node = data[2]
837 d7cdb55d Iustin Pop
    if master_node not in votes:
838 d7cdb55d Iustin Pop
      votes[master_node] = 0
839 d7cdb55d Iustin Pop
    votes[master_node] += 1
840 d7cdb55d Iustin Pop
841 d7cdb55d Iustin Pop
  vote_list = [v for v in votes.items()]
842 d7cdb55d Iustin Pop
  # sort first on number of votes then on name, since we want None
843 d7cdb55d Iustin Pop
  # sorted later if we have the half of the nodes not responding, and
844 d7cdb55d Iustin Pop
  # half voting all for the same master
845 d7cdb55d Iustin Pop
  vote_list.sort(key=lambda x: (x[1], x[0]), reverse=True)
846 d7cdb55d Iustin Pop
847 d7cdb55d Iustin Pop
  return vote_list