Statistics
| Branch: | Tag: | Revision:

root / lib / bootstrap.py @ 11e90588

History | View | Annotate | Download (36.6 kB)

1 a0c9f010 Michael Hanselmann
#
2 a0c9f010 Michael Hanselmann
#
3 a0c9f010 Michael Hanselmann
4 57dc299a Iustin Pop
# Copyright (C) 2006, 2007, 2008, 2010, 2011, 2012 Google Inc.
5 a0c9f010 Michael Hanselmann
#
6 a0c9f010 Michael Hanselmann
# This program is free software; you can redistribute it and/or modify
7 a0c9f010 Michael Hanselmann
# it under the terms of the GNU General Public License as published by
8 a0c9f010 Michael Hanselmann
# the Free Software Foundation; either version 2 of the License, or
9 a0c9f010 Michael Hanselmann
# (at your option) any later version.
10 a0c9f010 Michael Hanselmann
#
11 a0c9f010 Michael Hanselmann
# This program is distributed in the hope that it will be useful, but
12 a0c9f010 Michael Hanselmann
# WITHOUT ANY WARRANTY; without even the implied warranty of
13 a0c9f010 Michael Hanselmann
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 a0c9f010 Michael Hanselmann
# General Public License for more details.
15 a0c9f010 Michael Hanselmann
#
16 a0c9f010 Michael Hanselmann
# You should have received a copy of the GNU General Public License
17 a0c9f010 Michael Hanselmann
# along with this program; if not, write to the Free Software
18 a0c9f010 Michael Hanselmann
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19 a0c9f010 Michael Hanselmann
# 02110-1301, USA.
20 a0c9f010 Michael Hanselmann
21 a0c9f010 Michael Hanselmann
22 a0c9f010 Michael Hanselmann
"""Functions to bootstrap a new cluster.
23 a0c9f010 Michael Hanselmann

24 a0c9f010 Michael Hanselmann
"""
25 a0c9f010 Michael Hanselmann
26 a0c9f010 Michael Hanselmann
import os
27 a0c9f010 Michael Hanselmann
import os.path
28 a0c9f010 Michael Hanselmann
import re
29 b1b6ea87 Iustin Pop
import logging
30 d693c864 Iustin Pop
import time
31 a698cdbb Michael Hanselmann
import tempfile
32 a0c9f010 Michael Hanselmann
33 a0c9f010 Michael Hanselmann
from ganeti import rpc
34 a0c9f010 Michael Hanselmann
from ganeti import ssh
35 a0c9f010 Michael Hanselmann
from ganeti import utils
36 a0c9f010 Michael Hanselmann
from ganeti import errors
37 a0c9f010 Michael Hanselmann
from ganeti import config
38 a0c9f010 Michael Hanselmann
from ganeti import constants
39 b9eeeb02 Michael Hanselmann
from ganeti import objects
40 a0c9f010 Michael Hanselmann
from ganeti import ssconf
41 a33848a5 Guido Trotter
from ganeti import serializer
42 a5728081 Guido Trotter
from ganeti import hypervisor
43 a721e23a Luca Bigliardi
from ganeti import bdev
44 a744b676 Manuel Franceschini
from ganeti import netutils
45 3b6b6129 Michael Hanselmann
from ganeti import luxi
46 ff699aa9 Michael Hanselmann
from ganeti import jstore
47 7ede9c6a Michael Hanselmann
from ganeti import pathutils
48 3b6b6129 Michael Hanselmann
49 a0c9f010 Michael Hanselmann
50 88b92fe3 Guido Trotter
# ec_id for InitConfig's temporary reservation manager
51 88b92fe3 Guido Trotter
_INITCONF_ECID = "initconfig-ecid"
52 88b92fe3 Guido Trotter
53 3b6b6129 Michael Hanselmann
#: After how many seconds daemon must be responsive
54 3b6b6129 Michael Hanselmann
_DAEMON_READY_TIMEOUT = 10.0
55 3b6b6129 Michael Hanselmann
56 e38220e4 Michael Hanselmann
57 531baf8e Iustin Pop
def _InitSSHSetup():
58 a0c9f010 Michael Hanselmann
  """Setup the SSH configuration for the cluster.
59 a0c9f010 Michael Hanselmann

60 a0c9f010 Michael Hanselmann
  This generates a dsa keypair for root, adds the pub key to the
61 a0c9f010 Michael Hanselmann
  permitted hosts and adds the hostkey to its own known hosts.
62 a0c9f010 Michael Hanselmann

63 a0c9f010 Michael Hanselmann
  """
64 052783ff Michael Hanselmann
  priv_key, pub_key, auth_keys = ssh.GetUserFiles(constants.SSH_LOGIN_USER)
65 a0c9f010 Michael Hanselmann
66 a0c9f010 Michael Hanselmann
  for name in priv_key, pub_key:
67 a0c9f010 Michael Hanselmann
    if os.path.exists(name):
68 a0c9f010 Michael Hanselmann
      utils.CreateBackup(name)
69 a0c9f010 Michael Hanselmann
    utils.RemoveFile(name)
70 a0c9f010 Michael Hanselmann
71 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ssh-keygen", "-t", "dsa",
72 a0c9f010 Michael Hanselmann
                         "-f", priv_key,
73 a0c9f010 Michael Hanselmann
                         "-q", "-N", ""])
74 a0c9f010 Michael Hanselmann
  if result.failed:
75 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not generate ssh keypair, error %s" %
76 a0c9f010 Michael Hanselmann
                             result.output)
77 a0c9f010 Michael Hanselmann
78 7a0156dc Luca Bigliardi
  utils.AddAuthorizedKey(auth_keys, utils.ReadFile(pub_key))
79 a0c9f010 Michael Hanselmann
80 a0c9f010 Michael Hanselmann
81 c008906b Michael Hanselmann
def GenerateHmacKey(file_name):
82 c008906b Michael Hanselmann
  """Writes a new HMAC key.
83 c008906b Michael Hanselmann

84 c008906b Michael Hanselmann
  @type file_name: str
85 c008906b Michael Hanselmann
  @param file_name: Path to output file
86 c008906b Michael Hanselmann

87 c008906b Michael Hanselmann
  """
88 43575108 Michael Hanselmann
  utils.WriteFile(file_name, data="%s\n" % utils.GenerateSecret(), mode=0400,
89 43575108 Michael Hanselmann
                  backup=True)
90 43575108 Michael Hanselmann
91 43575108 Michael Hanselmann
92 b6267745 Andrea Spadaccini
def GenerateClusterCrypto(new_cluster_cert, new_rapi_cert, new_spice_cert,
93 b6267745 Andrea Spadaccini
                          new_confd_hmac_key, new_cds,
94 b6267745 Andrea Spadaccini
                          rapi_cert_pem=None, spice_cert_pem=None,
95 b6267745 Andrea Spadaccini
                          spice_cacert_pem=None, cds=None,
96 7ede9c6a Michael Hanselmann
                          nodecert_file=pathutils.NODED_CERT_FILE,
97 7ede9c6a Michael Hanselmann
                          rapicert_file=pathutils.RAPI_CERT_FILE,
98 7ede9c6a Michael Hanselmann
                          spicecert_file=pathutils.SPICE_CERT_FILE,
99 7ede9c6a Michael Hanselmann
                          spicecacert_file=pathutils.SPICE_CACERT_FILE,
100 7ede9c6a Michael Hanselmann
                          hmackey_file=pathutils.CONFD_HMAC_KEY,
101 7ede9c6a Michael Hanselmann
                          cds_file=pathutils.CLUSTER_DOMAIN_SECRET_FILE):
102 43575108 Michael Hanselmann
  """Updates the cluster certificates, keys and secrets.
103 43575108 Michael Hanselmann

104 43575108 Michael Hanselmann
  @type new_cluster_cert: bool
105 43575108 Michael Hanselmann
  @param new_cluster_cert: Whether to generate a new cluster certificate
106 43575108 Michael Hanselmann
  @type new_rapi_cert: bool
107 43575108 Michael Hanselmann
  @param new_rapi_cert: Whether to generate a new RAPI certificate
108 b6267745 Andrea Spadaccini
  @type new_spice_cert: bool
109 b6267745 Andrea Spadaccini
  @param new_spice_cert: Whether to generate a new SPICE certificate
110 6b7d5878 Michael Hanselmann
  @type new_confd_hmac_key: bool
111 6b7d5878 Michael Hanselmann
  @param new_confd_hmac_key: Whether to generate a new HMAC key
112 3db3eb2a Michael Hanselmann
  @type new_cds: bool
113 3db3eb2a Michael Hanselmann
  @param new_cds: Whether to generate a new cluster domain secret
114 43575108 Michael Hanselmann
  @type rapi_cert_pem: string
115 43575108 Michael Hanselmann
  @param rapi_cert_pem: New RAPI certificate in PEM format
116 b6267745 Andrea Spadaccini
  @type spice_cert_pem: string
117 b6267745 Andrea Spadaccini
  @param spice_cert_pem: New SPICE certificate in PEM format
118 b6267745 Andrea Spadaccini
  @type spice_cacert_pem: string
119 b6267745 Andrea Spadaccini
  @param spice_cacert_pem: Certificate of the CA that signed the SPICE
120 b6267745 Andrea Spadaccini
                           certificate, in PEM format
121 3db3eb2a Michael Hanselmann
  @type cds: string
122 3db3eb2a Michael Hanselmann
  @param cds: New cluster domain secret
123 aeefe835 Iustin Pop
  @type nodecert_file: string
124 aeefe835 Iustin Pop
  @param nodecert_file: optional override of the node cert file path
125 aeefe835 Iustin Pop
  @type rapicert_file: string
126 aeefe835 Iustin Pop
  @param rapicert_file: optional override of the rapi cert file path
127 b6267745 Andrea Spadaccini
  @type spicecert_file: string
128 b6267745 Andrea Spadaccini
  @param spicecert_file: optional override of the spice cert file path
129 b6267745 Andrea Spadaccini
  @type spicecacert_file: string
130 b6267745 Andrea Spadaccini
  @param spicecacert_file: optional override of the spice CA cert file path
131 aeefe835 Iustin Pop
  @type hmackey_file: string
132 aeefe835 Iustin Pop
  @param hmackey_file: optional override of the hmac key file path
133 43575108 Michael Hanselmann

134 43575108 Michael Hanselmann
  """
135 168c1de2 Michael Hanselmann
  # noded SSL certificate
136 aeefe835 Iustin Pop
  cluster_cert_exists = os.path.exists(nodecert_file)
137 43575108 Michael Hanselmann
  if new_cluster_cert or not cluster_cert_exists:
138 43575108 Michael Hanselmann
    if cluster_cert_exists:
139 aeefe835 Iustin Pop
      utils.CreateBackup(nodecert_file)
140 43575108 Michael Hanselmann
141 aeefe835 Iustin Pop
    logging.debug("Generating new cluster certificate at %s", nodecert_file)
142 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(nodecert_file)
143 43575108 Michael Hanselmann
144 6b7d5878 Michael Hanselmann
  # confd HMAC key
145 aeefe835 Iustin Pop
  if new_confd_hmac_key or not os.path.exists(hmackey_file):
146 aeefe835 Iustin Pop
    logging.debug("Writing new confd HMAC key to %s", hmackey_file)
147 aeefe835 Iustin Pop
    GenerateHmacKey(hmackey_file)
148 43575108 Michael Hanselmann
149 43575108 Michael Hanselmann
  # RAPI
150 aeefe835 Iustin Pop
  rapi_cert_exists = os.path.exists(rapicert_file)
151 43575108 Michael Hanselmann
152 43575108 Michael Hanselmann
  if rapi_cert_pem:
153 43575108 Michael Hanselmann
    # Assume rapi_pem contains a valid PEM-formatted certificate and key
154 aeefe835 Iustin Pop
    logging.debug("Writing RAPI certificate at %s", rapicert_file)
155 aeefe835 Iustin Pop
    utils.WriteFile(rapicert_file, data=rapi_cert_pem, backup=True)
156 43575108 Michael Hanselmann
157 43575108 Michael Hanselmann
  elif new_rapi_cert or not rapi_cert_exists:
158 43575108 Michael Hanselmann
    if rapi_cert_exists:
159 aeefe835 Iustin Pop
      utils.CreateBackup(rapicert_file)
160 43575108 Michael Hanselmann
161 aeefe835 Iustin Pop
    logging.debug("Generating new RAPI certificate at %s", rapicert_file)
162 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(rapicert_file)
163 c008906b Michael Hanselmann
164 b6267745 Andrea Spadaccini
  # SPICE
165 b6267745 Andrea Spadaccini
  spice_cert_exists = os.path.exists(spicecert_file)
166 b6267745 Andrea Spadaccini
  spice_cacert_exists = os.path.exists(spicecacert_file)
167 b6267745 Andrea Spadaccini
  if spice_cert_pem:
168 b6267745 Andrea Spadaccini
    # spice_cert_pem implies also spice_cacert_pem
169 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE certificate at %s", spicecert_file)
170 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecert_file, data=spice_cert_pem, backup=True)
171 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE CA certificate at %s", spicecacert_file)
172 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecacert_file, data=spice_cacert_pem, backup=True)
173 b6267745 Andrea Spadaccini
  elif new_spice_cert or not spice_cert_exists:
174 b6267745 Andrea Spadaccini
    if spice_cert_exists:
175 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecert_file)
176 b6267745 Andrea Spadaccini
    if spice_cacert_exists:
177 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecacert_file)
178 b6267745 Andrea Spadaccini
179 b6267745 Andrea Spadaccini
    logging.debug("Generating new self-signed SPICE certificate at %s",
180 b6267745 Andrea Spadaccini
                  spicecert_file)
181 b6267745 Andrea Spadaccini
    (_, cert_pem) = utils.GenerateSelfSignedSslCert(spicecert_file)
182 b6267745 Andrea Spadaccini
183 b6267745 Andrea Spadaccini
    # Self-signed certificate -> the public certificate is also the CA public
184 b6267745 Andrea Spadaccini
    # certificate
185 b6267745 Andrea Spadaccini
    logging.debug("Writing the public certificate to %s",
186 b6267745 Andrea Spadaccini
                  spicecert_file)
187 b6267745 Andrea Spadaccini
    utils.io.WriteFile(spicecacert_file, mode=0400, data=cert_pem)
188 b6267745 Andrea Spadaccini
189 3db3eb2a Michael Hanselmann
  # Cluster domain secret
190 3db3eb2a Michael Hanselmann
  if cds:
191 fc0726b9 Michael Hanselmann
    logging.debug("Writing cluster domain secret to %s", cds_file)
192 fc0726b9 Michael Hanselmann
    utils.WriteFile(cds_file, data=cds, backup=True)
193 fc0726b9 Michael Hanselmann
194 fc0726b9 Michael Hanselmann
  elif new_cds or not os.path.exists(cds_file):
195 fc0726b9 Michael Hanselmann
    logging.debug("Generating new cluster domain secret at %s", cds_file)
196 fc0726b9 Michael Hanselmann
    GenerateHmacKey(cds_file)
197 3db3eb2a Michael Hanselmann
198 c008906b Michael Hanselmann
199 8f215968 Michael Hanselmann
def _InitGanetiServerSetup(master_name):
200 40a97d80 Michael Hanselmann
  """Setup the necessary configuration for the initial node daemon.
201 40a97d80 Michael Hanselmann

202 40a97d80 Michael Hanselmann
  This creates the nodepass file containing the shared password for
203 600535f0 Manuel Franceschini
  the cluster, generates the SSL certificate and starts the node daemon.
204 600535f0 Manuel Franceschini

205 600535f0 Manuel Franceschini
  @type master_name: str
206 600535f0 Manuel Franceschini
  @param master_name: Name of the master node
207 40a97d80 Michael Hanselmann

208 40a97d80 Michael Hanselmann
  """
209 43575108 Michael Hanselmann
  # Generate cluster secrets
210 b6267745 Andrea Spadaccini
  GenerateClusterCrypto(True, False, False, False, False)
211 4a34c5cf Guido Trotter
212 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start", constants.NODED])
213 a0c9f010 Michael Hanselmann
  if result.failed:
214 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not start the node daemon, command %s"
215 a0c9f010 Michael Hanselmann
                             " had exitcode %s and error %s" %
216 a0c9f010 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
217 a0c9f010 Michael Hanselmann
218 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(master_name)
219 5627f375 Michael Hanselmann
220 5627f375 Michael Hanselmann
221 5627f375 Michael Hanselmann
def _WaitForNodeDaemon(node_name):
222 5627f375 Michael Hanselmann
  """Wait for node daemon to become responsive.
223 5627f375 Michael Hanselmann

224 5627f375 Michael Hanselmann
  """
225 d3833ebd Michael Hanselmann
  def _CheckNodeDaemon():
226 bd6d1202 René Nussbaumer
    # Pylint bug <http://www.logilab.org/ticket/35642>
227 bd6d1202 René Nussbaumer
    # pylint: disable=E1101
228 db04ce5d Michael Hanselmann
    result = rpc.BootstrapRunner().call_version([node_name])[node_name]
229 d3833ebd Michael Hanselmann
    if result.fail_msg:
230 d3833ebd Michael Hanselmann
      raise utils.RetryAgain()
231 8f215968 Michael Hanselmann
232 d3833ebd Michael Hanselmann
  try:
233 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckNodeDaemon, 1.0, _DAEMON_READY_TIMEOUT)
234 d3833ebd Michael Hanselmann
  except utils.RetryTimeout:
235 5627f375 Michael Hanselmann
    raise errors.OpExecError("Node daemon on %s didn't answer queries within"
236 3b6b6129 Michael Hanselmann
                             " %s seconds" % (node_name, _DAEMON_READY_TIMEOUT))
237 3b6b6129 Michael Hanselmann
238 3b6b6129 Michael Hanselmann
239 3b6b6129 Michael Hanselmann
def _WaitForMasterDaemon():
240 3b6b6129 Michael Hanselmann
  """Wait for master daemon to become responsive.
241 3b6b6129 Michael Hanselmann

242 3b6b6129 Michael Hanselmann
  """
243 3b6b6129 Michael Hanselmann
  def _CheckMasterDaemon():
244 3b6b6129 Michael Hanselmann
    try:
245 3b6b6129 Michael Hanselmann
      cl = luxi.Client()
246 3b6b6129 Michael Hanselmann
      (cluster_name, ) = cl.QueryConfigValues(["cluster_name"])
247 3b6b6129 Michael Hanselmann
    except Exception:
248 3b6b6129 Michael Hanselmann
      raise utils.RetryAgain()
249 3b6b6129 Michael Hanselmann
250 3b6b6129 Michael Hanselmann
    logging.debug("Received cluster name %s from master", cluster_name)
251 3b6b6129 Michael Hanselmann
252 3b6b6129 Michael Hanselmann
  try:
253 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckMasterDaemon, 1.0, _DAEMON_READY_TIMEOUT)
254 3b6b6129 Michael Hanselmann
  except utils.RetryTimeout:
255 3b6b6129 Michael Hanselmann
    raise errors.OpExecError("Master daemon didn't answer queries within"
256 3b6b6129 Michael Hanselmann
                             " %s seconds" % _DAEMON_READY_TIMEOUT)
257 5627f375 Michael Hanselmann
258 a0c9f010 Michael Hanselmann
259 a5da38fa Michael Hanselmann
def _WaitForSshDaemon(hostname, port, family):
260 a5da38fa Michael Hanselmann
  """Wait for SSH daemon to become responsive.
261 a5da38fa Michael Hanselmann

262 a5da38fa Michael Hanselmann
  """
263 a5da38fa Michael Hanselmann
  hostip = netutils.GetHostname(name=hostname, family=family).ip
264 a5da38fa Michael Hanselmann
265 a5da38fa Michael Hanselmann
  def _CheckSshDaemon():
266 a5da38fa Michael Hanselmann
    if netutils.TcpPing(hostip, port, timeout=1.0, live_port_needed=True):
267 a5da38fa Michael Hanselmann
      logging.debug("SSH daemon on %s:%s (IP address %s) has become"
268 a5da38fa Michael Hanselmann
                    " responsive", hostname, port, hostip)
269 a5da38fa Michael Hanselmann
    else:
270 a5da38fa Michael Hanselmann
      raise utils.RetryAgain()
271 a5da38fa Michael Hanselmann
272 a5da38fa Michael Hanselmann
  try:
273 a5da38fa Michael Hanselmann
    utils.Retry(_CheckSshDaemon, 1.0, _DAEMON_READY_TIMEOUT)
274 a5da38fa Michael Hanselmann
  except utils.RetryTimeout:
275 a5da38fa Michael Hanselmann
    raise errors.OpExecError("SSH daemon on %s:%s (IP address %s) didn't"
276 a5da38fa Michael Hanselmann
                             " become responsive within %s seconds" %
277 a5da38fa Michael Hanselmann
                             (hostname, port, hostip, _DAEMON_READY_TIMEOUT))
278 a5da38fa Michael Hanselmann
279 a5da38fa Michael Hanselmann
280 a698cdbb Michael Hanselmann
def RunNodeSetupCmd(cluster_name, node, basecmd, debug, verbose,
281 a698cdbb Michael Hanselmann
                    use_cluster_key, ask_key, strict_host_check, data):
282 a698cdbb Michael Hanselmann
  """Runs a command to configure something on a remote machine.
283 a698cdbb Michael Hanselmann

284 a698cdbb Michael Hanselmann
  @type cluster_name: string
285 a698cdbb Michael Hanselmann
  @param cluster_name: Cluster name
286 a698cdbb Michael Hanselmann
  @type node: string
287 a698cdbb Michael Hanselmann
  @param node: Node name
288 a698cdbb Michael Hanselmann
  @type basecmd: string
289 a698cdbb Michael Hanselmann
  @param basecmd: Base command (path on the remote machine)
290 a698cdbb Michael Hanselmann
  @type debug: bool
291 a698cdbb Michael Hanselmann
  @param debug: Enable debug output
292 a698cdbb Michael Hanselmann
  @type verbose: bool
293 a698cdbb Michael Hanselmann
  @param verbose: Enable verbose output
294 a698cdbb Michael Hanselmann
  @type use_cluster_key: bool
295 a698cdbb Michael Hanselmann
  @param use_cluster_key: See L{ssh.SshRunner.BuildCmd}
296 a698cdbb Michael Hanselmann
  @type ask_key: bool
297 a698cdbb Michael Hanselmann
  @param ask_key: See L{ssh.SshRunner.BuildCmd}
298 a698cdbb Michael Hanselmann
  @type strict_host_check: bool
299 a698cdbb Michael Hanselmann
  @param strict_host_check: See L{ssh.SshRunner.BuildCmd}
300 a698cdbb Michael Hanselmann
  @param data: JSON-serializable input data for script (passed to stdin)
301 a698cdbb Michael Hanselmann

302 a698cdbb Michael Hanselmann
  """
303 a698cdbb Michael Hanselmann
  cmd = [basecmd]
304 a698cdbb Michael Hanselmann
305 a698cdbb Michael Hanselmann
  # Pass --debug/--verbose to the external script if set on our invocation
306 a698cdbb Michael Hanselmann
  if debug:
307 a698cdbb Michael Hanselmann
    cmd.append("--debug")
308 a698cdbb Michael Hanselmann
309 a698cdbb Michael Hanselmann
  if verbose:
310 a698cdbb Michael Hanselmann
    cmd.append("--verbose")
311 a698cdbb Michael Hanselmann
312 e1874aa7 Michael Hanselmann
  family = ssconf.SimpleStore().GetPrimaryIPFamily()
313 e1874aa7 Michael Hanselmann
  srun = ssh.SshRunner(cluster_name,
314 e1874aa7 Michael Hanselmann
                       ipv6=(family == netutils.IP6Address.family))
315 a698cdbb Michael Hanselmann
  scmd = srun.BuildCmd(node, constants.SSH_LOGIN_USER,
316 a698cdbb Michael Hanselmann
                       utils.ShellQuoteArgs(cmd),
317 a698cdbb Michael Hanselmann
                       batch=False, ask_key=ask_key, quiet=False,
318 a698cdbb Michael Hanselmann
                       strict_host_check=strict_host_check,
319 a698cdbb Michael Hanselmann
                       use_cluster_key=use_cluster_key)
320 a698cdbb Michael Hanselmann
321 a698cdbb Michael Hanselmann
  tempfh = tempfile.TemporaryFile()
322 a698cdbb Michael Hanselmann
  try:
323 a698cdbb Michael Hanselmann
    tempfh.write(serializer.DumpJson(data))
324 a698cdbb Michael Hanselmann
    tempfh.seek(0)
325 a698cdbb Michael Hanselmann
326 a698cdbb Michael Hanselmann
    result = utils.RunCmd(scmd, interactive=True, input_fd=tempfh)
327 a698cdbb Michael Hanselmann
  finally:
328 a698cdbb Michael Hanselmann
    tempfh.close()
329 a698cdbb Michael Hanselmann
330 a698cdbb Michael Hanselmann
  if result.failed:
331 a698cdbb Michael Hanselmann
    raise errors.OpExecError("Command '%s' failed: %s" %
332 a698cdbb Michael Hanselmann
                             (result.cmd, result.fail_reason))
333 a698cdbb Michael Hanselmann
334 a5da38fa Michael Hanselmann
  _WaitForSshDaemon(node, netutils.GetDaemonPort(constants.SSH), family)
335 a5da38fa Michael Hanselmann
336 a698cdbb Michael Hanselmann
337 0e3baaf3 Iustin Pop
def _InitFileStorage(file_storage_dir):
338 0e3baaf3 Iustin Pop
  """Initialize if needed the file storage.
339 0e3baaf3 Iustin Pop

340 0e3baaf3 Iustin Pop
  @param file_storage_dir: the user-supplied value
341 0e3baaf3 Iustin Pop
  @return: either empty string (if file storage was disabled at build
342 0e3baaf3 Iustin Pop
      time) or the normalized path to the storage directory
343 0e3baaf3 Iustin Pop

344 0e3baaf3 Iustin Pop
  """
345 0e3baaf3 Iustin Pop
  file_storage_dir = os.path.normpath(file_storage_dir)
346 0e3baaf3 Iustin Pop
347 0e3baaf3 Iustin Pop
  if not os.path.isabs(file_storage_dir):
348 0376655e Guido Trotter
    raise errors.OpPrereqError("File storage directory '%s' is not an absolute"
349 0376655e Guido Trotter
                               " path" % file_storage_dir, errors.ECODE_INVAL)
350 0e3baaf3 Iustin Pop
351 0e3baaf3 Iustin Pop
  if not os.path.exists(file_storage_dir):
352 0e3baaf3 Iustin Pop
    try:
353 0e3baaf3 Iustin Pop
      os.makedirs(file_storage_dir, 0750)
354 0e3baaf3 Iustin Pop
    except OSError, err:
355 0e3baaf3 Iustin Pop
      raise errors.OpPrereqError("Cannot create file storage directory"
356 0e3baaf3 Iustin Pop
                                 " '%s': %s" % (file_storage_dir, err),
357 0e3baaf3 Iustin Pop
                                 errors.ECODE_ENVIRON)
358 0e3baaf3 Iustin Pop
359 0e3baaf3 Iustin Pop
  if not os.path.isdir(file_storage_dir):
360 0e3baaf3 Iustin Pop
    raise errors.OpPrereqError("The file storage directory '%s' is not"
361 0e3baaf3 Iustin Pop
                               " a directory." % file_storage_dir,
362 0e3baaf3 Iustin Pop
                               errors.ECODE_ENVIRON)
363 0e3baaf3 Iustin Pop
  return file_storage_dir
364 0e3baaf3 Iustin Pop
365 0e3baaf3 Iustin Pop
366 18bb6d28 Agata Murawska
def InitCluster(cluster_name, mac_prefix, # pylint: disable=R0913, R0914
367 5a8648eb Andrea Spadaccini
                master_netmask, master_netdev, file_storage_dir,
368 5a8648eb Andrea Spadaccini
                shared_file_storage_dir, candidate_pool_size, secondary_ip=None,
369 5a8648eb Andrea Spadaccini
                vg_name=None, beparams=None, nicparams=None, ndparams=None,
370 bc5d0215 Andrea Spadaccini
                hvparams=None, diskparams=None, enabled_hypervisors=None,
371 bc5d0215 Andrea Spadaccini
                modify_etc_hosts=True, modify_ssh_setup=True,
372 bc5d0215 Andrea Spadaccini
                maintain_node_health=False, drbd_helper=None, uid_pool=None,
373 18bb6d28 Agata Murawska
                default_iallocator=None, primary_ip_version=None, ipolicy=None,
374 c4929a8b René Nussbaumer
                prealloc_wipe_disks=False, use_external_mip_script=False,
375 3bde79ee Helga Velroyen
                hv_state=None, disk_state=None, enabled_disk_templates=None):
376 a0c9f010 Michael Hanselmann
  """Initialise the cluster.
377 a0c9f010 Michael Hanselmann

378 ce735215 Guido Trotter
  @type candidate_pool_size: int
379 ce735215 Guido Trotter
  @param candidate_pool_size: master candidate pool size
380 3bde79ee Helga Velroyen
  @type enabled_disk_templates: list of string
381 3bde79ee Helga Velroyen
  @param enabled_disk_templates: list of disk_templates to be used in this
382 c074a9e8 Helga Velroyen
    cluster
383 ce735215 Guido Trotter

384 a0c9f010 Michael Hanselmann
  """
385 ce735215 Guido Trotter
  # TODO: complete the docstring
386 a0c9f010 Michael Hanselmann
  if config.ConfigWriter.IsCluster():
387 debac808 Iustin Pop
    raise errors.OpPrereqError("Cluster is already initialised",
388 debac808 Iustin Pop
                               errors.ECODE_STATE)
389 a0c9f010 Michael Hanselmann
390 b119bccb Guido Trotter
  if not enabled_hypervisors:
391 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors list must contain at"
392 debac808 Iustin Pop
                               " least one member", errors.ECODE_INVAL)
393 b119bccb Guido Trotter
  invalid_hvs = set(enabled_hypervisors) - constants.HYPER_TYPES
394 b119bccb Guido Trotter
  if invalid_hvs:
395 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors contains invalid"
396 debac808 Iustin Pop
                               " entries: %s" % invalid_hvs,
397 debac808 Iustin Pop
                               errors.ECODE_INVAL)
398 b119bccb Guido Trotter
399 3bde79ee Helga Velroyen
  if not enabled_disk_templates:
400 3bde79ee Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list must contain at"
401 c074a9e8 Helga Velroyen
                               " least one member", errors.ECODE_INVAL)
402 3bde79ee Helga Velroyen
  invalid_disk_templates = \
403 3bde79ee Helga Velroyen
    set(enabled_disk_templates) - constants.DISK_TEMPLATES
404 3bde79ee Helga Velroyen
  if invalid_disk_templates:
405 3bde79ee Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list contains invalid"
406 3bde79ee Helga Velroyen
                               " entries: %s" % invalid_disk_templates,
407 c074a9e8 Helga Velroyen
                               errors.ECODE_INVAL)
408 c074a9e8 Helga Velroyen
409 5a8648eb Andrea Spadaccini
  try:
410 5a8648eb Andrea Spadaccini
    ipcls = netutils.IPAddress.GetClassFromIpVersion(primary_ip_version)
411 5a8648eb Andrea Spadaccini
  except errors.ProgrammerError:
412 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Invalid primary ip version: %d." %
413 2cfbc784 Iustin Pop
                               primary_ip_version, errors.ECODE_INVAL)
414 2f20d07b Manuel Franceschini
415 2f20d07b Manuel Franceschini
  hostname = netutils.GetHostname(family=ipcls.family)
416 2f20d07b Manuel Franceschini
  if not ipcls.IsValid(hostname.ip):
417 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) is not a valid IPv%d"
418 2cfbc784 Iustin Pop
                               " address." % (hostname.ip, primary_ip_version),
419 2cfbc784 Iustin Pop
                               errors.ECODE_INVAL)
420 2f20d07b Manuel Franceschini
421 2f20d07b Manuel Franceschini
  if ipcls.IsLoopback(hostname.ip):
422 8b312c1d Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) resolves to a loopback"
423 8b312c1d Manuel Franceschini
                               " address. Please fix DNS or %s." %
424 ee045466 Michael Hanselmann
                               (hostname.ip, pathutils.ETC_HOSTS),
425 debac808 Iustin Pop
                               errors.ECODE_ENVIRON)
426 a0c9f010 Michael Hanselmann
427 2f20d07b Manuel Franceschini
  if not ipcls.Own(hostname.ip):
428 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Inconsistency: this host's name resolves"
429 a0c9f010 Michael Hanselmann
                               " to %s,\nbut this ip address does not"
430 7c4c22f5 Manuel Franceschini
                               " belong to this host" %
431 debac808 Iustin Pop
                               hostname.ip, errors.ECODE_ENVIRON)
432 a0c9f010 Michael Hanselmann
433 2f20d07b Manuel Franceschini
  clustername = netutils.GetHostname(name=cluster_name, family=ipcls.family)
434 a0c9f010 Michael Hanselmann
435 2f20d07b Manuel Franceschini
  if netutils.TcpPing(clustername.ip, constants.DEFAULT_NODED_PORT, timeout=5):
436 7c4c22f5 Manuel Franceschini
    raise errors.OpPrereqError("Cluster IP already active",
437 debac808 Iustin Pop
                               errors.ECODE_NOTUNIQUE)
438 a0c9f010 Michael Hanselmann
439 2f20d07b Manuel Franceschini
  if not secondary_ip:
440 2f20d07b Manuel Franceschini
    if primary_ip_version == constants.IP6_VERSION:
441 2f20d07b Manuel Franceschini
      raise errors.OpPrereqError("When using a IPv6 primary address, a valid"
442 7c4c22f5 Manuel Franceschini
                                 " IPv4 address must be given as secondary",
443 7c4c22f5 Manuel Franceschini
                                 errors.ECODE_INVAL)
444 b9eeeb02 Michael Hanselmann
    secondary_ip = hostname.ip
445 a0c9f010 Michael Hanselmann
446 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.IsValid(secondary_ip):
447 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Secondary IP address (%s) has to be a valid"
448 2f20d07b Manuel Franceschini
                               " IPv4 address." % secondary_ip,
449 2f20d07b Manuel Franceschini
                               errors.ECODE_INVAL)
450 2f20d07b Manuel Franceschini
451 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.Own(secondary_ip):
452 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("You gave %s as secondary IP,"
453 2f20d07b Manuel Franceschini
                               " but it does not belong to this host." %
454 2f20d07b Manuel Franceschini
                               secondary_ip, errors.ECODE_ENVIRON)
455 2f20d07b Manuel Franceschini
456 5a8648eb Andrea Spadaccini
  if master_netmask is not None:
457 5a8648eb Andrea Spadaccini
    if not ipcls.ValidateNetmask(master_netmask):
458 5a8648eb Andrea Spadaccini
      raise errors.OpPrereqError("CIDR netmask (%s) not valid for IPv%s " %
459 2cfbc784 Iustin Pop
                                  (master_netmask, primary_ip_version),
460 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
461 5a8648eb Andrea Spadaccini
  else:
462 5a8648eb Andrea Spadaccini
    master_netmask = ipcls.iplen
463 5a8648eb Andrea Spadaccini
464 a0c9f010 Michael Hanselmann
  if vg_name is not None:
465 a0c9f010 Michael Hanselmann
    # Check if volume group is valid
466 a0c9f010 Michael Hanselmann
    vgstatus = utils.CheckVolumeGroupSize(utils.ListVolumeGroups(), vg_name,
467 a0c9f010 Michael Hanselmann
                                          constants.MIN_VG_SIZE)
468 a0c9f010 Michael Hanselmann
    if vgstatus:
469 a0c9f010 Michael Hanselmann
      raise errors.OpPrereqError("Error: %s\nspecify --no-lvm-storage if"
470 debac808 Iustin Pop
                                 " you are not using lvm" % vgstatus,
471 debac808 Iustin Pop
                                 errors.ECODE_INVAL)
472 a0c9f010 Michael Hanselmann
473 a721e23a Luca Bigliardi
  if drbd_helper is not None:
474 a721e23a Luca Bigliardi
    try:
475 a721e23a Luca Bigliardi
      curr_helper = bdev.BaseDRBD.GetUsermodeHelper()
476 a721e23a Luca Bigliardi
    except errors.BlockDeviceError, err:
477 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error while checking drbd helper"
478 a721e23a Luca Bigliardi
                                 " (specify --no-drbd-storage if you are not"
479 a721e23a Luca Bigliardi
                                 " using drbd): %s" % str(err),
480 a721e23a Luca Bigliardi
                                 errors.ECODE_ENVIRON)
481 a721e23a Luca Bigliardi
    if drbd_helper != curr_helper:
482 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error: requiring %s as drbd helper but %s"
483 a721e23a Luca Bigliardi
                                 " is the current helper" % (drbd_helper,
484 a721e23a Luca Bigliardi
                                                             curr_helper),
485 a721e23a Luca Bigliardi
                                 errors.ECODE_INVAL)
486 a721e23a Luca Bigliardi
487 32ba31be Michael Hanselmann
  logging.debug("Stopping daemons (if any are running)")
488 32ba31be Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "stop-all"])
489 32ba31be Michael Hanselmann
  if result.failed:
490 32ba31be Michael Hanselmann
    raise errors.OpExecError("Could not stop daemons, command %s"
491 32ba31be Michael Hanselmann
                             " had exitcode %s and error '%s'" %
492 32ba31be Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
493 32ba31be Michael Hanselmann
494 0376655e Guido Trotter
  if constants.ENABLE_FILE_STORAGE:
495 0376655e Guido Trotter
    file_storage_dir = _InitFileStorage(file_storage_dir)
496 0376655e Guido Trotter
  else:
497 0376655e Guido Trotter
    file_storage_dir = ""
498 0376655e Guido Trotter
499 0376655e Guido Trotter
  if constants.ENABLE_SHARED_FILE_STORAGE:
500 0376655e Guido Trotter
    shared_file_storage_dir = _InitFileStorage(shared_file_storage_dir)
501 0376655e Guido Trotter
  else:
502 0376655e Guido Trotter
    shared_file_storage_dir = ""
503 a0c9f010 Michael Hanselmann
504 a0c9f010 Michael Hanselmann
  if not re.match("^[0-9a-z]{2}:[0-9a-z]{2}:[0-9a-z]{2}$", mac_prefix):
505 debac808 Iustin Pop
    raise errors.OpPrereqError("Invalid mac prefix given '%s'" % mac_prefix,
506 debac808 Iustin Pop
                               errors.ECODE_INVAL)
507 a0c9f010 Michael Hanselmann
508 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ip", "link", "show", "dev", master_netdev])
509 a0c9f010 Michael Hanselmann
  if result.failed:
510 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Invalid master netdev given (%s): '%s'" %
511 a0c9f010 Michael Hanselmann
                               (master_netdev,
512 debac808 Iustin Pop
                                result.output.strip()), errors.ECODE_INVAL)
513 a0c9f010 Michael Hanselmann
514 7ede9c6a Michael Hanselmann
  dirs = [(pathutils.RUN_DIR, constants.RUN_DIRS_MODE)]
515 9dae41ad Guido Trotter
  utils.EnsureDirs(dirs)
516 9dae41ad Guido Trotter
517 b2e233a5 Guido Trotter
  objects.UpgradeBeParams(beparams)
518 a5728081 Guido Trotter
  utils.ForceDictType(beparams, constants.BES_PARAMETER_TYPES)
519 b6a30b0d Guido Trotter
  utils.ForceDictType(nicparams, constants.NICS_PARAMETER_TYPES)
520 18bb6d28 Agata Murawska
521 b6a30b0d Guido Trotter
  objects.NIC.CheckParameterSyntax(nicparams)
522 57dc299a Iustin Pop
523 2cc673a3 Iustin Pop
  full_ipolicy = objects.FillIPolicy(constants.IPOLICY_DEFAULTS, ipolicy)
524 b6a30b0d Guido Trotter
525 6204ee71 René Nussbaumer
  if ndparams is not None:
526 6204ee71 René Nussbaumer
    utils.ForceDictType(ndparams, constants.NDS_PARAMETER_TYPES)
527 6204ee71 René Nussbaumer
  else:
528 6204ee71 René Nussbaumer
    ndparams = dict(constants.NDC_DEFAULTS)
529 6204ee71 René Nussbaumer
530 c4929a8b René Nussbaumer
  # This is ugly, as we modify the dict itself
531 57dc299a Iustin Pop
  # FIXME: Make utils.ForceDictType pure functional or write a wrapper
532 57dc299a Iustin Pop
  # around it
533 c4929a8b René Nussbaumer
  if hv_state:
534 c4929a8b René Nussbaumer
    for hvname, hvs_data in hv_state.items():
535 c4929a8b René Nussbaumer
      utils.ForceDictType(hvs_data, constants.HVSTS_PARAMETER_TYPES)
536 c4929a8b René Nussbaumer
      hv_state[hvname] = objects.Cluster.SimpleFillHvState(hvs_data)
537 c4929a8b René Nussbaumer
  else:
538 c4929a8b René Nussbaumer
    hv_state = dict((hvname, constants.HVST_DEFAULTS)
539 c4929a8b René Nussbaumer
                    for hvname in enabled_hypervisors)
540 c4929a8b René Nussbaumer
541 c4929a8b René Nussbaumer
  # FIXME: disk_state has no default values yet
542 c4929a8b René Nussbaumer
  if disk_state:
543 c4929a8b René Nussbaumer
    for storage, ds_data in disk_state.items():
544 c4929a8b René Nussbaumer
      if storage not in constants.DS_VALID_TYPES:
545 c4929a8b René Nussbaumer
        raise errors.OpPrereqError("Invalid storage type in disk state: %s" %
546 c4929a8b René Nussbaumer
                                   storage, errors.ECODE_INVAL)
547 c4929a8b René Nussbaumer
      for ds_name, state in ds_data.items():
548 c4929a8b René Nussbaumer
        utils.ForceDictType(state, constants.DSS_PARAMETER_TYPES)
549 c4929a8b René Nussbaumer
        ds_data[ds_name] = objects.Cluster.SimpleFillDiskState(state)
550 c4929a8b René Nussbaumer
551 a5728081 Guido Trotter
  # hvparams is a mapping of hypervisor->hvparams dict
552 a5728081 Guido Trotter
  for hv_name, hv_params in hvparams.iteritems():
553 a5728081 Guido Trotter
    utils.ForceDictType(hv_params, constants.HVS_PARAMETER_TYPES)
554 a5728081 Guido Trotter
    hv_class = hypervisor.GetHypervisor(hv_name)
555 a5728081 Guido Trotter
    hv_class.CheckParameterSyntax(hv_params)
556 d4b72030 Guido Trotter
557 bc5d0215 Andrea Spadaccini
  # diskparams is a mapping of disk-template->diskparams dict
558 bc5d0215 Andrea Spadaccini
  for template, dt_params in diskparams.items():
559 bc5d0215 Andrea Spadaccini
    param_keys = set(dt_params.keys())
560 bc5d0215 Andrea Spadaccini
    default_param_keys = set(constants.DISK_DT_DEFAULTS[template].keys())
561 bc5d0215 Andrea Spadaccini
    if not (param_keys <= default_param_keys):
562 bc5d0215 Andrea Spadaccini
      unknown_params = param_keys - default_param_keys
563 bc5d0215 Andrea Spadaccini
      raise errors.OpPrereqError("Invalid parameters for disk template %s:"
564 bc5d0215 Andrea Spadaccini
                                 " %s" % (template,
565 2cfbc784 Iustin Pop
                                          utils.CommaJoin(unknown_params)),
566 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
567 bc5d0215 Andrea Spadaccini
    utils.ForceDictType(dt_params, constants.DISK_DT_TYPES)
568 35c48839 Michele Tartara
    if template == constants.DT_DRBD8 and vg_name is not None:
569 35c48839 Michele Tartara
      # The default METAVG value is equal to the VG name set at init time,
570 35c48839 Michele Tartara
      # if provided
571 35c48839 Michele Tartara
      dt_params[constants.DRBD_DEFAULT_METAVG] = vg_name
572 35c48839 Michele Tartara
573 e4a4391d René Nussbaumer
  try:
574 e4a4391d René Nussbaumer
    utils.VerifyDictOptions(diskparams, constants.DISK_DT_DEFAULTS)
575 e4a4391d René Nussbaumer
  except errors.OpPrereqError, err:
576 e4a4391d René Nussbaumer
    raise errors.OpPrereqError("While verify diskparam options: %s" % err,
577 e4a4391d René Nussbaumer
                               errors.ECODE_INVAL)
578 bc5d0215 Andrea Spadaccini
579 a0c9f010 Michael Hanselmann
  # set up ssh config and /etc/hosts
580 a9542a4f Thomas Thrainer
  rsa_sshkey = ""
581 a9542a4f Thomas Thrainer
  dsa_sshkey = ""
582 a9542a4f Thomas Thrainer
  if os.path.isfile(pathutils.SSH_HOST_RSA_PUB):
583 a9542a4f Thomas Thrainer
    sshline = utils.ReadFile(pathutils.SSH_HOST_RSA_PUB)
584 a9542a4f Thomas Thrainer
    rsa_sshkey = sshline.split(" ")[1]
585 a9542a4f Thomas Thrainer
  if os.path.isfile(pathutils.SSH_HOST_DSA_PUB):
586 a9542a4f Thomas Thrainer
    sshline = utils.ReadFile(pathutils.SSH_HOST_DSA_PUB)
587 a9542a4f Thomas Thrainer
    dsa_sshkey = sshline.split(" ")[1]
588 a9542a4f Thomas Thrainer
  if not rsa_sshkey and not dsa_sshkey:
589 a9542a4f Thomas Thrainer
    raise errors.OpPrereqError("Failed to find SSH public keys",
590 a9542a4f Thomas Thrainer
                               errors.ECODE_ENVIRON)
591 a0c9f010 Michael Hanselmann
592 b86a6bcd Guido Trotter
  if modify_etc_hosts:
593 ea8ac9c9 René Nussbaumer
    utils.AddHostToEtcHosts(hostname.name, hostname.ip)
594 b86a6bcd Guido Trotter
595 b989b9d9 Ken Wehr
  if modify_ssh_setup:
596 b989b9d9 Ken Wehr
    _InitSSHSetup()
597 a0c9f010 Michael Hanselmann
598 bf4af505 Apollon Oikonomopoulos
  if default_iallocator is not None:
599 bf4af505 Apollon Oikonomopoulos
    alloc_script = utils.FindFile(default_iallocator,
600 bf4af505 Apollon Oikonomopoulos
                                  constants.IALLOCATOR_SEARCH_PATH,
601 bf4af505 Apollon Oikonomopoulos
                                  os.path.isfile)
602 bf4af505 Apollon Oikonomopoulos
    if alloc_script is None:
603 bf4af505 Apollon Oikonomopoulos
      raise errors.OpPrereqError("Invalid default iallocator script '%s'"
604 bf4af505 Apollon Oikonomopoulos
                                 " specified" % default_iallocator,
605 bf4af505 Apollon Oikonomopoulos
                                 errors.ECODE_INVAL)
606 d1e9c98d Iustin Pop
  elif constants.HTOOLS:
607 d1e9c98d Iustin Pop
    # htools was enabled at build-time, we default to it
608 d1e9c98d Iustin Pop
    if utils.FindFile(constants.IALLOC_HAIL,
609 d1e9c98d Iustin Pop
                      constants.IALLOCATOR_SEARCH_PATH,
610 d1e9c98d Iustin Pop
                      os.path.isfile):
611 d1e9c98d Iustin Pop
      default_iallocator = constants.IALLOC_HAIL
612 bf4af505 Apollon Oikonomopoulos
613 430b923c Iustin Pop
  now = time.time()
614 430b923c Iustin Pop
615 a0c9f010 Michael Hanselmann
  # init of cluster config file
616 b9eeeb02 Michael Hanselmann
  cluster_config = objects.Cluster(
617 b9eeeb02 Michael Hanselmann
    serial_no=1,
618 a9542a4f Thomas Thrainer
    rsahostkeypub=rsa_sshkey,
619 a9542a4f Thomas Thrainer
    dsahostkeypub=dsa_sshkey,
620 b9eeeb02 Michael Hanselmann
    highest_used_port=(constants.FIRST_DRBD_PORT - 1),
621 b9eeeb02 Michael Hanselmann
    mac_prefix=mac_prefix,
622 b9eeeb02 Michael Hanselmann
    volume_group_name=vg_name,
623 b9eeeb02 Michael Hanselmann
    tcpudp_port_pool=set(),
624 f6bd6e98 Michael Hanselmann
    master_node=hostname.name,
625 f6bd6e98 Michael Hanselmann
    master_ip=clustername.ip,
626 5a8648eb Andrea Spadaccini
    master_netmask=master_netmask,
627 f6bd6e98 Michael Hanselmann
    master_netdev=master_netdev,
628 f6bd6e98 Michael Hanselmann
    cluster_name=clustername.name,
629 f6bd6e98 Michael Hanselmann
    file_storage_dir=file_storage_dir,
630 4b97f902 Apollon Oikonomopoulos
    shared_file_storage_dir=shared_file_storage_dir,
631 ea3a925f Alexander Schreiber
    enabled_hypervisors=enabled_hypervisors,
632 4ef7f423 Guido Trotter
    beparams={constants.PP_DEFAULT: beparams},
633 b6a30b0d Guido Trotter
    nicparams={constants.PP_DEFAULT: nicparams},
634 6204ee71 René Nussbaumer
    ndparams=ndparams,
635 ea3a925f Alexander Schreiber
    hvparams=hvparams,
636 bc5d0215 Andrea Spadaccini
    diskparams=diskparams,
637 ce735215 Guido Trotter
    candidate_pool_size=candidate_pool_size,
638 022c3a0b Guido Trotter
    modify_etc_hosts=modify_etc_hosts,
639 b989b9d9 Ken Wehr
    modify_ssh_setup=modify_ssh_setup,
640 39b0f0c2 Balazs Lecz
    uid_pool=uid_pool,
641 430b923c Iustin Pop
    ctime=now,
642 430b923c Iustin Pop
    mtime=now,
643 3953242f Iustin Pop
    maintain_node_health=maintain_node_health,
644 a721e23a Luca Bigliardi
    drbd_usermode_helper=drbd_helper,
645 bf4af505 Apollon Oikonomopoulos
    default_iallocator=default_iallocator,
646 2f20d07b Manuel Franceschini
    primary_ip_family=ipcls.family,
647 3d914585 René Nussbaumer
    prealloc_wipe_disks=prealloc_wipe_disks,
648 bf689b7a Andrea Spadaccini
    use_external_mip_script=use_external_mip_script,
649 57dc299a Iustin Pop
    ipolicy=full_ipolicy,
650 c4929a8b René Nussbaumer
    hv_state_static=hv_state,
651 c4929a8b René Nussbaumer
    disk_state_static=disk_state,
652 3bde79ee Helga Velroyen
    enabled_disk_templates=enabled_disk_templates,
653 b9eeeb02 Michael Hanselmann
    )
654 b9eeeb02 Michael Hanselmann
  master_node_config = objects.Node(name=hostname.name,
655 b9eeeb02 Michael Hanselmann
                                    primary_ip=hostname.ip,
656 b9222f32 Guido Trotter
                                    secondary_ip=secondary_ip,
657 c044f32c Guido Trotter
                                    serial_no=1,
658 c044f32c Guido Trotter
                                    master_candidate=True,
659 af64c0ea Iustin Pop
                                    offline=False, drained=False,
660 435e4bd6 Michael Hanselmann
                                    ctime=now, mtime=now,
661 c044f32c Guido Trotter
                                    )
662 9e1333b9 Guido Trotter
  InitConfig(constants.CONFIG_VERSION, cluster_config, master_node_config)
663 d367b66c Manuel Franceschini
  cfg = config.ConfigWriter(offline=True)
664 7ede9c6a Michael Hanselmann
  ssh.WriteKnownHostsFile(cfg, pathutils.SSH_KNOWN_HOSTS_FILE)
665 a4eae71f Michael Hanselmann
  cfg.Update(cfg.GetClusterInfo(), logging.error)
666 ee501db1 Michael Hanselmann
  ssconf.WriteSsconfFiles(cfg.GetSsconfValues())
667 d367b66c Manuel Franceschini
668 d367b66c Manuel Franceschini
  # set up the inter-node password and certificate
669 d367b66c Manuel Franceschini
  _InitGanetiServerSetup(hostname.name)
670 827f753e Guido Trotter
671 952d7515 Michael Hanselmann
  logging.debug("Starting daemons")
672 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start-all"])
673 952d7515 Michael Hanselmann
  if result.failed:
674 952d7515 Michael Hanselmann
    raise errors.OpExecError("Could not start daemons, command %s"
675 952d7515 Michael Hanselmann
                             " had exitcode %s and error %s" %
676 952d7515 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
677 b3f1cf6f Iustin Pop
678 3b6b6129 Michael Hanselmann
  _WaitForMasterDaemon()
679 b3f1cf6f Iustin Pop
680 b1b6ea87 Iustin Pop
681 02f99608 Oleksiy Mishchenko
def InitConfig(version, cluster_config, master_node_config,
682 7ede9c6a Michael Hanselmann
               cfg_file=pathutils.CLUSTER_CONF_FILE):
683 7b3a8fb5 Iustin Pop
  """Create the initial cluster configuration.
684 7b3a8fb5 Iustin Pop

685 7b3a8fb5 Iustin Pop
  It will contain the current node, which will also be the master
686 7b3a8fb5 Iustin Pop
  node, and no instances.
687 7b3a8fb5 Iustin Pop

688 7b3a8fb5 Iustin Pop
  @type version: int
689 c41eea6e Iustin Pop
  @param version: configuration version
690 c41eea6e Iustin Pop
  @type cluster_config: L{objects.Cluster}
691 c41eea6e Iustin Pop
  @param cluster_config: cluster configuration
692 c41eea6e Iustin Pop
  @type master_node_config: L{objects.Node}
693 c41eea6e Iustin Pop
  @param master_node_config: master node configuration
694 c41eea6e Iustin Pop
  @type cfg_file: string
695 c41eea6e Iustin Pop
  @param cfg_file: configuration file path
696 c41eea6e Iustin Pop

697 7b3a8fb5 Iustin Pop
  """
698 88b92fe3 Guido Trotter
  uuid_generator = config.TemporaryReservationManager()
699 88b92fe3 Guido Trotter
  cluster_config.uuid = uuid_generator.Generate([], utils.NewUUID,
700 88b92fe3 Guido Trotter
                                                _INITCONF_ECID)
701 88b92fe3 Guido Trotter
  master_node_config.uuid = uuid_generator.Generate([], utils.NewUUID,
702 88b92fe3 Guido Trotter
                                                    _INITCONF_ECID)
703 7b3a8fb5 Iustin Pop
  nodes = {
704 7b3a8fb5 Iustin Pop
    master_node_config.name: master_node_config,
705 7b3a8fb5 Iustin Pop
    }
706 88b92fe3 Guido Trotter
  default_nodegroup = objects.NodeGroup(
707 88b92fe3 Guido Trotter
    uuid=uuid_generator.Generate([], utils.NewUUID, _INITCONF_ECID),
708 75cf411a Adeodato Simo
    name=constants.INITIAL_NODE_GROUP_NAME,
709 88b92fe3 Guido Trotter
    members=[master_node_config.name],
710 99ccf8b9 René Nussbaumer
    diskparams={},
711 88b92fe3 Guido Trotter
    )
712 88b92fe3 Guido Trotter
  nodegroups = {
713 88b92fe3 Guido Trotter
    default_nodegroup.uuid: default_nodegroup,
714 88b92fe3 Guido Trotter
    }
715 d693c864 Iustin Pop
  now = time.time()
716 7b3a8fb5 Iustin Pop
  config_data = objects.ConfigData(version=version,
717 7b3a8fb5 Iustin Pop
                                   cluster=cluster_config,
718 88b92fe3 Guido Trotter
                                   nodegroups=nodegroups,
719 7b3a8fb5 Iustin Pop
                                   nodes=nodes,
720 7b3a8fb5 Iustin Pop
                                   instances={},
721 eaa4c57c Dimitris Aragiorgis
                                   networks={},
722 d693c864 Iustin Pop
                                   serial_no=1,
723 d693c864 Iustin Pop
                                   ctime=now, mtime=now)
724 a33848a5 Guido Trotter
  utils.WriteFile(cfg_file,
725 a33848a5 Guido Trotter
                  data=serializer.Dump(config_data.ToDict()),
726 a33848a5 Guido Trotter
                  mode=0600)
727 02f99608 Oleksiy Mishchenko
728 02f99608 Oleksiy Mishchenko
729 140aa4a8 Iustin Pop
def FinalizeClusterDestroy(master):
730 140aa4a8 Iustin Pop
  """Execute the last steps of cluster destroy
731 140aa4a8 Iustin Pop

732 140aa4a8 Iustin Pop
  This function shuts down all the daemons, completing the destroy
733 140aa4a8 Iustin Pop
  begun in cmdlib.LUDestroyOpcode.
734 140aa4a8 Iustin Pop

735 140aa4a8 Iustin Pop
  """
736 b989b9d9 Ken Wehr
  cfg = config.ConfigWriter()
737 b989b9d9 Ken Wehr
  modify_ssh_setup = cfg.GetClusterInfo().modify_ssh_setup
738 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
739 7c74bbe0 Andrea Spadaccini
740 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
741 c79198a0 Andrea Spadaccini
  master_params.name = master
742 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
743 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
744 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
745 c79198a0 Andrea Spadaccini
746 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
747 7c74bbe0 Andrea Spadaccini
  if msg:
748 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
749 7c74bbe0 Andrea Spadaccini
750 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(master)
751 3cebe102 Michael Hanselmann
  msg = result.fail_msg
752 6c00d19a Iustin Pop
  if msg:
753 099c52ad Iustin Pop
    logging.warning("Could not disable the master role: %s", msg)
754 7c74bbe0 Andrea Spadaccini
755 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_leave_cluster(master, modify_ssh_setup)
756 3cebe102 Michael Hanselmann
  msg = result.fail_msg
757 0623d351 Iustin Pop
  if msg:
758 0623d351 Iustin Pop
    logging.warning("Could not shutdown the node daemon and cleanup"
759 0623d351 Iustin Pop
                    " the node: %s", msg)
760 140aa4a8 Iustin Pop
761 140aa4a8 Iustin Pop
762 7b8ba235 Michael Hanselmann
def SetupNodeDaemon(opts, cluster_name, node):
763 827f753e Guido Trotter
  """Add a node to the cluster.
764 827f753e Guido Trotter

765 b1b6ea87 Iustin Pop
  This function must be called before the actual opcode, and will ssh
766 b1b6ea87 Iustin Pop
  to the remote node, copy the needed files, and start ganeti-noded,
767 b1b6ea87 Iustin Pop
  allowing the master to do the rest via normal rpc calls.
768 827f753e Guido Trotter

769 87622829 Iustin Pop
  @param cluster_name: the cluster name
770 87622829 Iustin Pop
  @param node: the name of the new node
771 827f753e Guido Trotter

772 827f753e Guido Trotter
  """
773 7b8ba235 Michael Hanselmann
  data = {
774 7b8ba235 Michael Hanselmann
    constants.NDS_CLUSTER_NAME: cluster_name,
775 7b8ba235 Michael Hanselmann
    constants.NDS_NODE_DAEMON_CERTIFICATE:
776 7b8ba235 Michael Hanselmann
      utils.ReadFile(pathutils.NODED_CERT_FILE),
777 7b8ba235 Michael Hanselmann
    constants.NDS_SSCONF: ssconf.SimpleStore().ReadAll(),
778 7b8ba235 Michael Hanselmann
    constants.NDS_START_NODE_DAEMON: True,
779 7b8ba235 Michael Hanselmann
    }
780 7b8ba235 Michael Hanselmann
781 7b8ba235 Michael Hanselmann
  RunNodeSetupCmd(cluster_name, node, pathutils.NODE_DAEMON_SETUP,
782 7b8ba235 Michael Hanselmann
                  opts.debug, opts.verbose,
783 7b8ba235 Michael Hanselmann
                  True, opts.ssh_key_check, opts.ssh_key_check, data)
784 827f753e Guido Trotter
785 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(node)
786 5627f375 Michael Hanselmann
787 b1b6ea87 Iustin Pop
788 8e2524c3 Guido Trotter
def MasterFailover(no_voting=False):
789 b1b6ea87 Iustin Pop
  """Failover the master node.
790 b1b6ea87 Iustin Pop

791 b1b6ea87 Iustin Pop
  This checks that we are not already the master, and will cause the
792 b1b6ea87 Iustin Pop
  current master to cease being master, and the non-master to become
793 b1b6ea87 Iustin Pop
  new master.
794 b1b6ea87 Iustin Pop

795 8e2524c3 Guido Trotter
  @type no_voting: boolean
796 8e2524c3 Guido Trotter
  @param no_voting: force the operation without remote nodes agreement
797 8e2524c3 Guido Trotter
                      (dangerous)
798 8e2524c3 Guido Trotter

799 b1b6ea87 Iustin Pop
  """
800 8135a2db Iustin Pop
  sstore = ssconf.SimpleStore()
801 b1b6ea87 Iustin Pop
802 8135a2db Iustin Pop
  old_master, new_master = ssconf.GetMasterAndMyself(sstore)
803 8135a2db Iustin Pop
  node_list = sstore.GetNodeList()
804 8135a2db Iustin Pop
  mc_list = sstore.GetMasterCandidates()
805 b1b6ea87 Iustin Pop
806 b1b6ea87 Iustin Pop
  if old_master == new_master:
807 b1b6ea87 Iustin Pop
    raise errors.OpPrereqError("This commands must be run on the node"
808 b1b6ea87 Iustin Pop
                               " where you want the new master to be."
809 b1b6ea87 Iustin Pop
                               " %s is already the master" %
810 debac808 Iustin Pop
                               old_master, errors.ECODE_INVAL)
811 d5927e48 Iustin Pop
812 8135a2db Iustin Pop
  if new_master not in mc_list:
813 8135a2db Iustin Pop
    mc_no_master = [name for name in mc_list if name != old_master]
814 8135a2db Iustin Pop
    raise errors.OpPrereqError("This node is not among the nodes marked"
815 8135a2db Iustin Pop
                               " as master candidates. Only these nodes"
816 8135a2db Iustin Pop
                               " can become masters. Current list of"
817 8135a2db Iustin Pop
                               " master candidates is:\n"
818 3ccb3a64 Michael Hanselmann
                               "%s" % ("\n".join(mc_no_master)),
819 debac808 Iustin Pop
                               errors.ECODE_STATE)
820 8135a2db Iustin Pop
821 8e2524c3 Guido Trotter
  if not no_voting:
822 8e2524c3 Guido Trotter
    vote_list = GatherMasterVotes(node_list)
823 8e2524c3 Guido Trotter
824 8e2524c3 Guido Trotter
    if vote_list:
825 8e2524c3 Guido Trotter
      voted_master = vote_list[0][0]
826 8e2524c3 Guido Trotter
      if voted_master is None:
827 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("Cluster is inconsistent, most nodes did"
828 debac808 Iustin Pop
                                   " not respond.", errors.ECODE_ENVIRON)
829 8e2524c3 Guido Trotter
      elif voted_master != old_master:
830 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("I have a wrong configuration, I believe"
831 8e2524c3 Guido Trotter
                                   " the master is %s but the other nodes"
832 8e2524c3 Guido Trotter
                                   " voted %s. Please resync the configuration"
833 8e2524c3 Guido Trotter
                                   " of this node." %
834 debac808 Iustin Pop
                                   (old_master, voted_master),
835 debac808 Iustin Pop
                                   errors.ECODE_STATE)
836 b1b6ea87 Iustin Pop
  # end checks
837 b1b6ea87 Iustin Pop
838 b1b6ea87 Iustin Pop
  rcode = 0
839 b1b6ea87 Iustin Pop
840 d5927e48 Iustin Pop
  logging.info("Setting master to %s, old master: %s", new_master, old_master)
841 b1b6ea87 Iustin Pop
842 21004460 Iustin Pop
  try:
843 21004460 Iustin Pop
    # instantiate a real config writer, as we now know we have the
844 21004460 Iustin Pop
    # configuration data
845 eb180fe2 Iustin Pop
    cfg = config.ConfigWriter(accept_foreign=True)
846 21004460 Iustin Pop
847 21004460 Iustin Pop
    cluster_info = cfg.GetClusterInfo()
848 21004460 Iustin Pop
    cluster_info.master_node = new_master
849 21004460 Iustin Pop
    # this will also regenerate the ssconf files, since we updated the
850 21004460 Iustin Pop
    # cluster info
851 21004460 Iustin Pop
    cfg.Update(cluster_info, logging.error)
852 21004460 Iustin Pop
  except errors.ConfigurationError, err:
853 21004460 Iustin Pop
    logging.error("Error while trying to set the new master: %s",
854 21004460 Iustin Pop
                  str(err))
855 21004460 Iustin Pop
    return 1
856 21004460 Iustin Pop
857 21004460 Iustin Pop
  # if cfg.Update worked, then it means the old master daemon won't be
858 21004460 Iustin Pop
  # able now to write its own config file (we rely on locking in both
859 21004460 Iustin Pop
  # backend.UploadFile() and ConfigWriter._Write(); hence the next
860 21004460 Iustin Pop
  # step is to kill the old master
861 21004460 Iustin Pop
862 21004460 Iustin Pop
  logging.info("Stopping the master daemon on node %s", old_master)
863 21004460 Iustin Pop
864 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
865 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
866 c79198a0 Andrea Spadaccini
  master_params.name = old_master
867 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
868 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
869 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
870 c79198a0 Andrea Spadaccini
871 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
872 7c74bbe0 Andrea Spadaccini
  if msg:
873 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
874 7c74bbe0 Andrea Spadaccini
875 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(old_master)
876 3cebe102 Michael Hanselmann
  msg = result.fail_msg
877 6c00d19a Iustin Pop
  if msg:
878 d5927e48 Iustin Pop
    logging.error("Could not disable the master role on the old master"
879 5ae4945a Iustin Pop
                  " %s, please disable manually: %s", old_master, msg)
880 b1b6ea87 Iustin Pop
881 21004460 Iustin Pop
  logging.info("Checking master IP non-reachability...")
882 21004460 Iustin Pop
883 425f0f54 Iustin Pop
  master_ip = sstore.GetMasterIP()
884 425f0f54 Iustin Pop
  total_timeout = 30
885 e687ec01 Michael Hanselmann
886 d23ef431 Michael Hanselmann
  # Here we have a phase where no master should be running
887 425f0f54 Iustin Pop
  def _check_ip():
888 a744b676 Manuel Franceschini
    if netutils.TcpPing(master_ip, constants.DEFAULT_NODED_PORT):
889 425f0f54 Iustin Pop
      raise utils.RetryAgain()
890 425f0f54 Iustin Pop
891 425f0f54 Iustin Pop
  try:
892 425f0f54 Iustin Pop
    utils.Retry(_check_ip, (1, 1.5, 5), total_timeout)
893 425f0f54 Iustin Pop
  except utils.RetryTimeout:
894 425f0f54 Iustin Pop
    logging.warning("The master IP is still reachable after %s seconds,"
895 425f0f54 Iustin Pop
                    " continuing but activating the master on the current"
896 425f0f54 Iustin Pop
                    " node will probably fail", total_timeout)
897 b1b6ea87 Iustin Pop
898 ff699aa9 Michael Hanselmann
  if jstore.CheckDrainFlag():
899 ff699aa9 Michael Hanselmann
    logging.info("Undraining job queue")
900 ff699aa9 Michael Hanselmann
    jstore.SetDrainFlag(False)
901 ff699aa9 Michael Hanselmann
902 21004460 Iustin Pop
  logging.info("Starting the master daemons on the new master")
903 d5927e48 Iustin Pop
904 db04ce5d Michael Hanselmann
  result = rpc.BootstrapRunner().call_node_start_master_daemons(new_master,
905 db04ce5d Michael Hanselmann
                                                                no_voting)
906 3cebe102 Michael Hanselmann
  msg = result.fail_msg
907 b726aff0 Iustin Pop
  if msg:
908 d5927e48 Iustin Pop
    logging.error("Could not start the master role on the new master"
909 b726aff0 Iustin Pop
                  " %s, please check: %s", new_master, msg)
910 b1b6ea87 Iustin Pop
    rcode = 1
911 b1b6ea87 Iustin Pop
912 21004460 Iustin Pop
  logging.info("Master failed over from %s to %s", old_master, new_master)
913 b1b6ea87 Iustin Pop
  return rcode
914 d7cdb55d Iustin Pop
915 d7cdb55d Iustin Pop
916 8eb148ae Iustin Pop
def GetMaster():
917 8eb148ae Iustin Pop
  """Returns the current master node.
918 8eb148ae Iustin Pop

919 8eb148ae Iustin Pop
  This is a separate function in bootstrap since it's needed by
920 8eb148ae Iustin Pop
  gnt-cluster, and instead of importing directly ssconf, it's better
921 8eb148ae Iustin Pop
  to abstract it in bootstrap, where we do use ssconf in other
922 8eb148ae Iustin Pop
  functions too.
923 8eb148ae Iustin Pop

924 8eb148ae Iustin Pop
  """
925 8eb148ae Iustin Pop
  sstore = ssconf.SimpleStore()
926 8eb148ae Iustin Pop
927 8eb148ae Iustin Pop
  old_master, _ = ssconf.GetMasterAndMyself(sstore)
928 8eb148ae Iustin Pop
929 8eb148ae Iustin Pop
  return old_master
930 8eb148ae Iustin Pop
931 8eb148ae Iustin Pop
932 d7cdb55d Iustin Pop
def GatherMasterVotes(node_list):
933 d7cdb55d Iustin Pop
  """Check the agreement on who is the master.
934 d7cdb55d Iustin Pop

935 d7cdb55d Iustin Pop
  This function will return a list of (node, number of votes), ordered
936 d7cdb55d Iustin Pop
  by the number of votes. Errors will be denoted by the key 'None'.
937 d7cdb55d Iustin Pop

938 d7cdb55d Iustin Pop
  Note that the sum of votes is the number of nodes this machine
939 d7cdb55d Iustin Pop
  knows, whereas the number of entries in the list could be different
940 d7cdb55d Iustin Pop
  (if some nodes vote for another master).
941 d7cdb55d Iustin Pop

942 d7cdb55d Iustin Pop
  We remove ourselves from the list since we know that (bugs aside)
943 d7cdb55d Iustin Pop
  since we use the same source for configuration information for both
944 d7cdb55d Iustin Pop
  backend and boostrap, we'll always vote for ourselves.
945 d7cdb55d Iustin Pop

946 d7cdb55d Iustin Pop
  @type node_list: list
947 d7cdb55d Iustin Pop
  @param node_list: the list of nodes to query for master info; the current
948 5bbd3f7f Michael Hanselmann
      node will be removed if it is in the list
949 d7cdb55d Iustin Pop
  @rtype: list
950 d7cdb55d Iustin Pop
  @return: list of (node, votes)
951 d7cdb55d Iustin Pop

952 d7cdb55d Iustin Pop
  """
953 b705c7a6 Manuel Franceschini
  myself = netutils.Hostname.GetSysName()
954 d7cdb55d Iustin Pop
  try:
955 d7cdb55d Iustin Pop
    node_list.remove(myself)
956 d7cdb55d Iustin Pop
  except ValueError:
957 d7cdb55d Iustin Pop
    pass
958 d7cdb55d Iustin Pop
  if not node_list:
959 d7cdb55d Iustin Pop
    # no nodes left (eventually after removing myself)
960 d7cdb55d Iustin Pop
    return []
961 db04ce5d Michael Hanselmann
  results = rpc.BootstrapRunner().call_master_info(node_list)
962 d7cdb55d Iustin Pop
  if not isinstance(results, dict):
963 d7cdb55d Iustin Pop
    # this should not happen (unless internal error in rpc)
964 d7cdb55d Iustin Pop
    logging.critical("Can't complete rpc call, aborting master startup")
965 d7cdb55d Iustin Pop
    return [(None, len(node_list))]
966 d7cdb55d Iustin Pop
  votes = {}
967 d7cdb55d Iustin Pop
  for node in results:
968 781de953 Iustin Pop
    nres = results[node]
969 2a52a064 Iustin Pop
    data = nres.payload
970 3cebe102 Michael Hanselmann
    msg = nres.fail_msg
971 2a52a064 Iustin Pop
    fail = False
972 2a52a064 Iustin Pop
    if msg:
973 2a52a064 Iustin Pop
      logging.warning("Error contacting node %s: %s", node, msg)
974 2a52a064 Iustin Pop
      fail = True
975 909b3a0e Andrea Spadaccini
    # for now we accept both length 3, 4 and 5 (data[3] is primary ip version
976 909b3a0e Andrea Spadaccini
    # and data[4] is the master netmask)
977 2a52a064 Iustin Pop
    elif not isinstance(data, (tuple, list)) or len(data) < 3:
978 2a52a064 Iustin Pop
      logging.warning("Invalid data received from node %s: %s", node, data)
979 2a52a064 Iustin Pop
      fail = True
980 2a52a064 Iustin Pop
    if fail:
981 d7cdb55d Iustin Pop
      if None not in votes:
982 d7cdb55d Iustin Pop
        votes[None] = 0
983 d7cdb55d Iustin Pop
      votes[None] += 1
984 d7cdb55d Iustin Pop
      continue
985 781de953 Iustin Pop
    master_node = data[2]
986 d7cdb55d Iustin Pop
    if master_node not in votes:
987 d7cdb55d Iustin Pop
      votes[master_node] = 0
988 d7cdb55d Iustin Pop
    votes[master_node] += 1
989 d7cdb55d Iustin Pop
990 d7cdb55d Iustin Pop
  vote_list = [v for v in votes.items()]
991 d7cdb55d Iustin Pop
  # sort first on number of votes then on name, since we want None
992 d7cdb55d Iustin Pop
  # sorted later if we have the half of the nodes not responding, and
993 d7cdb55d Iustin Pop
  # half voting all for the same master
994 d7cdb55d Iustin Pop
  vote_list.sort(key=lambda x: (x[1], x[0]), reverse=True)
995 d7cdb55d Iustin Pop
996 d7cdb55d Iustin Pop
  return vote_list