Statistics
| Branch: | Tag: | Revision:

root / lib / bootstrap.py @ 7af7da68

History | View | Annotate | Download (36.2 kB)

1 a0c9f010 Michael Hanselmann
#
2 a0c9f010 Michael Hanselmann
#
3 a0c9f010 Michael Hanselmann
4 57dc299a Iustin Pop
# Copyright (C) 2006, 2007, 2008, 2010, 2011, 2012 Google Inc.
5 a0c9f010 Michael Hanselmann
#
6 a0c9f010 Michael Hanselmann
# This program is free software; you can redistribute it and/or modify
7 a0c9f010 Michael Hanselmann
# it under the terms of the GNU General Public License as published by
8 a0c9f010 Michael Hanselmann
# the Free Software Foundation; either version 2 of the License, or
9 a0c9f010 Michael Hanselmann
# (at your option) any later version.
10 a0c9f010 Michael Hanselmann
#
11 a0c9f010 Michael Hanselmann
# This program is distributed in the hope that it will be useful, but
12 a0c9f010 Michael Hanselmann
# WITHOUT ANY WARRANTY; without even the implied warranty of
13 a0c9f010 Michael Hanselmann
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 a0c9f010 Michael Hanselmann
# General Public License for more details.
15 a0c9f010 Michael Hanselmann
#
16 a0c9f010 Michael Hanselmann
# You should have received a copy of the GNU General Public License
17 a0c9f010 Michael Hanselmann
# along with this program; if not, write to the Free Software
18 a0c9f010 Michael Hanselmann
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19 a0c9f010 Michael Hanselmann
# 02110-1301, USA.
20 a0c9f010 Michael Hanselmann
21 a0c9f010 Michael Hanselmann
22 a0c9f010 Michael Hanselmann
"""Functions to bootstrap a new cluster.
23 a0c9f010 Michael Hanselmann

24 a0c9f010 Michael Hanselmann
"""
25 a0c9f010 Michael Hanselmann
26 a0c9f010 Michael Hanselmann
import os
27 a0c9f010 Michael Hanselmann
import os.path
28 a0c9f010 Michael Hanselmann
import re
29 b1b6ea87 Iustin Pop
import logging
30 d693c864 Iustin Pop
import time
31 a698cdbb Michael Hanselmann
import tempfile
32 a0c9f010 Michael Hanselmann
33 a0c9f010 Michael Hanselmann
from ganeti import rpc
34 a0c9f010 Michael Hanselmann
from ganeti import ssh
35 a0c9f010 Michael Hanselmann
from ganeti import utils
36 a0c9f010 Michael Hanselmann
from ganeti import errors
37 a0c9f010 Michael Hanselmann
from ganeti import config
38 a0c9f010 Michael Hanselmann
from ganeti import constants
39 b9eeeb02 Michael Hanselmann
from ganeti import objects
40 a0c9f010 Michael Hanselmann
from ganeti import ssconf
41 a33848a5 Guido Trotter
from ganeti import serializer
42 a5728081 Guido Trotter
from ganeti import hypervisor
43 a721e23a Luca Bigliardi
from ganeti import bdev
44 a744b676 Manuel Franceschini
from ganeti import netutils
45 3b6b6129 Michael Hanselmann
from ganeti import luxi
46 ff699aa9 Michael Hanselmann
from ganeti import jstore
47 7ede9c6a Michael Hanselmann
from ganeti import pathutils
48 3b6b6129 Michael Hanselmann
49 a0c9f010 Michael Hanselmann
50 88b92fe3 Guido Trotter
# ec_id for InitConfig's temporary reservation manager
51 88b92fe3 Guido Trotter
_INITCONF_ECID = "initconfig-ecid"
52 88b92fe3 Guido Trotter
53 3b6b6129 Michael Hanselmann
#: After how many seconds daemon must be responsive
54 3b6b6129 Michael Hanselmann
_DAEMON_READY_TIMEOUT = 10.0
55 3b6b6129 Michael Hanselmann
56 e38220e4 Michael Hanselmann
57 531baf8e Iustin Pop
def _InitSSHSetup():
58 a0c9f010 Michael Hanselmann
  """Setup the SSH configuration for the cluster.
59 a0c9f010 Michael Hanselmann

60 a0c9f010 Michael Hanselmann
  This generates a dsa keypair for root, adds the pub key to the
61 a0c9f010 Michael Hanselmann
  permitted hosts and adds the hostkey to its own known hosts.
62 a0c9f010 Michael Hanselmann

63 a0c9f010 Michael Hanselmann
  """
64 052783ff Michael Hanselmann
  priv_key, pub_key, auth_keys = ssh.GetUserFiles(constants.SSH_LOGIN_USER)
65 a0c9f010 Michael Hanselmann
66 a0c9f010 Michael Hanselmann
  for name in priv_key, pub_key:
67 a0c9f010 Michael Hanselmann
    if os.path.exists(name):
68 a0c9f010 Michael Hanselmann
      utils.CreateBackup(name)
69 a0c9f010 Michael Hanselmann
    utils.RemoveFile(name)
70 a0c9f010 Michael Hanselmann
71 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ssh-keygen", "-t", "dsa",
72 a0c9f010 Michael Hanselmann
                         "-f", priv_key,
73 a0c9f010 Michael Hanselmann
                         "-q", "-N", ""])
74 a0c9f010 Michael Hanselmann
  if result.failed:
75 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not generate ssh keypair, error %s" %
76 a0c9f010 Michael Hanselmann
                             result.output)
77 a0c9f010 Michael Hanselmann
78 7a0156dc Luca Bigliardi
  utils.AddAuthorizedKey(auth_keys, utils.ReadFile(pub_key))
79 a0c9f010 Michael Hanselmann
80 a0c9f010 Michael Hanselmann
81 c008906b Michael Hanselmann
def GenerateHmacKey(file_name):
82 c008906b Michael Hanselmann
  """Writes a new HMAC key.
83 c008906b Michael Hanselmann

84 c008906b Michael Hanselmann
  @type file_name: str
85 c008906b Michael Hanselmann
  @param file_name: Path to output file
86 c008906b Michael Hanselmann

87 c008906b Michael Hanselmann
  """
88 43575108 Michael Hanselmann
  utils.WriteFile(file_name, data="%s\n" % utils.GenerateSecret(), mode=0400,
89 43575108 Michael Hanselmann
                  backup=True)
90 43575108 Michael Hanselmann
91 43575108 Michael Hanselmann
92 b6267745 Andrea Spadaccini
def GenerateClusterCrypto(new_cluster_cert, new_rapi_cert, new_spice_cert,
93 b6267745 Andrea Spadaccini
                          new_confd_hmac_key, new_cds,
94 b6267745 Andrea Spadaccini
                          rapi_cert_pem=None, spice_cert_pem=None,
95 b6267745 Andrea Spadaccini
                          spice_cacert_pem=None, cds=None,
96 7ede9c6a Michael Hanselmann
                          nodecert_file=pathutils.NODED_CERT_FILE,
97 7ede9c6a Michael Hanselmann
                          rapicert_file=pathutils.RAPI_CERT_FILE,
98 7ede9c6a Michael Hanselmann
                          spicecert_file=pathutils.SPICE_CERT_FILE,
99 7ede9c6a Michael Hanselmann
                          spicecacert_file=pathutils.SPICE_CACERT_FILE,
100 7ede9c6a Michael Hanselmann
                          hmackey_file=pathutils.CONFD_HMAC_KEY,
101 7ede9c6a Michael Hanselmann
                          cds_file=pathutils.CLUSTER_DOMAIN_SECRET_FILE):
102 43575108 Michael Hanselmann
  """Updates the cluster certificates, keys and secrets.
103 43575108 Michael Hanselmann

104 43575108 Michael Hanselmann
  @type new_cluster_cert: bool
105 43575108 Michael Hanselmann
  @param new_cluster_cert: Whether to generate a new cluster certificate
106 43575108 Michael Hanselmann
  @type new_rapi_cert: bool
107 43575108 Michael Hanselmann
  @param new_rapi_cert: Whether to generate a new RAPI certificate
108 b6267745 Andrea Spadaccini
  @type new_spice_cert: bool
109 b6267745 Andrea Spadaccini
  @param new_spice_cert: Whether to generate a new SPICE certificate
110 6b7d5878 Michael Hanselmann
  @type new_confd_hmac_key: bool
111 6b7d5878 Michael Hanselmann
  @param new_confd_hmac_key: Whether to generate a new HMAC key
112 3db3eb2a Michael Hanselmann
  @type new_cds: bool
113 3db3eb2a Michael Hanselmann
  @param new_cds: Whether to generate a new cluster domain secret
114 43575108 Michael Hanselmann
  @type rapi_cert_pem: string
115 43575108 Michael Hanselmann
  @param rapi_cert_pem: New RAPI certificate in PEM format
116 b6267745 Andrea Spadaccini
  @type spice_cert_pem: string
117 b6267745 Andrea Spadaccini
  @param spice_cert_pem: New SPICE certificate in PEM format
118 b6267745 Andrea Spadaccini
  @type spice_cacert_pem: string
119 b6267745 Andrea Spadaccini
  @param spice_cacert_pem: Certificate of the CA that signed the SPICE
120 b6267745 Andrea Spadaccini
                           certificate, in PEM format
121 3db3eb2a Michael Hanselmann
  @type cds: string
122 3db3eb2a Michael Hanselmann
  @param cds: New cluster domain secret
123 aeefe835 Iustin Pop
  @type nodecert_file: string
124 aeefe835 Iustin Pop
  @param nodecert_file: optional override of the node cert file path
125 aeefe835 Iustin Pop
  @type rapicert_file: string
126 aeefe835 Iustin Pop
  @param rapicert_file: optional override of the rapi cert file path
127 b6267745 Andrea Spadaccini
  @type spicecert_file: string
128 b6267745 Andrea Spadaccini
  @param spicecert_file: optional override of the spice cert file path
129 b6267745 Andrea Spadaccini
  @type spicecacert_file: string
130 b6267745 Andrea Spadaccini
  @param spicecacert_file: optional override of the spice CA cert file path
131 aeefe835 Iustin Pop
  @type hmackey_file: string
132 aeefe835 Iustin Pop
  @param hmackey_file: optional override of the hmac key file path
133 43575108 Michael Hanselmann

134 43575108 Michael Hanselmann
  """
135 168c1de2 Michael Hanselmann
  # noded SSL certificate
136 aeefe835 Iustin Pop
  cluster_cert_exists = os.path.exists(nodecert_file)
137 43575108 Michael Hanselmann
  if new_cluster_cert or not cluster_cert_exists:
138 43575108 Michael Hanselmann
    if cluster_cert_exists:
139 aeefe835 Iustin Pop
      utils.CreateBackup(nodecert_file)
140 43575108 Michael Hanselmann
141 aeefe835 Iustin Pop
    logging.debug("Generating new cluster certificate at %s", nodecert_file)
142 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(nodecert_file)
143 43575108 Michael Hanselmann
144 6b7d5878 Michael Hanselmann
  # confd HMAC key
145 aeefe835 Iustin Pop
  if new_confd_hmac_key or not os.path.exists(hmackey_file):
146 aeefe835 Iustin Pop
    logging.debug("Writing new confd HMAC key to %s", hmackey_file)
147 aeefe835 Iustin Pop
    GenerateHmacKey(hmackey_file)
148 43575108 Michael Hanselmann
149 43575108 Michael Hanselmann
  # RAPI
150 aeefe835 Iustin Pop
  rapi_cert_exists = os.path.exists(rapicert_file)
151 43575108 Michael Hanselmann
152 43575108 Michael Hanselmann
  if rapi_cert_pem:
153 43575108 Michael Hanselmann
    # Assume rapi_pem contains a valid PEM-formatted certificate and key
154 aeefe835 Iustin Pop
    logging.debug("Writing RAPI certificate at %s", rapicert_file)
155 aeefe835 Iustin Pop
    utils.WriteFile(rapicert_file, data=rapi_cert_pem, backup=True)
156 43575108 Michael Hanselmann
157 43575108 Michael Hanselmann
  elif new_rapi_cert or not rapi_cert_exists:
158 43575108 Michael Hanselmann
    if rapi_cert_exists:
159 aeefe835 Iustin Pop
      utils.CreateBackup(rapicert_file)
160 43575108 Michael Hanselmann
161 aeefe835 Iustin Pop
    logging.debug("Generating new RAPI certificate at %s", rapicert_file)
162 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(rapicert_file)
163 c008906b Michael Hanselmann
164 b6267745 Andrea Spadaccini
  # SPICE
165 b6267745 Andrea Spadaccini
  spice_cert_exists = os.path.exists(spicecert_file)
166 b6267745 Andrea Spadaccini
  spice_cacert_exists = os.path.exists(spicecacert_file)
167 b6267745 Andrea Spadaccini
  if spice_cert_pem:
168 b6267745 Andrea Spadaccini
    # spice_cert_pem implies also spice_cacert_pem
169 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE certificate at %s", spicecert_file)
170 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecert_file, data=spice_cert_pem, backup=True)
171 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE CA certificate at %s", spicecacert_file)
172 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecacert_file, data=spice_cacert_pem, backup=True)
173 b6267745 Andrea Spadaccini
  elif new_spice_cert or not spice_cert_exists:
174 b6267745 Andrea Spadaccini
    if spice_cert_exists:
175 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecert_file)
176 b6267745 Andrea Spadaccini
    if spice_cacert_exists:
177 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecacert_file)
178 b6267745 Andrea Spadaccini
179 b6267745 Andrea Spadaccini
    logging.debug("Generating new self-signed SPICE certificate at %s",
180 b6267745 Andrea Spadaccini
                  spicecert_file)
181 b6267745 Andrea Spadaccini
    (_, cert_pem) = utils.GenerateSelfSignedSslCert(spicecert_file)
182 b6267745 Andrea Spadaccini
183 b6267745 Andrea Spadaccini
    # Self-signed certificate -> the public certificate is also the CA public
184 b6267745 Andrea Spadaccini
    # certificate
185 b6267745 Andrea Spadaccini
    logging.debug("Writing the public certificate to %s",
186 b6267745 Andrea Spadaccini
                  spicecert_file)
187 b6267745 Andrea Spadaccini
    utils.io.WriteFile(spicecacert_file, mode=0400, data=cert_pem)
188 b6267745 Andrea Spadaccini
189 3db3eb2a Michael Hanselmann
  # Cluster domain secret
190 3db3eb2a Michael Hanselmann
  if cds:
191 fc0726b9 Michael Hanselmann
    logging.debug("Writing cluster domain secret to %s", cds_file)
192 fc0726b9 Michael Hanselmann
    utils.WriteFile(cds_file, data=cds, backup=True)
193 fc0726b9 Michael Hanselmann
194 fc0726b9 Michael Hanselmann
  elif new_cds or not os.path.exists(cds_file):
195 fc0726b9 Michael Hanselmann
    logging.debug("Generating new cluster domain secret at %s", cds_file)
196 fc0726b9 Michael Hanselmann
    GenerateHmacKey(cds_file)
197 3db3eb2a Michael Hanselmann
198 c008906b Michael Hanselmann
199 8f215968 Michael Hanselmann
def _InitGanetiServerSetup(master_name):
200 40a97d80 Michael Hanselmann
  """Setup the necessary configuration for the initial node daemon.
201 40a97d80 Michael Hanselmann

202 40a97d80 Michael Hanselmann
  This creates the nodepass file containing the shared password for
203 600535f0 Manuel Franceschini
  the cluster, generates the SSL certificate and starts the node daemon.
204 600535f0 Manuel Franceschini

205 600535f0 Manuel Franceschini
  @type master_name: str
206 600535f0 Manuel Franceschini
  @param master_name: Name of the master node
207 40a97d80 Michael Hanselmann

208 40a97d80 Michael Hanselmann
  """
209 43575108 Michael Hanselmann
  # Generate cluster secrets
210 b6267745 Andrea Spadaccini
  GenerateClusterCrypto(True, False, False, False, False)
211 4a34c5cf Guido Trotter
212 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start", constants.NODED])
213 a0c9f010 Michael Hanselmann
  if result.failed:
214 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not start the node daemon, command %s"
215 a0c9f010 Michael Hanselmann
                             " had exitcode %s and error %s" %
216 a0c9f010 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
217 a0c9f010 Michael Hanselmann
218 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(master_name)
219 5627f375 Michael Hanselmann
220 5627f375 Michael Hanselmann
221 5627f375 Michael Hanselmann
def _WaitForNodeDaemon(node_name):
222 5627f375 Michael Hanselmann
  """Wait for node daemon to become responsive.
223 5627f375 Michael Hanselmann

224 5627f375 Michael Hanselmann
  """
225 d3833ebd Michael Hanselmann
  def _CheckNodeDaemon():
226 bd6d1202 Renรฉ Nussbaumer
    # Pylint bug <http://www.logilab.org/ticket/35642>
227 bd6d1202 Renรฉ Nussbaumer
    # pylint: disable=E1101
228 db04ce5d Michael Hanselmann
    result = rpc.BootstrapRunner().call_version([node_name])[node_name]
229 d3833ebd Michael Hanselmann
    if result.fail_msg:
230 d3833ebd Michael Hanselmann
      raise utils.RetryAgain()
231 8f215968 Michael Hanselmann
232 d3833ebd Michael Hanselmann
  try:
233 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckNodeDaemon, 1.0, _DAEMON_READY_TIMEOUT)
234 d3833ebd Michael Hanselmann
  except utils.RetryTimeout:
235 5627f375 Michael Hanselmann
    raise errors.OpExecError("Node daemon on %s didn't answer queries within"
236 3b6b6129 Michael Hanselmann
                             " %s seconds" % (node_name, _DAEMON_READY_TIMEOUT))
237 3b6b6129 Michael Hanselmann
238 3b6b6129 Michael Hanselmann
239 3b6b6129 Michael Hanselmann
def _WaitForMasterDaemon():
240 3b6b6129 Michael Hanselmann
  """Wait for master daemon to become responsive.
241 3b6b6129 Michael Hanselmann

242 3b6b6129 Michael Hanselmann
  """
243 3b6b6129 Michael Hanselmann
  def _CheckMasterDaemon():
244 3b6b6129 Michael Hanselmann
    try:
245 3b6b6129 Michael Hanselmann
      cl = luxi.Client()
246 3b6b6129 Michael Hanselmann
      (cluster_name, ) = cl.QueryConfigValues(["cluster_name"])
247 3b6b6129 Michael Hanselmann
    except Exception:
248 3b6b6129 Michael Hanselmann
      raise utils.RetryAgain()
249 3b6b6129 Michael Hanselmann
250 3b6b6129 Michael Hanselmann
    logging.debug("Received cluster name %s from master", cluster_name)
251 3b6b6129 Michael Hanselmann
252 3b6b6129 Michael Hanselmann
  try:
253 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckMasterDaemon, 1.0, _DAEMON_READY_TIMEOUT)
254 3b6b6129 Michael Hanselmann
  except utils.RetryTimeout:
255 3b6b6129 Michael Hanselmann
    raise errors.OpExecError("Master daemon didn't answer queries within"
256 3b6b6129 Michael Hanselmann
                             " %s seconds" % _DAEMON_READY_TIMEOUT)
257 5627f375 Michael Hanselmann
258 a0c9f010 Michael Hanselmann
259 a5da38fa Michael Hanselmann
def _WaitForSshDaemon(hostname, port, family):
260 a5da38fa Michael Hanselmann
  """Wait for SSH daemon to become responsive.
261 a5da38fa Michael Hanselmann

262 a5da38fa Michael Hanselmann
  """
263 a5da38fa Michael Hanselmann
  hostip = netutils.GetHostname(name=hostname, family=family).ip
264 a5da38fa Michael Hanselmann
265 a5da38fa Michael Hanselmann
  def _CheckSshDaemon():
266 a5da38fa Michael Hanselmann
    if netutils.TcpPing(hostip, port, timeout=1.0, live_port_needed=True):
267 a5da38fa Michael Hanselmann
      logging.debug("SSH daemon on %s:%s (IP address %s) has become"
268 a5da38fa Michael Hanselmann
                    " responsive", hostname, port, hostip)
269 a5da38fa Michael Hanselmann
    else:
270 a5da38fa Michael Hanselmann
      raise utils.RetryAgain()
271 a5da38fa Michael Hanselmann
272 a5da38fa Michael Hanselmann
  try:
273 a5da38fa Michael Hanselmann
    utils.Retry(_CheckSshDaemon, 1.0, _DAEMON_READY_TIMEOUT)
274 a5da38fa Michael Hanselmann
  except utils.RetryTimeout:
275 a5da38fa Michael Hanselmann
    raise errors.OpExecError("SSH daemon on %s:%s (IP address %s) didn't"
276 a5da38fa Michael Hanselmann
                             " become responsive within %s seconds" %
277 a5da38fa Michael Hanselmann
                             (hostname, port, hostip, _DAEMON_READY_TIMEOUT))
278 a5da38fa Michael Hanselmann
279 a5da38fa Michael Hanselmann
280 a698cdbb Michael Hanselmann
def RunNodeSetupCmd(cluster_name, node, basecmd, debug, verbose,
281 a698cdbb Michael Hanselmann
                    use_cluster_key, ask_key, strict_host_check, data):
282 a698cdbb Michael Hanselmann
  """Runs a command to configure something on a remote machine.
283 a698cdbb Michael Hanselmann

284 a698cdbb Michael Hanselmann
  @type cluster_name: string
285 a698cdbb Michael Hanselmann
  @param cluster_name: Cluster name
286 a698cdbb Michael Hanselmann
  @type node: string
287 a698cdbb Michael Hanselmann
  @param node: Node name
288 a698cdbb Michael Hanselmann
  @type basecmd: string
289 a698cdbb Michael Hanselmann
  @param basecmd: Base command (path on the remote machine)
290 a698cdbb Michael Hanselmann
  @type debug: bool
291 a698cdbb Michael Hanselmann
  @param debug: Enable debug output
292 a698cdbb Michael Hanselmann
  @type verbose: bool
293 a698cdbb Michael Hanselmann
  @param verbose: Enable verbose output
294 a698cdbb Michael Hanselmann
  @type use_cluster_key: bool
295 a698cdbb Michael Hanselmann
  @param use_cluster_key: See L{ssh.SshRunner.BuildCmd}
296 a698cdbb Michael Hanselmann
  @type ask_key: bool
297 a698cdbb Michael Hanselmann
  @param ask_key: See L{ssh.SshRunner.BuildCmd}
298 a698cdbb Michael Hanselmann
  @type strict_host_check: bool
299 a698cdbb Michael Hanselmann
  @param strict_host_check: See L{ssh.SshRunner.BuildCmd}
300 a698cdbb Michael Hanselmann
  @param data: JSON-serializable input data for script (passed to stdin)
301 a698cdbb Michael Hanselmann

302 a698cdbb Michael Hanselmann
  """
303 a698cdbb Michael Hanselmann
  cmd = [basecmd]
304 a698cdbb Michael Hanselmann
305 a698cdbb Michael Hanselmann
  # Pass --debug/--verbose to the external script if set on our invocation
306 a698cdbb Michael Hanselmann
  if debug:
307 a698cdbb Michael Hanselmann
    cmd.append("--debug")
308 a698cdbb Michael Hanselmann
309 a698cdbb Michael Hanselmann
  if verbose:
310 a698cdbb Michael Hanselmann
    cmd.append("--verbose")
311 a698cdbb Michael Hanselmann
312 e1874aa7 Michael Hanselmann
  family = ssconf.SimpleStore().GetPrimaryIPFamily()
313 e1874aa7 Michael Hanselmann
  srun = ssh.SshRunner(cluster_name,
314 e1874aa7 Michael Hanselmann
                       ipv6=(family == netutils.IP6Address.family))
315 a698cdbb Michael Hanselmann
  scmd = srun.BuildCmd(node, constants.SSH_LOGIN_USER,
316 a698cdbb Michael Hanselmann
                       utils.ShellQuoteArgs(cmd),
317 a698cdbb Michael Hanselmann
                       batch=False, ask_key=ask_key, quiet=False,
318 a698cdbb Michael Hanselmann
                       strict_host_check=strict_host_check,
319 a698cdbb Michael Hanselmann
                       use_cluster_key=use_cluster_key)
320 a698cdbb Michael Hanselmann
321 a698cdbb Michael Hanselmann
  tempfh = tempfile.TemporaryFile()
322 a698cdbb Michael Hanselmann
  try:
323 a698cdbb Michael Hanselmann
    tempfh.write(serializer.DumpJson(data))
324 a698cdbb Michael Hanselmann
    tempfh.seek(0)
325 a698cdbb Michael Hanselmann
326 a698cdbb Michael Hanselmann
    result = utils.RunCmd(scmd, interactive=True, input_fd=tempfh)
327 a698cdbb Michael Hanselmann
  finally:
328 a698cdbb Michael Hanselmann
    tempfh.close()
329 a698cdbb Michael Hanselmann
330 a698cdbb Michael Hanselmann
  if result.failed:
331 a698cdbb Michael Hanselmann
    raise errors.OpExecError("Command '%s' failed: %s" %
332 a698cdbb Michael Hanselmann
                             (result.cmd, result.fail_reason))
333 a698cdbb Michael Hanselmann
334 a5da38fa Michael Hanselmann
  _WaitForSshDaemon(node, netutils.GetDaemonPort(constants.SSH), family)
335 a5da38fa Michael Hanselmann
336 a698cdbb Michael Hanselmann
337 0e3baaf3 Iustin Pop
def _InitFileStorage(file_storage_dir):
338 0e3baaf3 Iustin Pop
  """Initialize if needed the file storage.
339 0e3baaf3 Iustin Pop

340 0e3baaf3 Iustin Pop
  @param file_storage_dir: the user-supplied value
341 0e3baaf3 Iustin Pop
  @return: either empty string (if file storage was disabled at build
342 0e3baaf3 Iustin Pop
      time) or the normalized path to the storage directory
343 0e3baaf3 Iustin Pop

344 0e3baaf3 Iustin Pop
  """
345 0e3baaf3 Iustin Pop
  file_storage_dir = os.path.normpath(file_storage_dir)
346 0e3baaf3 Iustin Pop
347 0e3baaf3 Iustin Pop
  if not os.path.isabs(file_storage_dir):
348 0376655e Guido Trotter
    raise errors.OpPrereqError("File storage directory '%s' is not an absolute"
349 0376655e Guido Trotter
                               " path" % file_storage_dir, errors.ECODE_INVAL)
350 0e3baaf3 Iustin Pop
351 0e3baaf3 Iustin Pop
  if not os.path.exists(file_storage_dir):
352 0e3baaf3 Iustin Pop
    try:
353 0e3baaf3 Iustin Pop
      os.makedirs(file_storage_dir, 0750)
354 0e3baaf3 Iustin Pop
    except OSError, err:
355 0e3baaf3 Iustin Pop
      raise errors.OpPrereqError("Cannot create file storage directory"
356 0e3baaf3 Iustin Pop
                                 " '%s': %s" % (file_storage_dir, err),
357 0e3baaf3 Iustin Pop
                                 errors.ECODE_ENVIRON)
358 0e3baaf3 Iustin Pop
359 0e3baaf3 Iustin Pop
  if not os.path.isdir(file_storage_dir):
360 0e3baaf3 Iustin Pop
    raise errors.OpPrereqError("The file storage directory '%s' is not"
361 0e3baaf3 Iustin Pop
                               " a directory." % file_storage_dir,
362 0e3baaf3 Iustin Pop
                               errors.ECODE_ENVIRON)
363 0e3baaf3 Iustin Pop
  return file_storage_dir
364 0e3baaf3 Iustin Pop
365 0e3baaf3 Iustin Pop
366 18bb6d28 Agata Murawska
def InitCluster(cluster_name, mac_prefix, # pylint: disable=R0913, R0914
367 5a8648eb Andrea Spadaccini
                master_netmask, master_netdev, file_storage_dir,
368 5a8648eb Andrea Spadaccini
                shared_file_storage_dir, candidate_pool_size, secondary_ip=None,
369 5a8648eb Andrea Spadaccini
                vg_name=None, beparams=None, nicparams=None, ndparams=None,
370 bc5d0215 Andrea Spadaccini
                hvparams=None, diskparams=None, enabled_hypervisors=None,
371 bc5d0215 Andrea Spadaccini
                modify_etc_hosts=True, modify_ssh_setup=True,
372 bc5d0215 Andrea Spadaccini
                maintain_node_health=False, drbd_helper=None, uid_pool=None,
373 18bb6d28 Agata Murawska
                default_iallocator=None, primary_ip_version=None, ipolicy=None,
374 c4929a8b Renรฉ Nussbaumer
                prealloc_wipe_disks=False, use_external_mip_script=False,
375 3bde79ee Helga Velroyen
                hv_state=None, disk_state=None, enabled_disk_templates=None):
376 a0c9f010 Michael Hanselmann
  """Initialise the cluster.
377 a0c9f010 Michael Hanselmann

378 ce735215 Guido Trotter
  @type candidate_pool_size: int
379 ce735215 Guido Trotter
  @param candidate_pool_size: master candidate pool size
380 3bde79ee Helga Velroyen
  @type enabled_disk_templates: list of string
381 3bde79ee Helga Velroyen
  @param enabled_disk_templates: list of disk_templates to be used in this
382 c074a9e8 Helga Velroyen
    cluster
383 ce735215 Guido Trotter

384 a0c9f010 Michael Hanselmann
  """
385 ce735215 Guido Trotter
  # TODO: complete the docstring
386 a0c9f010 Michael Hanselmann
  if config.ConfigWriter.IsCluster():
387 debac808 Iustin Pop
    raise errors.OpPrereqError("Cluster is already initialised",
388 debac808 Iustin Pop
                               errors.ECODE_STATE)
389 a0c9f010 Michael Hanselmann
390 b119bccb Guido Trotter
  if not enabled_hypervisors:
391 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors list must contain at"
392 debac808 Iustin Pop
                               " least one member", errors.ECODE_INVAL)
393 b119bccb Guido Trotter
  invalid_hvs = set(enabled_hypervisors) - constants.HYPER_TYPES
394 b119bccb Guido Trotter
  if invalid_hvs:
395 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors contains invalid"
396 debac808 Iustin Pop
                               " entries: %s" % invalid_hvs,
397 debac808 Iustin Pop
                               errors.ECODE_INVAL)
398 b119bccb Guido Trotter
399 3bde79ee Helga Velroyen
  if not enabled_disk_templates:
400 3bde79ee Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list must contain at"
401 c074a9e8 Helga Velroyen
                               " least one member", errors.ECODE_INVAL)
402 3bde79ee Helga Velroyen
  invalid_disk_templates = \
403 3bde79ee Helga Velroyen
    set(enabled_disk_templates) - constants.DISK_TEMPLATES
404 3bde79ee Helga Velroyen
  if invalid_disk_templates:
405 3bde79ee Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list contains invalid"
406 3bde79ee Helga Velroyen
                               " entries: %s" % invalid_disk_templates,
407 c074a9e8 Helga Velroyen
                               errors.ECODE_INVAL)
408 c074a9e8 Helga Velroyen
409 5a8648eb Andrea Spadaccini
  try:
410 5a8648eb Andrea Spadaccini
    ipcls = netutils.IPAddress.GetClassFromIpVersion(primary_ip_version)
411 5a8648eb Andrea Spadaccini
  except errors.ProgrammerError:
412 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Invalid primary ip version: %d." %
413 2cfbc784 Iustin Pop
                               primary_ip_version, errors.ECODE_INVAL)
414 2f20d07b Manuel Franceschini
415 2f20d07b Manuel Franceschini
  hostname = netutils.GetHostname(family=ipcls.family)
416 2f20d07b Manuel Franceschini
  if not ipcls.IsValid(hostname.ip):
417 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) is not a valid IPv%d"
418 2cfbc784 Iustin Pop
                               " address." % (hostname.ip, primary_ip_version),
419 2cfbc784 Iustin Pop
                               errors.ECODE_INVAL)
420 2f20d07b Manuel Franceschini
421 2f20d07b Manuel Franceschini
  if ipcls.IsLoopback(hostname.ip):
422 8b312c1d Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) resolves to a loopback"
423 8b312c1d Manuel Franceschini
                               " address. Please fix DNS or %s." %
424 ee045466 Michael Hanselmann
                               (hostname.ip, pathutils.ETC_HOSTS),
425 debac808 Iustin Pop
                               errors.ECODE_ENVIRON)
426 a0c9f010 Michael Hanselmann
427 2f20d07b Manuel Franceschini
  if not ipcls.Own(hostname.ip):
428 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Inconsistency: this host's name resolves"
429 a0c9f010 Michael Hanselmann
                               " to %s,\nbut this ip address does not"
430 7c4c22f5 Manuel Franceschini
                               " belong to this host" %
431 debac808 Iustin Pop
                               hostname.ip, errors.ECODE_ENVIRON)
432 a0c9f010 Michael Hanselmann
433 2f20d07b Manuel Franceschini
  clustername = netutils.GetHostname(name=cluster_name, family=ipcls.family)
434 a0c9f010 Michael Hanselmann
435 2f20d07b Manuel Franceschini
  if netutils.TcpPing(clustername.ip, constants.DEFAULT_NODED_PORT, timeout=5):
436 7c4c22f5 Manuel Franceschini
    raise errors.OpPrereqError("Cluster IP already active",
437 debac808 Iustin Pop
                               errors.ECODE_NOTUNIQUE)
438 a0c9f010 Michael Hanselmann
439 2f20d07b Manuel Franceschini
  if not secondary_ip:
440 2f20d07b Manuel Franceschini
    if primary_ip_version == constants.IP6_VERSION:
441 2f20d07b Manuel Franceschini
      raise errors.OpPrereqError("When using a IPv6 primary address, a valid"
442 7c4c22f5 Manuel Franceschini
                                 " IPv4 address must be given as secondary",
443 7c4c22f5 Manuel Franceschini
                                 errors.ECODE_INVAL)
444 b9eeeb02 Michael Hanselmann
    secondary_ip = hostname.ip
445 a0c9f010 Michael Hanselmann
446 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.IsValid(secondary_ip):
447 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Secondary IP address (%s) has to be a valid"
448 2f20d07b Manuel Franceschini
                               " IPv4 address." % secondary_ip,
449 2f20d07b Manuel Franceschini
                               errors.ECODE_INVAL)
450 2f20d07b Manuel Franceschini
451 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.Own(secondary_ip):
452 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("You gave %s as secondary IP,"
453 2f20d07b Manuel Franceschini
                               " but it does not belong to this host." %
454 2f20d07b Manuel Franceschini
                               secondary_ip, errors.ECODE_ENVIRON)
455 2f20d07b Manuel Franceschini
456 5a8648eb Andrea Spadaccini
  if master_netmask is not None:
457 5a8648eb Andrea Spadaccini
    if not ipcls.ValidateNetmask(master_netmask):
458 5a8648eb Andrea Spadaccini
      raise errors.OpPrereqError("CIDR netmask (%s) not valid for IPv%s " %
459 2cfbc784 Iustin Pop
                                  (master_netmask, primary_ip_version),
460 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
461 5a8648eb Andrea Spadaccini
  else:
462 5a8648eb Andrea Spadaccini
    master_netmask = ipcls.iplen
463 5a8648eb Andrea Spadaccini
464 a0c9f010 Michael Hanselmann
  if vg_name is not None:
465 a0c9f010 Michael Hanselmann
    # Check if volume group is valid
466 a0c9f010 Michael Hanselmann
    vgstatus = utils.CheckVolumeGroupSize(utils.ListVolumeGroups(), vg_name,
467 a0c9f010 Michael Hanselmann
                                          constants.MIN_VG_SIZE)
468 a0c9f010 Michael Hanselmann
    if vgstatus:
469 a0c9f010 Michael Hanselmann
      raise errors.OpPrereqError("Error: %s\nspecify --no-lvm-storage if"
470 debac808 Iustin Pop
                                 " you are not using lvm" % vgstatus,
471 debac808 Iustin Pop
                                 errors.ECODE_INVAL)
472 a0c9f010 Michael Hanselmann
473 a721e23a Luca Bigliardi
  if drbd_helper is not None:
474 a721e23a Luca Bigliardi
    try:
475 a721e23a Luca Bigliardi
      curr_helper = bdev.BaseDRBD.GetUsermodeHelper()
476 a721e23a Luca Bigliardi
    except errors.BlockDeviceError, err:
477 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error while checking drbd helper"
478 a721e23a Luca Bigliardi
                                 " (specify --no-drbd-storage if you are not"
479 a721e23a Luca Bigliardi
                                 " using drbd): %s" % str(err),
480 a721e23a Luca Bigliardi
                                 errors.ECODE_ENVIRON)
481 a721e23a Luca Bigliardi
    if drbd_helper != curr_helper:
482 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error: requiring %s as drbd helper but %s"
483 a721e23a Luca Bigliardi
                                 " is the current helper" % (drbd_helper,
484 a721e23a Luca Bigliardi
                                                             curr_helper),
485 a721e23a Luca Bigliardi
                                 errors.ECODE_INVAL)
486 a721e23a Luca Bigliardi
487 32ba31be Michael Hanselmann
  logging.debug("Stopping daemons (if any are running)")
488 32ba31be Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "stop-all"])
489 32ba31be Michael Hanselmann
  if result.failed:
490 32ba31be Michael Hanselmann
    raise errors.OpExecError("Could not stop daemons, command %s"
491 32ba31be Michael Hanselmann
                             " had exitcode %s and error '%s'" %
492 32ba31be Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
493 32ba31be Michael Hanselmann
494 0376655e Guido Trotter
  if constants.ENABLE_FILE_STORAGE:
495 0376655e Guido Trotter
    file_storage_dir = _InitFileStorage(file_storage_dir)
496 0376655e Guido Trotter
  else:
497 0376655e Guido Trotter
    file_storage_dir = ""
498 0376655e Guido Trotter
499 0376655e Guido Trotter
  if constants.ENABLE_SHARED_FILE_STORAGE:
500 0376655e Guido Trotter
    shared_file_storage_dir = _InitFileStorage(shared_file_storage_dir)
501 0376655e Guido Trotter
  else:
502 0376655e Guido Trotter
    shared_file_storage_dir = ""
503 a0c9f010 Michael Hanselmann
504 a0c9f010 Michael Hanselmann
  if not re.match("^[0-9a-z]{2}:[0-9a-z]{2}:[0-9a-z]{2}$", mac_prefix):
505 debac808 Iustin Pop
    raise errors.OpPrereqError("Invalid mac prefix given '%s'" % mac_prefix,
506 debac808 Iustin Pop
                               errors.ECODE_INVAL)
507 a0c9f010 Michael Hanselmann
508 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ip", "link", "show", "dev", master_netdev])
509 a0c9f010 Michael Hanselmann
  if result.failed:
510 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Invalid master netdev given (%s): '%s'" %
511 a0c9f010 Michael Hanselmann
                               (master_netdev,
512 debac808 Iustin Pop
                                result.output.strip()), errors.ECODE_INVAL)
513 a0c9f010 Michael Hanselmann
514 7ede9c6a Michael Hanselmann
  dirs = [(pathutils.RUN_DIR, constants.RUN_DIRS_MODE)]
515 9dae41ad Guido Trotter
  utils.EnsureDirs(dirs)
516 9dae41ad Guido Trotter
517 b2e233a5 Guido Trotter
  objects.UpgradeBeParams(beparams)
518 a5728081 Guido Trotter
  utils.ForceDictType(beparams, constants.BES_PARAMETER_TYPES)
519 b6a30b0d Guido Trotter
  utils.ForceDictType(nicparams, constants.NICS_PARAMETER_TYPES)
520 18bb6d28 Agata Murawska
521 b6a30b0d Guido Trotter
  objects.NIC.CheckParameterSyntax(nicparams)
522 57dc299a Iustin Pop
523 2cc673a3 Iustin Pop
  full_ipolicy = objects.FillIPolicy(constants.IPOLICY_DEFAULTS, ipolicy)
524 b6a30b0d Guido Trotter
525 6204ee71 Renรฉ Nussbaumer
  if ndparams is not None:
526 6204ee71 Renรฉ Nussbaumer
    utils.ForceDictType(ndparams, constants.NDS_PARAMETER_TYPES)
527 6204ee71 Renรฉ Nussbaumer
  else:
528 6204ee71 Renรฉ Nussbaumer
    ndparams = dict(constants.NDC_DEFAULTS)
529 6204ee71 Renรฉ Nussbaumer
530 c4929a8b Renรฉ Nussbaumer
  # This is ugly, as we modify the dict itself
531 57dc299a Iustin Pop
  # FIXME: Make utils.ForceDictType pure functional or write a wrapper
532 57dc299a Iustin Pop
  # around it
533 c4929a8b Renรฉ Nussbaumer
  if hv_state:
534 c4929a8b Renรฉ Nussbaumer
    for hvname, hvs_data in hv_state.items():
535 c4929a8b Renรฉ Nussbaumer
      utils.ForceDictType(hvs_data, constants.HVSTS_PARAMETER_TYPES)
536 c4929a8b Renรฉ Nussbaumer
      hv_state[hvname] = objects.Cluster.SimpleFillHvState(hvs_data)
537 c4929a8b Renรฉ Nussbaumer
  else:
538 c4929a8b Renรฉ Nussbaumer
    hv_state = dict((hvname, constants.HVST_DEFAULTS)
539 c4929a8b Renรฉ Nussbaumer
                    for hvname in enabled_hypervisors)
540 c4929a8b Renรฉ Nussbaumer
541 c4929a8b Renรฉ Nussbaumer
  # FIXME: disk_state has no default values yet
542 c4929a8b Renรฉ Nussbaumer
  if disk_state:
543 c4929a8b Renรฉ Nussbaumer
    for storage, ds_data in disk_state.items():
544 c4929a8b Renรฉ Nussbaumer
      if storage not in constants.DS_VALID_TYPES:
545 c4929a8b Renรฉ Nussbaumer
        raise errors.OpPrereqError("Invalid storage type in disk state: %s" %
546 c4929a8b Renรฉ Nussbaumer
                                   storage, errors.ECODE_INVAL)
547 c4929a8b Renรฉ Nussbaumer
      for ds_name, state in ds_data.items():
548 c4929a8b Renรฉ Nussbaumer
        utils.ForceDictType(state, constants.DSS_PARAMETER_TYPES)
549 c4929a8b Renรฉ Nussbaumer
        ds_data[ds_name] = objects.Cluster.SimpleFillDiskState(state)
550 c4929a8b Renรฉ Nussbaumer
551 a5728081 Guido Trotter
  # hvparams is a mapping of hypervisor->hvparams dict
552 a5728081 Guido Trotter
  for hv_name, hv_params in hvparams.iteritems():
553 a5728081 Guido Trotter
    utils.ForceDictType(hv_params, constants.HVS_PARAMETER_TYPES)
554 a5728081 Guido Trotter
    hv_class = hypervisor.GetHypervisor(hv_name)
555 a5728081 Guido Trotter
    hv_class.CheckParameterSyntax(hv_params)
556 d4b72030 Guido Trotter
557 bc5d0215 Andrea Spadaccini
  # diskparams is a mapping of disk-template->diskparams dict
558 bc5d0215 Andrea Spadaccini
  for template, dt_params in diskparams.items():
559 bc5d0215 Andrea Spadaccini
    param_keys = set(dt_params.keys())
560 bc5d0215 Andrea Spadaccini
    default_param_keys = set(constants.DISK_DT_DEFAULTS[template].keys())
561 bc5d0215 Andrea Spadaccini
    if not (param_keys <= default_param_keys):
562 bc5d0215 Andrea Spadaccini
      unknown_params = param_keys - default_param_keys
563 bc5d0215 Andrea Spadaccini
      raise errors.OpPrereqError("Invalid parameters for disk template %s:"
564 bc5d0215 Andrea Spadaccini
                                 " %s" % (template,
565 2cfbc784 Iustin Pop
                                          utils.CommaJoin(unknown_params)),
566 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
567 bc5d0215 Andrea Spadaccini
    utils.ForceDictType(dt_params, constants.DISK_DT_TYPES)
568 35c48839 Michele Tartara
    if template == constants.DT_DRBD8 and vg_name is not None:
569 35c48839 Michele Tartara
      # The default METAVG value is equal to the VG name set at init time,
570 35c48839 Michele Tartara
      # if provided
571 35c48839 Michele Tartara
      dt_params[constants.DRBD_DEFAULT_METAVG] = vg_name
572 35c48839 Michele Tartara
573 e4a4391d Renรฉ Nussbaumer
  try:
574 e4a4391d Renรฉ Nussbaumer
    utils.VerifyDictOptions(diskparams, constants.DISK_DT_DEFAULTS)
575 e4a4391d Renรฉ Nussbaumer
  except errors.OpPrereqError, err:
576 e4a4391d Renรฉ Nussbaumer
    raise errors.OpPrereqError("While verify diskparam options: %s" % err,
577 e4a4391d Renรฉ Nussbaumer
                               errors.ECODE_INVAL)
578 bc5d0215 Andrea Spadaccini
579 a0c9f010 Michael Hanselmann
  # set up ssh config and /etc/hosts
580 7ede9c6a Michael Hanselmann
  sshline = utils.ReadFile(pathutils.SSH_HOST_RSA_PUB)
581 a0c9f010 Michael Hanselmann
  sshkey = sshline.split(" ")[1]
582 a0c9f010 Michael Hanselmann
583 b86a6bcd Guido Trotter
  if modify_etc_hosts:
584 ea8ac9c9 Renรฉ Nussbaumer
    utils.AddHostToEtcHosts(hostname.name, hostname.ip)
585 b86a6bcd Guido Trotter
586 b989b9d9 Ken Wehr
  if modify_ssh_setup:
587 b989b9d9 Ken Wehr
    _InitSSHSetup()
588 a0c9f010 Michael Hanselmann
589 bf4af505 Apollon Oikonomopoulos
  if default_iallocator is not None:
590 bf4af505 Apollon Oikonomopoulos
    alloc_script = utils.FindFile(default_iallocator,
591 bf4af505 Apollon Oikonomopoulos
                                  constants.IALLOCATOR_SEARCH_PATH,
592 bf4af505 Apollon Oikonomopoulos
                                  os.path.isfile)
593 bf4af505 Apollon Oikonomopoulos
    if alloc_script is None:
594 bf4af505 Apollon Oikonomopoulos
      raise errors.OpPrereqError("Invalid default iallocator script '%s'"
595 bf4af505 Apollon Oikonomopoulos
                                 " specified" % default_iallocator,
596 bf4af505 Apollon Oikonomopoulos
                                 errors.ECODE_INVAL)
597 d1e9c98d Iustin Pop
  elif constants.HTOOLS:
598 d1e9c98d Iustin Pop
    # htools was enabled at build-time, we default to it
599 d1e9c98d Iustin Pop
    if utils.FindFile(constants.IALLOC_HAIL,
600 d1e9c98d Iustin Pop
                      constants.IALLOCATOR_SEARCH_PATH,
601 d1e9c98d Iustin Pop
                      os.path.isfile):
602 d1e9c98d Iustin Pop
      default_iallocator = constants.IALLOC_HAIL
603 bf4af505 Apollon Oikonomopoulos
604 430b923c Iustin Pop
  now = time.time()
605 430b923c Iustin Pop
606 a0c9f010 Michael Hanselmann
  # init of cluster config file
607 b9eeeb02 Michael Hanselmann
  cluster_config = objects.Cluster(
608 b9eeeb02 Michael Hanselmann
    serial_no=1,
609 b9eeeb02 Michael Hanselmann
    rsahostkeypub=sshkey,
610 b9eeeb02 Michael Hanselmann
    highest_used_port=(constants.FIRST_DRBD_PORT - 1),
611 b9eeeb02 Michael Hanselmann
    mac_prefix=mac_prefix,
612 b9eeeb02 Michael Hanselmann
    volume_group_name=vg_name,
613 b9eeeb02 Michael Hanselmann
    tcpudp_port_pool=set(),
614 f6bd6e98 Michael Hanselmann
    master_node=hostname.name,
615 f6bd6e98 Michael Hanselmann
    master_ip=clustername.ip,
616 5a8648eb Andrea Spadaccini
    master_netmask=master_netmask,
617 f6bd6e98 Michael Hanselmann
    master_netdev=master_netdev,
618 f6bd6e98 Michael Hanselmann
    cluster_name=clustername.name,
619 f6bd6e98 Michael Hanselmann
    file_storage_dir=file_storage_dir,
620 4b97f902 Apollon Oikonomopoulos
    shared_file_storage_dir=shared_file_storage_dir,
621 ea3a925f Alexander Schreiber
    enabled_hypervisors=enabled_hypervisors,
622 4ef7f423 Guido Trotter
    beparams={constants.PP_DEFAULT: beparams},
623 b6a30b0d Guido Trotter
    nicparams={constants.PP_DEFAULT: nicparams},
624 6204ee71 Renรฉ Nussbaumer
    ndparams=ndparams,
625 ea3a925f Alexander Schreiber
    hvparams=hvparams,
626 bc5d0215 Andrea Spadaccini
    diskparams=diskparams,
627 ce735215 Guido Trotter
    candidate_pool_size=candidate_pool_size,
628 022c3a0b Guido Trotter
    modify_etc_hosts=modify_etc_hosts,
629 b989b9d9 Ken Wehr
    modify_ssh_setup=modify_ssh_setup,
630 39b0f0c2 Balazs Lecz
    uid_pool=uid_pool,
631 430b923c Iustin Pop
    ctime=now,
632 430b923c Iustin Pop
    mtime=now,
633 3953242f Iustin Pop
    maintain_node_health=maintain_node_health,
634 a721e23a Luca Bigliardi
    drbd_usermode_helper=drbd_helper,
635 bf4af505 Apollon Oikonomopoulos
    default_iallocator=default_iallocator,
636 2f20d07b Manuel Franceschini
    primary_ip_family=ipcls.family,
637 3d914585 Renรฉ Nussbaumer
    prealloc_wipe_disks=prealloc_wipe_disks,
638 bf689b7a Andrea Spadaccini
    use_external_mip_script=use_external_mip_script,
639 57dc299a Iustin Pop
    ipolicy=full_ipolicy,
640 c4929a8b Renรฉ Nussbaumer
    hv_state_static=hv_state,
641 c4929a8b Renรฉ Nussbaumer
    disk_state_static=disk_state,
642 3bde79ee Helga Velroyen
    enabled_disk_templates=enabled_disk_templates,
643 b9eeeb02 Michael Hanselmann
    )
644 b9eeeb02 Michael Hanselmann
  master_node_config = objects.Node(name=hostname.name,
645 b9eeeb02 Michael Hanselmann
                                    primary_ip=hostname.ip,
646 b9222f32 Guido Trotter
                                    secondary_ip=secondary_ip,
647 c044f32c Guido Trotter
                                    serial_no=1,
648 c044f32c Guido Trotter
                                    master_candidate=True,
649 af64c0ea Iustin Pop
                                    offline=False, drained=False,
650 435e4bd6 Michael Hanselmann
                                    ctime=now, mtime=now,
651 c044f32c Guido Trotter
                                    )
652 9e1333b9 Guido Trotter
  InitConfig(constants.CONFIG_VERSION, cluster_config, master_node_config)
653 d367b66c Manuel Franceschini
  cfg = config.ConfigWriter(offline=True)
654 7ede9c6a Michael Hanselmann
  ssh.WriteKnownHostsFile(cfg, pathutils.SSH_KNOWN_HOSTS_FILE)
655 a4eae71f Michael Hanselmann
  cfg.Update(cfg.GetClusterInfo(), logging.error)
656 ee501db1 Michael Hanselmann
  ssconf.WriteSsconfFiles(cfg.GetSsconfValues())
657 d367b66c Manuel Franceschini
658 d367b66c Manuel Franceschini
  # set up the inter-node password and certificate
659 d367b66c Manuel Franceschini
  _InitGanetiServerSetup(hostname.name)
660 827f753e Guido Trotter
661 952d7515 Michael Hanselmann
  logging.debug("Starting daemons")
662 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start-all"])
663 952d7515 Michael Hanselmann
  if result.failed:
664 952d7515 Michael Hanselmann
    raise errors.OpExecError("Could not start daemons, command %s"
665 952d7515 Michael Hanselmann
                             " had exitcode %s and error %s" %
666 952d7515 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
667 b3f1cf6f Iustin Pop
668 3b6b6129 Michael Hanselmann
  _WaitForMasterDaemon()
669 b3f1cf6f Iustin Pop
670 b1b6ea87 Iustin Pop
671 02f99608 Oleksiy Mishchenko
def InitConfig(version, cluster_config, master_node_config,
672 7ede9c6a Michael Hanselmann
               cfg_file=pathutils.CLUSTER_CONF_FILE):
673 7b3a8fb5 Iustin Pop
  """Create the initial cluster configuration.
674 7b3a8fb5 Iustin Pop

675 7b3a8fb5 Iustin Pop
  It will contain the current node, which will also be the master
676 7b3a8fb5 Iustin Pop
  node, and no instances.
677 7b3a8fb5 Iustin Pop

678 7b3a8fb5 Iustin Pop
  @type version: int
679 c41eea6e Iustin Pop
  @param version: configuration version
680 c41eea6e Iustin Pop
  @type cluster_config: L{objects.Cluster}
681 c41eea6e Iustin Pop
  @param cluster_config: cluster configuration
682 c41eea6e Iustin Pop
  @type master_node_config: L{objects.Node}
683 c41eea6e Iustin Pop
  @param master_node_config: master node configuration
684 c41eea6e Iustin Pop
  @type cfg_file: string
685 c41eea6e Iustin Pop
  @param cfg_file: configuration file path
686 c41eea6e Iustin Pop

687 7b3a8fb5 Iustin Pop
  """
688 88b92fe3 Guido Trotter
  uuid_generator = config.TemporaryReservationManager()
689 88b92fe3 Guido Trotter
  cluster_config.uuid = uuid_generator.Generate([], utils.NewUUID,
690 88b92fe3 Guido Trotter
                                                _INITCONF_ECID)
691 88b92fe3 Guido Trotter
  master_node_config.uuid = uuid_generator.Generate([], utils.NewUUID,
692 88b92fe3 Guido Trotter
                                                    _INITCONF_ECID)
693 7b3a8fb5 Iustin Pop
  nodes = {
694 7b3a8fb5 Iustin Pop
    master_node_config.name: master_node_config,
695 7b3a8fb5 Iustin Pop
    }
696 88b92fe3 Guido Trotter
  default_nodegroup = objects.NodeGroup(
697 88b92fe3 Guido Trotter
    uuid=uuid_generator.Generate([], utils.NewUUID, _INITCONF_ECID),
698 75cf411a Adeodato Simo
    name=constants.INITIAL_NODE_GROUP_NAME,
699 88b92fe3 Guido Trotter
    members=[master_node_config.name],
700 99ccf8b9 Renรฉ Nussbaumer
    diskparams={},
701 88b92fe3 Guido Trotter
    )
702 88b92fe3 Guido Trotter
  nodegroups = {
703 88b92fe3 Guido Trotter
    default_nodegroup.uuid: default_nodegroup,
704 88b92fe3 Guido Trotter
    }
705 d693c864 Iustin Pop
  now = time.time()
706 7b3a8fb5 Iustin Pop
  config_data = objects.ConfigData(version=version,
707 7b3a8fb5 Iustin Pop
                                   cluster=cluster_config,
708 88b92fe3 Guido Trotter
                                   nodegroups=nodegroups,
709 7b3a8fb5 Iustin Pop
                                   nodes=nodes,
710 7b3a8fb5 Iustin Pop
                                   instances={},
711 eaa4c57c Dimitris Aragiorgis
                                   networks={},
712 d693c864 Iustin Pop
                                   serial_no=1,
713 d693c864 Iustin Pop
                                   ctime=now, mtime=now)
714 a33848a5 Guido Trotter
  utils.WriteFile(cfg_file,
715 a33848a5 Guido Trotter
                  data=serializer.Dump(config_data.ToDict()),
716 a33848a5 Guido Trotter
                  mode=0600)
717 02f99608 Oleksiy Mishchenko
718 02f99608 Oleksiy Mishchenko
719 140aa4a8 Iustin Pop
def FinalizeClusterDestroy(master):
720 140aa4a8 Iustin Pop
  """Execute the last steps of cluster destroy
721 140aa4a8 Iustin Pop

722 140aa4a8 Iustin Pop
  This function shuts down all the daemons, completing the destroy
723 140aa4a8 Iustin Pop
  begun in cmdlib.LUDestroyOpcode.
724 140aa4a8 Iustin Pop

725 140aa4a8 Iustin Pop
  """
726 b989b9d9 Ken Wehr
  cfg = config.ConfigWriter()
727 b989b9d9 Ken Wehr
  modify_ssh_setup = cfg.GetClusterInfo().modify_ssh_setup
728 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
729 7c74bbe0 Andrea Spadaccini
730 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
731 c79198a0 Andrea Spadaccini
  master_params.name = master
732 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
733 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
734 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
735 c79198a0 Andrea Spadaccini
736 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
737 7c74bbe0 Andrea Spadaccini
  if msg:
738 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
739 7c74bbe0 Andrea Spadaccini
740 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(master)
741 3cebe102 Michael Hanselmann
  msg = result.fail_msg
742 6c00d19a Iustin Pop
  if msg:
743 099c52ad Iustin Pop
    logging.warning("Could not disable the master role: %s", msg)
744 7c74bbe0 Andrea Spadaccini
745 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_leave_cluster(master, modify_ssh_setup)
746 3cebe102 Michael Hanselmann
  msg = result.fail_msg
747 0623d351 Iustin Pop
  if msg:
748 0623d351 Iustin Pop
    logging.warning("Could not shutdown the node daemon and cleanup"
749 0623d351 Iustin Pop
                    " the node: %s", msg)
750 140aa4a8 Iustin Pop
751 140aa4a8 Iustin Pop
752 7b8ba235 Michael Hanselmann
def SetupNodeDaemon(opts, cluster_name, node):
753 827f753e Guido Trotter
  """Add a node to the cluster.
754 827f753e Guido Trotter

755 b1b6ea87 Iustin Pop
  This function must be called before the actual opcode, and will ssh
756 b1b6ea87 Iustin Pop
  to the remote node, copy the needed files, and start ganeti-noded,
757 b1b6ea87 Iustin Pop
  allowing the master to do the rest via normal rpc calls.
758 827f753e Guido Trotter

759 87622829 Iustin Pop
  @param cluster_name: the cluster name
760 87622829 Iustin Pop
  @param node: the name of the new node
761 827f753e Guido Trotter

762 827f753e Guido Trotter
  """
763 7b8ba235 Michael Hanselmann
  data = {
764 7b8ba235 Michael Hanselmann
    constants.NDS_CLUSTER_NAME: cluster_name,
765 7b8ba235 Michael Hanselmann
    constants.NDS_NODE_DAEMON_CERTIFICATE:
766 7b8ba235 Michael Hanselmann
      utils.ReadFile(pathutils.NODED_CERT_FILE),
767 7b8ba235 Michael Hanselmann
    constants.NDS_SSCONF: ssconf.SimpleStore().ReadAll(),
768 7b8ba235 Michael Hanselmann
    constants.NDS_START_NODE_DAEMON: True,
769 7b8ba235 Michael Hanselmann
    }
770 7b8ba235 Michael Hanselmann
771 7b8ba235 Michael Hanselmann
  RunNodeSetupCmd(cluster_name, node, pathutils.NODE_DAEMON_SETUP,
772 7b8ba235 Michael Hanselmann
                  opts.debug, opts.verbose,
773 7b8ba235 Michael Hanselmann
                  True, opts.ssh_key_check, opts.ssh_key_check, data)
774 827f753e Guido Trotter
775 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(node)
776 5627f375 Michael Hanselmann
777 b1b6ea87 Iustin Pop
778 8e2524c3 Guido Trotter
def MasterFailover(no_voting=False):
779 b1b6ea87 Iustin Pop
  """Failover the master node.
780 b1b6ea87 Iustin Pop

781 b1b6ea87 Iustin Pop
  This checks that we are not already the master, and will cause the
782 b1b6ea87 Iustin Pop
  current master to cease being master, and the non-master to become
783 b1b6ea87 Iustin Pop
  new master.
784 b1b6ea87 Iustin Pop

785 8e2524c3 Guido Trotter
  @type no_voting: boolean
786 8e2524c3 Guido Trotter
  @param no_voting: force the operation without remote nodes agreement
787 8e2524c3 Guido Trotter
                      (dangerous)
788 8e2524c3 Guido Trotter

789 b1b6ea87 Iustin Pop
  """
790 8135a2db Iustin Pop
  sstore = ssconf.SimpleStore()
791 b1b6ea87 Iustin Pop
792 8135a2db Iustin Pop
  old_master, new_master = ssconf.GetMasterAndMyself(sstore)
793 8135a2db Iustin Pop
  node_list = sstore.GetNodeList()
794 8135a2db Iustin Pop
  mc_list = sstore.GetMasterCandidates()
795 b1b6ea87 Iustin Pop
796 b1b6ea87 Iustin Pop
  if old_master == new_master:
797 b1b6ea87 Iustin Pop
    raise errors.OpPrereqError("This commands must be run on the node"
798 b1b6ea87 Iustin Pop
                               " where you want the new master to be."
799 b1b6ea87 Iustin Pop
                               " %s is already the master" %
800 debac808 Iustin Pop
                               old_master, errors.ECODE_INVAL)
801 d5927e48 Iustin Pop
802 8135a2db Iustin Pop
  if new_master not in mc_list:
803 8135a2db Iustin Pop
    mc_no_master = [name for name in mc_list if name != old_master]
804 8135a2db Iustin Pop
    raise errors.OpPrereqError("This node is not among the nodes marked"
805 8135a2db Iustin Pop
                               " as master candidates. Only these nodes"
806 8135a2db Iustin Pop
                               " can become masters. Current list of"
807 8135a2db Iustin Pop
                               " master candidates is:\n"
808 3ccb3a64 Michael Hanselmann
                               "%s" % ("\n".join(mc_no_master)),
809 debac808 Iustin Pop
                               errors.ECODE_STATE)
810 8135a2db Iustin Pop
811 8e2524c3 Guido Trotter
  if not no_voting:
812 8e2524c3 Guido Trotter
    vote_list = GatherMasterVotes(node_list)
813 8e2524c3 Guido Trotter
814 8e2524c3 Guido Trotter
    if vote_list:
815 8e2524c3 Guido Trotter
      voted_master = vote_list[0][0]
816 8e2524c3 Guido Trotter
      if voted_master is None:
817 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("Cluster is inconsistent, most nodes did"
818 debac808 Iustin Pop
                                   " not respond.", errors.ECODE_ENVIRON)
819 8e2524c3 Guido Trotter
      elif voted_master != old_master:
820 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("I have a wrong configuration, I believe"
821 8e2524c3 Guido Trotter
                                   " the master is %s but the other nodes"
822 8e2524c3 Guido Trotter
                                   " voted %s. Please resync the configuration"
823 8e2524c3 Guido Trotter
                                   " of this node." %
824 debac808 Iustin Pop
                                   (old_master, voted_master),
825 debac808 Iustin Pop
                                   errors.ECODE_STATE)
826 b1b6ea87 Iustin Pop
  # end checks
827 b1b6ea87 Iustin Pop
828 b1b6ea87 Iustin Pop
  rcode = 0
829 b1b6ea87 Iustin Pop
830 d5927e48 Iustin Pop
  logging.info("Setting master to %s, old master: %s", new_master, old_master)
831 b1b6ea87 Iustin Pop
832 21004460 Iustin Pop
  try:
833 21004460 Iustin Pop
    # instantiate a real config writer, as we now know we have the
834 21004460 Iustin Pop
    # configuration data
835 eb180fe2 Iustin Pop
    cfg = config.ConfigWriter(accept_foreign=True)
836 21004460 Iustin Pop
837 21004460 Iustin Pop
    cluster_info = cfg.GetClusterInfo()
838 21004460 Iustin Pop
    cluster_info.master_node = new_master
839 21004460 Iustin Pop
    # this will also regenerate the ssconf files, since we updated the
840 21004460 Iustin Pop
    # cluster info
841 21004460 Iustin Pop
    cfg.Update(cluster_info, logging.error)
842 21004460 Iustin Pop
  except errors.ConfigurationError, err:
843 21004460 Iustin Pop
    logging.error("Error while trying to set the new master: %s",
844 21004460 Iustin Pop
                  str(err))
845 21004460 Iustin Pop
    return 1
846 21004460 Iustin Pop
847 21004460 Iustin Pop
  # if cfg.Update worked, then it means the old master daemon won't be
848 21004460 Iustin Pop
  # able now to write its own config file (we rely on locking in both
849 21004460 Iustin Pop
  # backend.UploadFile() and ConfigWriter._Write(); hence the next
850 21004460 Iustin Pop
  # step is to kill the old master
851 21004460 Iustin Pop
852 21004460 Iustin Pop
  logging.info("Stopping the master daemon on node %s", old_master)
853 21004460 Iustin Pop
854 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
855 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
856 c79198a0 Andrea Spadaccini
  master_params.name = old_master
857 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
858 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
859 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
860 c79198a0 Andrea Spadaccini
861 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
862 7c74bbe0 Andrea Spadaccini
  if msg:
863 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
864 7c74bbe0 Andrea Spadaccini
865 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(old_master)
866 3cebe102 Michael Hanselmann
  msg = result.fail_msg
867 6c00d19a Iustin Pop
  if msg:
868 d5927e48 Iustin Pop
    logging.error("Could not disable the master role on the old master"
869 5ae4945a Iustin Pop
                  " %s, please disable manually: %s", old_master, msg)
870 b1b6ea87 Iustin Pop
871 21004460 Iustin Pop
  logging.info("Checking master IP non-reachability...")
872 21004460 Iustin Pop
873 425f0f54 Iustin Pop
  master_ip = sstore.GetMasterIP()
874 425f0f54 Iustin Pop
  total_timeout = 30
875 e687ec01 Michael Hanselmann
876 d23ef431 Michael Hanselmann
  # Here we have a phase where no master should be running
877 425f0f54 Iustin Pop
  def _check_ip():
878 a744b676 Manuel Franceschini
    if netutils.TcpPing(master_ip, constants.DEFAULT_NODED_PORT):
879 425f0f54 Iustin Pop
      raise utils.RetryAgain()
880 425f0f54 Iustin Pop
881 425f0f54 Iustin Pop
  try:
882 425f0f54 Iustin Pop
    utils.Retry(_check_ip, (1, 1.5, 5), total_timeout)
883 425f0f54 Iustin Pop
  except utils.RetryTimeout:
884 425f0f54 Iustin Pop
    logging.warning("The master IP is still reachable after %s seconds,"
885 425f0f54 Iustin Pop
                    " continuing but activating the master on the current"
886 425f0f54 Iustin Pop
                    " node will probably fail", total_timeout)
887 b1b6ea87 Iustin Pop
888 ff699aa9 Michael Hanselmann
  if jstore.CheckDrainFlag():
889 ff699aa9 Michael Hanselmann
    logging.info("Undraining job queue")
890 ff699aa9 Michael Hanselmann
    jstore.SetDrainFlag(False)
891 ff699aa9 Michael Hanselmann
892 21004460 Iustin Pop
  logging.info("Starting the master daemons on the new master")
893 d5927e48 Iustin Pop
894 db04ce5d Michael Hanselmann
  result = rpc.BootstrapRunner().call_node_start_master_daemons(new_master,
895 db04ce5d Michael Hanselmann
                                                                no_voting)
896 3cebe102 Michael Hanselmann
  msg = result.fail_msg
897 b726aff0 Iustin Pop
  if msg:
898 d5927e48 Iustin Pop
    logging.error("Could not start the master role on the new master"
899 b726aff0 Iustin Pop
                  " %s, please check: %s", new_master, msg)
900 b1b6ea87 Iustin Pop
    rcode = 1
901 b1b6ea87 Iustin Pop
902 21004460 Iustin Pop
  logging.info("Master failed over from %s to %s", old_master, new_master)
903 b1b6ea87 Iustin Pop
  return rcode
904 d7cdb55d Iustin Pop
905 d7cdb55d Iustin Pop
906 8eb148ae Iustin Pop
def GetMaster():
907 8eb148ae Iustin Pop
  """Returns the current master node.
908 8eb148ae Iustin Pop

909 8eb148ae Iustin Pop
  This is a separate function in bootstrap since it's needed by
910 8eb148ae Iustin Pop
  gnt-cluster, and instead of importing directly ssconf, it's better
911 8eb148ae Iustin Pop
  to abstract it in bootstrap, where we do use ssconf in other
912 8eb148ae Iustin Pop
  functions too.
913 8eb148ae Iustin Pop

914 8eb148ae Iustin Pop
  """
915 8eb148ae Iustin Pop
  sstore = ssconf.SimpleStore()
916 8eb148ae Iustin Pop
917 8eb148ae Iustin Pop
  old_master, _ = ssconf.GetMasterAndMyself(sstore)
918 8eb148ae Iustin Pop
919 8eb148ae Iustin Pop
  return old_master
920 8eb148ae Iustin Pop
921 8eb148ae Iustin Pop
922 d7cdb55d Iustin Pop
def GatherMasterVotes(node_list):
923 d7cdb55d Iustin Pop
  """Check the agreement on who is the master.
924 d7cdb55d Iustin Pop

925 d7cdb55d Iustin Pop
  This function will return a list of (node, number of votes), ordered
926 d7cdb55d Iustin Pop
  by the number of votes. Errors will be denoted by the key 'None'.
927 d7cdb55d Iustin Pop

928 d7cdb55d Iustin Pop
  Note that the sum of votes is the number of nodes this machine
929 d7cdb55d Iustin Pop
  knows, whereas the number of entries in the list could be different
930 d7cdb55d Iustin Pop
  (if some nodes vote for another master).
931 d7cdb55d Iustin Pop

932 d7cdb55d Iustin Pop
  We remove ourselves from the list since we know that (bugs aside)
933 d7cdb55d Iustin Pop
  since we use the same source for configuration information for both
934 d7cdb55d Iustin Pop
  backend and boostrap, we'll always vote for ourselves.
935 d7cdb55d Iustin Pop

936 d7cdb55d Iustin Pop
  @type node_list: list
937 d7cdb55d Iustin Pop
  @param node_list: the list of nodes to query for master info; the current
938 5bbd3f7f Michael Hanselmann
      node will be removed if it is in the list
939 d7cdb55d Iustin Pop
  @rtype: list
940 d7cdb55d Iustin Pop
  @return: list of (node, votes)
941 d7cdb55d Iustin Pop

942 d7cdb55d Iustin Pop
  """
943 b705c7a6 Manuel Franceschini
  myself = netutils.Hostname.GetSysName()
944 d7cdb55d Iustin Pop
  try:
945 d7cdb55d Iustin Pop
    node_list.remove(myself)
946 d7cdb55d Iustin Pop
  except ValueError:
947 d7cdb55d Iustin Pop
    pass
948 d7cdb55d Iustin Pop
  if not node_list:
949 d7cdb55d Iustin Pop
    # no nodes left (eventually after removing myself)
950 d7cdb55d Iustin Pop
    return []
951 db04ce5d Michael Hanselmann
  results = rpc.BootstrapRunner().call_master_info(node_list)
952 d7cdb55d Iustin Pop
  if not isinstance(results, dict):
953 d7cdb55d Iustin Pop
    # this should not happen (unless internal error in rpc)
954 d7cdb55d Iustin Pop
    logging.critical("Can't complete rpc call, aborting master startup")
955 d7cdb55d Iustin Pop
    return [(None, len(node_list))]
956 d7cdb55d Iustin Pop
  votes = {}
957 d7cdb55d Iustin Pop
  for node in results:
958 781de953 Iustin Pop
    nres = results[node]
959 2a52a064 Iustin Pop
    data = nres.payload
960 3cebe102 Michael Hanselmann
    msg = nres.fail_msg
961 2a52a064 Iustin Pop
    fail = False
962 2a52a064 Iustin Pop
    if msg:
963 2a52a064 Iustin Pop
      logging.warning("Error contacting node %s: %s", node, msg)
964 2a52a064 Iustin Pop
      fail = True
965 909b3a0e Andrea Spadaccini
    # for now we accept both length 3, 4 and 5 (data[3] is primary ip version
966 909b3a0e Andrea Spadaccini
    # and data[4] is the master netmask)
967 2a52a064 Iustin Pop
    elif not isinstance(data, (tuple, list)) or len(data) < 3:
968 2a52a064 Iustin Pop
      logging.warning("Invalid data received from node %s: %s", node, data)
969 2a52a064 Iustin Pop
      fail = True
970 2a52a064 Iustin Pop
    if fail:
971 d7cdb55d Iustin Pop
      if None not in votes:
972 d7cdb55d Iustin Pop
        votes[None] = 0
973 d7cdb55d Iustin Pop
      votes[None] += 1
974 d7cdb55d Iustin Pop
      continue
975 781de953 Iustin Pop
    master_node = data[2]
976 d7cdb55d Iustin Pop
    if master_node not in votes:
977 d7cdb55d Iustin Pop
      votes[master_node] = 0
978 d7cdb55d Iustin Pop
    votes[master_node] += 1
979 d7cdb55d Iustin Pop
980 d7cdb55d Iustin Pop
  vote_list = [v for v in votes.items()]
981 d7cdb55d Iustin Pop
  # sort first on number of votes then on name, since we want None
982 d7cdb55d Iustin Pop
  # sorted later if we have the half of the nodes not responding, and
983 d7cdb55d Iustin Pop
  # half voting all for the same master
984 d7cdb55d Iustin Pop
  vote_list.sort(key=lambda x: (x[1], x[0]), reverse=True)
985 d7cdb55d Iustin Pop
986 d7cdb55d Iustin Pop
  return vote_list