Statistics
| Branch: | Tag: | Revision:

root / lib / bootstrap.py @ bbfa259c

History | View | Annotate | Download (36 kB)

1 a0c9f010 Michael Hanselmann
#
2 a0c9f010 Michael Hanselmann
#
3 a0c9f010 Michael Hanselmann
4 57dc299a Iustin Pop
# Copyright (C) 2006, 2007, 2008, 2010, 2011, 2012 Google Inc.
5 a0c9f010 Michael Hanselmann
#
6 a0c9f010 Michael Hanselmann
# This program is free software; you can redistribute it and/or modify
7 a0c9f010 Michael Hanselmann
# it under the terms of the GNU General Public License as published by
8 a0c9f010 Michael Hanselmann
# the Free Software Foundation; either version 2 of the License, or
9 a0c9f010 Michael Hanselmann
# (at your option) any later version.
10 a0c9f010 Michael Hanselmann
#
11 a0c9f010 Michael Hanselmann
# This program is distributed in the hope that it will be useful, but
12 a0c9f010 Michael Hanselmann
# WITHOUT ANY WARRANTY; without even the implied warranty of
13 a0c9f010 Michael Hanselmann
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 a0c9f010 Michael Hanselmann
# General Public License for more details.
15 a0c9f010 Michael Hanselmann
#
16 a0c9f010 Michael Hanselmann
# You should have received a copy of the GNU General Public License
17 a0c9f010 Michael Hanselmann
# along with this program; if not, write to the Free Software
18 a0c9f010 Michael Hanselmann
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19 a0c9f010 Michael Hanselmann
# 02110-1301, USA.
20 a0c9f010 Michael Hanselmann
21 a0c9f010 Michael Hanselmann
22 a0c9f010 Michael Hanselmann
"""Functions to bootstrap a new cluster.
23 a0c9f010 Michael Hanselmann

24 a0c9f010 Michael Hanselmann
"""
25 a0c9f010 Michael Hanselmann
26 a0c9f010 Michael Hanselmann
import os
27 a0c9f010 Michael Hanselmann
import os.path
28 a0c9f010 Michael Hanselmann
import re
29 b1b6ea87 Iustin Pop
import logging
30 d693c864 Iustin Pop
import time
31 a698cdbb Michael Hanselmann
import tempfile
32 a0c9f010 Michael Hanselmann
33 a0c9f010 Michael Hanselmann
from ganeti import rpc
34 a0c9f010 Michael Hanselmann
from ganeti import ssh
35 a0c9f010 Michael Hanselmann
from ganeti import utils
36 a0c9f010 Michael Hanselmann
from ganeti import errors
37 a0c9f010 Michael Hanselmann
from ganeti import config
38 a0c9f010 Michael Hanselmann
from ganeti import constants
39 b9eeeb02 Michael Hanselmann
from ganeti import objects
40 a0c9f010 Michael Hanselmann
from ganeti import ssconf
41 a33848a5 Guido Trotter
from ganeti import serializer
42 a5728081 Guido Trotter
from ganeti import hypervisor
43 a721e23a Luca Bigliardi
from ganeti import bdev
44 a744b676 Manuel Franceschini
from ganeti import netutils
45 3b6b6129 Michael Hanselmann
from ganeti import luxi
46 ff699aa9 Michael Hanselmann
from ganeti import jstore
47 7ede9c6a Michael Hanselmann
from ganeti import pathutils
48 3b6b6129 Michael Hanselmann
49 a0c9f010 Michael Hanselmann
50 88b92fe3 Guido Trotter
# ec_id for InitConfig's temporary reservation manager
51 88b92fe3 Guido Trotter
_INITCONF_ECID = "initconfig-ecid"
52 88b92fe3 Guido Trotter
53 3b6b6129 Michael Hanselmann
#: After how many seconds daemon must be responsive
54 3b6b6129 Michael Hanselmann
_DAEMON_READY_TIMEOUT = 10.0
55 3b6b6129 Michael Hanselmann
56 e38220e4 Michael Hanselmann
57 531baf8e Iustin Pop
def _InitSSHSetup():
58 a0c9f010 Michael Hanselmann
  """Setup the SSH configuration for the cluster.
59 a0c9f010 Michael Hanselmann

60 a0c9f010 Michael Hanselmann
  This generates a dsa keypair for root, adds the pub key to the
61 a0c9f010 Michael Hanselmann
  permitted hosts and adds the hostkey to its own known hosts.
62 a0c9f010 Michael Hanselmann

63 a0c9f010 Michael Hanselmann
  """
64 052783ff Michael Hanselmann
  priv_key, pub_key, auth_keys = ssh.GetUserFiles(constants.SSH_LOGIN_USER)
65 a0c9f010 Michael Hanselmann
66 a0c9f010 Michael Hanselmann
  for name in priv_key, pub_key:
67 a0c9f010 Michael Hanselmann
    if os.path.exists(name):
68 a0c9f010 Michael Hanselmann
      utils.CreateBackup(name)
69 a0c9f010 Michael Hanselmann
    utils.RemoveFile(name)
70 a0c9f010 Michael Hanselmann
71 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ssh-keygen", "-t", "dsa",
72 a0c9f010 Michael Hanselmann
                         "-f", priv_key,
73 a0c9f010 Michael Hanselmann
                         "-q", "-N", ""])
74 a0c9f010 Michael Hanselmann
  if result.failed:
75 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not generate ssh keypair, error %s" %
76 a0c9f010 Michael Hanselmann
                             result.output)
77 a0c9f010 Michael Hanselmann
78 7a0156dc Luca Bigliardi
  utils.AddAuthorizedKey(auth_keys, utils.ReadFile(pub_key))
79 a0c9f010 Michael Hanselmann
80 a0c9f010 Michael Hanselmann
81 c008906b Michael Hanselmann
def GenerateHmacKey(file_name):
82 c008906b Michael Hanselmann
  """Writes a new HMAC key.
83 c008906b Michael Hanselmann

84 c008906b Michael Hanselmann
  @type file_name: str
85 c008906b Michael Hanselmann
  @param file_name: Path to output file
86 c008906b Michael Hanselmann

87 c008906b Michael Hanselmann
  """
88 43575108 Michael Hanselmann
  utils.WriteFile(file_name, data="%s\n" % utils.GenerateSecret(), mode=0400,
89 43575108 Michael Hanselmann
                  backup=True)
90 43575108 Michael Hanselmann
91 43575108 Michael Hanselmann
92 b6267745 Andrea Spadaccini
def GenerateClusterCrypto(new_cluster_cert, new_rapi_cert, new_spice_cert,
93 b6267745 Andrea Spadaccini
                          new_confd_hmac_key, new_cds,
94 b6267745 Andrea Spadaccini
                          rapi_cert_pem=None, spice_cert_pem=None,
95 b6267745 Andrea Spadaccini
                          spice_cacert_pem=None, cds=None,
96 7ede9c6a Michael Hanselmann
                          nodecert_file=pathutils.NODED_CERT_FILE,
97 7ede9c6a Michael Hanselmann
                          rapicert_file=pathutils.RAPI_CERT_FILE,
98 7ede9c6a Michael Hanselmann
                          spicecert_file=pathutils.SPICE_CERT_FILE,
99 7ede9c6a Michael Hanselmann
                          spicecacert_file=pathutils.SPICE_CACERT_FILE,
100 7ede9c6a Michael Hanselmann
                          hmackey_file=pathutils.CONFD_HMAC_KEY,
101 7ede9c6a Michael Hanselmann
                          cds_file=pathutils.CLUSTER_DOMAIN_SECRET_FILE):
102 43575108 Michael Hanselmann
  """Updates the cluster certificates, keys and secrets.
103 43575108 Michael Hanselmann

104 43575108 Michael Hanselmann
  @type new_cluster_cert: bool
105 43575108 Michael Hanselmann
  @param new_cluster_cert: Whether to generate a new cluster certificate
106 43575108 Michael Hanselmann
  @type new_rapi_cert: bool
107 43575108 Michael Hanselmann
  @param new_rapi_cert: Whether to generate a new RAPI certificate
108 b6267745 Andrea Spadaccini
  @type new_spice_cert: bool
109 b6267745 Andrea Spadaccini
  @param new_spice_cert: Whether to generate a new SPICE certificate
110 6b7d5878 Michael Hanselmann
  @type new_confd_hmac_key: bool
111 6b7d5878 Michael Hanselmann
  @param new_confd_hmac_key: Whether to generate a new HMAC key
112 3db3eb2a Michael Hanselmann
  @type new_cds: bool
113 3db3eb2a Michael Hanselmann
  @param new_cds: Whether to generate a new cluster domain secret
114 43575108 Michael Hanselmann
  @type rapi_cert_pem: string
115 43575108 Michael Hanselmann
  @param rapi_cert_pem: New RAPI certificate in PEM format
116 b6267745 Andrea Spadaccini
  @type spice_cert_pem: string
117 b6267745 Andrea Spadaccini
  @param spice_cert_pem: New SPICE certificate in PEM format
118 b6267745 Andrea Spadaccini
  @type spice_cacert_pem: string
119 b6267745 Andrea Spadaccini
  @param spice_cacert_pem: Certificate of the CA that signed the SPICE
120 b6267745 Andrea Spadaccini
                           certificate, in PEM format
121 3db3eb2a Michael Hanselmann
  @type cds: string
122 3db3eb2a Michael Hanselmann
  @param cds: New cluster domain secret
123 aeefe835 Iustin Pop
  @type nodecert_file: string
124 aeefe835 Iustin Pop
  @param nodecert_file: optional override of the node cert file path
125 aeefe835 Iustin Pop
  @type rapicert_file: string
126 aeefe835 Iustin Pop
  @param rapicert_file: optional override of the rapi cert file path
127 b6267745 Andrea Spadaccini
  @type spicecert_file: string
128 b6267745 Andrea Spadaccini
  @param spicecert_file: optional override of the spice cert file path
129 b6267745 Andrea Spadaccini
  @type spicecacert_file: string
130 b6267745 Andrea Spadaccini
  @param spicecacert_file: optional override of the spice CA cert file path
131 aeefe835 Iustin Pop
  @type hmackey_file: string
132 aeefe835 Iustin Pop
  @param hmackey_file: optional override of the hmac key file path
133 43575108 Michael Hanselmann

134 43575108 Michael Hanselmann
  """
135 168c1de2 Michael Hanselmann
  # noded SSL certificate
136 aeefe835 Iustin Pop
  cluster_cert_exists = os.path.exists(nodecert_file)
137 43575108 Michael Hanselmann
  if new_cluster_cert or not cluster_cert_exists:
138 43575108 Michael Hanselmann
    if cluster_cert_exists:
139 aeefe835 Iustin Pop
      utils.CreateBackup(nodecert_file)
140 43575108 Michael Hanselmann
141 aeefe835 Iustin Pop
    logging.debug("Generating new cluster certificate at %s", nodecert_file)
142 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(nodecert_file)
143 43575108 Michael Hanselmann
144 6b7d5878 Michael Hanselmann
  # confd HMAC key
145 aeefe835 Iustin Pop
  if new_confd_hmac_key or not os.path.exists(hmackey_file):
146 aeefe835 Iustin Pop
    logging.debug("Writing new confd HMAC key to %s", hmackey_file)
147 aeefe835 Iustin Pop
    GenerateHmacKey(hmackey_file)
148 43575108 Michael Hanselmann
149 43575108 Michael Hanselmann
  # RAPI
150 aeefe835 Iustin Pop
  rapi_cert_exists = os.path.exists(rapicert_file)
151 43575108 Michael Hanselmann
152 43575108 Michael Hanselmann
  if rapi_cert_pem:
153 43575108 Michael Hanselmann
    # Assume rapi_pem contains a valid PEM-formatted certificate and key
154 aeefe835 Iustin Pop
    logging.debug("Writing RAPI certificate at %s", rapicert_file)
155 aeefe835 Iustin Pop
    utils.WriteFile(rapicert_file, data=rapi_cert_pem, backup=True)
156 43575108 Michael Hanselmann
157 43575108 Michael Hanselmann
  elif new_rapi_cert or not rapi_cert_exists:
158 43575108 Michael Hanselmann
    if rapi_cert_exists:
159 aeefe835 Iustin Pop
      utils.CreateBackup(rapicert_file)
160 43575108 Michael Hanselmann
161 aeefe835 Iustin Pop
    logging.debug("Generating new RAPI certificate at %s", rapicert_file)
162 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(rapicert_file)
163 c008906b Michael Hanselmann
164 b6267745 Andrea Spadaccini
  # SPICE
165 b6267745 Andrea Spadaccini
  spice_cert_exists = os.path.exists(spicecert_file)
166 b6267745 Andrea Spadaccini
  spice_cacert_exists = os.path.exists(spicecacert_file)
167 b6267745 Andrea Spadaccini
  if spice_cert_pem:
168 b6267745 Andrea Spadaccini
    # spice_cert_pem implies also spice_cacert_pem
169 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE certificate at %s", spicecert_file)
170 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecert_file, data=spice_cert_pem, backup=True)
171 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE CA certificate at %s", spicecacert_file)
172 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecacert_file, data=spice_cacert_pem, backup=True)
173 b6267745 Andrea Spadaccini
  elif new_spice_cert or not spice_cert_exists:
174 b6267745 Andrea Spadaccini
    if spice_cert_exists:
175 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecert_file)
176 b6267745 Andrea Spadaccini
    if spice_cacert_exists:
177 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecacert_file)
178 b6267745 Andrea Spadaccini
179 b6267745 Andrea Spadaccini
    logging.debug("Generating new self-signed SPICE certificate at %s",
180 b6267745 Andrea Spadaccini
                  spicecert_file)
181 b6267745 Andrea Spadaccini
    (_, cert_pem) = utils.GenerateSelfSignedSslCert(spicecert_file)
182 b6267745 Andrea Spadaccini
183 b6267745 Andrea Spadaccini
    # Self-signed certificate -> the public certificate is also the CA public
184 b6267745 Andrea Spadaccini
    # certificate
185 b6267745 Andrea Spadaccini
    logging.debug("Writing the public certificate to %s",
186 b6267745 Andrea Spadaccini
                  spicecert_file)
187 b6267745 Andrea Spadaccini
    utils.io.WriteFile(spicecacert_file, mode=0400, data=cert_pem)
188 b6267745 Andrea Spadaccini
189 3db3eb2a Michael Hanselmann
  # Cluster domain secret
190 3db3eb2a Michael Hanselmann
  if cds:
191 fc0726b9 Michael Hanselmann
    logging.debug("Writing cluster domain secret to %s", cds_file)
192 fc0726b9 Michael Hanselmann
    utils.WriteFile(cds_file, data=cds, backup=True)
193 fc0726b9 Michael Hanselmann
194 fc0726b9 Michael Hanselmann
  elif new_cds or not os.path.exists(cds_file):
195 fc0726b9 Michael Hanselmann
    logging.debug("Generating new cluster domain secret at %s", cds_file)
196 fc0726b9 Michael Hanselmann
    GenerateHmacKey(cds_file)
197 3db3eb2a Michael Hanselmann
198 c008906b Michael Hanselmann
199 8f215968 Michael Hanselmann
def _InitGanetiServerSetup(master_name):
200 40a97d80 Michael Hanselmann
  """Setup the necessary configuration for the initial node daemon.
201 40a97d80 Michael Hanselmann

202 40a97d80 Michael Hanselmann
  This creates the nodepass file containing the shared password for
203 600535f0 Manuel Franceschini
  the cluster, generates the SSL certificate and starts the node daemon.
204 600535f0 Manuel Franceschini

205 600535f0 Manuel Franceschini
  @type master_name: str
206 600535f0 Manuel Franceschini
  @param master_name: Name of the master node
207 40a97d80 Michael Hanselmann

208 40a97d80 Michael Hanselmann
  """
209 43575108 Michael Hanselmann
  # Generate cluster secrets
210 b6267745 Andrea Spadaccini
  GenerateClusterCrypto(True, False, False, False, False)
211 4a34c5cf Guido Trotter
212 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start", constants.NODED])
213 a0c9f010 Michael Hanselmann
  if result.failed:
214 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not start the node daemon, command %s"
215 a0c9f010 Michael Hanselmann
                             " had exitcode %s and error %s" %
216 a0c9f010 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
217 a0c9f010 Michael Hanselmann
218 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(master_name)
219 5627f375 Michael Hanselmann
220 5627f375 Michael Hanselmann
221 5627f375 Michael Hanselmann
def _WaitForNodeDaemon(node_name):
222 5627f375 Michael Hanselmann
  """Wait for node daemon to become responsive.
223 5627f375 Michael Hanselmann

224 5627f375 Michael Hanselmann
  """
225 d3833ebd Michael Hanselmann
  def _CheckNodeDaemon():
226 bd6d1202 Renรฉ Nussbaumer
    # Pylint bug <http://www.logilab.org/ticket/35642>
227 bd6d1202 Renรฉ Nussbaumer
    # pylint: disable=E1101
228 db04ce5d Michael Hanselmann
    result = rpc.BootstrapRunner().call_version([node_name])[node_name]
229 d3833ebd Michael Hanselmann
    if result.fail_msg:
230 d3833ebd Michael Hanselmann
      raise utils.RetryAgain()
231 8f215968 Michael Hanselmann
232 d3833ebd Michael Hanselmann
  try:
233 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckNodeDaemon, 1.0, _DAEMON_READY_TIMEOUT)
234 d3833ebd Michael Hanselmann
  except utils.RetryTimeout:
235 5627f375 Michael Hanselmann
    raise errors.OpExecError("Node daemon on %s didn't answer queries within"
236 3b6b6129 Michael Hanselmann
                             " %s seconds" % (node_name, _DAEMON_READY_TIMEOUT))
237 3b6b6129 Michael Hanselmann
238 3b6b6129 Michael Hanselmann
239 3b6b6129 Michael Hanselmann
def _WaitForMasterDaemon():
240 3b6b6129 Michael Hanselmann
  """Wait for master daemon to become responsive.
241 3b6b6129 Michael Hanselmann

242 3b6b6129 Michael Hanselmann
  """
243 3b6b6129 Michael Hanselmann
  def _CheckMasterDaemon():
244 3b6b6129 Michael Hanselmann
    try:
245 3b6b6129 Michael Hanselmann
      cl = luxi.Client()
246 3b6b6129 Michael Hanselmann
      (cluster_name, ) = cl.QueryConfigValues(["cluster_name"])
247 3b6b6129 Michael Hanselmann
    except Exception:
248 3b6b6129 Michael Hanselmann
      raise utils.RetryAgain()
249 3b6b6129 Michael Hanselmann
250 3b6b6129 Michael Hanselmann
    logging.debug("Received cluster name %s from master", cluster_name)
251 3b6b6129 Michael Hanselmann
252 3b6b6129 Michael Hanselmann
  try:
253 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckMasterDaemon, 1.0, _DAEMON_READY_TIMEOUT)
254 3b6b6129 Michael Hanselmann
  except utils.RetryTimeout:
255 3b6b6129 Michael Hanselmann
    raise errors.OpExecError("Master daemon didn't answer queries within"
256 3b6b6129 Michael Hanselmann
                             " %s seconds" % _DAEMON_READY_TIMEOUT)
257 5627f375 Michael Hanselmann
258 a0c9f010 Michael Hanselmann
259 a5da38fa Michael Hanselmann
def _WaitForSshDaemon(hostname, port, family):
260 a5da38fa Michael Hanselmann
  """Wait for SSH daemon to become responsive.
261 a5da38fa Michael Hanselmann

262 a5da38fa Michael Hanselmann
  """
263 a5da38fa Michael Hanselmann
  hostip = netutils.GetHostname(name=hostname, family=family).ip
264 a5da38fa Michael Hanselmann
265 a5da38fa Michael Hanselmann
  def _CheckSshDaemon():
266 a5da38fa Michael Hanselmann
    if netutils.TcpPing(hostip, port, timeout=1.0, live_port_needed=True):
267 a5da38fa Michael Hanselmann
      logging.debug("SSH daemon on %s:%s (IP address %s) has become"
268 a5da38fa Michael Hanselmann
                    " responsive", hostname, port, hostip)
269 a5da38fa Michael Hanselmann
    else:
270 a5da38fa Michael Hanselmann
      raise utils.RetryAgain()
271 a5da38fa Michael Hanselmann
272 a5da38fa Michael Hanselmann
  try:
273 a5da38fa Michael Hanselmann
    utils.Retry(_CheckSshDaemon, 1.0, _DAEMON_READY_TIMEOUT)
274 a5da38fa Michael Hanselmann
  except utils.RetryTimeout:
275 a5da38fa Michael Hanselmann
    raise errors.OpExecError("SSH daemon on %s:%s (IP address %s) didn't"
276 a5da38fa Michael Hanselmann
                             " become responsive within %s seconds" %
277 a5da38fa Michael Hanselmann
                             (hostname, port, hostip, _DAEMON_READY_TIMEOUT))
278 a5da38fa Michael Hanselmann
279 a5da38fa Michael Hanselmann
280 a698cdbb Michael Hanselmann
def RunNodeSetupCmd(cluster_name, node, basecmd, debug, verbose,
281 a698cdbb Michael Hanselmann
                    use_cluster_key, ask_key, strict_host_check, data):
282 a698cdbb Michael Hanselmann
  """Runs a command to configure something on a remote machine.
283 a698cdbb Michael Hanselmann

284 a698cdbb Michael Hanselmann
  @type cluster_name: string
285 a698cdbb Michael Hanselmann
  @param cluster_name: Cluster name
286 a698cdbb Michael Hanselmann
  @type node: string
287 a698cdbb Michael Hanselmann
  @param node: Node name
288 a698cdbb Michael Hanselmann
  @type basecmd: string
289 a698cdbb Michael Hanselmann
  @param basecmd: Base command (path on the remote machine)
290 a698cdbb Michael Hanselmann
  @type debug: bool
291 a698cdbb Michael Hanselmann
  @param debug: Enable debug output
292 a698cdbb Michael Hanselmann
  @type verbose: bool
293 a698cdbb Michael Hanselmann
  @param verbose: Enable verbose output
294 a698cdbb Michael Hanselmann
  @type use_cluster_key: bool
295 a698cdbb Michael Hanselmann
  @param use_cluster_key: See L{ssh.SshRunner.BuildCmd}
296 a698cdbb Michael Hanselmann
  @type ask_key: bool
297 a698cdbb Michael Hanselmann
  @param ask_key: See L{ssh.SshRunner.BuildCmd}
298 a698cdbb Michael Hanselmann
  @type strict_host_check: bool
299 a698cdbb Michael Hanselmann
  @param strict_host_check: See L{ssh.SshRunner.BuildCmd}
300 a698cdbb Michael Hanselmann
  @param data: JSON-serializable input data for script (passed to stdin)
301 a698cdbb Michael Hanselmann

302 a698cdbb Michael Hanselmann
  """
303 a698cdbb Michael Hanselmann
  cmd = [basecmd]
304 a698cdbb Michael Hanselmann
305 a698cdbb Michael Hanselmann
  # Pass --debug/--verbose to the external script if set on our invocation
306 a698cdbb Michael Hanselmann
  if debug:
307 a698cdbb Michael Hanselmann
    cmd.append("--debug")
308 a698cdbb Michael Hanselmann
309 a698cdbb Michael Hanselmann
  if verbose:
310 a698cdbb Michael Hanselmann
    cmd.append("--verbose")
311 a698cdbb Michael Hanselmann
312 e1874aa7 Michael Hanselmann
  family = ssconf.SimpleStore().GetPrimaryIPFamily()
313 e1874aa7 Michael Hanselmann
  srun = ssh.SshRunner(cluster_name,
314 e1874aa7 Michael Hanselmann
                       ipv6=(family == netutils.IP6Address.family))
315 a698cdbb Michael Hanselmann
  scmd = srun.BuildCmd(node, constants.SSH_LOGIN_USER,
316 a698cdbb Michael Hanselmann
                       utils.ShellQuoteArgs(cmd),
317 a698cdbb Michael Hanselmann
                       batch=False, ask_key=ask_key, quiet=False,
318 a698cdbb Michael Hanselmann
                       strict_host_check=strict_host_check,
319 a698cdbb Michael Hanselmann
                       use_cluster_key=use_cluster_key)
320 a698cdbb Michael Hanselmann
321 a698cdbb Michael Hanselmann
  tempfh = tempfile.TemporaryFile()
322 a698cdbb Michael Hanselmann
  try:
323 a698cdbb Michael Hanselmann
    tempfh.write(serializer.DumpJson(data))
324 a698cdbb Michael Hanselmann
    tempfh.seek(0)
325 a698cdbb Michael Hanselmann
326 a698cdbb Michael Hanselmann
    result = utils.RunCmd(scmd, interactive=True, input_fd=tempfh)
327 a698cdbb Michael Hanselmann
  finally:
328 a698cdbb Michael Hanselmann
    tempfh.close()
329 a698cdbb Michael Hanselmann
330 a698cdbb Michael Hanselmann
  if result.failed:
331 a698cdbb Michael Hanselmann
    raise errors.OpExecError("Command '%s' failed: %s" %
332 a698cdbb Michael Hanselmann
                             (result.cmd, result.fail_reason))
333 a698cdbb Michael Hanselmann
334 a5da38fa Michael Hanselmann
  _WaitForSshDaemon(node, netutils.GetDaemonPort(constants.SSH), family)
335 a5da38fa Michael Hanselmann
336 a698cdbb Michael Hanselmann
337 0e3baaf3 Iustin Pop
def _InitFileStorage(file_storage_dir):
338 0e3baaf3 Iustin Pop
  """Initialize if needed the file storage.
339 0e3baaf3 Iustin Pop

340 0e3baaf3 Iustin Pop
  @param file_storage_dir: the user-supplied value
341 0e3baaf3 Iustin Pop
  @return: either empty string (if file storage was disabled at build
342 0e3baaf3 Iustin Pop
      time) or the normalized path to the storage directory
343 0e3baaf3 Iustin Pop

344 0e3baaf3 Iustin Pop
  """
345 0e3baaf3 Iustin Pop
  file_storage_dir = os.path.normpath(file_storage_dir)
346 0e3baaf3 Iustin Pop
347 0e3baaf3 Iustin Pop
  if not os.path.isabs(file_storage_dir):
348 0376655e Guido Trotter
    raise errors.OpPrereqError("File storage directory '%s' is not an absolute"
349 0376655e Guido Trotter
                               " path" % file_storage_dir, errors.ECODE_INVAL)
350 0e3baaf3 Iustin Pop
351 0e3baaf3 Iustin Pop
  if not os.path.exists(file_storage_dir):
352 0e3baaf3 Iustin Pop
    try:
353 0e3baaf3 Iustin Pop
      os.makedirs(file_storage_dir, 0750)
354 0e3baaf3 Iustin Pop
    except OSError, err:
355 0e3baaf3 Iustin Pop
      raise errors.OpPrereqError("Cannot create file storage directory"
356 0e3baaf3 Iustin Pop
                                 " '%s': %s" % (file_storage_dir, err),
357 0e3baaf3 Iustin Pop
                                 errors.ECODE_ENVIRON)
358 0e3baaf3 Iustin Pop
359 0e3baaf3 Iustin Pop
  if not os.path.isdir(file_storage_dir):
360 0e3baaf3 Iustin Pop
    raise errors.OpPrereqError("The file storage directory '%s' is not"
361 0e3baaf3 Iustin Pop
                               " a directory." % file_storage_dir,
362 0e3baaf3 Iustin Pop
                               errors.ECODE_ENVIRON)
363 0e3baaf3 Iustin Pop
  return file_storage_dir
364 0e3baaf3 Iustin Pop
365 0e3baaf3 Iustin Pop
366 18bb6d28 Agata Murawska
def InitCluster(cluster_name, mac_prefix, # pylint: disable=R0913, R0914
367 5a8648eb Andrea Spadaccini
                master_netmask, master_netdev, file_storage_dir,
368 5a8648eb Andrea Spadaccini
                shared_file_storage_dir, candidate_pool_size, secondary_ip=None,
369 5a8648eb Andrea Spadaccini
                vg_name=None, beparams=None, nicparams=None, ndparams=None,
370 bc5d0215 Andrea Spadaccini
                hvparams=None, diskparams=None, enabled_hypervisors=None,
371 bc5d0215 Andrea Spadaccini
                modify_etc_hosts=True, modify_ssh_setup=True,
372 bc5d0215 Andrea Spadaccini
                maintain_node_health=False, drbd_helper=None, uid_pool=None,
373 18bb6d28 Agata Murawska
                default_iallocator=None, primary_ip_version=None, ipolicy=None,
374 c4929a8b Renรฉ Nussbaumer
                prealloc_wipe_disks=False, use_external_mip_script=False,
375 3bde79ee Helga Velroyen
                hv_state=None, disk_state=None, enabled_disk_templates=None):
376 a0c9f010 Michael Hanselmann
  """Initialise the cluster.
377 a0c9f010 Michael Hanselmann

378 ce735215 Guido Trotter
  @type candidate_pool_size: int
379 ce735215 Guido Trotter
  @param candidate_pool_size: master candidate pool size
380 3bde79ee Helga Velroyen
  @type enabled_disk_templates: list of string
381 3bde79ee Helga Velroyen
  @param enabled_disk_templates: list of disk_templates to be used in this
382 c074a9e8 Helga Velroyen
    cluster
383 ce735215 Guido Trotter

384 a0c9f010 Michael Hanselmann
  """
385 ce735215 Guido Trotter
  # TODO: complete the docstring
386 a0c9f010 Michael Hanselmann
  if config.ConfigWriter.IsCluster():
387 debac808 Iustin Pop
    raise errors.OpPrereqError("Cluster is already initialised",
388 debac808 Iustin Pop
                               errors.ECODE_STATE)
389 a0c9f010 Michael Hanselmann
390 b119bccb Guido Trotter
  if not enabled_hypervisors:
391 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors list must contain at"
392 debac808 Iustin Pop
                               " least one member", errors.ECODE_INVAL)
393 b119bccb Guido Trotter
  invalid_hvs = set(enabled_hypervisors) - constants.HYPER_TYPES
394 b119bccb Guido Trotter
  if invalid_hvs:
395 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors contains invalid"
396 debac808 Iustin Pop
                               " entries: %s" % invalid_hvs,
397 debac808 Iustin Pop
                               errors.ECODE_INVAL)
398 b119bccb Guido Trotter
399 3bde79ee Helga Velroyen
  if not enabled_disk_templates:
400 3bde79ee Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list must contain at"
401 c074a9e8 Helga Velroyen
                               " least one member", errors.ECODE_INVAL)
402 3bde79ee Helga Velroyen
  invalid_disk_templates = \
403 3bde79ee Helga Velroyen
    set(enabled_disk_templates) - constants.DISK_TEMPLATES
404 3bde79ee Helga Velroyen
  if invalid_disk_templates:
405 3bde79ee Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list contains invalid"
406 3bde79ee Helga Velroyen
                               " entries: %s" % invalid_disk_templates,
407 c074a9e8 Helga Velroyen
                               errors.ECODE_INVAL)
408 c074a9e8 Helga Velroyen
409 5a8648eb Andrea Spadaccini
  try:
410 5a8648eb Andrea Spadaccini
    ipcls = netutils.IPAddress.GetClassFromIpVersion(primary_ip_version)
411 5a8648eb Andrea Spadaccini
  except errors.ProgrammerError:
412 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Invalid primary ip version: %d." %
413 2cfbc784 Iustin Pop
                               primary_ip_version, errors.ECODE_INVAL)
414 2f20d07b Manuel Franceschini
415 2f20d07b Manuel Franceschini
  hostname = netutils.GetHostname(family=ipcls.family)
416 2f20d07b Manuel Franceschini
  if not ipcls.IsValid(hostname.ip):
417 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) is not a valid IPv%d"
418 2cfbc784 Iustin Pop
                               " address." % (hostname.ip, primary_ip_version),
419 2cfbc784 Iustin Pop
                               errors.ECODE_INVAL)
420 2f20d07b Manuel Franceschini
421 2f20d07b Manuel Franceschini
  if ipcls.IsLoopback(hostname.ip):
422 8b312c1d Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) resolves to a loopback"
423 8b312c1d Manuel Franceschini
                               " address. Please fix DNS or %s." %
424 ee045466 Michael Hanselmann
                               (hostname.ip, pathutils.ETC_HOSTS),
425 debac808 Iustin Pop
                               errors.ECODE_ENVIRON)
426 a0c9f010 Michael Hanselmann
427 2f20d07b Manuel Franceschini
  if not ipcls.Own(hostname.ip):
428 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Inconsistency: this host's name resolves"
429 a0c9f010 Michael Hanselmann
                               " to %s,\nbut this ip address does not"
430 7c4c22f5 Manuel Franceschini
                               " belong to this host" %
431 debac808 Iustin Pop
                               hostname.ip, errors.ECODE_ENVIRON)
432 a0c9f010 Michael Hanselmann
433 2f20d07b Manuel Franceschini
  clustername = netutils.GetHostname(name=cluster_name, family=ipcls.family)
434 a0c9f010 Michael Hanselmann
435 2f20d07b Manuel Franceschini
  if netutils.TcpPing(clustername.ip, constants.DEFAULT_NODED_PORT, timeout=5):
436 7c4c22f5 Manuel Franceschini
    raise errors.OpPrereqError("Cluster IP already active",
437 debac808 Iustin Pop
                               errors.ECODE_NOTUNIQUE)
438 a0c9f010 Michael Hanselmann
439 2f20d07b Manuel Franceschini
  if not secondary_ip:
440 2f20d07b Manuel Franceschini
    if primary_ip_version == constants.IP6_VERSION:
441 2f20d07b Manuel Franceschini
      raise errors.OpPrereqError("When using a IPv6 primary address, a valid"
442 7c4c22f5 Manuel Franceschini
                                 " IPv4 address must be given as secondary",
443 7c4c22f5 Manuel Franceschini
                                 errors.ECODE_INVAL)
444 b9eeeb02 Michael Hanselmann
    secondary_ip = hostname.ip
445 a0c9f010 Michael Hanselmann
446 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.IsValid(secondary_ip):
447 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Secondary IP address (%s) has to be a valid"
448 2f20d07b Manuel Franceschini
                               " IPv4 address." % secondary_ip,
449 2f20d07b Manuel Franceschini
                               errors.ECODE_INVAL)
450 2f20d07b Manuel Franceschini
451 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.Own(secondary_ip):
452 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("You gave %s as secondary IP,"
453 2f20d07b Manuel Franceschini
                               " but it does not belong to this host." %
454 2f20d07b Manuel Franceschini
                               secondary_ip, errors.ECODE_ENVIRON)
455 2f20d07b Manuel Franceschini
456 5a8648eb Andrea Spadaccini
  if master_netmask is not None:
457 5a8648eb Andrea Spadaccini
    if not ipcls.ValidateNetmask(master_netmask):
458 5a8648eb Andrea Spadaccini
      raise errors.OpPrereqError("CIDR netmask (%s) not valid for IPv%s " %
459 2cfbc784 Iustin Pop
                                  (master_netmask, primary_ip_version),
460 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
461 5a8648eb Andrea Spadaccini
  else:
462 5a8648eb Andrea Spadaccini
    master_netmask = ipcls.iplen
463 5a8648eb Andrea Spadaccini
464 a0c9f010 Michael Hanselmann
  if vg_name is not None:
465 a0c9f010 Michael Hanselmann
    # Check if volume group is valid
466 a0c9f010 Michael Hanselmann
    vgstatus = utils.CheckVolumeGroupSize(utils.ListVolumeGroups(), vg_name,
467 a0c9f010 Michael Hanselmann
                                          constants.MIN_VG_SIZE)
468 a0c9f010 Michael Hanselmann
    if vgstatus:
469 a0c9f010 Michael Hanselmann
      raise errors.OpPrereqError("Error: %s\nspecify --no-lvm-storage if"
470 debac808 Iustin Pop
                                 " you are not using lvm" % vgstatus,
471 debac808 Iustin Pop
                                 errors.ECODE_INVAL)
472 a0c9f010 Michael Hanselmann
473 a721e23a Luca Bigliardi
  if drbd_helper is not None:
474 a721e23a Luca Bigliardi
    try:
475 a721e23a Luca Bigliardi
      curr_helper = bdev.BaseDRBD.GetUsermodeHelper()
476 a721e23a Luca Bigliardi
    except errors.BlockDeviceError, err:
477 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error while checking drbd helper"
478 a721e23a Luca Bigliardi
                                 " (specify --no-drbd-storage if you are not"
479 a721e23a Luca Bigliardi
                                 " using drbd): %s" % str(err),
480 a721e23a Luca Bigliardi
                                 errors.ECODE_ENVIRON)
481 a721e23a Luca Bigliardi
    if drbd_helper != curr_helper:
482 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error: requiring %s as drbd helper but %s"
483 a721e23a Luca Bigliardi
                                 " is the current helper" % (drbd_helper,
484 a721e23a Luca Bigliardi
                                                             curr_helper),
485 a721e23a Luca Bigliardi
                                 errors.ECODE_INVAL)
486 a721e23a Luca Bigliardi
487 32ba31be Michael Hanselmann
  logging.debug("Stopping daemons (if any are running)")
488 32ba31be Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "stop-all"])
489 32ba31be Michael Hanselmann
  if result.failed:
490 32ba31be Michael Hanselmann
    raise errors.OpExecError("Could not stop daemons, command %s"
491 32ba31be Michael Hanselmann
                             " had exitcode %s and error '%s'" %
492 32ba31be Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
493 32ba31be Michael Hanselmann
494 0376655e Guido Trotter
  if constants.ENABLE_FILE_STORAGE:
495 0376655e Guido Trotter
    file_storage_dir = _InitFileStorage(file_storage_dir)
496 0376655e Guido Trotter
  else:
497 0376655e Guido Trotter
    file_storage_dir = ""
498 0376655e Guido Trotter
499 0376655e Guido Trotter
  if constants.ENABLE_SHARED_FILE_STORAGE:
500 0376655e Guido Trotter
    shared_file_storage_dir = _InitFileStorage(shared_file_storage_dir)
501 0376655e Guido Trotter
  else:
502 0376655e Guido Trotter
    shared_file_storage_dir = ""
503 a0c9f010 Michael Hanselmann
504 a0c9f010 Michael Hanselmann
  if not re.match("^[0-9a-z]{2}:[0-9a-z]{2}:[0-9a-z]{2}$", mac_prefix):
505 debac808 Iustin Pop
    raise errors.OpPrereqError("Invalid mac prefix given '%s'" % mac_prefix,
506 debac808 Iustin Pop
                               errors.ECODE_INVAL)
507 a0c9f010 Michael Hanselmann
508 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ip", "link", "show", "dev", master_netdev])
509 a0c9f010 Michael Hanselmann
  if result.failed:
510 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Invalid master netdev given (%s): '%s'" %
511 a0c9f010 Michael Hanselmann
                               (master_netdev,
512 debac808 Iustin Pop
                                result.output.strip()), errors.ECODE_INVAL)
513 a0c9f010 Michael Hanselmann
514 7ede9c6a Michael Hanselmann
  dirs = [(pathutils.RUN_DIR, constants.RUN_DIRS_MODE)]
515 9dae41ad Guido Trotter
  utils.EnsureDirs(dirs)
516 9dae41ad Guido Trotter
517 b2e233a5 Guido Trotter
  objects.UpgradeBeParams(beparams)
518 a5728081 Guido Trotter
  utils.ForceDictType(beparams, constants.BES_PARAMETER_TYPES)
519 b6a30b0d Guido Trotter
  utils.ForceDictType(nicparams, constants.NICS_PARAMETER_TYPES)
520 18bb6d28 Agata Murawska
521 b6a30b0d Guido Trotter
  objects.NIC.CheckParameterSyntax(nicparams)
522 57dc299a Iustin Pop
523 2cc673a3 Iustin Pop
  full_ipolicy = objects.FillIPolicy(constants.IPOLICY_DEFAULTS, ipolicy)
524 b6a30b0d Guido Trotter
525 6204ee71 Renรฉ Nussbaumer
  if ndparams is not None:
526 6204ee71 Renรฉ Nussbaumer
    utils.ForceDictType(ndparams, constants.NDS_PARAMETER_TYPES)
527 6204ee71 Renรฉ Nussbaumer
  else:
528 6204ee71 Renรฉ Nussbaumer
    ndparams = dict(constants.NDC_DEFAULTS)
529 6204ee71 Renรฉ Nussbaumer
530 c4929a8b Renรฉ Nussbaumer
  # This is ugly, as we modify the dict itself
531 57dc299a Iustin Pop
  # FIXME: Make utils.ForceDictType pure functional or write a wrapper
532 57dc299a Iustin Pop
  # around it
533 c4929a8b Renรฉ Nussbaumer
  if hv_state:
534 c4929a8b Renรฉ Nussbaumer
    for hvname, hvs_data in hv_state.items():
535 c4929a8b Renรฉ Nussbaumer
      utils.ForceDictType(hvs_data, constants.HVSTS_PARAMETER_TYPES)
536 c4929a8b Renรฉ Nussbaumer
      hv_state[hvname] = objects.Cluster.SimpleFillHvState(hvs_data)
537 c4929a8b Renรฉ Nussbaumer
  else:
538 c4929a8b Renรฉ Nussbaumer
    hv_state = dict((hvname, constants.HVST_DEFAULTS)
539 c4929a8b Renรฉ Nussbaumer
                    for hvname in enabled_hypervisors)
540 c4929a8b Renรฉ Nussbaumer
541 c4929a8b Renรฉ Nussbaumer
  # FIXME: disk_state has no default values yet
542 c4929a8b Renรฉ Nussbaumer
  if disk_state:
543 c4929a8b Renรฉ Nussbaumer
    for storage, ds_data in disk_state.items():
544 c4929a8b Renรฉ Nussbaumer
      if storage not in constants.DS_VALID_TYPES:
545 c4929a8b Renรฉ Nussbaumer
        raise errors.OpPrereqError("Invalid storage type in disk state: %s" %
546 c4929a8b Renรฉ Nussbaumer
                                   storage, errors.ECODE_INVAL)
547 c4929a8b Renรฉ Nussbaumer
      for ds_name, state in ds_data.items():
548 c4929a8b Renรฉ Nussbaumer
        utils.ForceDictType(state, constants.DSS_PARAMETER_TYPES)
549 c4929a8b Renรฉ Nussbaumer
        ds_data[ds_name] = objects.Cluster.SimpleFillDiskState(state)
550 c4929a8b Renรฉ Nussbaumer
551 a5728081 Guido Trotter
  # hvparams is a mapping of hypervisor->hvparams dict
552 a5728081 Guido Trotter
  for hv_name, hv_params in hvparams.iteritems():
553 a5728081 Guido Trotter
    utils.ForceDictType(hv_params, constants.HVS_PARAMETER_TYPES)
554 a5728081 Guido Trotter
    hv_class = hypervisor.GetHypervisor(hv_name)
555 a5728081 Guido Trotter
    hv_class.CheckParameterSyntax(hv_params)
556 d4b72030 Guido Trotter
557 bc5d0215 Andrea Spadaccini
  # diskparams is a mapping of disk-template->diskparams dict
558 bc5d0215 Andrea Spadaccini
  for template, dt_params in diskparams.items():
559 bc5d0215 Andrea Spadaccini
    param_keys = set(dt_params.keys())
560 bc5d0215 Andrea Spadaccini
    default_param_keys = set(constants.DISK_DT_DEFAULTS[template].keys())
561 bc5d0215 Andrea Spadaccini
    if not (param_keys <= default_param_keys):
562 bc5d0215 Andrea Spadaccini
      unknown_params = param_keys - default_param_keys
563 bc5d0215 Andrea Spadaccini
      raise errors.OpPrereqError("Invalid parameters for disk template %s:"
564 bc5d0215 Andrea Spadaccini
                                 " %s" % (template,
565 2cfbc784 Iustin Pop
                                          utils.CommaJoin(unknown_params)),
566 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
567 bc5d0215 Andrea Spadaccini
    utils.ForceDictType(dt_params, constants.DISK_DT_TYPES)
568 e4a4391d Renรฉ Nussbaumer
  try:
569 e4a4391d Renรฉ Nussbaumer
    utils.VerifyDictOptions(diskparams, constants.DISK_DT_DEFAULTS)
570 e4a4391d Renรฉ Nussbaumer
  except errors.OpPrereqError, err:
571 e4a4391d Renรฉ Nussbaumer
    raise errors.OpPrereqError("While verify diskparam options: %s" % err,
572 e4a4391d Renรฉ Nussbaumer
                               errors.ECODE_INVAL)
573 bc5d0215 Andrea Spadaccini
574 a0c9f010 Michael Hanselmann
  # set up ssh config and /etc/hosts
575 7ede9c6a Michael Hanselmann
  sshline = utils.ReadFile(pathutils.SSH_HOST_RSA_PUB)
576 a0c9f010 Michael Hanselmann
  sshkey = sshline.split(" ")[1]
577 a0c9f010 Michael Hanselmann
578 b86a6bcd Guido Trotter
  if modify_etc_hosts:
579 ea8ac9c9 Renรฉ Nussbaumer
    utils.AddHostToEtcHosts(hostname.name, hostname.ip)
580 b86a6bcd Guido Trotter
581 b989b9d9 Ken Wehr
  if modify_ssh_setup:
582 b989b9d9 Ken Wehr
    _InitSSHSetup()
583 a0c9f010 Michael Hanselmann
584 bf4af505 Apollon Oikonomopoulos
  if default_iallocator is not None:
585 bf4af505 Apollon Oikonomopoulos
    alloc_script = utils.FindFile(default_iallocator,
586 bf4af505 Apollon Oikonomopoulos
                                  constants.IALLOCATOR_SEARCH_PATH,
587 bf4af505 Apollon Oikonomopoulos
                                  os.path.isfile)
588 bf4af505 Apollon Oikonomopoulos
    if alloc_script is None:
589 bf4af505 Apollon Oikonomopoulos
      raise errors.OpPrereqError("Invalid default iallocator script '%s'"
590 bf4af505 Apollon Oikonomopoulos
                                 " specified" % default_iallocator,
591 bf4af505 Apollon Oikonomopoulos
                                 errors.ECODE_INVAL)
592 d1e9c98d Iustin Pop
  elif constants.HTOOLS:
593 d1e9c98d Iustin Pop
    # htools was enabled at build-time, we default to it
594 d1e9c98d Iustin Pop
    if utils.FindFile(constants.IALLOC_HAIL,
595 d1e9c98d Iustin Pop
                      constants.IALLOCATOR_SEARCH_PATH,
596 d1e9c98d Iustin Pop
                      os.path.isfile):
597 d1e9c98d Iustin Pop
      default_iallocator = constants.IALLOC_HAIL
598 bf4af505 Apollon Oikonomopoulos
599 430b923c Iustin Pop
  now = time.time()
600 430b923c Iustin Pop
601 a0c9f010 Michael Hanselmann
  # init of cluster config file
602 b9eeeb02 Michael Hanselmann
  cluster_config = objects.Cluster(
603 b9eeeb02 Michael Hanselmann
    serial_no=1,
604 b9eeeb02 Michael Hanselmann
    rsahostkeypub=sshkey,
605 b9eeeb02 Michael Hanselmann
    highest_used_port=(constants.FIRST_DRBD_PORT - 1),
606 b9eeeb02 Michael Hanselmann
    mac_prefix=mac_prefix,
607 b9eeeb02 Michael Hanselmann
    volume_group_name=vg_name,
608 b9eeeb02 Michael Hanselmann
    tcpudp_port_pool=set(),
609 f6bd6e98 Michael Hanselmann
    master_node=hostname.name,
610 f6bd6e98 Michael Hanselmann
    master_ip=clustername.ip,
611 5a8648eb Andrea Spadaccini
    master_netmask=master_netmask,
612 f6bd6e98 Michael Hanselmann
    master_netdev=master_netdev,
613 f6bd6e98 Michael Hanselmann
    cluster_name=clustername.name,
614 f6bd6e98 Michael Hanselmann
    file_storage_dir=file_storage_dir,
615 4b97f902 Apollon Oikonomopoulos
    shared_file_storage_dir=shared_file_storage_dir,
616 ea3a925f Alexander Schreiber
    enabled_hypervisors=enabled_hypervisors,
617 4ef7f423 Guido Trotter
    beparams={constants.PP_DEFAULT: beparams},
618 b6a30b0d Guido Trotter
    nicparams={constants.PP_DEFAULT: nicparams},
619 6204ee71 Renรฉ Nussbaumer
    ndparams=ndparams,
620 ea3a925f Alexander Schreiber
    hvparams=hvparams,
621 bc5d0215 Andrea Spadaccini
    diskparams=diskparams,
622 ce735215 Guido Trotter
    candidate_pool_size=candidate_pool_size,
623 022c3a0b Guido Trotter
    modify_etc_hosts=modify_etc_hosts,
624 b989b9d9 Ken Wehr
    modify_ssh_setup=modify_ssh_setup,
625 39b0f0c2 Balazs Lecz
    uid_pool=uid_pool,
626 430b923c Iustin Pop
    ctime=now,
627 430b923c Iustin Pop
    mtime=now,
628 3953242f Iustin Pop
    maintain_node_health=maintain_node_health,
629 a721e23a Luca Bigliardi
    drbd_usermode_helper=drbd_helper,
630 bf4af505 Apollon Oikonomopoulos
    default_iallocator=default_iallocator,
631 2f20d07b Manuel Franceschini
    primary_ip_family=ipcls.family,
632 3d914585 Renรฉ Nussbaumer
    prealloc_wipe_disks=prealloc_wipe_disks,
633 bf689b7a Andrea Spadaccini
    use_external_mip_script=use_external_mip_script,
634 57dc299a Iustin Pop
    ipolicy=full_ipolicy,
635 c4929a8b Renรฉ Nussbaumer
    hv_state_static=hv_state,
636 c4929a8b Renรฉ Nussbaumer
    disk_state_static=disk_state,
637 3bde79ee Helga Velroyen
    enabled_disk_templates=enabled_disk_templates,
638 b9eeeb02 Michael Hanselmann
    )
639 b9eeeb02 Michael Hanselmann
  master_node_config = objects.Node(name=hostname.name,
640 b9eeeb02 Michael Hanselmann
                                    primary_ip=hostname.ip,
641 b9222f32 Guido Trotter
                                    secondary_ip=secondary_ip,
642 c044f32c Guido Trotter
                                    serial_no=1,
643 c044f32c Guido Trotter
                                    master_candidate=True,
644 af64c0ea Iustin Pop
                                    offline=False, drained=False,
645 435e4bd6 Michael Hanselmann
                                    ctime=now, mtime=now,
646 c044f32c Guido Trotter
                                    )
647 9e1333b9 Guido Trotter
  InitConfig(constants.CONFIG_VERSION, cluster_config, master_node_config)
648 d367b66c Manuel Franceschini
  cfg = config.ConfigWriter(offline=True)
649 7ede9c6a Michael Hanselmann
  ssh.WriteKnownHostsFile(cfg, pathutils.SSH_KNOWN_HOSTS_FILE)
650 a4eae71f Michael Hanselmann
  cfg.Update(cfg.GetClusterInfo(), logging.error)
651 ee501db1 Michael Hanselmann
  ssconf.WriteSsconfFiles(cfg.GetSsconfValues())
652 d367b66c Manuel Franceschini
653 d367b66c Manuel Franceschini
  # set up the inter-node password and certificate
654 d367b66c Manuel Franceschini
  _InitGanetiServerSetup(hostname.name)
655 827f753e Guido Trotter
656 952d7515 Michael Hanselmann
  logging.debug("Starting daemons")
657 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start-all"])
658 952d7515 Michael Hanselmann
  if result.failed:
659 952d7515 Michael Hanselmann
    raise errors.OpExecError("Could not start daemons, command %s"
660 952d7515 Michael Hanselmann
                             " had exitcode %s and error %s" %
661 952d7515 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
662 b3f1cf6f Iustin Pop
663 3b6b6129 Michael Hanselmann
  _WaitForMasterDaemon()
664 b3f1cf6f Iustin Pop
665 b1b6ea87 Iustin Pop
666 02f99608 Oleksiy Mishchenko
def InitConfig(version, cluster_config, master_node_config,
667 7ede9c6a Michael Hanselmann
               cfg_file=pathutils.CLUSTER_CONF_FILE):
668 7b3a8fb5 Iustin Pop
  """Create the initial cluster configuration.
669 7b3a8fb5 Iustin Pop

670 7b3a8fb5 Iustin Pop
  It will contain the current node, which will also be the master
671 7b3a8fb5 Iustin Pop
  node, and no instances.
672 7b3a8fb5 Iustin Pop

673 7b3a8fb5 Iustin Pop
  @type version: int
674 c41eea6e Iustin Pop
  @param version: configuration version
675 c41eea6e Iustin Pop
  @type cluster_config: L{objects.Cluster}
676 c41eea6e Iustin Pop
  @param cluster_config: cluster configuration
677 c41eea6e Iustin Pop
  @type master_node_config: L{objects.Node}
678 c41eea6e Iustin Pop
  @param master_node_config: master node configuration
679 c41eea6e Iustin Pop
  @type cfg_file: string
680 c41eea6e Iustin Pop
  @param cfg_file: configuration file path
681 c41eea6e Iustin Pop

682 7b3a8fb5 Iustin Pop
  """
683 88b92fe3 Guido Trotter
  uuid_generator = config.TemporaryReservationManager()
684 88b92fe3 Guido Trotter
  cluster_config.uuid = uuid_generator.Generate([], utils.NewUUID,
685 88b92fe3 Guido Trotter
                                                _INITCONF_ECID)
686 88b92fe3 Guido Trotter
  master_node_config.uuid = uuid_generator.Generate([], utils.NewUUID,
687 88b92fe3 Guido Trotter
                                                    _INITCONF_ECID)
688 7b3a8fb5 Iustin Pop
  nodes = {
689 7b3a8fb5 Iustin Pop
    master_node_config.name: master_node_config,
690 7b3a8fb5 Iustin Pop
    }
691 88b92fe3 Guido Trotter
  default_nodegroup = objects.NodeGroup(
692 88b92fe3 Guido Trotter
    uuid=uuid_generator.Generate([], utils.NewUUID, _INITCONF_ECID),
693 75cf411a Adeodato Simo
    name=constants.INITIAL_NODE_GROUP_NAME,
694 88b92fe3 Guido Trotter
    members=[master_node_config.name],
695 99ccf8b9 Renรฉ Nussbaumer
    diskparams={},
696 88b92fe3 Guido Trotter
    )
697 88b92fe3 Guido Trotter
  nodegroups = {
698 88b92fe3 Guido Trotter
    default_nodegroup.uuid: default_nodegroup,
699 88b92fe3 Guido Trotter
    }
700 d693c864 Iustin Pop
  now = time.time()
701 7b3a8fb5 Iustin Pop
  config_data = objects.ConfigData(version=version,
702 7b3a8fb5 Iustin Pop
                                   cluster=cluster_config,
703 88b92fe3 Guido Trotter
                                   nodegroups=nodegroups,
704 7b3a8fb5 Iustin Pop
                                   nodes=nodes,
705 7b3a8fb5 Iustin Pop
                                   instances={},
706 eaa4c57c Dimitris Aragiorgis
                                   networks={},
707 d693c864 Iustin Pop
                                   serial_no=1,
708 d693c864 Iustin Pop
                                   ctime=now, mtime=now)
709 a33848a5 Guido Trotter
  utils.WriteFile(cfg_file,
710 a33848a5 Guido Trotter
                  data=serializer.Dump(config_data.ToDict()),
711 a33848a5 Guido Trotter
                  mode=0600)
712 02f99608 Oleksiy Mishchenko
713 02f99608 Oleksiy Mishchenko
714 140aa4a8 Iustin Pop
def FinalizeClusterDestroy(master):
715 140aa4a8 Iustin Pop
  """Execute the last steps of cluster destroy
716 140aa4a8 Iustin Pop

717 140aa4a8 Iustin Pop
  This function shuts down all the daemons, completing the destroy
718 140aa4a8 Iustin Pop
  begun in cmdlib.LUDestroyOpcode.
719 140aa4a8 Iustin Pop

720 140aa4a8 Iustin Pop
  """
721 b989b9d9 Ken Wehr
  cfg = config.ConfigWriter()
722 b989b9d9 Ken Wehr
  modify_ssh_setup = cfg.GetClusterInfo().modify_ssh_setup
723 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
724 7c74bbe0 Andrea Spadaccini
725 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
726 c79198a0 Andrea Spadaccini
  master_params.name = master
727 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
728 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
729 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
730 c79198a0 Andrea Spadaccini
731 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
732 7c74bbe0 Andrea Spadaccini
  if msg:
733 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
734 7c74bbe0 Andrea Spadaccini
735 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(master)
736 3cebe102 Michael Hanselmann
  msg = result.fail_msg
737 6c00d19a Iustin Pop
  if msg:
738 099c52ad Iustin Pop
    logging.warning("Could not disable the master role: %s", msg)
739 7c74bbe0 Andrea Spadaccini
740 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_leave_cluster(master, modify_ssh_setup)
741 3cebe102 Michael Hanselmann
  msg = result.fail_msg
742 0623d351 Iustin Pop
  if msg:
743 0623d351 Iustin Pop
    logging.warning("Could not shutdown the node daemon and cleanup"
744 0623d351 Iustin Pop
                    " the node: %s", msg)
745 140aa4a8 Iustin Pop
746 140aa4a8 Iustin Pop
747 7b8ba235 Michael Hanselmann
def SetupNodeDaemon(opts, cluster_name, node):
748 827f753e Guido Trotter
  """Add a node to the cluster.
749 827f753e Guido Trotter

750 b1b6ea87 Iustin Pop
  This function must be called before the actual opcode, and will ssh
751 b1b6ea87 Iustin Pop
  to the remote node, copy the needed files, and start ganeti-noded,
752 b1b6ea87 Iustin Pop
  allowing the master to do the rest via normal rpc calls.
753 827f753e Guido Trotter

754 87622829 Iustin Pop
  @param cluster_name: the cluster name
755 87622829 Iustin Pop
  @param node: the name of the new node
756 827f753e Guido Trotter

757 827f753e Guido Trotter
  """
758 7b8ba235 Michael Hanselmann
  data = {
759 7b8ba235 Michael Hanselmann
    constants.NDS_CLUSTER_NAME: cluster_name,
760 7b8ba235 Michael Hanselmann
    constants.NDS_NODE_DAEMON_CERTIFICATE:
761 7b8ba235 Michael Hanselmann
      utils.ReadFile(pathutils.NODED_CERT_FILE),
762 7b8ba235 Michael Hanselmann
    constants.NDS_SSCONF: ssconf.SimpleStore().ReadAll(),
763 7b8ba235 Michael Hanselmann
    constants.NDS_START_NODE_DAEMON: True,
764 7b8ba235 Michael Hanselmann
    }
765 7b8ba235 Michael Hanselmann
766 7b8ba235 Michael Hanselmann
  RunNodeSetupCmd(cluster_name, node, pathutils.NODE_DAEMON_SETUP,
767 7b8ba235 Michael Hanselmann
                  opts.debug, opts.verbose,
768 7b8ba235 Michael Hanselmann
                  True, opts.ssh_key_check, opts.ssh_key_check, data)
769 827f753e Guido Trotter
770 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(node)
771 5627f375 Michael Hanselmann
772 b1b6ea87 Iustin Pop
773 8e2524c3 Guido Trotter
def MasterFailover(no_voting=False):
774 b1b6ea87 Iustin Pop
  """Failover the master node.
775 b1b6ea87 Iustin Pop

776 b1b6ea87 Iustin Pop
  This checks that we are not already the master, and will cause the
777 b1b6ea87 Iustin Pop
  current master to cease being master, and the non-master to become
778 b1b6ea87 Iustin Pop
  new master.
779 b1b6ea87 Iustin Pop

780 8e2524c3 Guido Trotter
  @type no_voting: boolean
781 8e2524c3 Guido Trotter
  @param no_voting: force the operation without remote nodes agreement
782 8e2524c3 Guido Trotter
                      (dangerous)
783 8e2524c3 Guido Trotter

784 b1b6ea87 Iustin Pop
  """
785 8135a2db Iustin Pop
  sstore = ssconf.SimpleStore()
786 b1b6ea87 Iustin Pop
787 8135a2db Iustin Pop
  old_master, new_master = ssconf.GetMasterAndMyself(sstore)
788 8135a2db Iustin Pop
  node_list = sstore.GetNodeList()
789 8135a2db Iustin Pop
  mc_list = sstore.GetMasterCandidates()
790 b1b6ea87 Iustin Pop
791 b1b6ea87 Iustin Pop
  if old_master == new_master:
792 b1b6ea87 Iustin Pop
    raise errors.OpPrereqError("This commands must be run on the node"
793 b1b6ea87 Iustin Pop
                               " where you want the new master to be."
794 b1b6ea87 Iustin Pop
                               " %s is already the master" %
795 debac808 Iustin Pop
                               old_master, errors.ECODE_INVAL)
796 d5927e48 Iustin Pop
797 8135a2db Iustin Pop
  if new_master not in mc_list:
798 8135a2db Iustin Pop
    mc_no_master = [name for name in mc_list if name != old_master]
799 8135a2db Iustin Pop
    raise errors.OpPrereqError("This node is not among the nodes marked"
800 8135a2db Iustin Pop
                               " as master candidates. Only these nodes"
801 8135a2db Iustin Pop
                               " can become masters. Current list of"
802 8135a2db Iustin Pop
                               " master candidates is:\n"
803 3ccb3a64 Michael Hanselmann
                               "%s" % ("\n".join(mc_no_master)),
804 debac808 Iustin Pop
                               errors.ECODE_STATE)
805 8135a2db Iustin Pop
806 8e2524c3 Guido Trotter
  if not no_voting:
807 8e2524c3 Guido Trotter
    vote_list = GatherMasterVotes(node_list)
808 8e2524c3 Guido Trotter
809 8e2524c3 Guido Trotter
    if vote_list:
810 8e2524c3 Guido Trotter
      voted_master = vote_list[0][0]
811 8e2524c3 Guido Trotter
      if voted_master is None:
812 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("Cluster is inconsistent, most nodes did"
813 debac808 Iustin Pop
                                   " not respond.", errors.ECODE_ENVIRON)
814 8e2524c3 Guido Trotter
      elif voted_master != old_master:
815 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("I have a wrong configuration, I believe"
816 8e2524c3 Guido Trotter
                                   " the master is %s but the other nodes"
817 8e2524c3 Guido Trotter
                                   " voted %s. Please resync the configuration"
818 8e2524c3 Guido Trotter
                                   " of this node." %
819 debac808 Iustin Pop
                                   (old_master, voted_master),
820 debac808 Iustin Pop
                                   errors.ECODE_STATE)
821 b1b6ea87 Iustin Pop
  # end checks
822 b1b6ea87 Iustin Pop
823 b1b6ea87 Iustin Pop
  rcode = 0
824 b1b6ea87 Iustin Pop
825 d5927e48 Iustin Pop
  logging.info("Setting master to %s, old master: %s", new_master, old_master)
826 b1b6ea87 Iustin Pop
827 21004460 Iustin Pop
  try:
828 21004460 Iustin Pop
    # instantiate a real config writer, as we now know we have the
829 21004460 Iustin Pop
    # configuration data
830 eb180fe2 Iustin Pop
    cfg = config.ConfigWriter(accept_foreign=True)
831 21004460 Iustin Pop
832 21004460 Iustin Pop
    cluster_info = cfg.GetClusterInfo()
833 21004460 Iustin Pop
    cluster_info.master_node = new_master
834 21004460 Iustin Pop
    # this will also regenerate the ssconf files, since we updated the
835 21004460 Iustin Pop
    # cluster info
836 21004460 Iustin Pop
    cfg.Update(cluster_info, logging.error)
837 21004460 Iustin Pop
  except errors.ConfigurationError, err:
838 21004460 Iustin Pop
    logging.error("Error while trying to set the new master: %s",
839 21004460 Iustin Pop
                  str(err))
840 21004460 Iustin Pop
    return 1
841 21004460 Iustin Pop
842 21004460 Iustin Pop
  # if cfg.Update worked, then it means the old master daemon won't be
843 21004460 Iustin Pop
  # able now to write its own config file (we rely on locking in both
844 21004460 Iustin Pop
  # backend.UploadFile() and ConfigWriter._Write(); hence the next
845 21004460 Iustin Pop
  # step is to kill the old master
846 21004460 Iustin Pop
847 21004460 Iustin Pop
  logging.info("Stopping the master daemon on node %s", old_master)
848 21004460 Iustin Pop
849 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
850 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
851 c79198a0 Andrea Spadaccini
  master_params.name = old_master
852 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
853 c79198a0 Andrea Spadaccini
  result = runner.call_node_deactivate_master_ip(master_params.name,
854 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
855 c79198a0 Andrea Spadaccini
856 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
857 7c74bbe0 Andrea Spadaccini
  if msg:
858 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
859 7c74bbe0 Andrea Spadaccini
860 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(old_master)
861 3cebe102 Michael Hanselmann
  msg = result.fail_msg
862 6c00d19a Iustin Pop
  if msg:
863 d5927e48 Iustin Pop
    logging.error("Could not disable the master role on the old master"
864 5ae4945a Iustin Pop
                  " %s, please disable manually: %s", old_master, msg)
865 b1b6ea87 Iustin Pop
866 21004460 Iustin Pop
  logging.info("Checking master IP non-reachability...")
867 21004460 Iustin Pop
868 425f0f54 Iustin Pop
  master_ip = sstore.GetMasterIP()
869 425f0f54 Iustin Pop
  total_timeout = 30
870 e687ec01 Michael Hanselmann
871 d23ef431 Michael Hanselmann
  # Here we have a phase where no master should be running
872 425f0f54 Iustin Pop
  def _check_ip():
873 a744b676 Manuel Franceschini
    if netutils.TcpPing(master_ip, constants.DEFAULT_NODED_PORT):
874 425f0f54 Iustin Pop
      raise utils.RetryAgain()
875 425f0f54 Iustin Pop
876 425f0f54 Iustin Pop
  try:
877 425f0f54 Iustin Pop
    utils.Retry(_check_ip, (1, 1.5, 5), total_timeout)
878 425f0f54 Iustin Pop
  except utils.RetryTimeout:
879 425f0f54 Iustin Pop
    logging.warning("The master IP is still reachable after %s seconds,"
880 425f0f54 Iustin Pop
                    " continuing but activating the master on the current"
881 425f0f54 Iustin Pop
                    " node will probably fail", total_timeout)
882 b1b6ea87 Iustin Pop
883 ff699aa9 Michael Hanselmann
  if jstore.CheckDrainFlag():
884 ff699aa9 Michael Hanselmann
    logging.info("Undraining job queue")
885 ff699aa9 Michael Hanselmann
    jstore.SetDrainFlag(False)
886 ff699aa9 Michael Hanselmann
887 21004460 Iustin Pop
  logging.info("Starting the master daemons on the new master")
888 d5927e48 Iustin Pop
889 db04ce5d Michael Hanselmann
  result = rpc.BootstrapRunner().call_node_start_master_daemons(new_master,
890 db04ce5d Michael Hanselmann
                                                                no_voting)
891 3cebe102 Michael Hanselmann
  msg = result.fail_msg
892 b726aff0 Iustin Pop
  if msg:
893 d5927e48 Iustin Pop
    logging.error("Could not start the master role on the new master"
894 b726aff0 Iustin Pop
                  " %s, please check: %s", new_master, msg)
895 b1b6ea87 Iustin Pop
    rcode = 1
896 b1b6ea87 Iustin Pop
897 21004460 Iustin Pop
  logging.info("Master failed over from %s to %s", old_master, new_master)
898 b1b6ea87 Iustin Pop
  return rcode
899 d7cdb55d Iustin Pop
900 d7cdb55d Iustin Pop
901 8eb148ae Iustin Pop
def GetMaster():
902 8eb148ae Iustin Pop
  """Returns the current master node.
903 8eb148ae Iustin Pop

904 8eb148ae Iustin Pop
  This is a separate function in bootstrap since it's needed by
905 8eb148ae Iustin Pop
  gnt-cluster, and instead of importing directly ssconf, it's better
906 8eb148ae Iustin Pop
  to abstract it in bootstrap, where we do use ssconf in other
907 8eb148ae Iustin Pop
  functions too.
908 8eb148ae Iustin Pop

909 8eb148ae Iustin Pop
  """
910 8eb148ae Iustin Pop
  sstore = ssconf.SimpleStore()
911 8eb148ae Iustin Pop
912 8eb148ae Iustin Pop
  old_master, _ = ssconf.GetMasterAndMyself(sstore)
913 8eb148ae Iustin Pop
914 8eb148ae Iustin Pop
  return old_master
915 8eb148ae Iustin Pop
916 8eb148ae Iustin Pop
917 d7cdb55d Iustin Pop
def GatherMasterVotes(node_list):
918 d7cdb55d Iustin Pop
  """Check the agreement on who is the master.
919 d7cdb55d Iustin Pop

920 d7cdb55d Iustin Pop
  This function will return a list of (node, number of votes), ordered
921 d7cdb55d Iustin Pop
  by the number of votes. Errors will be denoted by the key 'None'.
922 d7cdb55d Iustin Pop

923 d7cdb55d Iustin Pop
  Note that the sum of votes is the number of nodes this machine
924 d7cdb55d Iustin Pop
  knows, whereas the number of entries in the list could be different
925 d7cdb55d Iustin Pop
  (if some nodes vote for another master).
926 d7cdb55d Iustin Pop

927 d7cdb55d Iustin Pop
  We remove ourselves from the list since we know that (bugs aside)
928 d7cdb55d Iustin Pop
  since we use the same source for configuration information for both
929 d7cdb55d Iustin Pop
  backend and boostrap, we'll always vote for ourselves.
930 d7cdb55d Iustin Pop

931 d7cdb55d Iustin Pop
  @type node_list: list
932 d7cdb55d Iustin Pop
  @param node_list: the list of nodes to query for master info; the current
933 5bbd3f7f Michael Hanselmann
      node will be removed if it is in the list
934 d7cdb55d Iustin Pop
  @rtype: list
935 d7cdb55d Iustin Pop
  @return: list of (node, votes)
936 d7cdb55d Iustin Pop

937 d7cdb55d Iustin Pop
  """
938 b705c7a6 Manuel Franceschini
  myself = netutils.Hostname.GetSysName()
939 d7cdb55d Iustin Pop
  try:
940 d7cdb55d Iustin Pop
    node_list.remove(myself)
941 d7cdb55d Iustin Pop
  except ValueError:
942 d7cdb55d Iustin Pop
    pass
943 d7cdb55d Iustin Pop
  if not node_list:
944 d7cdb55d Iustin Pop
    # no nodes left (eventually after removing myself)
945 d7cdb55d Iustin Pop
    return []
946 db04ce5d Michael Hanselmann
  results = rpc.BootstrapRunner().call_master_info(node_list)
947 d7cdb55d Iustin Pop
  if not isinstance(results, dict):
948 d7cdb55d Iustin Pop
    # this should not happen (unless internal error in rpc)
949 d7cdb55d Iustin Pop
    logging.critical("Can't complete rpc call, aborting master startup")
950 d7cdb55d Iustin Pop
    return [(None, len(node_list))]
951 d7cdb55d Iustin Pop
  votes = {}
952 d7cdb55d Iustin Pop
  for node in results:
953 781de953 Iustin Pop
    nres = results[node]
954 2a52a064 Iustin Pop
    data = nres.payload
955 3cebe102 Michael Hanselmann
    msg = nres.fail_msg
956 2a52a064 Iustin Pop
    fail = False
957 2a52a064 Iustin Pop
    if msg:
958 2a52a064 Iustin Pop
      logging.warning("Error contacting node %s: %s", node, msg)
959 2a52a064 Iustin Pop
      fail = True
960 909b3a0e Andrea Spadaccini
    # for now we accept both length 3, 4 and 5 (data[3] is primary ip version
961 909b3a0e Andrea Spadaccini
    # and data[4] is the master netmask)
962 2a52a064 Iustin Pop
    elif not isinstance(data, (tuple, list)) or len(data) < 3:
963 2a52a064 Iustin Pop
      logging.warning("Invalid data received from node %s: %s", node, data)
964 2a52a064 Iustin Pop
      fail = True
965 2a52a064 Iustin Pop
    if fail:
966 d7cdb55d Iustin Pop
      if None not in votes:
967 d7cdb55d Iustin Pop
        votes[None] = 0
968 d7cdb55d Iustin Pop
      votes[None] += 1
969 d7cdb55d Iustin Pop
      continue
970 781de953 Iustin Pop
    master_node = data[2]
971 d7cdb55d Iustin Pop
    if master_node not in votes:
972 d7cdb55d Iustin Pop
      votes[master_node] = 0
973 d7cdb55d Iustin Pop
    votes[master_node] += 1
974 d7cdb55d Iustin Pop
975 d7cdb55d Iustin Pop
  vote_list = [v for v in votes.items()]
976 d7cdb55d Iustin Pop
  # sort first on number of votes then on name, since we want None
977 d7cdb55d Iustin Pop
  # sorted later if we have the half of the nodes not responding, and
978 d7cdb55d Iustin Pop
  # half voting all for the same master
979 d7cdb55d Iustin Pop
  vote_list.sort(key=lambda x: (x[1], x[0]), reverse=True)
980 d7cdb55d Iustin Pop
981 d7cdb55d Iustin Pop
  return vote_list