Statistics
| Branch: | Tag: | Revision:

root / lib / bootstrap.py @ 74676af4

History | View | Annotate | Download (37.4 kB)

1 a0c9f010 Michael Hanselmann
#
2 a0c9f010 Michael Hanselmann
#
3 a0c9f010 Michael Hanselmann
4 57dc299a Iustin Pop
# Copyright (C) 2006, 2007, 2008, 2010, 2011, 2012 Google Inc.
5 a0c9f010 Michael Hanselmann
#
6 a0c9f010 Michael Hanselmann
# This program is free software; you can redistribute it and/or modify
7 a0c9f010 Michael Hanselmann
# it under the terms of the GNU General Public License as published by
8 a0c9f010 Michael Hanselmann
# the Free Software Foundation; either version 2 of the License, or
9 a0c9f010 Michael Hanselmann
# (at your option) any later version.
10 a0c9f010 Michael Hanselmann
#
11 a0c9f010 Michael Hanselmann
# This program is distributed in the hope that it will be useful, but
12 a0c9f010 Michael Hanselmann
# WITHOUT ANY WARRANTY; without even the implied warranty of
13 a0c9f010 Michael Hanselmann
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 a0c9f010 Michael Hanselmann
# General Public License for more details.
15 a0c9f010 Michael Hanselmann
#
16 a0c9f010 Michael Hanselmann
# You should have received a copy of the GNU General Public License
17 a0c9f010 Michael Hanselmann
# along with this program; if not, write to the Free Software
18 a0c9f010 Michael Hanselmann
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19 a0c9f010 Michael Hanselmann
# 02110-1301, USA.
20 a0c9f010 Michael Hanselmann
21 a0c9f010 Michael Hanselmann
22 a0c9f010 Michael Hanselmann
"""Functions to bootstrap a new cluster.
23 a0c9f010 Michael Hanselmann

24 a0c9f010 Michael Hanselmann
"""
25 a0c9f010 Michael Hanselmann
26 a0c9f010 Michael Hanselmann
import os
27 a0c9f010 Michael Hanselmann
import os.path
28 a0c9f010 Michael Hanselmann
import re
29 b1b6ea87 Iustin Pop
import logging
30 d693c864 Iustin Pop
import time
31 a698cdbb Michael Hanselmann
import tempfile
32 a0c9f010 Michael Hanselmann
33 a0c9f010 Michael Hanselmann
from ganeti import rpc
34 a0c9f010 Michael Hanselmann
from ganeti import ssh
35 a0c9f010 Michael Hanselmann
from ganeti import utils
36 a0c9f010 Michael Hanselmann
from ganeti import errors
37 a0c9f010 Michael Hanselmann
from ganeti import config
38 a0c9f010 Michael Hanselmann
from ganeti import constants
39 b9eeeb02 Michael Hanselmann
from ganeti import objects
40 a0c9f010 Michael Hanselmann
from ganeti import ssconf
41 a33848a5 Guido Trotter
from ganeti import serializer
42 a5728081 Guido Trotter
from ganeti import hypervisor
43 cde49218 Helga Velroyen
from ganeti.storage import drbd
44 a744b676 Manuel Franceschini
from ganeti import netutils
45 3b6b6129 Michael Hanselmann
from ganeti import luxi
46 ff699aa9 Michael Hanselmann
from ganeti import jstore
47 7ede9c6a Michael Hanselmann
from ganeti import pathutils
48 3b6b6129 Michael Hanselmann
49 a0c9f010 Michael Hanselmann
50 88b92fe3 Guido Trotter
# ec_id for InitConfig's temporary reservation manager
51 88b92fe3 Guido Trotter
_INITCONF_ECID = "initconfig-ecid"
52 88b92fe3 Guido Trotter
53 3b6b6129 Michael Hanselmann
#: After how many seconds daemon must be responsive
54 3b6b6129 Michael Hanselmann
_DAEMON_READY_TIMEOUT = 10.0
55 3b6b6129 Michael Hanselmann
56 e38220e4 Michael Hanselmann
57 531baf8e Iustin Pop
def _InitSSHSetup():
58 a0c9f010 Michael Hanselmann
  """Setup the SSH configuration for the cluster.
59 a0c9f010 Michael Hanselmann

60 a0c9f010 Michael Hanselmann
  This generates a dsa keypair for root, adds the pub key to the
61 a0c9f010 Michael Hanselmann
  permitted hosts and adds the hostkey to its own known hosts.
62 a0c9f010 Michael Hanselmann

63 a0c9f010 Michael Hanselmann
  """
64 052783ff Michael Hanselmann
  priv_key, pub_key, auth_keys = ssh.GetUserFiles(constants.SSH_LOGIN_USER)
65 a0c9f010 Michael Hanselmann
66 a0c9f010 Michael Hanselmann
  for name in priv_key, pub_key:
67 a0c9f010 Michael Hanselmann
    if os.path.exists(name):
68 a0c9f010 Michael Hanselmann
      utils.CreateBackup(name)
69 a0c9f010 Michael Hanselmann
    utils.RemoveFile(name)
70 a0c9f010 Michael Hanselmann
71 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ssh-keygen", "-t", "dsa",
72 a0c9f010 Michael Hanselmann
                         "-f", priv_key,
73 a0c9f010 Michael Hanselmann
                         "-q", "-N", ""])
74 a0c9f010 Michael Hanselmann
  if result.failed:
75 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not generate ssh keypair, error %s" %
76 a0c9f010 Michael Hanselmann
                             result.output)
77 a0c9f010 Michael Hanselmann
78 7a0156dc Luca Bigliardi
  utils.AddAuthorizedKey(auth_keys, utils.ReadFile(pub_key))
79 a0c9f010 Michael Hanselmann
80 a0c9f010 Michael Hanselmann
81 c008906b Michael Hanselmann
def GenerateHmacKey(file_name):
82 c008906b Michael Hanselmann
  """Writes a new HMAC key.
83 c008906b Michael Hanselmann

84 c008906b Michael Hanselmann
  @type file_name: str
85 c008906b Michael Hanselmann
  @param file_name: Path to output file
86 c008906b Michael Hanselmann

87 c008906b Michael Hanselmann
  """
88 43575108 Michael Hanselmann
  utils.WriteFile(file_name, data="%s\n" % utils.GenerateSecret(), mode=0400,
89 43575108 Michael Hanselmann
                  backup=True)
90 43575108 Michael Hanselmann
91 43575108 Michael Hanselmann
92 b6267745 Andrea Spadaccini
def GenerateClusterCrypto(new_cluster_cert, new_rapi_cert, new_spice_cert,
93 b6267745 Andrea Spadaccini
                          new_confd_hmac_key, new_cds,
94 b6267745 Andrea Spadaccini
                          rapi_cert_pem=None, spice_cert_pem=None,
95 b6267745 Andrea Spadaccini
                          spice_cacert_pem=None, cds=None,
96 7ede9c6a Michael Hanselmann
                          nodecert_file=pathutils.NODED_CERT_FILE,
97 7ede9c6a Michael Hanselmann
                          rapicert_file=pathutils.RAPI_CERT_FILE,
98 7ede9c6a Michael Hanselmann
                          spicecert_file=pathutils.SPICE_CERT_FILE,
99 7ede9c6a Michael Hanselmann
                          spicecacert_file=pathutils.SPICE_CACERT_FILE,
100 7ede9c6a Michael Hanselmann
                          hmackey_file=pathutils.CONFD_HMAC_KEY,
101 7ede9c6a Michael Hanselmann
                          cds_file=pathutils.CLUSTER_DOMAIN_SECRET_FILE):
102 43575108 Michael Hanselmann
  """Updates the cluster certificates, keys and secrets.
103 43575108 Michael Hanselmann

104 43575108 Michael Hanselmann
  @type new_cluster_cert: bool
105 43575108 Michael Hanselmann
  @param new_cluster_cert: Whether to generate a new cluster certificate
106 43575108 Michael Hanselmann
  @type new_rapi_cert: bool
107 43575108 Michael Hanselmann
  @param new_rapi_cert: Whether to generate a new RAPI certificate
108 b6267745 Andrea Spadaccini
  @type new_spice_cert: bool
109 b6267745 Andrea Spadaccini
  @param new_spice_cert: Whether to generate a new SPICE certificate
110 6b7d5878 Michael Hanselmann
  @type new_confd_hmac_key: bool
111 6b7d5878 Michael Hanselmann
  @param new_confd_hmac_key: Whether to generate a new HMAC key
112 3db3eb2a Michael Hanselmann
  @type new_cds: bool
113 3db3eb2a Michael Hanselmann
  @param new_cds: Whether to generate a new cluster domain secret
114 43575108 Michael Hanselmann
  @type rapi_cert_pem: string
115 43575108 Michael Hanselmann
  @param rapi_cert_pem: New RAPI certificate in PEM format
116 b6267745 Andrea Spadaccini
  @type spice_cert_pem: string
117 b6267745 Andrea Spadaccini
  @param spice_cert_pem: New SPICE certificate in PEM format
118 b6267745 Andrea Spadaccini
  @type spice_cacert_pem: string
119 b6267745 Andrea Spadaccini
  @param spice_cacert_pem: Certificate of the CA that signed the SPICE
120 b6267745 Andrea Spadaccini
                           certificate, in PEM format
121 3db3eb2a Michael Hanselmann
  @type cds: string
122 3db3eb2a Michael Hanselmann
  @param cds: New cluster domain secret
123 aeefe835 Iustin Pop
  @type nodecert_file: string
124 aeefe835 Iustin Pop
  @param nodecert_file: optional override of the node cert file path
125 aeefe835 Iustin Pop
  @type rapicert_file: string
126 aeefe835 Iustin Pop
  @param rapicert_file: optional override of the rapi cert file path
127 b6267745 Andrea Spadaccini
  @type spicecert_file: string
128 b6267745 Andrea Spadaccini
  @param spicecert_file: optional override of the spice cert file path
129 b6267745 Andrea Spadaccini
  @type spicecacert_file: string
130 b6267745 Andrea Spadaccini
  @param spicecacert_file: optional override of the spice CA cert file path
131 aeefe835 Iustin Pop
  @type hmackey_file: string
132 aeefe835 Iustin Pop
  @param hmackey_file: optional override of the hmac key file path
133 43575108 Michael Hanselmann

134 43575108 Michael Hanselmann
  """
135 168c1de2 Michael Hanselmann
  # noded SSL certificate
136 aeefe835 Iustin Pop
  cluster_cert_exists = os.path.exists(nodecert_file)
137 43575108 Michael Hanselmann
  if new_cluster_cert or not cluster_cert_exists:
138 43575108 Michael Hanselmann
    if cluster_cert_exists:
139 aeefe835 Iustin Pop
      utils.CreateBackup(nodecert_file)
140 43575108 Michael Hanselmann
141 aeefe835 Iustin Pop
    logging.debug("Generating new cluster certificate at %s", nodecert_file)
142 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(nodecert_file)
143 43575108 Michael Hanselmann
144 6b7d5878 Michael Hanselmann
  # confd HMAC key
145 aeefe835 Iustin Pop
  if new_confd_hmac_key or not os.path.exists(hmackey_file):
146 aeefe835 Iustin Pop
    logging.debug("Writing new confd HMAC key to %s", hmackey_file)
147 aeefe835 Iustin Pop
    GenerateHmacKey(hmackey_file)
148 43575108 Michael Hanselmann
149 43575108 Michael Hanselmann
  # RAPI
150 aeefe835 Iustin Pop
  rapi_cert_exists = os.path.exists(rapicert_file)
151 43575108 Michael Hanselmann
152 43575108 Michael Hanselmann
  if rapi_cert_pem:
153 43575108 Michael Hanselmann
    # Assume rapi_pem contains a valid PEM-formatted certificate and key
154 aeefe835 Iustin Pop
    logging.debug("Writing RAPI certificate at %s", rapicert_file)
155 aeefe835 Iustin Pop
    utils.WriteFile(rapicert_file, data=rapi_cert_pem, backup=True)
156 43575108 Michael Hanselmann
157 43575108 Michael Hanselmann
  elif new_rapi_cert or not rapi_cert_exists:
158 43575108 Michael Hanselmann
    if rapi_cert_exists:
159 aeefe835 Iustin Pop
      utils.CreateBackup(rapicert_file)
160 43575108 Michael Hanselmann
161 aeefe835 Iustin Pop
    logging.debug("Generating new RAPI certificate at %s", rapicert_file)
162 af2ae1c0 Iustin Pop
    utils.GenerateSelfSignedSslCert(rapicert_file)
163 c008906b Michael Hanselmann
164 b6267745 Andrea Spadaccini
  # SPICE
165 b6267745 Andrea Spadaccini
  spice_cert_exists = os.path.exists(spicecert_file)
166 b6267745 Andrea Spadaccini
  spice_cacert_exists = os.path.exists(spicecacert_file)
167 b6267745 Andrea Spadaccini
  if spice_cert_pem:
168 b6267745 Andrea Spadaccini
    # spice_cert_pem implies also spice_cacert_pem
169 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE certificate at %s", spicecert_file)
170 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecert_file, data=spice_cert_pem, backup=True)
171 b6267745 Andrea Spadaccini
    logging.debug("Writing SPICE CA certificate at %s", spicecacert_file)
172 b6267745 Andrea Spadaccini
    utils.WriteFile(spicecacert_file, data=spice_cacert_pem, backup=True)
173 b6267745 Andrea Spadaccini
  elif new_spice_cert or not spice_cert_exists:
174 b6267745 Andrea Spadaccini
    if spice_cert_exists:
175 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecert_file)
176 b6267745 Andrea Spadaccini
    if spice_cacert_exists:
177 b6267745 Andrea Spadaccini
      utils.CreateBackup(spicecacert_file)
178 b6267745 Andrea Spadaccini
179 b6267745 Andrea Spadaccini
    logging.debug("Generating new self-signed SPICE certificate at %s",
180 b6267745 Andrea Spadaccini
                  spicecert_file)
181 b6267745 Andrea Spadaccini
    (_, cert_pem) = utils.GenerateSelfSignedSslCert(spicecert_file)
182 b6267745 Andrea Spadaccini
183 b6267745 Andrea Spadaccini
    # Self-signed certificate -> the public certificate is also the CA public
184 b6267745 Andrea Spadaccini
    # certificate
185 b6267745 Andrea Spadaccini
    logging.debug("Writing the public certificate to %s",
186 b6267745 Andrea Spadaccini
                  spicecert_file)
187 b6267745 Andrea Spadaccini
    utils.io.WriteFile(spicecacert_file, mode=0400, data=cert_pem)
188 b6267745 Andrea Spadaccini
189 3db3eb2a Michael Hanselmann
  # Cluster domain secret
190 3db3eb2a Michael Hanselmann
  if cds:
191 fc0726b9 Michael Hanselmann
    logging.debug("Writing cluster domain secret to %s", cds_file)
192 fc0726b9 Michael Hanselmann
    utils.WriteFile(cds_file, data=cds, backup=True)
193 fc0726b9 Michael Hanselmann
194 fc0726b9 Michael Hanselmann
  elif new_cds or not os.path.exists(cds_file):
195 fc0726b9 Michael Hanselmann
    logging.debug("Generating new cluster domain secret at %s", cds_file)
196 fc0726b9 Michael Hanselmann
    GenerateHmacKey(cds_file)
197 3db3eb2a Michael Hanselmann
198 c008906b Michael Hanselmann
199 8f215968 Michael Hanselmann
def _InitGanetiServerSetup(master_name):
200 40a97d80 Michael Hanselmann
  """Setup the necessary configuration for the initial node daemon.
201 40a97d80 Michael Hanselmann

202 40a97d80 Michael Hanselmann
  This creates the nodepass file containing the shared password for
203 600535f0 Manuel Franceschini
  the cluster, generates the SSL certificate and starts the node daemon.
204 600535f0 Manuel Franceschini

205 600535f0 Manuel Franceschini
  @type master_name: str
206 600535f0 Manuel Franceschini
  @param master_name: Name of the master node
207 40a97d80 Michael Hanselmann

208 40a97d80 Michael Hanselmann
  """
209 43575108 Michael Hanselmann
  # Generate cluster secrets
210 b6267745 Andrea Spadaccini
  GenerateClusterCrypto(True, False, False, False, False)
211 4a34c5cf Guido Trotter
212 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start", constants.NODED])
213 a0c9f010 Michael Hanselmann
  if result.failed:
214 a0c9f010 Michael Hanselmann
    raise errors.OpExecError("Could not start the node daemon, command %s"
215 a0c9f010 Michael Hanselmann
                             " had exitcode %s and error %s" %
216 a0c9f010 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
217 a0c9f010 Michael Hanselmann
218 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(master_name)
219 5627f375 Michael Hanselmann
220 5627f375 Michael Hanselmann
221 5627f375 Michael Hanselmann
def _WaitForNodeDaemon(node_name):
222 5627f375 Michael Hanselmann
  """Wait for node daemon to become responsive.
223 5627f375 Michael Hanselmann

224 5627f375 Michael Hanselmann
  """
225 d3833ebd Michael Hanselmann
  def _CheckNodeDaemon():
226 bd6d1202 Renรฉ Nussbaumer
    # Pylint bug <http://www.logilab.org/ticket/35642>
227 bd6d1202 Renรฉ Nussbaumer
    # pylint: disable=E1101
228 db04ce5d Michael Hanselmann
    result = rpc.BootstrapRunner().call_version([node_name])[node_name]
229 d3833ebd Michael Hanselmann
    if result.fail_msg:
230 d3833ebd Michael Hanselmann
      raise utils.RetryAgain()
231 8f215968 Michael Hanselmann
232 d3833ebd Michael Hanselmann
  try:
233 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckNodeDaemon, 1.0, _DAEMON_READY_TIMEOUT)
234 d3833ebd Michael Hanselmann
  except utils.RetryTimeout:
235 5627f375 Michael Hanselmann
    raise errors.OpExecError("Node daemon on %s didn't answer queries within"
236 3b6b6129 Michael Hanselmann
                             " %s seconds" % (node_name, _DAEMON_READY_TIMEOUT))
237 3b6b6129 Michael Hanselmann
238 3b6b6129 Michael Hanselmann
239 3b6b6129 Michael Hanselmann
def _WaitForMasterDaemon():
240 3b6b6129 Michael Hanselmann
  """Wait for master daemon to become responsive.
241 3b6b6129 Michael Hanselmann

242 3b6b6129 Michael Hanselmann
  """
243 3b6b6129 Michael Hanselmann
  def _CheckMasterDaemon():
244 3b6b6129 Michael Hanselmann
    try:
245 3b6b6129 Michael Hanselmann
      cl = luxi.Client()
246 3b6b6129 Michael Hanselmann
      (cluster_name, ) = cl.QueryConfigValues(["cluster_name"])
247 3b6b6129 Michael Hanselmann
    except Exception:
248 3b6b6129 Michael Hanselmann
      raise utils.RetryAgain()
249 3b6b6129 Michael Hanselmann
250 3b6b6129 Michael Hanselmann
    logging.debug("Received cluster name %s from master", cluster_name)
251 3b6b6129 Michael Hanselmann
252 3b6b6129 Michael Hanselmann
  try:
253 3b6b6129 Michael Hanselmann
    utils.Retry(_CheckMasterDaemon, 1.0, _DAEMON_READY_TIMEOUT)
254 3b6b6129 Michael Hanselmann
  except utils.RetryTimeout:
255 3b6b6129 Michael Hanselmann
    raise errors.OpExecError("Master daemon didn't answer queries within"
256 3b6b6129 Michael Hanselmann
                             " %s seconds" % _DAEMON_READY_TIMEOUT)
257 5627f375 Michael Hanselmann
258 a0c9f010 Michael Hanselmann
259 a5da38fa Michael Hanselmann
def _WaitForSshDaemon(hostname, port, family):
260 a5da38fa Michael Hanselmann
  """Wait for SSH daemon to become responsive.
261 a5da38fa Michael Hanselmann

262 a5da38fa Michael Hanselmann
  """
263 a5da38fa Michael Hanselmann
  hostip = netutils.GetHostname(name=hostname, family=family).ip
264 a5da38fa Michael Hanselmann
265 a5da38fa Michael Hanselmann
  def _CheckSshDaemon():
266 a5da38fa Michael Hanselmann
    if netutils.TcpPing(hostip, port, timeout=1.0, live_port_needed=True):
267 a5da38fa Michael Hanselmann
      logging.debug("SSH daemon on %s:%s (IP address %s) has become"
268 a5da38fa Michael Hanselmann
                    " responsive", hostname, port, hostip)
269 a5da38fa Michael Hanselmann
    else:
270 a5da38fa Michael Hanselmann
      raise utils.RetryAgain()
271 a5da38fa Michael Hanselmann
272 a5da38fa Michael Hanselmann
  try:
273 a5da38fa Michael Hanselmann
    utils.Retry(_CheckSshDaemon, 1.0, _DAEMON_READY_TIMEOUT)
274 a5da38fa Michael Hanselmann
  except utils.RetryTimeout:
275 a5da38fa Michael Hanselmann
    raise errors.OpExecError("SSH daemon on %s:%s (IP address %s) didn't"
276 a5da38fa Michael Hanselmann
                             " become responsive within %s seconds" %
277 a5da38fa Michael Hanselmann
                             (hostname, port, hostip, _DAEMON_READY_TIMEOUT))
278 a5da38fa Michael Hanselmann
279 a5da38fa Michael Hanselmann
280 a698cdbb Michael Hanselmann
def RunNodeSetupCmd(cluster_name, node, basecmd, debug, verbose,
281 a698cdbb Michael Hanselmann
                    use_cluster_key, ask_key, strict_host_check, data):
282 a698cdbb Michael Hanselmann
  """Runs a command to configure something on a remote machine.
283 a698cdbb Michael Hanselmann

284 a698cdbb Michael Hanselmann
  @type cluster_name: string
285 a698cdbb Michael Hanselmann
  @param cluster_name: Cluster name
286 a698cdbb Michael Hanselmann
  @type node: string
287 a698cdbb Michael Hanselmann
  @param node: Node name
288 a698cdbb Michael Hanselmann
  @type basecmd: string
289 a698cdbb Michael Hanselmann
  @param basecmd: Base command (path on the remote machine)
290 a698cdbb Michael Hanselmann
  @type debug: bool
291 a698cdbb Michael Hanselmann
  @param debug: Enable debug output
292 a698cdbb Michael Hanselmann
  @type verbose: bool
293 a698cdbb Michael Hanselmann
  @param verbose: Enable verbose output
294 a698cdbb Michael Hanselmann
  @type use_cluster_key: bool
295 a698cdbb Michael Hanselmann
  @param use_cluster_key: See L{ssh.SshRunner.BuildCmd}
296 a698cdbb Michael Hanselmann
  @type ask_key: bool
297 a698cdbb Michael Hanselmann
  @param ask_key: See L{ssh.SshRunner.BuildCmd}
298 a698cdbb Michael Hanselmann
  @type strict_host_check: bool
299 a698cdbb Michael Hanselmann
  @param strict_host_check: See L{ssh.SshRunner.BuildCmd}
300 a698cdbb Michael Hanselmann
  @param data: JSON-serializable input data for script (passed to stdin)
301 a698cdbb Michael Hanselmann

302 a698cdbb Michael Hanselmann
  """
303 a698cdbb Michael Hanselmann
  cmd = [basecmd]
304 a698cdbb Michael Hanselmann
305 a698cdbb Michael Hanselmann
  # Pass --debug/--verbose to the external script if set on our invocation
306 a698cdbb Michael Hanselmann
  if debug:
307 a698cdbb Michael Hanselmann
    cmd.append("--debug")
308 a698cdbb Michael Hanselmann
309 a698cdbb Michael Hanselmann
  if verbose:
310 a698cdbb Michael Hanselmann
    cmd.append("--verbose")
311 a698cdbb Michael Hanselmann
312 e1874aa7 Michael Hanselmann
  family = ssconf.SimpleStore().GetPrimaryIPFamily()
313 e1874aa7 Michael Hanselmann
  srun = ssh.SshRunner(cluster_name,
314 e1874aa7 Michael Hanselmann
                       ipv6=(family == netutils.IP6Address.family))
315 a698cdbb Michael Hanselmann
  scmd = srun.BuildCmd(node, constants.SSH_LOGIN_USER,
316 a698cdbb Michael Hanselmann
                       utils.ShellQuoteArgs(cmd),
317 a698cdbb Michael Hanselmann
                       batch=False, ask_key=ask_key, quiet=False,
318 a698cdbb Michael Hanselmann
                       strict_host_check=strict_host_check,
319 a698cdbb Michael Hanselmann
                       use_cluster_key=use_cluster_key)
320 a698cdbb Michael Hanselmann
321 a698cdbb Michael Hanselmann
  tempfh = tempfile.TemporaryFile()
322 a698cdbb Michael Hanselmann
  try:
323 a698cdbb Michael Hanselmann
    tempfh.write(serializer.DumpJson(data))
324 a698cdbb Michael Hanselmann
    tempfh.seek(0)
325 a698cdbb Michael Hanselmann
326 a698cdbb Michael Hanselmann
    result = utils.RunCmd(scmd, interactive=True, input_fd=tempfh)
327 a698cdbb Michael Hanselmann
  finally:
328 a698cdbb Michael Hanselmann
    tempfh.close()
329 a698cdbb Michael Hanselmann
330 a698cdbb Michael Hanselmann
  if result.failed:
331 a698cdbb Michael Hanselmann
    raise errors.OpExecError("Command '%s' failed: %s" %
332 a698cdbb Michael Hanselmann
                             (result.cmd, result.fail_reason))
333 a698cdbb Michael Hanselmann
334 a5da38fa Michael Hanselmann
  _WaitForSshDaemon(node, netutils.GetDaemonPort(constants.SSH), family)
335 a5da38fa Michael Hanselmann
336 a698cdbb Michael Hanselmann
337 5030cff3 Helga Velroyen
def _PrepareFileStorage(enabled_disk_templates, file_storage_dir):
338 5030cff3 Helga Velroyen
  """Checks if file storage is enabled and inits the dir.
339 5030cff3 Helga Velroyen

340 5030cff3 Helga Velroyen
  """
341 5030cff3 Helga Velroyen
  if utils.storage.IsFileStorageEnabled(enabled_disk_templates):
342 5030cff3 Helga Velroyen
    file_storage_dir = _InitFileStorageDir(file_storage_dir)
343 5030cff3 Helga Velroyen
  else:
344 5030cff3 Helga Velroyen
    file_storage_dir = ""
345 5030cff3 Helga Velroyen
  return file_storage_dir
346 5030cff3 Helga Velroyen
347 5030cff3 Helga Velroyen
348 5030cff3 Helga Velroyen
def _InitFileStorageDir(file_storage_dir):
349 0e3baaf3 Iustin Pop
  """Initialize if needed the file storage.
350 0e3baaf3 Iustin Pop

351 0e3baaf3 Iustin Pop
  @param file_storage_dir: the user-supplied value
352 0e3baaf3 Iustin Pop
  @return: either empty string (if file storage was disabled at build
353 0e3baaf3 Iustin Pop
      time) or the normalized path to the storage directory
354 0e3baaf3 Iustin Pop

355 0e3baaf3 Iustin Pop
  """
356 0e3baaf3 Iustin Pop
  file_storage_dir = os.path.normpath(file_storage_dir)
357 0e3baaf3 Iustin Pop
358 0e3baaf3 Iustin Pop
  if not os.path.isabs(file_storage_dir):
359 0376655e Guido Trotter
    raise errors.OpPrereqError("File storage directory '%s' is not an absolute"
360 0376655e Guido Trotter
                               " path" % file_storage_dir, errors.ECODE_INVAL)
361 0e3baaf3 Iustin Pop
362 0e3baaf3 Iustin Pop
  if not os.path.exists(file_storage_dir):
363 0e3baaf3 Iustin Pop
    try:
364 0e3baaf3 Iustin Pop
      os.makedirs(file_storage_dir, 0750)
365 0e3baaf3 Iustin Pop
    except OSError, err:
366 0e3baaf3 Iustin Pop
      raise errors.OpPrereqError("Cannot create file storage directory"
367 0e3baaf3 Iustin Pop
                                 " '%s': %s" % (file_storage_dir, err),
368 0e3baaf3 Iustin Pop
                                 errors.ECODE_ENVIRON)
369 0e3baaf3 Iustin Pop
370 0e3baaf3 Iustin Pop
  if not os.path.isdir(file_storage_dir):
371 0e3baaf3 Iustin Pop
    raise errors.OpPrereqError("The file storage directory '%s' is not"
372 0e3baaf3 Iustin Pop
                               " a directory." % file_storage_dir,
373 0e3baaf3 Iustin Pop
                               errors.ECODE_ENVIRON)
374 5030cff3 Helga Velroyen
375 5030cff3 Helga Velroyen
  # FIXME: check here if the file_storage_dir is in the set of allowed dirs
376 0e3baaf3 Iustin Pop
  return file_storage_dir
377 0e3baaf3 Iustin Pop
378 0e3baaf3 Iustin Pop
379 5030cff3 Helga Velroyen
def _InitCheckEnabledDiskTemplates(enabled_disk_templates):
380 5030cff3 Helga Velroyen
  """Checks the sanity of the enabled disk templates.
381 5030cff3 Helga Velroyen

382 5030cff3 Helga Velroyen
  """
383 5030cff3 Helga Velroyen
  if not enabled_disk_templates:
384 5030cff3 Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list must contain at"
385 5030cff3 Helga Velroyen
                               " least one member", errors.ECODE_INVAL)
386 5030cff3 Helga Velroyen
  invalid_disk_templates = \
387 5030cff3 Helga Velroyen
    set(enabled_disk_templates) - constants.DISK_TEMPLATES
388 5030cff3 Helga Velroyen
  if invalid_disk_templates:
389 5030cff3 Helga Velroyen
    raise errors.OpPrereqError("Enabled disk templates list contains invalid"
390 5030cff3 Helga Velroyen
                               " entries: %s" % invalid_disk_templates,
391 5030cff3 Helga Velroyen
                               errors.ECODE_INVAL)
392 5030cff3 Helga Velroyen
393 5030cff3 Helga Velroyen
394 18bb6d28 Agata Murawska
def InitCluster(cluster_name, mac_prefix, # pylint: disable=R0913, R0914
395 5a8648eb Andrea Spadaccini
                master_netmask, master_netdev, file_storage_dir,
396 5a8648eb Andrea Spadaccini
                shared_file_storage_dir, candidate_pool_size, secondary_ip=None,
397 5a8648eb Andrea Spadaccini
                vg_name=None, beparams=None, nicparams=None, ndparams=None,
398 bc5d0215 Andrea Spadaccini
                hvparams=None, diskparams=None, enabled_hypervisors=None,
399 bc5d0215 Andrea Spadaccini
                modify_etc_hosts=True, modify_ssh_setup=True,
400 bc5d0215 Andrea Spadaccini
                maintain_node_health=False, drbd_helper=None, uid_pool=None,
401 18bb6d28 Agata Murawska
                default_iallocator=None, primary_ip_version=None, ipolicy=None,
402 c4929a8b Renรฉ Nussbaumer
                prealloc_wipe_disks=False, use_external_mip_script=False,
403 3bde79ee Helga Velroyen
                hv_state=None, disk_state=None, enabled_disk_templates=None):
404 a0c9f010 Michael Hanselmann
  """Initialise the cluster.
405 a0c9f010 Michael Hanselmann

406 ce735215 Guido Trotter
  @type candidate_pool_size: int
407 ce735215 Guido Trotter
  @param candidate_pool_size: master candidate pool size
408 3bde79ee Helga Velroyen
  @type enabled_disk_templates: list of string
409 3bde79ee Helga Velroyen
  @param enabled_disk_templates: list of disk_templates to be used in this
410 c074a9e8 Helga Velroyen
    cluster
411 ce735215 Guido Trotter

412 a0c9f010 Michael Hanselmann
  """
413 ce735215 Guido Trotter
  # TODO: complete the docstring
414 a0c9f010 Michael Hanselmann
  if config.ConfigWriter.IsCluster():
415 debac808 Iustin Pop
    raise errors.OpPrereqError("Cluster is already initialised",
416 debac808 Iustin Pop
                               errors.ECODE_STATE)
417 a0c9f010 Michael Hanselmann
418 b119bccb Guido Trotter
  if not enabled_hypervisors:
419 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors list must contain at"
420 debac808 Iustin Pop
                               " least one member", errors.ECODE_INVAL)
421 b119bccb Guido Trotter
  invalid_hvs = set(enabled_hypervisors) - constants.HYPER_TYPES
422 b119bccb Guido Trotter
  if invalid_hvs:
423 b119bccb Guido Trotter
    raise errors.OpPrereqError("Enabled hypervisors contains invalid"
424 debac808 Iustin Pop
                               " entries: %s" % invalid_hvs,
425 debac808 Iustin Pop
                               errors.ECODE_INVAL)
426 b119bccb Guido Trotter
427 5030cff3 Helga Velroyen
  _InitCheckEnabledDiskTemplates(enabled_disk_templates)
428 c074a9e8 Helga Velroyen
429 5a8648eb Andrea Spadaccini
  try:
430 5a8648eb Andrea Spadaccini
    ipcls = netutils.IPAddress.GetClassFromIpVersion(primary_ip_version)
431 5a8648eb Andrea Spadaccini
  except errors.ProgrammerError:
432 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Invalid primary ip version: %d." %
433 2cfbc784 Iustin Pop
                               primary_ip_version, errors.ECODE_INVAL)
434 2f20d07b Manuel Franceschini
435 2f20d07b Manuel Franceschini
  hostname = netutils.GetHostname(family=ipcls.family)
436 2f20d07b Manuel Franceschini
  if not ipcls.IsValid(hostname.ip):
437 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) is not a valid IPv%d"
438 2cfbc784 Iustin Pop
                               " address." % (hostname.ip, primary_ip_version),
439 2cfbc784 Iustin Pop
                               errors.ECODE_INVAL)
440 2f20d07b Manuel Franceschini
441 2f20d07b Manuel Franceschini
  if ipcls.IsLoopback(hostname.ip):
442 8b312c1d Manuel Franceschini
    raise errors.OpPrereqError("This host's IP (%s) resolves to a loopback"
443 8b312c1d Manuel Franceschini
                               " address. Please fix DNS or %s." %
444 ee045466 Michael Hanselmann
                               (hostname.ip, pathutils.ETC_HOSTS),
445 debac808 Iustin Pop
                               errors.ECODE_ENVIRON)
446 a0c9f010 Michael Hanselmann
447 2f20d07b Manuel Franceschini
  if not ipcls.Own(hostname.ip):
448 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Inconsistency: this host's name resolves"
449 a0c9f010 Michael Hanselmann
                               " to %s,\nbut this ip address does not"
450 7c4c22f5 Manuel Franceschini
                               " belong to this host" %
451 debac808 Iustin Pop
                               hostname.ip, errors.ECODE_ENVIRON)
452 a0c9f010 Michael Hanselmann
453 2f20d07b Manuel Franceschini
  clustername = netutils.GetHostname(name=cluster_name, family=ipcls.family)
454 a0c9f010 Michael Hanselmann
455 2f20d07b Manuel Franceschini
  if netutils.TcpPing(clustername.ip, constants.DEFAULT_NODED_PORT, timeout=5):
456 7c4c22f5 Manuel Franceschini
    raise errors.OpPrereqError("Cluster IP already active",
457 debac808 Iustin Pop
                               errors.ECODE_NOTUNIQUE)
458 a0c9f010 Michael Hanselmann
459 2f20d07b Manuel Franceschini
  if not secondary_ip:
460 2f20d07b Manuel Franceschini
    if primary_ip_version == constants.IP6_VERSION:
461 2f20d07b Manuel Franceschini
      raise errors.OpPrereqError("When using a IPv6 primary address, a valid"
462 7c4c22f5 Manuel Franceschini
                                 " IPv4 address must be given as secondary",
463 7c4c22f5 Manuel Franceschini
                                 errors.ECODE_INVAL)
464 b9eeeb02 Michael Hanselmann
    secondary_ip = hostname.ip
465 a0c9f010 Michael Hanselmann
466 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.IsValid(secondary_ip):
467 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("Secondary IP address (%s) has to be a valid"
468 2f20d07b Manuel Franceschini
                               " IPv4 address." % secondary_ip,
469 2f20d07b Manuel Franceschini
                               errors.ECODE_INVAL)
470 2f20d07b Manuel Franceschini
471 2f20d07b Manuel Franceschini
  if not netutils.IP4Address.Own(secondary_ip):
472 2f20d07b Manuel Franceschini
    raise errors.OpPrereqError("You gave %s as secondary IP,"
473 2f20d07b Manuel Franceschini
                               " but it does not belong to this host." %
474 2f20d07b Manuel Franceschini
                               secondary_ip, errors.ECODE_ENVIRON)
475 2f20d07b Manuel Franceschini
476 5a8648eb Andrea Spadaccini
  if master_netmask is not None:
477 5a8648eb Andrea Spadaccini
    if not ipcls.ValidateNetmask(master_netmask):
478 5a8648eb Andrea Spadaccini
      raise errors.OpPrereqError("CIDR netmask (%s) not valid for IPv%s " %
479 2cfbc784 Iustin Pop
                                  (master_netmask, primary_ip_version),
480 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
481 5a8648eb Andrea Spadaccini
  else:
482 5a8648eb Andrea Spadaccini
    master_netmask = ipcls.iplen
483 5a8648eb Andrea Spadaccini
484 912737ba Helga Velroyen
  if vg_name:
485 a0c9f010 Michael Hanselmann
    # Check if volume group is valid
486 a0c9f010 Michael Hanselmann
    vgstatus = utils.CheckVolumeGroupSize(utils.ListVolumeGroups(), vg_name,
487 a0c9f010 Michael Hanselmann
                                          constants.MIN_VG_SIZE)
488 a0c9f010 Michael Hanselmann
    if vgstatus:
489 912737ba Helga Velroyen
      raise errors.OpPrereqError("Error: %s" % vgstatus, errors.ECODE_INVAL)
490 a0c9f010 Michael Hanselmann
491 a721e23a Luca Bigliardi
  if drbd_helper is not None:
492 a721e23a Luca Bigliardi
    try:
493 47e0abee Thomas Thrainer
      curr_helper = drbd.DRBD8.GetUsermodeHelper()
494 a721e23a Luca Bigliardi
    except errors.BlockDeviceError, err:
495 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error while checking drbd helper"
496 a721e23a Luca Bigliardi
                                 " (specify --no-drbd-storage if you are not"
497 a721e23a Luca Bigliardi
                                 " using drbd): %s" % str(err),
498 a721e23a Luca Bigliardi
                                 errors.ECODE_ENVIRON)
499 a721e23a Luca Bigliardi
    if drbd_helper != curr_helper:
500 a721e23a Luca Bigliardi
      raise errors.OpPrereqError("Error: requiring %s as drbd helper but %s"
501 a721e23a Luca Bigliardi
                                 " is the current helper" % (drbd_helper,
502 a721e23a Luca Bigliardi
                                                             curr_helper),
503 a721e23a Luca Bigliardi
                                 errors.ECODE_INVAL)
504 a721e23a Luca Bigliardi
505 32ba31be Michael Hanselmann
  logging.debug("Stopping daemons (if any are running)")
506 32ba31be Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "stop-all"])
507 32ba31be Michael Hanselmann
  if result.failed:
508 32ba31be Michael Hanselmann
    raise errors.OpExecError("Could not stop daemons, command %s"
509 32ba31be Michael Hanselmann
                             " had exitcode %s and error '%s'" %
510 32ba31be Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
511 32ba31be Michael Hanselmann
512 5030cff3 Helga Velroyen
  file_storage_dir = _PrepareFileStorage(enabled_disk_templates,
513 5030cff3 Helga Velroyen
                                         file_storage_dir)
514 0376655e Guido Trotter
515 0376655e Guido Trotter
  if constants.ENABLE_SHARED_FILE_STORAGE:
516 5030cff3 Helga Velroyen
    shared_file_storage_dir = _InitFileStorageDir(shared_file_storage_dir)
517 0376655e Guido Trotter
  else:
518 0376655e Guido Trotter
    shared_file_storage_dir = ""
519 a0c9f010 Michael Hanselmann
520 a0c9f010 Michael Hanselmann
  if not re.match("^[0-9a-z]{2}:[0-9a-z]{2}:[0-9a-z]{2}$", mac_prefix):
521 debac808 Iustin Pop
    raise errors.OpPrereqError("Invalid mac prefix given '%s'" % mac_prefix,
522 debac808 Iustin Pop
                               errors.ECODE_INVAL)
523 a0c9f010 Michael Hanselmann
524 a0c9f010 Michael Hanselmann
  result = utils.RunCmd(["ip", "link", "show", "dev", master_netdev])
525 a0c9f010 Michael Hanselmann
  if result.failed:
526 a0c9f010 Michael Hanselmann
    raise errors.OpPrereqError("Invalid master netdev given (%s): '%s'" %
527 a0c9f010 Michael Hanselmann
                               (master_netdev,
528 debac808 Iustin Pop
                                result.output.strip()), errors.ECODE_INVAL)
529 a0c9f010 Michael Hanselmann
530 7ede9c6a Michael Hanselmann
  dirs = [(pathutils.RUN_DIR, constants.RUN_DIRS_MODE)]
531 9dae41ad Guido Trotter
  utils.EnsureDirs(dirs)
532 9dae41ad Guido Trotter
533 b2e233a5 Guido Trotter
  objects.UpgradeBeParams(beparams)
534 a5728081 Guido Trotter
  utils.ForceDictType(beparams, constants.BES_PARAMETER_TYPES)
535 b6a30b0d Guido Trotter
  utils.ForceDictType(nicparams, constants.NICS_PARAMETER_TYPES)
536 18bb6d28 Agata Murawska
537 b6a30b0d Guido Trotter
  objects.NIC.CheckParameterSyntax(nicparams)
538 57dc299a Iustin Pop
539 2cc673a3 Iustin Pop
  full_ipolicy = objects.FillIPolicy(constants.IPOLICY_DEFAULTS, ipolicy)
540 b6a30b0d Guido Trotter
541 6204ee71 Renรฉ Nussbaumer
  if ndparams is not None:
542 6204ee71 Renรฉ Nussbaumer
    utils.ForceDictType(ndparams, constants.NDS_PARAMETER_TYPES)
543 6204ee71 Renรฉ Nussbaumer
  else:
544 6204ee71 Renรฉ Nussbaumer
    ndparams = dict(constants.NDC_DEFAULTS)
545 6204ee71 Renรฉ Nussbaumer
546 c4929a8b Renรฉ Nussbaumer
  # This is ugly, as we modify the dict itself
547 57dc299a Iustin Pop
  # FIXME: Make utils.ForceDictType pure functional or write a wrapper
548 57dc299a Iustin Pop
  # around it
549 c4929a8b Renรฉ Nussbaumer
  if hv_state:
550 c4929a8b Renรฉ Nussbaumer
    for hvname, hvs_data in hv_state.items():
551 c4929a8b Renรฉ Nussbaumer
      utils.ForceDictType(hvs_data, constants.HVSTS_PARAMETER_TYPES)
552 c4929a8b Renรฉ Nussbaumer
      hv_state[hvname] = objects.Cluster.SimpleFillHvState(hvs_data)
553 c4929a8b Renรฉ Nussbaumer
  else:
554 c4929a8b Renรฉ Nussbaumer
    hv_state = dict((hvname, constants.HVST_DEFAULTS)
555 c4929a8b Renรฉ Nussbaumer
                    for hvname in enabled_hypervisors)
556 c4929a8b Renรฉ Nussbaumer
557 c4929a8b Renรฉ Nussbaumer
  # FIXME: disk_state has no default values yet
558 c4929a8b Renรฉ Nussbaumer
  if disk_state:
559 c4929a8b Renรฉ Nussbaumer
    for storage, ds_data in disk_state.items():
560 c4929a8b Renรฉ Nussbaumer
      if storage not in constants.DS_VALID_TYPES:
561 c4929a8b Renรฉ Nussbaumer
        raise errors.OpPrereqError("Invalid storage type in disk state: %s" %
562 c4929a8b Renรฉ Nussbaumer
                                   storage, errors.ECODE_INVAL)
563 c4929a8b Renรฉ Nussbaumer
      for ds_name, state in ds_data.items():
564 c4929a8b Renรฉ Nussbaumer
        utils.ForceDictType(state, constants.DSS_PARAMETER_TYPES)
565 c4929a8b Renรฉ Nussbaumer
        ds_data[ds_name] = objects.Cluster.SimpleFillDiskState(state)
566 c4929a8b Renรฉ Nussbaumer
567 a5728081 Guido Trotter
  # hvparams is a mapping of hypervisor->hvparams dict
568 a5728081 Guido Trotter
  for hv_name, hv_params in hvparams.iteritems():
569 a5728081 Guido Trotter
    utils.ForceDictType(hv_params, constants.HVS_PARAMETER_TYPES)
570 a5728081 Guido Trotter
    hv_class = hypervisor.GetHypervisor(hv_name)
571 a5728081 Guido Trotter
    hv_class.CheckParameterSyntax(hv_params)
572 d4b72030 Guido Trotter
573 bc5d0215 Andrea Spadaccini
  # diskparams is a mapping of disk-template->diskparams dict
574 bc5d0215 Andrea Spadaccini
  for template, dt_params in diskparams.items():
575 bc5d0215 Andrea Spadaccini
    param_keys = set(dt_params.keys())
576 bc5d0215 Andrea Spadaccini
    default_param_keys = set(constants.DISK_DT_DEFAULTS[template].keys())
577 bc5d0215 Andrea Spadaccini
    if not (param_keys <= default_param_keys):
578 bc5d0215 Andrea Spadaccini
      unknown_params = param_keys - default_param_keys
579 bc5d0215 Andrea Spadaccini
      raise errors.OpPrereqError("Invalid parameters for disk template %s:"
580 bc5d0215 Andrea Spadaccini
                                 " %s" % (template,
581 2cfbc784 Iustin Pop
                                          utils.CommaJoin(unknown_params)),
582 2cfbc784 Iustin Pop
                                 errors.ECODE_INVAL)
583 bc5d0215 Andrea Spadaccini
    utils.ForceDictType(dt_params, constants.DISK_DT_TYPES)
584 35c48839 Michele Tartara
    if template == constants.DT_DRBD8 and vg_name is not None:
585 35c48839 Michele Tartara
      # The default METAVG value is equal to the VG name set at init time,
586 35c48839 Michele Tartara
      # if provided
587 35c48839 Michele Tartara
      dt_params[constants.DRBD_DEFAULT_METAVG] = vg_name
588 35c48839 Michele Tartara
589 e4a4391d Renรฉ Nussbaumer
  try:
590 e4a4391d Renรฉ Nussbaumer
    utils.VerifyDictOptions(diskparams, constants.DISK_DT_DEFAULTS)
591 e4a4391d Renรฉ Nussbaumer
  except errors.OpPrereqError, err:
592 e4a4391d Renรฉ Nussbaumer
    raise errors.OpPrereqError("While verify diskparam options: %s" % err,
593 e4a4391d Renรฉ Nussbaumer
                               errors.ECODE_INVAL)
594 bc5d0215 Andrea Spadaccini
595 a0c9f010 Michael Hanselmann
  # set up ssh config and /etc/hosts
596 7ede9c6a Michael Hanselmann
  sshline = utils.ReadFile(pathutils.SSH_HOST_RSA_PUB)
597 a0c9f010 Michael Hanselmann
  sshkey = sshline.split(" ")[1]
598 a0c9f010 Michael Hanselmann
599 b86a6bcd Guido Trotter
  if modify_etc_hosts:
600 ea8ac9c9 Renรฉ Nussbaumer
    utils.AddHostToEtcHosts(hostname.name, hostname.ip)
601 b86a6bcd Guido Trotter
602 b989b9d9 Ken Wehr
  if modify_ssh_setup:
603 b989b9d9 Ken Wehr
    _InitSSHSetup()
604 a0c9f010 Michael Hanselmann
605 bf4af505 Apollon Oikonomopoulos
  if default_iallocator is not None:
606 bf4af505 Apollon Oikonomopoulos
    alloc_script = utils.FindFile(default_iallocator,
607 bf4af505 Apollon Oikonomopoulos
                                  constants.IALLOCATOR_SEARCH_PATH,
608 bf4af505 Apollon Oikonomopoulos
                                  os.path.isfile)
609 bf4af505 Apollon Oikonomopoulos
    if alloc_script is None:
610 bf4af505 Apollon Oikonomopoulos
      raise errors.OpPrereqError("Invalid default iallocator script '%s'"
611 bf4af505 Apollon Oikonomopoulos
                                 " specified" % default_iallocator,
612 bf4af505 Apollon Oikonomopoulos
                                 errors.ECODE_INVAL)
613 d1e9c98d Iustin Pop
  elif constants.HTOOLS:
614 d1e9c98d Iustin Pop
    # htools was enabled at build-time, we default to it
615 d1e9c98d Iustin Pop
    if utils.FindFile(constants.IALLOC_HAIL,
616 d1e9c98d Iustin Pop
                      constants.IALLOCATOR_SEARCH_PATH,
617 d1e9c98d Iustin Pop
                      os.path.isfile):
618 d1e9c98d Iustin Pop
      default_iallocator = constants.IALLOC_HAIL
619 bf4af505 Apollon Oikonomopoulos
620 430b923c Iustin Pop
  now = time.time()
621 430b923c Iustin Pop
622 a0c9f010 Michael Hanselmann
  # init of cluster config file
623 b9eeeb02 Michael Hanselmann
  cluster_config = objects.Cluster(
624 b9eeeb02 Michael Hanselmann
    serial_no=1,
625 b9eeeb02 Michael Hanselmann
    rsahostkeypub=sshkey,
626 b9eeeb02 Michael Hanselmann
    highest_used_port=(constants.FIRST_DRBD_PORT - 1),
627 b9eeeb02 Michael Hanselmann
    mac_prefix=mac_prefix,
628 b9eeeb02 Michael Hanselmann
    volume_group_name=vg_name,
629 b9eeeb02 Michael Hanselmann
    tcpudp_port_pool=set(),
630 f6bd6e98 Michael Hanselmann
    master_ip=clustername.ip,
631 5a8648eb Andrea Spadaccini
    master_netmask=master_netmask,
632 f6bd6e98 Michael Hanselmann
    master_netdev=master_netdev,
633 f6bd6e98 Michael Hanselmann
    cluster_name=clustername.name,
634 f6bd6e98 Michael Hanselmann
    file_storage_dir=file_storage_dir,
635 4b97f902 Apollon Oikonomopoulos
    shared_file_storage_dir=shared_file_storage_dir,
636 ea3a925f Alexander Schreiber
    enabled_hypervisors=enabled_hypervisors,
637 4ef7f423 Guido Trotter
    beparams={constants.PP_DEFAULT: beparams},
638 b6a30b0d Guido Trotter
    nicparams={constants.PP_DEFAULT: nicparams},
639 6204ee71 Renรฉ Nussbaumer
    ndparams=ndparams,
640 ea3a925f Alexander Schreiber
    hvparams=hvparams,
641 bc5d0215 Andrea Spadaccini
    diskparams=diskparams,
642 ce735215 Guido Trotter
    candidate_pool_size=candidate_pool_size,
643 022c3a0b Guido Trotter
    modify_etc_hosts=modify_etc_hosts,
644 b989b9d9 Ken Wehr
    modify_ssh_setup=modify_ssh_setup,
645 39b0f0c2 Balazs Lecz
    uid_pool=uid_pool,
646 430b923c Iustin Pop
    ctime=now,
647 430b923c Iustin Pop
    mtime=now,
648 3953242f Iustin Pop
    maintain_node_health=maintain_node_health,
649 a721e23a Luca Bigliardi
    drbd_usermode_helper=drbd_helper,
650 bf4af505 Apollon Oikonomopoulos
    default_iallocator=default_iallocator,
651 2f20d07b Manuel Franceschini
    primary_ip_family=ipcls.family,
652 3d914585 Renรฉ Nussbaumer
    prealloc_wipe_disks=prealloc_wipe_disks,
653 bf689b7a Andrea Spadaccini
    use_external_mip_script=use_external_mip_script,
654 57dc299a Iustin Pop
    ipolicy=full_ipolicy,
655 c4929a8b Renรฉ Nussbaumer
    hv_state_static=hv_state,
656 c4929a8b Renรฉ Nussbaumer
    disk_state_static=disk_state,
657 3bde79ee Helga Velroyen
    enabled_disk_templates=enabled_disk_templates,
658 b9eeeb02 Michael Hanselmann
    )
659 b9eeeb02 Michael Hanselmann
  master_node_config = objects.Node(name=hostname.name,
660 b9eeeb02 Michael Hanselmann
                                    primary_ip=hostname.ip,
661 b9222f32 Guido Trotter
                                    secondary_ip=secondary_ip,
662 c044f32c Guido Trotter
                                    serial_no=1,
663 c044f32c Guido Trotter
                                    master_candidate=True,
664 af64c0ea Iustin Pop
                                    offline=False, drained=False,
665 435e4bd6 Michael Hanselmann
                                    ctime=now, mtime=now,
666 c044f32c Guido Trotter
                                    )
667 9e1333b9 Guido Trotter
  InitConfig(constants.CONFIG_VERSION, cluster_config, master_node_config)
668 d367b66c Manuel Franceschini
  cfg = config.ConfigWriter(offline=True)
669 7ede9c6a Michael Hanselmann
  ssh.WriteKnownHostsFile(cfg, pathutils.SSH_KNOWN_HOSTS_FILE)
670 a4eae71f Michael Hanselmann
  cfg.Update(cfg.GetClusterInfo(), logging.error)
671 ee501db1 Michael Hanselmann
  ssconf.WriteSsconfFiles(cfg.GetSsconfValues())
672 d367b66c Manuel Franceschini
673 d367b66c Manuel Franceschini
  # set up the inter-node password and certificate
674 d367b66c Manuel Franceschini
  _InitGanetiServerSetup(hostname.name)
675 827f753e Guido Trotter
676 952d7515 Michael Hanselmann
  logging.debug("Starting daemons")
677 7ede9c6a Michael Hanselmann
  result = utils.RunCmd([pathutils.DAEMON_UTIL, "start-all"])
678 952d7515 Michael Hanselmann
  if result.failed:
679 952d7515 Michael Hanselmann
    raise errors.OpExecError("Could not start daemons, command %s"
680 952d7515 Michael Hanselmann
                             " had exitcode %s and error %s" %
681 952d7515 Michael Hanselmann
                             (result.cmd, result.exit_code, result.output))
682 b3f1cf6f Iustin Pop
683 3b6b6129 Michael Hanselmann
  _WaitForMasterDaemon()
684 b3f1cf6f Iustin Pop
685 b1b6ea87 Iustin Pop
686 02f99608 Oleksiy Mishchenko
def InitConfig(version, cluster_config, master_node_config,
687 7ede9c6a Michael Hanselmann
               cfg_file=pathutils.CLUSTER_CONF_FILE):
688 7b3a8fb5 Iustin Pop
  """Create the initial cluster configuration.
689 7b3a8fb5 Iustin Pop

690 7b3a8fb5 Iustin Pop
  It will contain the current node, which will also be the master
691 7b3a8fb5 Iustin Pop
  node, and no instances.
692 7b3a8fb5 Iustin Pop

693 7b3a8fb5 Iustin Pop
  @type version: int
694 c41eea6e Iustin Pop
  @param version: configuration version
695 c41eea6e Iustin Pop
  @type cluster_config: L{objects.Cluster}
696 c41eea6e Iustin Pop
  @param cluster_config: cluster configuration
697 c41eea6e Iustin Pop
  @type master_node_config: L{objects.Node}
698 c41eea6e Iustin Pop
  @param master_node_config: master node configuration
699 c41eea6e Iustin Pop
  @type cfg_file: string
700 c41eea6e Iustin Pop
  @param cfg_file: configuration file path
701 c41eea6e Iustin Pop

702 7b3a8fb5 Iustin Pop
  """
703 88b92fe3 Guido Trotter
  uuid_generator = config.TemporaryReservationManager()
704 88b92fe3 Guido Trotter
  cluster_config.uuid = uuid_generator.Generate([], utils.NewUUID,
705 88b92fe3 Guido Trotter
                                                _INITCONF_ECID)
706 88b92fe3 Guido Trotter
  master_node_config.uuid = uuid_generator.Generate([], utils.NewUUID,
707 88b92fe3 Guido Trotter
                                                    _INITCONF_ECID)
708 1c3231aa Thomas Thrainer
  cluster_config.master_node = master_node_config.uuid
709 7b3a8fb5 Iustin Pop
  nodes = {
710 1c3231aa Thomas Thrainer
    master_node_config.uuid: master_node_config,
711 7b3a8fb5 Iustin Pop
    }
712 88b92fe3 Guido Trotter
  default_nodegroup = objects.NodeGroup(
713 88b92fe3 Guido Trotter
    uuid=uuid_generator.Generate([], utils.NewUUID, _INITCONF_ECID),
714 75cf411a Adeodato Simo
    name=constants.INITIAL_NODE_GROUP_NAME,
715 1c3231aa Thomas Thrainer
    members=[master_node_config.uuid],
716 99ccf8b9 Renรฉ Nussbaumer
    diskparams={},
717 88b92fe3 Guido Trotter
    )
718 88b92fe3 Guido Trotter
  nodegroups = {
719 88b92fe3 Guido Trotter
    default_nodegroup.uuid: default_nodegroup,
720 88b92fe3 Guido Trotter
    }
721 d693c864 Iustin Pop
  now = time.time()
722 7b3a8fb5 Iustin Pop
  config_data = objects.ConfigData(version=version,
723 7b3a8fb5 Iustin Pop
                                   cluster=cluster_config,
724 88b92fe3 Guido Trotter
                                   nodegroups=nodegroups,
725 7b3a8fb5 Iustin Pop
                                   nodes=nodes,
726 7b3a8fb5 Iustin Pop
                                   instances={},
727 eaa4c57c Dimitris Aragiorgis
                                   networks={},
728 d693c864 Iustin Pop
                                   serial_no=1,
729 d693c864 Iustin Pop
                                   ctime=now, mtime=now)
730 a33848a5 Guido Trotter
  utils.WriteFile(cfg_file,
731 a33848a5 Guido Trotter
                  data=serializer.Dump(config_data.ToDict()),
732 a33848a5 Guido Trotter
                  mode=0600)
733 02f99608 Oleksiy Mishchenko
734 02f99608 Oleksiy Mishchenko
735 1c3231aa Thomas Thrainer
def FinalizeClusterDestroy(master_uuid):
736 140aa4a8 Iustin Pop
  """Execute the last steps of cluster destroy
737 140aa4a8 Iustin Pop

738 140aa4a8 Iustin Pop
  This function shuts down all the daemons, completing the destroy
739 140aa4a8 Iustin Pop
  begun in cmdlib.LUDestroyOpcode.
740 140aa4a8 Iustin Pop

741 140aa4a8 Iustin Pop
  """
742 b989b9d9 Ken Wehr
  cfg = config.ConfigWriter()
743 b989b9d9 Ken Wehr
  modify_ssh_setup = cfg.GetClusterInfo().modify_ssh_setup
744 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
745 7c74bbe0 Andrea Spadaccini
746 1c3231aa Thomas Thrainer
  master_name = cfg.GetNodeName(master_uuid)
747 1c3231aa Thomas Thrainer
748 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
749 1c3231aa Thomas Thrainer
  master_params.uuid = master_uuid
750 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
751 1c3231aa Thomas Thrainer
  result = runner.call_node_deactivate_master_ip(master_name, master_params,
752 1c3231aa Thomas Thrainer
                                                 ems)
753 c79198a0 Andrea Spadaccini
754 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
755 7c74bbe0 Andrea Spadaccini
  if msg:
756 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
757 7c74bbe0 Andrea Spadaccini
758 1c3231aa Thomas Thrainer
  result = runner.call_node_stop_master(master_name)
759 3cebe102 Michael Hanselmann
  msg = result.fail_msg
760 6c00d19a Iustin Pop
  if msg:
761 099c52ad Iustin Pop
    logging.warning("Could not disable the master role: %s", msg)
762 7c74bbe0 Andrea Spadaccini
763 1c3231aa Thomas Thrainer
  result = runner.call_node_leave_cluster(master_name, modify_ssh_setup)
764 3cebe102 Michael Hanselmann
  msg = result.fail_msg
765 0623d351 Iustin Pop
  if msg:
766 0623d351 Iustin Pop
    logging.warning("Could not shutdown the node daemon and cleanup"
767 0623d351 Iustin Pop
                    " the node: %s", msg)
768 140aa4a8 Iustin Pop
769 140aa4a8 Iustin Pop
770 7b8ba235 Michael Hanselmann
def SetupNodeDaemon(opts, cluster_name, node):
771 827f753e Guido Trotter
  """Add a node to the cluster.
772 827f753e Guido Trotter

773 b1b6ea87 Iustin Pop
  This function must be called before the actual opcode, and will ssh
774 b1b6ea87 Iustin Pop
  to the remote node, copy the needed files, and start ganeti-noded,
775 b1b6ea87 Iustin Pop
  allowing the master to do the rest via normal rpc calls.
776 827f753e Guido Trotter

777 87622829 Iustin Pop
  @param cluster_name: the cluster name
778 87622829 Iustin Pop
  @param node: the name of the new node
779 827f753e Guido Trotter

780 827f753e Guido Trotter
  """
781 7b8ba235 Michael Hanselmann
  data = {
782 7b8ba235 Michael Hanselmann
    constants.NDS_CLUSTER_NAME: cluster_name,
783 7b8ba235 Michael Hanselmann
    constants.NDS_NODE_DAEMON_CERTIFICATE:
784 7b8ba235 Michael Hanselmann
      utils.ReadFile(pathutils.NODED_CERT_FILE),
785 7b8ba235 Michael Hanselmann
    constants.NDS_SSCONF: ssconf.SimpleStore().ReadAll(),
786 7b8ba235 Michael Hanselmann
    constants.NDS_START_NODE_DAEMON: True,
787 7b8ba235 Michael Hanselmann
    }
788 7b8ba235 Michael Hanselmann
789 7b8ba235 Michael Hanselmann
  RunNodeSetupCmd(cluster_name, node, pathutils.NODE_DAEMON_SETUP,
790 7b8ba235 Michael Hanselmann
                  opts.debug, opts.verbose,
791 7b8ba235 Michael Hanselmann
                  True, opts.ssh_key_check, opts.ssh_key_check, data)
792 827f753e Guido Trotter
793 5627f375 Michael Hanselmann
  _WaitForNodeDaemon(node)
794 5627f375 Michael Hanselmann
795 b1b6ea87 Iustin Pop
796 8e2524c3 Guido Trotter
def MasterFailover(no_voting=False):
797 b1b6ea87 Iustin Pop
  """Failover the master node.
798 b1b6ea87 Iustin Pop

799 b1b6ea87 Iustin Pop
  This checks that we are not already the master, and will cause the
800 b1b6ea87 Iustin Pop
  current master to cease being master, and the non-master to become
801 b1b6ea87 Iustin Pop
  new master.
802 b1b6ea87 Iustin Pop

803 8e2524c3 Guido Trotter
  @type no_voting: boolean
804 8e2524c3 Guido Trotter
  @param no_voting: force the operation without remote nodes agreement
805 8e2524c3 Guido Trotter
                      (dangerous)
806 8e2524c3 Guido Trotter

807 b1b6ea87 Iustin Pop
  """
808 8135a2db Iustin Pop
  sstore = ssconf.SimpleStore()
809 b1b6ea87 Iustin Pop
810 8135a2db Iustin Pop
  old_master, new_master = ssconf.GetMasterAndMyself(sstore)
811 1c3231aa Thomas Thrainer
  node_names = sstore.GetNodeList()
812 8135a2db Iustin Pop
  mc_list = sstore.GetMasterCandidates()
813 b1b6ea87 Iustin Pop
814 b1b6ea87 Iustin Pop
  if old_master == new_master:
815 b1b6ea87 Iustin Pop
    raise errors.OpPrereqError("This commands must be run on the node"
816 b1b6ea87 Iustin Pop
                               " where you want the new master to be."
817 b1b6ea87 Iustin Pop
                               " %s is already the master" %
818 debac808 Iustin Pop
                               old_master, errors.ECODE_INVAL)
819 d5927e48 Iustin Pop
820 8135a2db Iustin Pop
  if new_master not in mc_list:
821 8135a2db Iustin Pop
    mc_no_master = [name for name in mc_list if name != old_master]
822 8135a2db Iustin Pop
    raise errors.OpPrereqError("This node is not among the nodes marked"
823 8135a2db Iustin Pop
                               " as master candidates. Only these nodes"
824 8135a2db Iustin Pop
                               " can become masters. Current list of"
825 8135a2db Iustin Pop
                               " master candidates is:\n"
826 3ccb3a64 Michael Hanselmann
                               "%s" % ("\n".join(mc_no_master)),
827 debac808 Iustin Pop
                               errors.ECODE_STATE)
828 8135a2db Iustin Pop
829 8e2524c3 Guido Trotter
  if not no_voting:
830 1c3231aa Thomas Thrainer
    vote_list = GatherMasterVotes(node_names)
831 8e2524c3 Guido Trotter
832 8e2524c3 Guido Trotter
    if vote_list:
833 8e2524c3 Guido Trotter
      voted_master = vote_list[0][0]
834 8e2524c3 Guido Trotter
      if voted_master is None:
835 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("Cluster is inconsistent, most nodes did"
836 debac808 Iustin Pop
                                   " not respond.", errors.ECODE_ENVIRON)
837 8e2524c3 Guido Trotter
      elif voted_master != old_master:
838 8e2524c3 Guido Trotter
        raise errors.OpPrereqError("I have a wrong configuration, I believe"
839 8e2524c3 Guido Trotter
                                   " the master is %s but the other nodes"
840 8e2524c3 Guido Trotter
                                   " voted %s. Please resync the configuration"
841 8e2524c3 Guido Trotter
                                   " of this node." %
842 debac808 Iustin Pop
                                   (old_master, voted_master),
843 debac808 Iustin Pop
                                   errors.ECODE_STATE)
844 b1b6ea87 Iustin Pop
  # end checks
845 b1b6ea87 Iustin Pop
846 b1b6ea87 Iustin Pop
  rcode = 0
847 b1b6ea87 Iustin Pop
848 d5927e48 Iustin Pop
  logging.info("Setting master to %s, old master: %s", new_master, old_master)
849 b1b6ea87 Iustin Pop
850 21004460 Iustin Pop
  try:
851 21004460 Iustin Pop
    # instantiate a real config writer, as we now know we have the
852 21004460 Iustin Pop
    # configuration data
853 eb180fe2 Iustin Pop
    cfg = config.ConfigWriter(accept_foreign=True)
854 21004460 Iustin Pop
855 1c3231aa Thomas Thrainer
    old_master_node = cfg.GetNodeInfoByName(old_master)
856 1c3231aa Thomas Thrainer
    if old_master_node is None:
857 1c3231aa Thomas Thrainer
      raise errors.OpPrereqError("Could not find old master node '%s' in"
858 1c3231aa Thomas Thrainer
                                 " cluster configuration." % old_master,
859 1c3231aa Thomas Thrainer
                                 errors.ECODE_NOENT)
860 1c3231aa Thomas Thrainer
861 21004460 Iustin Pop
    cluster_info = cfg.GetClusterInfo()
862 1c3231aa Thomas Thrainer
    new_master_node = cfg.GetNodeInfoByName(new_master)
863 1c3231aa Thomas Thrainer
    if new_master_node is None:
864 1c3231aa Thomas Thrainer
      raise errors.OpPrereqError("Could not find new master node '%s' in"
865 1c3231aa Thomas Thrainer
                                 " cluster configuration." % new_master,
866 1c3231aa Thomas Thrainer
                                 errors.ECODE_NOENT)
867 1c3231aa Thomas Thrainer
868 1c3231aa Thomas Thrainer
    cluster_info.master_node = new_master_node.uuid
869 21004460 Iustin Pop
    # this will also regenerate the ssconf files, since we updated the
870 21004460 Iustin Pop
    # cluster info
871 21004460 Iustin Pop
    cfg.Update(cluster_info, logging.error)
872 21004460 Iustin Pop
  except errors.ConfigurationError, err:
873 21004460 Iustin Pop
    logging.error("Error while trying to set the new master: %s",
874 21004460 Iustin Pop
                  str(err))
875 21004460 Iustin Pop
    return 1
876 21004460 Iustin Pop
877 21004460 Iustin Pop
  # if cfg.Update worked, then it means the old master daemon won't be
878 21004460 Iustin Pop
  # able now to write its own config file (we rely on locking in both
879 21004460 Iustin Pop
  # backend.UploadFile() and ConfigWriter._Write(); hence the next
880 21004460 Iustin Pop
  # step is to kill the old master
881 21004460 Iustin Pop
882 21004460 Iustin Pop
  logging.info("Stopping the master daemon on node %s", old_master)
883 21004460 Iustin Pop
884 7c74bbe0 Andrea Spadaccini
  runner = rpc.BootstrapRunner()
885 f9d20654 Andrea Spadaccini
  master_params = cfg.GetMasterNetworkParameters()
886 1c3231aa Thomas Thrainer
  master_params.uuid = old_master_node.uuid
887 57c7bc57 Andrea Spadaccini
  ems = cfg.GetUseExternalMipScript()
888 1c3231aa Thomas Thrainer
  result = runner.call_node_deactivate_master_ip(old_master,
889 57c7bc57 Andrea Spadaccini
                                                 master_params, ems)
890 c79198a0 Andrea Spadaccini
891 7c74bbe0 Andrea Spadaccini
  msg = result.fail_msg
892 7c74bbe0 Andrea Spadaccini
  if msg:
893 7c74bbe0 Andrea Spadaccini
    logging.warning("Could not disable the master IP: %s", msg)
894 7c74bbe0 Andrea Spadaccini
895 7c74bbe0 Andrea Spadaccini
  result = runner.call_node_stop_master(old_master)
896 3cebe102 Michael Hanselmann
  msg = result.fail_msg
897 6c00d19a Iustin Pop
  if msg:
898 d5927e48 Iustin Pop
    logging.error("Could not disable the master role on the old master"
899 5ae4945a Iustin Pop
                  " %s, please disable manually: %s", old_master, msg)
900 b1b6ea87 Iustin Pop
901 21004460 Iustin Pop
  logging.info("Checking master IP non-reachability...")
902 21004460 Iustin Pop
903 425f0f54 Iustin Pop
  master_ip = sstore.GetMasterIP()
904 425f0f54 Iustin Pop
  total_timeout = 30
905 e687ec01 Michael Hanselmann
906 d23ef431 Michael Hanselmann
  # Here we have a phase where no master should be running
907 425f0f54 Iustin Pop
  def _check_ip():
908 a744b676 Manuel Franceschini
    if netutils.TcpPing(master_ip, constants.DEFAULT_NODED_PORT):
909 425f0f54 Iustin Pop
      raise utils.RetryAgain()
910 425f0f54 Iustin Pop
911 425f0f54 Iustin Pop
  try:
912 425f0f54 Iustin Pop
    utils.Retry(_check_ip, (1, 1.5, 5), total_timeout)
913 425f0f54 Iustin Pop
  except utils.RetryTimeout:
914 425f0f54 Iustin Pop
    logging.warning("The master IP is still reachable after %s seconds,"
915 425f0f54 Iustin Pop
                    " continuing but activating the master on the current"
916 425f0f54 Iustin Pop
                    " node will probably fail", total_timeout)
917 b1b6ea87 Iustin Pop
918 ff699aa9 Michael Hanselmann
  if jstore.CheckDrainFlag():
919 ff699aa9 Michael Hanselmann
    logging.info("Undraining job queue")
920 ff699aa9 Michael Hanselmann
    jstore.SetDrainFlag(False)
921 ff699aa9 Michael Hanselmann
922 21004460 Iustin Pop
  logging.info("Starting the master daemons on the new master")
923 d5927e48 Iustin Pop
924 db04ce5d Michael Hanselmann
  result = rpc.BootstrapRunner().call_node_start_master_daemons(new_master,
925 db04ce5d Michael Hanselmann
                                                                no_voting)
926 3cebe102 Michael Hanselmann
  msg = result.fail_msg
927 b726aff0 Iustin Pop
  if msg:
928 d5927e48 Iustin Pop
    logging.error("Could not start the master role on the new master"
929 b726aff0 Iustin Pop
                  " %s, please check: %s", new_master, msg)
930 b1b6ea87 Iustin Pop
    rcode = 1
931 b1b6ea87 Iustin Pop
932 21004460 Iustin Pop
  logging.info("Master failed over from %s to %s", old_master, new_master)
933 b1b6ea87 Iustin Pop
  return rcode
934 d7cdb55d Iustin Pop
935 d7cdb55d Iustin Pop
936 8eb148ae Iustin Pop
def GetMaster():
937 8eb148ae Iustin Pop
  """Returns the current master node.
938 8eb148ae Iustin Pop

939 8eb148ae Iustin Pop
  This is a separate function in bootstrap since it's needed by
940 8eb148ae Iustin Pop
  gnt-cluster, and instead of importing directly ssconf, it's better
941 8eb148ae Iustin Pop
  to abstract it in bootstrap, where we do use ssconf in other
942 8eb148ae Iustin Pop
  functions too.
943 8eb148ae Iustin Pop

944 8eb148ae Iustin Pop
  """
945 8eb148ae Iustin Pop
  sstore = ssconf.SimpleStore()
946 8eb148ae Iustin Pop
947 8eb148ae Iustin Pop
  old_master, _ = ssconf.GetMasterAndMyself(sstore)
948 8eb148ae Iustin Pop
949 8eb148ae Iustin Pop
  return old_master
950 8eb148ae Iustin Pop
951 8eb148ae Iustin Pop
952 1c3231aa Thomas Thrainer
def GatherMasterVotes(node_names):
953 d7cdb55d Iustin Pop
  """Check the agreement on who is the master.
954 d7cdb55d Iustin Pop

955 d7cdb55d Iustin Pop
  This function will return a list of (node, number of votes), ordered
956 d7cdb55d Iustin Pop
  by the number of votes. Errors will be denoted by the key 'None'.
957 d7cdb55d Iustin Pop

958 d7cdb55d Iustin Pop
  Note that the sum of votes is the number of nodes this machine
959 d7cdb55d Iustin Pop
  knows, whereas the number of entries in the list could be different
960 d7cdb55d Iustin Pop
  (if some nodes vote for another master).
961 d7cdb55d Iustin Pop

962 d7cdb55d Iustin Pop
  We remove ourselves from the list since we know that (bugs aside)
963 d7cdb55d Iustin Pop
  since we use the same source for configuration information for both
964 d7cdb55d Iustin Pop
  backend and boostrap, we'll always vote for ourselves.
965 d7cdb55d Iustin Pop

966 1c3231aa Thomas Thrainer
  @type node_names: list
967 1c3231aa Thomas Thrainer
  @param node_names: the list of nodes to query for master info; the current
968 5bbd3f7f Michael Hanselmann
      node will be removed if it is in the list
969 d7cdb55d Iustin Pop
  @rtype: list
970 d7cdb55d Iustin Pop
  @return: list of (node, votes)
971 d7cdb55d Iustin Pop

972 d7cdb55d Iustin Pop
  """
973 b705c7a6 Manuel Franceschini
  myself = netutils.Hostname.GetSysName()
974 d7cdb55d Iustin Pop
  try:
975 1c3231aa Thomas Thrainer
    node_names.remove(myself)
976 d7cdb55d Iustin Pop
  except ValueError:
977 d7cdb55d Iustin Pop
    pass
978 1c3231aa Thomas Thrainer
  if not node_names:
979 d7cdb55d Iustin Pop
    # no nodes left (eventually after removing myself)
980 d7cdb55d Iustin Pop
    return []
981 1c3231aa Thomas Thrainer
  results = rpc.BootstrapRunner().call_master_info(node_names)
982 d7cdb55d Iustin Pop
  if not isinstance(results, dict):
983 d7cdb55d Iustin Pop
    # this should not happen (unless internal error in rpc)
984 d7cdb55d Iustin Pop
    logging.critical("Can't complete rpc call, aborting master startup")
985 1c3231aa Thomas Thrainer
    return [(None, len(node_names))]
986 d7cdb55d Iustin Pop
  votes = {}
987 1c3231aa Thomas Thrainer
  for node_name in results:
988 1c3231aa Thomas Thrainer
    nres = results[node_name]
989 2a52a064 Iustin Pop
    data = nres.payload
990 3cebe102 Michael Hanselmann
    msg = nres.fail_msg
991 2a52a064 Iustin Pop
    fail = False
992 2a52a064 Iustin Pop
    if msg:
993 1c3231aa Thomas Thrainer
      logging.warning("Error contacting node %s: %s", node_name, msg)
994 2a52a064 Iustin Pop
      fail = True
995 909b3a0e Andrea Spadaccini
    # for now we accept both length 3, 4 and 5 (data[3] is primary ip version
996 909b3a0e Andrea Spadaccini
    # and data[4] is the master netmask)
997 2a52a064 Iustin Pop
    elif not isinstance(data, (tuple, list)) or len(data) < 3:
998 1c3231aa Thomas Thrainer
      logging.warning("Invalid data received from node %s: %s",
999 1c3231aa Thomas Thrainer
                      node_name, data)
1000 2a52a064 Iustin Pop
      fail = True
1001 2a52a064 Iustin Pop
    if fail:
1002 d7cdb55d Iustin Pop
      if None not in votes:
1003 d7cdb55d Iustin Pop
        votes[None] = 0
1004 d7cdb55d Iustin Pop
      votes[None] += 1
1005 d7cdb55d Iustin Pop
      continue
1006 781de953 Iustin Pop
    master_node = data[2]
1007 d7cdb55d Iustin Pop
    if master_node not in votes:
1008 d7cdb55d Iustin Pop
      votes[master_node] = 0
1009 d7cdb55d Iustin Pop
    votes[master_node] += 1
1010 d7cdb55d Iustin Pop
1011 d7cdb55d Iustin Pop
  vote_list = [v for v in votes.items()]
1012 d7cdb55d Iustin Pop
  # sort first on number of votes then on name, since we want None
1013 d7cdb55d Iustin Pop
  # sorted later if we have the half of the nodes not responding, and
1014 d7cdb55d Iustin Pop
  # half voting all for the same master
1015 d7cdb55d Iustin Pop
  vote_list.sort(key=lambda x: (x[1], x[0]), reverse=True)
1016 d7cdb55d Iustin Pop
1017 d7cdb55d Iustin Pop
  return vote_list