Statistics
| Branch: | Tag: | Revision:

root / snf-cyclades-app / synnefo / logic / callbacks.py @ 368d879e

History | View | Annotate | Download (11.6 kB)

1
# Copyright 2011 GRNET S.A. All rights reserved.
2
#
3
# Redistribution and use in source and binary forms, with or without
4
# modification, are permitted provided that the following conditions
5
# are met:
6
#
7
#   1. Redistributions of source code must retain the above copyright
8
#      notice, this list of conditions and the following disclaimer.
9
#
10
#  2. Redistributions in binary form must reproduce the above copyright
11
#     notice, this list of conditions and the following disclaimer in the
12
#     documentation and/or other materials provided with the distribution.
13
#
14
# THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
15
# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17
# ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
18
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20
# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23
# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24
# SUCH DAMAGE.
25
#
26
# The views and conclusions contained in the software and documentation are
27
# those of the authors and should not be interpreted as representing official
28
# policies, either expressed or implied, of GRNET S.A.
29

    
30
# Callback functions used by the dispatcher to process incoming notifications
31
# from AMQP queues.
32

    
33
import logging
34
import json
35
from functools import wraps
36

    
37
from django.db import transaction
38
from synnefo.db.models import (Backend, VirtualMachine, Network,
39
                               BackendNetwork, pooled_rapi_client)
40
from synnefo.logic import utils, backend as backend_mod
41

    
42
from synnefo.lib.utils import merge_time
43

    
44
log = logging.getLogger(__name__)
45

    
46

    
47
def handle_message_delivery(func):
48
    """ Generic decorator for handling messages.
49

50
    This decorator is responsible for converting the message into json format,
51
    handling of common exceptions and acknowledment of message if needed.
52

53
    """
54
    @wraps(func)
55
    def wrapper(client, message, *args, **kwargs):
56
        try:
57
            msg = None
58
            msg = json.loads(message['body'])
59
            func(msg)
60
            client.basic_ack(message)
61
        except ValueError as e:
62
            log.error("Incoming message not in JSON format %s: %s", e, message)
63
            client.basic_nack(message)
64
        except KeyError as e:
65
            log.error("Malformed incoming JSON, missing attribute %s: %s",
66
                      e, message)
67
            client.basic_nack(message)
68
        except Exception as e:
69
            if msg:
70
                log.exception("Unexpected error: %s, msg: %s", e, msg)
71
            else:
72
                log.exception("Unexpected error: %s", e)
73
            client.basic_reject(message)
74

    
75
    return wrapper
76

    
77

    
78
def instance_from_msg(func):
79
    """ Decorator for getting the VirtualMachine object of the msg.
80

81
    """
82
    @handle_message_delivery
83
    @wraps(func)
84
    def wrapper(msg):
85
        try:
86
            vm_id = utils.id_from_instance_name(msg["instance"])
87
            vm = VirtualMachine.objects.select_for_update().get(id=vm_id)
88
            func(vm, msg)
89
        except VirtualMachine.InvalidBackendIdError:
90
            log.debug("Ignoring msg for unknown instance %s.", msg['instance'])
91
        except VirtualMachine.DoesNotExist:
92
            log.error("VM for instance %s with id %d not found in DB.",
93
                      msg['instance'], vm_id)
94
        except (Network.InvalidBackendIdError, Network.DoesNotExist) as e:
95
            log.error("Invalid message, can not find network. msg: %s", msg)
96
    return wrapper
97

    
98

    
99
def network_from_msg(func):
100
    """ Decorator for getting the BackendNetwork object of the msg.
101

102
    """
103
    @handle_message_delivery
104
    @wraps(func)
105
    def wrapper(msg):
106
        try:
107
            network_id = utils.id_from_network_name(msg["network"])
108
            network = Network.objects.select_for_update().get(id=network_id)
109
            backend = Backend.objects.get(clustername=msg['cluster'])
110
            bnet, new = BackendNetwork.objects.get_or_create(network=network,
111
                                                             backend=backend)
112
            if new:
113
                log.info("Created missing BackendNetwork %s", bnet)
114
            func(bnet, msg)
115
        except Network.InvalidBackendIdError:
116
            log.debug("Ignoring msg for unknown network %s.", msg['network'])
117
        except Network.DoesNotExist:
118
            log.error("Network %s not found in DB.", msg['network'])
119
        except Backend.DoesNotExist:
120
            log.error("Backend %s not found in DB.", msg['cluster'])
121
        except BackendNetwork.DoesNotExist:
122
            log.error("Network %s on backend %s not found in DB.",
123
                      msg['network'], msg['cluster'])
124
    return wrapper
125

    
126

    
127
def if_update_required(func):
128
    """
129
    Decorator for checking if an incoming message needs to update the db.
130

131
    The database will not be updated in the following cases:
132
    - The message has been redelivered and the action has already been
133
      completed. In this case the event_time will be equal with the one
134
      in the database.
135
    - The message describes a previous state in the ganeti, from the one that
136
      is described in the db. In this case the event_time will be smaller from
137
      the one in the database.
138

139
    """
140
    @wraps(func)
141
    def wrapper(target, msg):
142
        try:
143
            event_time = merge_time(msg['event_time'])
144
        except:
145
            log.error("Received message with malformed time: %s",
146
                      msg['event_time'])
147
            raise KeyError
148

    
149
        db_time = target.backendtime
150

    
151
        if db_time and event_time <= db_time:
152
            format_ = "%d/%m/%y %H:%M:%S:%f"
153
            log.debug("Ignoring message %s.\nevent_timestamp: %s"
154
                      " db_timestamp: %s",
155
                      msg,
156
                      event_time.strftime(format_),
157
                      db_time.strftime(format_))
158
            return
159
        # New message. Update the database!
160
        func(target, msg, event_time)
161

    
162
    return wrapper
163

    
164

    
165
@instance_from_msg
166
@if_update_required
167
def update_db(vm, msg, event_time):
168
    """Process a notification of type 'ganeti-op-status'"""
169
    log.debug("Processing ganeti-op-status msg: %s", msg)
170

    
171
    if msg['type'] != "ganeti-op-status":
172
        log.error("Message is of unknown type %s.", msg['type'])
173
        return
174

    
175
    operation = msg["operation"]
176
    status = msg["status"]
177
    jobID = msg["jobId"]
178
    logmsg = msg["logmsg"]
179
    nics = msg.get("instance_nics", None)
180
    job_fields = msg.get("job_fields", {})
181

    
182
    # Special case: OP_INSTANCE_CREATE with opportunistic locking may fail
183
    # if all Ganeti nodes are already locked. Retry the job without
184
    # opportunistic locking..
185
    if (operation == "OP_INSTANCE_CREATE" and status == "error" and
186
       job_fields.get("opportunistic_locking", False)):
187
        if vm.backendjobid != jobID:  # The job has already been retried!
188
            return
189
        # Remove extra fields
190
        [job_fields.pop(f) for f in ("OP_ID", "reason")]
191
        name = job_fields.pop("name", job_fields.pop("instance_name"))
192
        # Turn off opportunistic locking before retrying the job
193
        job_fields["opportunistic_locking"] = False
194
        with pooled_rapi_client(vm) as c:
195
            jobID = c.CreateInstance(name=name, **job_fields)
196
        # Update the VM fields
197
        vm.backendjobid = jobID
198
        # Update the task_job_id for commissions
199
        vm.task_job_id = jobID
200
        vm.backendjobstatus = None
201
        vm.save()
202
        log.info("Retrying failed creation of instance '%s' without"
203
                 " opportunistic locking. New job ID: '%s'", name, jobID)
204
        return
205

    
206
    backend_mod.process_op_status(vm, event_time, jobID,
207
                                  operation, status,
208
                                  logmsg, nics=nics,
209
                                  job_fields=job_fields)
210

    
211
    log.debug("Done processing ganeti-op-status msg for vm %s.",
212
              msg['instance'])
213

    
214

    
215
@network_from_msg
216
@if_update_required
217
def update_network(network, msg, event_time):
218
    """Process a notification of type 'ganeti-network-status'"""
219
    log.debug("Processing ganeti-network-status msg: %s", msg)
220

    
221
    if msg['type'] != "ganeti-network-status":
222
        log.error("Message is of unknown type %s.", msg['type'])
223
        return
224

    
225
    opcode = msg['operation']
226
    status = msg['status']
227
    jobid = msg['jobId']
228
    job_fields = msg.get('job_fields', {})
229

    
230
    if opcode == "OP_NETWORK_SET_PARAMS":
231
        backend_mod.process_network_modify(network, event_time, jobid, opcode,
232
                                           status, job_fields)
233
    else:
234
        backend_mod.process_network_status(network, event_time, jobid, opcode,
235
                                           status, msg['logmsg'])
236

    
237
    log.debug("Done processing ganeti-network-status msg for network %s.",
238
              msg['network'])
239

    
240

    
241
@instance_from_msg
242
@if_update_required
243
def update_build_progress(vm, msg, event_time):
244
    """
245
    Process a create progress message. Update build progress, or create
246
    appropriate diagnostic entries for the virtual machine instance.
247
    """
248
    log.debug("Processing ganeti-create-progress msg: %s", msg)
249

    
250
    if msg['type'] not in ('image-copy-progress', 'image-error', 'image-info',
251
                           'image-warning', 'image-helper'):
252
        log.error("Message is of unknown type %s", msg['type'])
253
        return
254

    
255
    if msg['type'] == 'image-copy-progress':
256
        backend_mod.process_create_progress(vm, event_time, msg['progress'])
257
        # we do not add diagnostic messages for copy-progress messages
258
        return
259

    
260
    # default diagnostic fields
261
    source = msg['type']
262
    level = 'DEBUG'
263
    message = msg.get('messages', '')
264
    if isinstance(message, list):
265
        message = " ".join(message)
266

    
267
    details = msg.get('stderr', None)
268

    
269
    if msg['type'] == 'image-helper':
270
        # for helper task events join subtype to diagnostic source and
271
        # set task name as diagnostic message
272
        if msg.get('subtype', None):
273
            if msg.get('subtype') in ['task-start', 'task-end']:
274
                message = msg.get('task', message)
275
                source = "%s-%s" % (source, msg.get('subtype'))
276

    
277
        if msg.get('subtype', None) == 'warning':
278
            level = 'WARNING'
279

    
280
        if msg.get('subtype', None) == 'error':
281
            level = 'ERROR'
282

    
283
        if msg.get('subtype', None) == 'info':
284
            level = 'INFO'
285

    
286
    if msg['type'] == 'image-error':
287
        level = 'ERROR'
288

    
289
    if msg['type'] == 'image-warning':
290
        level = 'WARNING'
291

    
292
    if not message.strip():
293
        message = " ".join(source.split("-")).capitalize()
294

    
295
    # create the diagnostic entry
296
    backend_mod.create_instance_diagnostic(vm, message, source, level,
297
                                           event_time, details=details)
298

    
299
    log.debug("Done processing ganeti-create-progress msg for vm %s.",
300
              msg['instance'])
301

    
302

    
303
@handle_message_delivery
304
@transaction.commit_on_success()
305
def update_cluster(msg):
306
    clustername = msg.get("cluster")
307
    if clustername is None:
308
        return
309
    backend = Backend.objects.select_for_update().get(clustername=clustername)
310
    backend_mod.update_backend_disk_templates(backend)
311
    backend_mod.update_backend_resources(backend)
312

    
313

    
314
def dummy_proc(client, message, *args, **kwargs):
315
    try:
316
        log.debug("Msg: %s", message['body'])
317
        client.basic_ack(message)
318
    except Exception as e:
319
        log.exception("Could not receive message %s" % e)