Statistics
| Branch: | Tag: | Revision:

root / snf-cyclades-app / synnefo / logic / callbacks.py @ 7b4a61dc

History | View | Annotate | Download (11.3 kB)

1
# Copyright 2011 GRNET S.A. All rights reserved.
2
#
3
# Redistribution and use in source and binary forms, with or without
4
# modification, are permitted provided that the following conditions
5
# are met:
6
#
7
#   1. Redistributions of source code must retain the above copyright
8
#      notice, this list of conditions and the following disclaimer.
9
#
10
#  2. Redistributions in binary form must reproduce the above copyright
11
#     notice, this list of conditions and the following disclaimer in the
12
#     documentation and/or other materials provided with the distribution.
13
#
14
# THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
15
# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17
# ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
18
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20
# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23
# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24
# SUCH DAMAGE.
25
#
26
# The views and conclusions contained in the software and documentation are
27
# those of the authors and should not be interpreted as representing official
28
# policies, either expressed or implied, of GRNET S.A.
29

    
30
# Callback functions used by the dispatcher to process incoming notifications
31
# from AMQP queues.
32

    
33
import logging
34
import json
35
from functools import wraps
36

    
37
from synnefo.db.models import (Backend, VirtualMachine, Network,
38
                               BackendNetwork, pooled_rapi_client)
39
from synnefo.logic import utils, backend
40

    
41
from synnefo.lib.utils import merge_time
42

    
43
log = logging.getLogger(__name__)
44

    
45

    
46
def handle_message_delivery(func):
47
    """ Generic decorator for handling messages.
48

49
    This decorator is responsible for converting the message into json format,
50
    handling of common exceptions and acknowledment of message if needed.
51

52
    """
53
    @wraps(func)
54
    def wrapper(client, message, *args, **kwargs):
55
        try:
56
            msg = None
57
            msg = json.loads(message['body'])
58
            func(msg)
59
            client.basic_ack(message)
60
        except ValueError as e:
61
            log.error("Incoming message not in JSON format %s: %s", e, message)
62
            client.basic_nack(message)
63
        except KeyError as e:
64
            log.error("Malformed incoming JSON, missing attribute %s: %s",
65
                      e, message)
66
            client.basic_nack(message)
67
        except Exception as e:
68
            if msg:
69
                log.exception("Unexpected error: %s, msg: %s", e, msg)
70
            else:
71
                log.exception("Unexpected error: %s", e)
72
            client.basic_reject(message)
73

    
74
    return wrapper
75

    
76

    
77
def instance_from_msg(func):
78
    """ Decorator for getting the VirtualMachine object of the msg.
79

80
    """
81
    @handle_message_delivery
82
    @wraps(func)
83
    def wrapper(msg):
84
        try:
85
            vm_id = utils.id_from_instance_name(msg["instance"])
86
            vm = VirtualMachine.objects.select_for_update().get(id=vm_id)
87
            func(vm, msg)
88
        except VirtualMachine.InvalidBackendIdError:
89
            log.debug("Ignoring msg for unknown instance %s.", msg['instance'])
90
        except VirtualMachine.DoesNotExist:
91
            log.error("VM for instance %s with id %d not found in DB.",
92
                      msg['instance'], vm_id)
93
        except (Network.InvalidBackendIdError, Network.DoesNotExist) as e:
94
            log.error("Invalid message, can not find network. msg: %s", msg)
95
    return wrapper
96

    
97

    
98
def network_from_msg(func):
99
    """ Decorator for getting the BackendNetwork object of the msg.
100

101
    """
102
    @handle_message_delivery
103
    @wraps(func)
104
    def wrapper(msg):
105
        try:
106
            network_id = utils.id_from_network_name(msg["network"])
107
            network = Network.objects.select_for_update().get(id=network_id)
108
            backend = Backend.objects.get(clustername=msg['cluster'])
109
            bnet, new = BackendNetwork.objects.get_or_create(network=network,
110
                                                             backend=backend)
111
            if new:
112
                log.info("Created missing BackendNetwork %s", bnet)
113
            func(bnet, msg)
114
        except Network.InvalidBackendIdError:
115
            log.debug("Ignoring msg for unknown network %s.", msg['network'])
116
        except Network.DoesNotExist:
117
            log.error("Network %s not found in DB.", msg['network'])
118
        except Backend.DoesNotExist:
119
            log.error("Backend %s not found in DB.", msg['cluster'])
120
        except BackendNetwork.DoesNotExist:
121
            log.error("Network %s on backend %s not found in DB.",
122
                      msg['network'], msg['cluster'])
123
    return wrapper
124

    
125

    
126
def if_update_required(func):
127
    """
128
    Decorator for checking if an incoming message needs to update the db.
129

130
    The database will not be updated in the following cases:
131
    - The message has been redelivered and the action has already been
132
      completed. In this case the event_time will be equal with the one
133
      in the database.
134
    - The message describes a previous state in the ganeti, from the one that
135
      is described in the db. In this case the event_time will be smaller from
136
      the one in the database.
137

138
    """
139
    @wraps(func)
140
    def wrapper(target, msg):
141
        try:
142
            event_time = merge_time(msg['event_time'])
143
        except:
144
            log.error("Received message with malformed time: %s",
145
                      msg['event_time'])
146
            raise KeyError
147

    
148
        db_time = target.backendtime
149

    
150
        if db_time and event_time <= db_time:
151
            format_ = "%d/%m/%y %H:%M:%S:%f"
152
            log.debug("Ignoring message %s.\nevent_timestamp: %s"
153
                      " db_timestamp: %s",
154
                      msg,
155
                      event_time.strftime(format_),
156
                      db_time.strftime(format_))
157
            return
158
        # New message. Update the database!
159
        func(target, msg, event_time)
160

    
161
    return wrapper
162

    
163

    
164
@instance_from_msg
165
@if_update_required
166
def update_db(vm, msg, event_time):
167
    """Process a notification of type 'ganeti-op-status'"""
168
    log.debug("Processing ganeti-op-status msg: %s", msg)
169

    
170
    if msg['type'] != "ganeti-op-status":
171
        log.error("Message is of unknown type %s.", msg['type'])
172
        return
173

    
174
    operation = msg["operation"]
175
    status = msg["status"]
176
    jobID = msg["jobId"]
177
    logmsg = msg["logmsg"]
178
    nics = msg.get("nics", None)
179
    job_fields = msg.get("job_fields", {})
180

    
181
    # Special case: OP_INSTANCE_CREATE with opportunistic locking may fail
182
    # if all Ganeti nodes are already locked. Retry the job without
183
    # opportunistic locking..
184
    if (operation == "OP_INSTANCE_CREATE" and status == "error" and
185
       job_fields.get("opportunistic_locking", False)):
186
        if vm.backendjobid != jobID:  # The job has already been retried!
187
            return
188
        # Remove extra fields
189
        [job_fields.pop(f) for f in ("OP_ID", "reason")]
190
        # Remove 'pnode' and 'snode' if they were set by Ganeti iallocator.
191
        # Ganeti will fail if both allocator and nodes are specified.
192
        allocator = job_fields.pop("iallocator")
193
        if allocator is not None:
194
            [job_fields.pop(f) for f in ("pnode", "snode")]
195
        name = job_fields.pop("name", job_fields.pop("instance_name"))
196
        # Turn off opportunistic locking before retrying the job
197
        job_fields["opportunistic_locking"] = False
198
        with pooled_rapi_client(vm) as c:
199
            jobID = c.CreateInstance(name=name, **job_fields)
200
        # Update the VM fields
201
        vm.backendjobid = jobID
202
        vm.backendjobstatus = None
203
        vm.save()
204
        log.info("Retrying failed creation of instance '%s' without"
205
                 " opportunistic locking. New job ID: '%s'", name, jobID)
206
        return
207

    
208
    backend.process_op_status(vm, event_time, jobID, operation,
209
                              status, logmsg, nics)
210

    
211
    log.debug("Done processing ganeti-op-status msg for vm %s.",
212
              msg['instance'])
213

    
214

    
215
@network_from_msg
216
@if_update_required
217
def update_network(network, msg, event_time):
218
    """Process a notification of type 'ganeti-network-status'"""
219
    log.debug("Processing ganeti-network-status msg: %s", msg)
220

    
221
    if msg['type'] != "ganeti-network-status":
222
        log.error("Message is of unknown type %s.", msg['type'])
223
        return
224

    
225
    opcode = msg['operation']
226
    status = msg['status']
227
    jobid = msg['jobId']
228

    
229
    if opcode == "OP_NETWORK_SET_PARAMS":
230
        backend.process_network_modify(network, event_time, jobid, opcode,
231
                                       status, msg['add_reserved_ips'],
232
                                       msg['remove_reserved_ips'])
233
    else:
234
        backend.process_network_status(network, event_time, jobid, opcode,
235
                                       status, msg['logmsg'])
236

    
237
    log.debug("Done processing ganeti-network-status msg for network %s.",
238
              msg['network'])
239

    
240

    
241
@instance_from_msg
242
@if_update_required
243
def update_build_progress(vm, msg, event_time):
244
    """
245
    Process a create progress message. Update build progress, or create
246
    appropriate diagnostic entries for the virtual machine instance.
247
    """
248
    log.debug("Processing ganeti-create-progress msg: %s", msg)
249

    
250
    if msg['type'] not in ('image-copy-progress', 'image-error', 'image-info',
251
                           'image-warning', 'image-helper'):
252
        log.error("Message is of unknown type %s", msg['type'])
253
        return
254

    
255
    if msg['type'] == 'image-copy-progress':
256
        backend.process_create_progress(vm, event_time, msg['progress'])
257
        # we do not add diagnostic messages for copy-progress messages
258
        return
259

    
260
    # default diagnostic fields
261
    source = msg['type']
262
    level = 'DEBUG'
263
    message = msg.get('messages', '')
264
    if isinstance(message, list):
265
        message = " ".join(message)
266

    
267
    details = msg.get('stderr', None)
268

    
269
    if msg['type'] == 'image-helper':
270
        # for helper task events join subtype to diagnostic source and
271
        # set task name as diagnostic message
272
        if msg.get('subtype', None):
273
            if msg.get('subtype') in ['task-start', 'task-end']:
274
                message = msg.get('task', message)
275
                source = "%s-%s" % (source, msg.get('subtype'))
276

    
277
        if msg.get('subtype', None) == 'warning':
278
            level = 'WARNING'
279

    
280
        if msg.get('subtype', None) == 'error':
281
            level = 'ERROR'
282

    
283
        if msg.get('subtype', None) == 'info':
284
            level = 'INFO'
285

    
286
    if msg['type'] == 'image-error':
287
        level = 'ERROR'
288

    
289
    if msg['type'] == 'image-warning':
290
        level = 'WARNING'
291

    
292
    if not message.strip():
293
        message = " ".join(source.split("-")).capitalize()
294

    
295
    # create the diagnostic entry
296
    backend.create_instance_diagnostic(vm, message, source, level, event_time,
297
                                       details=details)
298

    
299
    log.debug("Done processing ganeti-create-progress msg for vm %s.",
300
              msg['instance'])
301

    
302

    
303
def dummy_proc(client, message, *args, **kwargs):
304
    try:
305
        log.debug("Msg: %s", message['body'])
306
        client.basic_ack(message)
307
    except Exception as e:
308
        log.exception("Could not receive message %s" % e)