1 # Copyright 2011-2012 GRNET S.A. All rights reserved.
3 # Redistribution and use in source and binary forms, with or
4 # without modification, are permitted provided that the following
7 # 1. Redistributions of source code must retain the above
8 # copyright notice, this list of conditions and the following
11 # 2. Redistributions in binary form must reproduce the above
12 # copyright notice, this list of conditions and the following
13 # disclaimer in the documentation and/or other materials
14 # provided with the distribution.
16 # THIS SOFTWARE IS PROVIDED BY GRNET S.A. ``AS IS'' AND ANY EXPRESS
17 # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18 # WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
19 # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL GRNET S.A OR
20 # CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
23 # USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
24 # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 # LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
26 # ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 # POSSIBILITY OF SUCH DAMAGE.
29 # The views and conclusions contained in the software and
30 # documentation are those of the authors and should not be
31 # interpreted as representing official policies, either expressed
32 # or implied, of GRNET S.A.
37 import uuid as uuidlib
42 from base import DEFAULT_QUOTA, DEFAULT_VERSIONING, NotAllowedError, QuotaError, BaseBackend
44 # Stripped-down version of the HashMap class found in tools.
47 def __init__(self, blocksize, blockhash):
48 super(HashMap, self).__init__()
49 self.blocksize = blocksize
50 self.blockhash = blockhash
52 def _hash_raw(self, v):
53 h = hashlib.new(self.blockhash)
59 return self._hash_raw('')
61 return self.__getitem__(0)
67 h += [('\x00' * len(h[0]))] * (s - len(h))
69 h = [self._hash_raw(h[x] + h[x + 1]) for x in range(0, len(h), 2)]
72 # Default modules and settings.
73 DEFAULT_DB_MODULE = 'pithos.backends.lib.sqlalchemy'
74 DEFAULT_DB_CONNECTION = 'sqlite:///backend.db'
75 DEFAULT_BLOCK_MODULE = 'pithos.backends.lib.hashfiler'
76 DEFAULT_BLOCK_PATH = 'data/'
77 DEFAULT_BLOCK_UMASK = 0o022
78 #DEFAULT_QUEUE_MODULE = 'pithos.backends.lib.rabbitmq'
79 #DEFAULT_QUEUE_CONNECTION = 'rabbitmq://guest:guest@localhost:5672/pithos'
81 QUEUE_MESSAGE_KEY_PREFIX = 'pithos.%s'
82 QUEUE_CLIENT_ID = 'pithos'
83 QUEUE_INSTANCE_ID = '1'
85 ( CLUSTER_NORMAL, CLUSTER_HISTORY, CLUSTER_DELETED ) = range(3)
92 logger = logging.getLogger(__name__)
95 def backend_method(func=None, autocommit=1):
98 return backend_method(func, autocommit)
103 def fn(self, *args, **kw):
104 self.wrapper.execute()
107 ret = func(self, *args, **kw)
108 for m in self.messages:
110 self.wrapper.commit()
113 self.wrapper.rollback()
118 class ModularBackend(BaseBackend):
119 """A modular backend.
121 Uses modules for SQL functions and storage.
124 def __init__(self, db_module=None, db_connection=None,
125 block_module=None, block_path=None, block_umask=None,
126 queue_module=None, queue_connection=None):
127 db_module = db_module or DEFAULT_DB_MODULE
128 db_connection = db_connection or DEFAULT_DB_CONNECTION
129 block_module = block_module or DEFAULT_BLOCK_MODULE
130 block_path = block_path or DEFAULT_BLOCK_PATH
131 block_umask = block_umask or DEFAULT_BLOCK_UMASK
132 #queue_module = queue_module or DEFAULT_QUEUE_MODULE
133 #queue_connection = queue_connection or DEFAULT_QUEUE_CONNECTION
135 self.hash_algorithm = 'sha256'
136 self.block_size = 4 * 1024 * 1024 # 4MB
138 self.default_policy = {'quota': DEFAULT_QUOTA, 'versioning': DEFAULT_VERSIONING}
142 return sys.modules[m]
144 self.db_module = load_module(db_module)
145 self.wrapper = self.db_module.DBWrapper(db_connection)
146 params = {'wrapper': self.wrapper}
147 self.permissions = self.db_module.Permissions(**params)
148 for x in ['READ', 'WRITE']:
149 setattr(self, x, getattr(self.db_module, x))
150 self.node = self.db_module.Node(**params)
151 for x in ['ROOTNODE', 'SERIAL', 'HASH', 'SIZE', 'TYPE', 'MTIME', 'MUSER', 'UUID', 'CHECKSUM', 'CLUSTER', 'MATCH_PREFIX', 'MATCH_EXACT']:
152 setattr(self, x, getattr(self.db_module, x))
154 self.block_module = load_module(block_module)
155 params = {'path': block_path,
156 'block_size': self.block_size,
157 'hash_algorithm': self.hash_algorithm,
158 'umask': block_umask}
159 self.store = self.block_module.Store(**params)
161 if queue_module and queue_connection:
162 self.queue_module = load_module(queue_module)
163 params = {'exchange': queue_connection,
164 'client_id': QUEUE_CLIENT_ID}
165 self.queue = self.queue_module.Queue(**params)
168 def send(self, *args):
174 self.queue = NoQueue()
181 def list_accounts(self, user, marker=None, limit=10000):
182 """Return a list of accounts the user can access."""
184 logger.debug("list_accounts: %s %s %s", user, marker, limit)
185 allowed = self._allowed_accounts(user)
186 start, limit = self._list_limits(allowed, marker, limit)
187 return allowed[start:start + limit]
190 def get_account_meta(self, user, account, domain, until=None, include_user_defined=True):
191 """Return a dictionary with the account metadata for the domain."""
193 logger.debug("get_account_meta: %s %s %s", account, domain, until)
194 path, node = self._lookup_account(account, user == account)
196 if until or node is None or account not in self._allowed_accounts(user):
197 raise NotAllowedError
199 props = self._get_properties(node, until)
200 mtime = props[self.MTIME]
204 count, bytes, tstamp = self._get_statistics(node, until)
205 tstamp = max(tstamp, mtime)
209 modified = self._get_statistics(node)[2] # Overall last modification.
210 modified = max(modified, mtime)
213 meta = {'name': account}
216 if props is not None and include_user_defined:
217 meta.update(dict(self.node.attribute_get(props[self.SERIAL], domain)))
218 if until is not None:
219 meta.update({'until_timestamp': tstamp})
220 meta.update({'name': account, 'count': count, 'bytes': bytes})
221 meta.update({'modified': modified})
225 def update_account_meta(self, user, account, domain, meta, replace=False):
226 """Update the metadata associated with the account for the domain."""
228 logger.debug("update_account_meta: %s %s %s %s", account, domain, meta, replace)
230 raise NotAllowedError
231 path, node = self._lookup_account(account, True)
232 self._put_metadata(user, node, domain, meta, replace)
235 def get_account_groups(self, user, account):
236 """Return a dictionary with the user groups defined for this account."""
238 logger.debug("get_account_groups: %s", account)
240 if account not in self._allowed_accounts(user):
241 raise NotAllowedError
243 self._lookup_account(account, True)
244 return self.permissions.group_dict(account)
247 def update_account_groups(self, user, account, groups, replace=False):
248 """Update the groups associated with the account."""
250 logger.debug("update_account_groups: %s %s %s", account, groups, replace)
252 raise NotAllowedError
253 self._lookup_account(account, True)
254 self._check_groups(groups)
256 self.permissions.group_destroy(account)
257 for k, v in groups.iteritems():
258 if not replace: # If not already deleted.
259 self.permissions.group_delete(account, k)
261 self.permissions.group_addmany(account, k, v)
264 def get_account_policy(self, user, account):
265 """Return a dictionary with the account policy."""
267 logger.debug("get_account_policy: %s", account)
269 if account not in self._allowed_accounts(user):
270 raise NotAllowedError
272 path, node = self._lookup_account(account, True)
273 return self._get_policy(node)
276 def update_account_policy(self, user, account, policy, replace=False):
277 """Update the policy associated with the account."""
279 logger.debug("update_account_policy: %s %s %s", account, policy, replace)
281 raise NotAllowedError
282 path, node = self._lookup_account(account, True)
283 self._check_policy(policy)
284 self._put_policy(node, policy, replace)
287 def put_account(self, user, account, policy={}):
288 """Create a new account with the given name."""
290 logger.debug("put_account: %s %s", account, policy)
292 raise NotAllowedError
293 node = self.node.node_lookup(account)
295 raise NameError('Account already exists')
297 self._check_policy(policy)
298 node = self._put_path(user, self.ROOTNODE, account)
299 self._put_policy(node, policy, True)
302 def delete_account(self, user, account):
303 """Delete the account with the given name."""
305 logger.debug("delete_account: %s", account)
307 raise NotAllowedError
308 node = self.node.node_lookup(account)
311 if not self.node.node_remove(node):
312 raise IndexError('Account is not empty')
313 self.permissions.group_destroy(account)
316 def list_containers(self, user, account, marker=None, limit=10000, shared=False, until=None, public=False):
317 """Return a list of containers existing under an account."""
319 logger.debug("list_containers: %s %s %s %s %s %s", account, marker, limit, shared, until, public)
321 if until or account not in self._allowed_accounts(user):
322 raise NotAllowedError
323 allowed = self._allowed_containers(user, account)
324 start, limit = self._list_limits(allowed, marker, limit)
325 return allowed[start:start + limit]
329 allowed.extend([x.split('/', 2)[1] for x in self.permissions.access_list_shared(account)])
331 allowed.extend([x[0].split('/', 2)[1] for x in self.permissions.public_list(account)])
332 allowed = list(set(allowed))
333 start, limit = self._list_limits(allowed, marker, limit)
334 return allowed[start:start + limit]
335 node = self.node.node_lookup(account)
336 return [x[0] for x in self._list_object_properties(node, account, '', '/', marker, limit, False, None, [], until)]
339 def list_container_meta(self, user, account, container, domain, until=None):
340 """Return a list with all the container's object meta keys for the domain."""
342 logger.debug("list_container_meta: %s %s %s %s", account, container, domain, until)
346 raise NotAllowedError
347 allowed = self.permissions.access_list_paths(user, '/'.join((account, container)))
349 raise NotAllowedError
350 path, node = self._lookup_container(account, container)
351 before = until if until is not None else inf
352 allowed = self._get_formatted_paths(allowed)
353 return self.node.latest_attribute_keys(node, domain, before, CLUSTER_DELETED, allowed)
356 def get_container_meta(self, user, account, container, domain, until=None, include_user_defined=True):
357 """Return a dictionary with the container metadata for the domain."""
359 logger.debug("get_container_meta: %s %s %s %s", account, container, domain, until)
361 if until or container not in self._allowed_containers(user, account):
362 raise NotAllowedError
363 path, node = self._lookup_container(account, container)
364 props = self._get_properties(node, until)
365 mtime = props[self.MTIME]
366 count, bytes, tstamp = self._get_statistics(node, until)
367 tstamp = max(tstamp, mtime)
371 modified = self._get_statistics(node)[2] # Overall last modification.
372 modified = max(modified, mtime)
375 meta = {'name': container}
378 if include_user_defined:
379 meta.update(dict(self.node.attribute_get(props[self.SERIAL], domain)))
380 if until is not None:
381 meta.update({'until_timestamp': tstamp})
382 meta.update({'name': container, 'count': count, 'bytes': bytes})
383 meta.update({'modified': modified})
387 def update_container_meta(self, user, account, container, domain, meta, replace=False):
388 """Update the metadata associated with the container for the domain."""
390 logger.debug("update_container_meta: %s %s %s %s %s", account, container, domain, meta, replace)
392 raise NotAllowedError
393 path, node = self._lookup_container(account, container)
394 src_version_id, dest_version_id = self._put_metadata(user, node, domain, meta, replace)
395 if src_version_id is not None:
396 versioning = self._get_policy(node)['versioning']
397 if versioning != 'auto':
398 self.node.version_remove(src_version_id)
401 def get_container_policy(self, user, account, container):
402 """Return a dictionary with the container policy."""
404 logger.debug("get_container_policy: %s %s", account, container)
406 if container not in self._allowed_containers(user, account):
407 raise NotAllowedError
409 path, node = self._lookup_container(account, container)
410 return self._get_policy(node)
413 def update_container_policy(self, user, account, container, policy, replace=False):
414 """Update the policy associated with the container."""
416 logger.debug("update_container_policy: %s %s %s %s", account, container, policy, replace)
418 raise NotAllowedError
419 path, node = self._lookup_container(account, container)
420 self._check_policy(policy)
421 self._put_policy(node, policy, replace)
424 def put_container(self, user, account, container, policy={}):
425 """Create a new container with the given name."""
427 logger.debug("put_container: %s %s %s", account, container, policy)
429 raise NotAllowedError
431 path, node = self._lookup_container(account, container)
435 raise NameError('Container already exists')
437 self._check_policy(policy)
438 path = '/'.join((account, container))
439 node = self._put_path(user, self._lookup_account(account, True)[1], path)
440 self._put_policy(node, policy, True)
443 def delete_container(self, user, account, container, until=None):
444 """Delete/purge the container with the given name."""
446 logger.debug("delete_container: %s %s %s", account, container, until)
448 raise NotAllowedError
449 path, node = self._lookup_container(account, container)
451 if until is not None:
452 hashes, size = self.node.node_purge_children(node, until, CLUSTER_HISTORY)
454 self.store.map_delete(h)
455 self.node.node_purge_children(node, until, CLUSTER_DELETED)
456 self._report_size_change(user, account, -size, {'action': 'container purge'})
459 if self._get_statistics(node)[0] > 0:
460 raise IndexError('Container is not empty')
461 hashes, size = self.node.node_purge_children(node, inf, CLUSTER_HISTORY)
463 self.store.map_delete(h)
464 self.node.node_purge_children(node, inf, CLUSTER_DELETED)
465 self.node.node_remove(node)
466 self._report_size_change(user, account, -size, {'action': 'container delete'})
468 def _list_objects(self, user, account, container, prefix, delimiter, marker, limit, virtual, domain, keys, shared, until, size_range, all_props, public):
469 if user != account and until:
470 raise NotAllowedError
471 allowed = self._list_object_permissions(user, account, container, prefix, shared, public)
472 if (shared or public) and not allowed:
474 path, node = self._lookup_container(account, container)
475 allowed = self._get_formatted_paths(allowed)
476 return self._list_object_properties(node, path, prefix, delimiter, marker, limit, virtual, domain, keys, until, size_range, allowed, all_props)
478 def _list_object_permissions(self, user, account, container, prefix, shared, public):
480 path = '/'.join((account, container, prefix)).rstrip('/')
482 allowed = self.permissions.access_list_paths(user, path)
484 raise NotAllowedError
488 allowed.extend(self.permissions.access_list_shared(path))
490 allowed.extend([x[0] for x in self.permissions.public_list(path)])
491 allowed = list(set(allowed))
497 def list_objects(self, user, account, container, prefix='', delimiter=None, marker=None, limit=10000, virtual=True, domain=None, keys=[], shared=False, until=None, size_range=None, public=False):
498 """Return a list of object (name, version_id) tuples existing under a container."""
500 logger.debug("list_objects: %s %s %s %s %s %s %s %s %s %s %s %s %s", account, container, prefix, delimiter, marker, limit, virtual, domain, keys, shared, until, size_range, public)
501 return self._list_objects(user, account, container, prefix, delimiter, marker, limit, virtual, domain, keys, shared, until, size_range, False, public)
504 def list_object_meta(self, user, account, container, prefix='', delimiter=None, marker=None, limit=10000, virtual=True, domain=None, keys=[], shared=False, until=None, size_range=None, public=False):
505 """Return a list of object metadata dicts existing under a container."""
507 logger.debug("list_object_meta: %s %s %s %s %s %s %s %s %s %s %s %s %s", account, container, prefix, delimiter, marker, limit, virtual, domain, keys, shared, until, size_range, public)
508 props = self._list_objects(user, account, container, prefix, delimiter, marker, limit, virtual, domain, keys, shared, until, size_range, True, public)
512 objects.append({'subdir': p[0]})
514 objects.append({'name': p[0],
515 'bytes': p[self.SIZE + 1],
516 'type': p[self.TYPE + 1],
517 'hash': p[self.HASH + 1],
518 'version': p[self.SERIAL + 1],
519 'version_timestamp': p[self.MTIME + 1],
520 'modified': p[self.MTIME + 1] if until is None else None,
521 'modified_by': p[self.MUSER + 1],
522 'uuid': p[self.UUID + 1],
523 'checksum': p[self.CHECKSUM + 1]})
527 def list_object_permissions(self, user, account, container, prefix=''):
528 """Return a list of paths that enforce permissions under a container."""
530 logger.debug("list_object_permissions: %s %s %s", account, container, prefix)
531 return self._list_object_permissions(user, account, container, prefix, True, False)
534 def list_object_public(self, user, account, container, prefix=''):
535 """Return a dict mapping paths to public ids for objects that are public under a container."""
537 logger.debug("list_object_public: %s %s %s", account, container, prefix)
539 for path, p in self.permissions.public_list('/'.join((account, container, prefix))):
540 public[path] = p + ULTIMATE_ANSWER
544 def get_object_meta(self, user, account, container, name, domain, version=None, include_user_defined=True):
545 """Return a dictionary with the object metadata for the domain."""
547 logger.debug("get_object_meta: %s %s %s %s %s", account, container, name, domain, version)
548 self._can_read(user, account, container, name)
549 path, node = self._lookup_object(account, container, name)
550 props = self._get_version(node, version)
552 modified = props[self.MTIME]
555 modified = self._get_version(node)[self.MTIME] # Overall last modification.
556 except NameError: # Object may be deleted.
557 del_props = self.node.version_lookup(node, inf, CLUSTER_DELETED)
558 if del_props is None:
559 raise NameError('Object does not exist')
560 modified = del_props[self.MTIME]
563 if include_user_defined:
564 meta.update(dict(self.node.attribute_get(props[self.SERIAL], domain)))
565 meta.update({'name': name,
566 'bytes': props[self.SIZE],
567 'type': props[self.TYPE],
568 'hash': props[self.HASH],
569 'version': props[self.SERIAL],
570 'version_timestamp': props[self.MTIME],
571 'modified': modified,
572 'modified_by': props[self.MUSER],
573 'uuid': props[self.UUID],
574 'checksum': props[self.CHECKSUM]})
578 def update_object_meta(self, user, account, container, name, domain, meta, replace=False):
579 """Update the metadata associated with the object for the domain and return the new version."""
581 logger.debug("update_object_meta: %s %s %s %s %s %s", account, container, name, domain, meta, replace)
582 self._can_write(user, account, container, name)
583 path, node = self._lookup_object(account, container, name)
584 src_version_id, dest_version_id = self._put_metadata(user, node, domain, meta, replace)
585 self._apply_versioning(account, container, src_version_id)
586 return dest_version_id
589 def get_object_permissions(self, user, account, container, name):
590 """Return the action allowed on the object, the path
591 from which the object gets its permissions from,
592 along with a dictionary containing the permissions."""
594 logger.debug("get_object_permissions: %s %s %s", account, container, name)
596 permissions_path = self._get_permissions_path(account, container, name)
598 if self.permissions.access_check(permissions_path, self.WRITE, user):
600 elif self.permissions.access_check(permissions_path, self.READ, user):
603 raise NotAllowedError
604 self._lookup_object(account, container, name)
605 return (allowed, permissions_path, self.permissions.access_get(permissions_path))
608 def update_object_permissions(self, user, account, container, name, permissions):
609 """Update the permissions associated with the object."""
611 logger.debug("update_object_permissions: %s %s %s %s", account, container, name, permissions)
613 raise NotAllowedError
614 path = self._lookup_object(account, container, name)[0]
615 self._check_permissions(path, permissions)
616 self.permissions.access_set(path, permissions)
617 self._report_sharing_change(user, account, path, {'members':self.permissions.access_members(path)})
620 def get_object_public(self, user, account, container, name):
621 """Return the public id of the object if applicable."""
623 logger.debug("get_object_public: %s %s %s", account, container, name)
624 self._can_read(user, account, container, name)
625 path = self._lookup_object(account, container, name)[0]
626 p = self.permissions.public_get(path)
632 def update_object_public(self, user, account, container, name, public):
633 """Update the public status of the object."""
635 logger.debug("update_object_public: %s %s %s %s", account, container, name, public)
636 self._can_write(user, account, container, name)
637 path = self._lookup_object(account, container, name)[0]
639 self.permissions.public_unset(path)
641 self.permissions.public_set(path)
644 def get_object_hashmap(self, user, account, container, name, version=None):
645 """Return the object's size and a list with partial hashes."""
647 logger.debug("get_object_hashmap: %s %s %s %s", account, container, name, version)
648 self._can_read(user, account, container, name)
649 path, node = self._lookup_object(account, container, name)
650 props = self._get_version(node, version)
651 hashmap = self.store.map_get(binascii.unhexlify(props[self.HASH]))
652 return props[self.SIZE], [binascii.hexlify(x) for x in hashmap]
654 def _update_object_hash(self, user, account, container, name, size, type, hash, checksum, domain, meta, replace_meta, permissions, src_node=None, src_version_id=None, is_copy=False):
655 if permissions is not None and user != account:
656 raise NotAllowedError
657 self._can_write(user, account, container, name)
658 if permissions is not None:
659 path = '/'.join((account, container, name))
660 self._check_permissions(path, permissions)
662 account_path, account_node = self._lookup_account(account, True)
663 container_path, container_node = self._lookup_container(account, container)
664 path, node = self._put_object_node(container_path, container_node, name)
665 pre_version_id, dest_version_id = self._put_version_duplicate(user, node, src_node=src_node, size=size, type=type, hash=hash, checksum=checksum, is_copy=is_copy)
668 if src_version_id is None:
669 src_version_id = pre_version_id
670 self._put_metadata_duplicate(src_version_id, dest_version_id, domain, meta, replace_meta)
673 del_size = self._apply_versioning(account, container, pre_version_id)
674 size_delta = size - del_size
676 account_quota = long(self._get_policy(account_node)['quota'])
677 container_quota = long(self._get_policy(container_node)['quota'])
678 if (account_quota > 0 and self._get_statistics(account_node)[1] + size_delta > account_quota) or \
679 (container_quota > 0 and self._get_statistics(container_node)[1] + size_delta > container_quota):
680 # This must be executed in a transaction, so the version is never created if it fails.
682 self._report_size_change(user, account, size_delta, {'action': 'object update'})
684 if permissions is not None:
685 self.permissions.access_set(path, permissions)
686 self._report_sharing_change(user, account, path, {'members':self.permissions.access_members(path)})
688 self._report_object_change(user, account, path, details={'version': dest_version_id, 'action': 'object update'})
689 return dest_version_id
692 def update_object_hashmap(self, user, account, container, name, size, type, hashmap, checksum, domain, meta={}, replace_meta=False, permissions=None):
693 """Create/update an object with the specified size and partial hashes."""
695 logger.debug("update_object_hashmap: %s %s %s %s %s %s %s", account, container, name, size, type, hashmap, checksum)
696 if size == 0: # No such thing as an empty hashmap.
697 hashmap = [self.put_block('')]
698 map = HashMap(self.block_size, self.hash_algorithm)
699 map.extend([binascii.unhexlify(x) for x in hashmap])
700 missing = self.store.block_search(map)
703 ie.data = [binascii.hexlify(x) for x in missing]
707 dest_version_id = self._update_object_hash(user, account, container, name, size, type, binascii.hexlify(hash), checksum, domain, meta, replace_meta, permissions)
708 self.store.map_put(hash, map)
709 return dest_version_id
712 def update_object_checksum(self, user, account, container, name, version, checksum):
713 """Update an object's checksum."""
715 logger.debug("update_object_checksum: %s %s %s %s %s", account, container, name, version, checksum)
716 # Update objects with greater version and same hashmap and size (fix metadata updates).
717 self._can_write(user, account, container, name)
718 path, node = self._lookup_object(account, container, name)
719 props = self._get_version(node, version)
720 versions = self.node.node_get_versions(node)
722 if x[self.SERIAL] >= int(version) and x[self.HASH] == props[self.HASH] and x[self.SIZE] == props[self.SIZE]:
723 self.node.version_put_property(x[self.SERIAL], 'checksum', checksum)
725 def _copy_object(self, user, src_account, src_container, src_name, dest_account, dest_container, dest_name, type, dest_domain=None, dest_meta={}, replace_meta=False, permissions=None, src_version=None, is_move=False):
726 self._can_read(user, src_account, src_container, src_name)
727 path, node = self._lookup_object(src_account, src_container, src_name)
728 # TODO: Will do another fetch of the properties in duplicate version...
729 props = self._get_version(node, src_version) # Check to see if source exists.
730 src_version_id = props[self.SERIAL]
731 hash = props[self.HASH]
732 size = props[self.SIZE]
734 is_copy = not is_move and (src_account, src_container, src_name) != (dest_account, dest_container, dest_name) # New uuid.
735 dest_version_id = self._update_object_hash(user, dest_account, dest_container, dest_name, size, type, hash, None, dest_domain, dest_meta, replace_meta, permissions, src_node=node, src_version_id=src_version_id, is_copy=is_copy)
736 return dest_version_id
739 def copy_object(self, user, src_account, src_container, src_name, dest_account, dest_container, dest_name, type, domain, meta={}, replace_meta=False, permissions=None, src_version=None):
740 """Copy an object's data and metadata."""
742 logger.debug("copy_object: %s %s %s %s %s %s %s %s %s %s %s %s", src_account, src_container, src_name, dest_account, dest_container, dest_name, type, domain, meta, replace_meta, permissions, src_version)
743 dest_version_id = self._copy_object(user, src_account, src_container, src_name, dest_account, dest_container, dest_name, type, domain, meta, replace_meta, permissions, src_version, False)
744 return dest_version_id
747 def move_object(self, user, src_account, src_container, src_name, dest_account, dest_container, dest_name, type, domain, meta={}, replace_meta=False, permissions=None):
748 """Move an object's data and metadata."""
750 logger.debug("move_object: %s %s %s %s %s %s %s %s %s %s %s", src_account, src_container, src_name, dest_account, dest_container, dest_name, type, domain, meta, replace_meta, permissions)
751 if user != src_account:
752 raise NotAllowedError
753 dest_version_id = self._copy_object(user, src_account, src_container, src_name, dest_account, dest_container, dest_name, type, domain, meta, replace_meta, permissions, None, True)
754 if (src_account, src_container, src_name) != (dest_account, dest_container, dest_name):
755 self._delete_object(user, src_account, src_container, src_name)
756 return dest_version_id
758 def _delete_object(self, user, account, container, name, until=None):
760 raise NotAllowedError
762 if until is not None:
763 path = '/'.join((account, container, name))
764 node = self.node.node_lookup(path)
769 h, s = self.node.node_purge(node, until, CLUSTER_NORMAL)
772 h, s = self.node.node_purge(node, until, CLUSTER_HISTORY)
776 self.store.map_delete(h)
777 self.node.node_purge(node, until, CLUSTER_DELETED)
779 props = self._get_version(node)
781 self.permissions.access_clear(path)
782 self._report_size_change(user, account, -size, {'action': 'object purge'})
785 path, node = self._lookup_object(account, container, name)
786 src_version_id, dest_version_id = self._put_version_duplicate(user, node, size=0, type='', hash=None, checksum='', cluster=CLUSTER_DELETED)
787 del_size = self._apply_versioning(account, container, src_version_id)
789 self._report_size_change(user, account, -del_size, {'action': 'object delete'})
790 self._report_object_change(user, account, path, details={'action': 'object delete'})
791 self.permissions.access_clear(path)
794 def delete_object(self, user, account, container, name, until=None):
795 """Delete/purge an object."""
797 logger.debug("delete_object: %s %s %s %s", account, container, name, until)
798 self._delete_object(user, account, container, name, until)
801 def list_versions(self, user, account, container, name):
802 """Return a list of all (version, version_timestamp) tuples for an object."""
804 logger.debug("list_versions: %s %s %s", account, container, name)
805 self._can_read(user, account, container, name)
806 path, node = self._lookup_object(account, container, name)
807 versions = self.node.node_get_versions(node)
808 return [[x[self.SERIAL], x[self.MTIME]] for x in versions if x[self.CLUSTER] != CLUSTER_DELETED]
811 def get_uuid(self, user, uuid):
812 """Return the (account, container, name) for the UUID given."""
814 logger.debug("get_uuid: %s", uuid)
815 info = self.node.latest_uuid(uuid)
819 account, container, name = path.split('/', 2)
820 self._can_read(user, account, container, name)
821 return (account, container, name)
824 def get_public(self, user, public):
825 """Return the (account, container, name) for the public id given."""
827 logger.debug("get_public: %s", public)
828 if public is None or public < ULTIMATE_ANSWER:
830 path = self.permissions.public_path(public - ULTIMATE_ANSWER)
833 account, container, name = path.split('/', 2)
834 self._can_read(user, account, container, name)
835 return (account, container, name)
837 @backend_method(autocommit=0)
838 def get_block(self, hash):
839 """Return a block's data."""
841 logger.debug("get_block: %s", hash)
842 block = self.store.block_get(binascii.unhexlify(hash))
844 raise NameError('Block does not exist')
847 @backend_method(autocommit=0)
848 def put_block(self, data):
849 """Store a block and return the hash."""
851 logger.debug("put_block: %s", len(data))
852 return binascii.hexlify(self.store.block_put(data))
854 @backend_method(autocommit=0)
855 def update_block(self, hash, data, offset=0):
856 """Update a known block and return the hash."""
858 logger.debug("update_block: %s %s %s", hash, len(data), offset)
859 if offset == 0 and len(data) == self.block_size:
860 return self.put_block(data)
861 h = self.store.block_update(binascii.unhexlify(hash), offset, data)
862 return binascii.hexlify(h)
866 def _generate_uuid(self):
867 return str(uuidlib.uuid4())
869 def _put_object_node(self, path, parent, name):
870 path = '/'.join((path, name))
871 node = self.node.node_lookup(path)
873 node = self.node.node_create(parent, path)
876 def _put_path(self, user, parent, path):
877 node = self.node.node_create(parent, path)
878 self.node.version_create(node, None, 0, '', None, user, self._generate_uuid(), '', CLUSTER_NORMAL)
881 def _lookup_account(self, account, create=True):
882 node = self.node.node_lookup(account)
883 if node is None and create:
884 node = self._put_path(account, self.ROOTNODE, account) # User is account.
887 def _lookup_container(self, account, container):
888 path = '/'.join((account, container))
889 node = self.node.node_lookup(path)
891 raise NameError('Container does not exist')
894 def _lookup_object(self, account, container, name):
895 path = '/'.join((account, container, name))
896 node = self.node.node_lookup(path)
898 raise NameError('Object does not exist')
901 def _get_properties(self, node, until=None):
902 """Return properties until the timestamp given."""
904 before = until if until is not None else inf
905 props = self.node.version_lookup(node, before, CLUSTER_NORMAL)
906 if props is None and until is not None:
907 props = self.node.version_lookup(node, before, CLUSTER_HISTORY)
909 raise NameError('Path does not exist')
912 def _get_statistics(self, node, until=None):
913 """Return count, sum of size and latest timestamp of everything under node."""
916 stats = self.node.statistics_get(node, CLUSTER_NORMAL)
918 stats = self.node.statistics_latest(node, until, CLUSTER_DELETED)
923 def _get_version(self, node, version=None):
925 props = self.node.version_lookup(node, inf, CLUSTER_NORMAL)
927 raise NameError('Object does not exist')
930 version = int(version)
932 raise IndexError('Version does not exist')
933 props = self.node.version_get_properties(version)
934 if props is None or props[self.CLUSTER] == CLUSTER_DELETED:
935 raise IndexError('Version does not exist')
938 def _put_version_duplicate(self, user, node, src_node=None, size=None, type=None, hash=None, checksum=None, cluster=CLUSTER_NORMAL, is_copy=False):
939 """Create a new version of the node."""
941 props = self.node.version_lookup(node if src_node is None else src_node, inf, CLUSTER_NORMAL)
942 if props is not None:
943 src_version_id = props[self.SERIAL]
944 src_hash = props[self.HASH]
945 src_size = props[self.SIZE]
946 src_type = props[self.TYPE]
947 src_checksum = props[self.CHECKSUM]
949 src_version_id = None
954 if size is None: # Set metadata.
955 hash = src_hash # This way hash can be set to None (account or container).
960 checksum = src_checksum
961 uuid = self._generate_uuid() if (is_copy or src_version_id is None) else props[self.UUID]
964 pre_version_id = src_version_id
966 pre_version_id = None
967 props = self.node.version_lookup(node, inf, CLUSTER_NORMAL)
968 if props is not None:
969 pre_version_id = props[self.SERIAL]
970 if pre_version_id is not None:
971 self.node.version_recluster(pre_version_id, CLUSTER_HISTORY)
973 dest_version_id, mtime = self.node.version_create(node, hash, size, type, src_version_id, user, uuid, checksum, cluster)
974 return pre_version_id, dest_version_id
976 def _put_metadata_duplicate(self, src_version_id, dest_version_id, domain, meta, replace=False):
977 if src_version_id is not None:
978 self.node.attribute_copy(src_version_id, dest_version_id)
980 self.node.attribute_del(dest_version_id, domain, (k for k, v in meta.iteritems() if v == ''))
981 self.node.attribute_set(dest_version_id, domain, ((k, v) for k, v in meta.iteritems() if v != ''))
983 self.node.attribute_del(dest_version_id, domain)
984 self.node.attribute_set(dest_version_id, domain, ((k, v) for k, v in meta.iteritems()))
986 def _put_metadata(self, user, node, domain, meta, replace=False):
987 """Create a new version and store metadata."""
989 src_version_id, dest_version_id = self._put_version_duplicate(user, node)
990 self._put_metadata_duplicate(src_version_id, dest_version_id, domain, meta, replace)
991 return src_version_id, dest_version_id
993 def _list_limits(self, listing, marker, limit):
997 start = listing.index(marker) + 1
1000 if not limit or limit > 10000:
1004 def _list_object_properties(self, parent, path, prefix='', delimiter=None, marker=None, limit=10000, virtual=True, domain=None, keys=[], until=None, size_range=None, allowed=[], all_props=False):
1005 cont_prefix = path + '/'
1006 prefix = cont_prefix + prefix
1007 start = cont_prefix + marker if marker else None
1008 before = until if until is not None else inf
1009 filterq = keys if domain else []
1012 objects, prefixes = self.node.latest_version_list(parent, prefix, delimiter, start, limit, before, CLUSTER_DELETED, allowed, domain, filterq, sizeq, all_props)
1013 objects.extend([(p, None) for p in prefixes] if virtual else [])
1014 objects.sort(key=lambda x: x[0])
1015 objects = [(x[0][len(cont_prefix):],) + x[1:] for x in objects]
1017 start, limit = self._list_limits([x[0] for x in objects], marker, limit)
1018 return objects[start:start + limit]
1020 # Reporting functions.
1022 def _report_size_change(self, user, account, size, details={}):
1023 logger.debug("_report_size_change: %s %s %s %s", user, account, size, details)
1024 account_node = self._lookup_account(account, True)[1]
1025 total = self._get_statistics(account_node)[1]
1026 details.update({'user': user, 'total': total})
1027 self.messages.append((QUEUE_MESSAGE_KEY_PREFIX % ('resource.diskspace',), account, QUEUE_INSTANCE_ID, 'diskspace', float(size), details))
1029 def _report_object_change(self, user, account, path, details={}):
1030 logger.debug("_report_object_change: %s %s %s %s", user, account, path, details)
1031 details.update({'user': user})
1032 self.messages.append((QUEUE_MESSAGE_KEY_PREFIX % ('object',), account, QUEUE_INSTANCE_ID, 'object', path, details))
1034 def _report_sharing_change(self, user, account, path, details={}):
1035 logger.debug("_report_permissions_change: %s %s %s %s", user, account, path, details)
1036 details.update({'user': user})
1037 self.messages.append((QUEUE_MESSAGE_KEY_PREFIX % ('sharing',), account, QUEUE_INSTANCE_ID, 'sharing', path, details))
1041 def _check_policy(self, policy):
1042 for k in policy.keys():
1044 policy[k] = self.default_policy.get(k)
1045 for k, v in policy.iteritems():
1047 q = int(v) # May raise ValueError.
1050 elif k == 'versioning':
1051 if v not in ['auto', 'none']:
1056 def _put_policy(self, node, policy, replace):
1058 for k, v in self.default_policy.iteritems():
1061 self.node.policy_set(node, policy)
1063 def _get_policy(self, node):
1064 policy = self.default_policy.copy()
1065 policy.update(self.node.policy_get(node))
1068 def _apply_versioning(self, account, container, version_id):
1069 """Delete the provided version if such is the policy.
1070 Return size of object removed.
1073 if version_id is None:
1075 path, node = self._lookup_container(account, container)
1076 versioning = self._get_policy(node)['versioning']
1077 if versioning != 'auto':
1078 hash, size = self.node.version_remove(version_id)
1079 self.store.map_delete(hash)
1083 # Access control functions.
1085 def _check_groups(self, groups):
1086 # raise ValueError('Bad characters in groups')
1089 def _check_permissions(self, path, permissions):
1090 # raise ValueError('Bad characters in permissions')
1093 def _get_formatted_paths(self, paths):
1096 node = self.node.node_lookup(p)
1097 if node is not None:
1098 props = self.node.version_lookup(node, inf, CLUSTER_NORMAL)
1099 if props is not None:
1100 if props[self.TYPE].split(';', 1)[0].strip() in ('application/directory', 'application/folder'):
1101 formatted.append((p.rstrip('/') + '/', self.MATCH_PREFIX))
1102 formatted.append((p, self.MATCH_EXACT))
1105 def _get_permissions_path(self, account, container, name):
1106 path = '/'.join((account, container, name))
1107 permission_paths = self.permissions.access_inherit(path)
1108 permission_paths.sort()
1109 permission_paths.reverse()
1110 for p in permission_paths:
1114 if p.count('/') < 2:
1116 node = self.node.node_lookup(p)
1117 if node is not None:
1118 props = self.node.version_lookup(node, inf, CLUSTER_NORMAL)
1119 if props is not None:
1120 if props[self.TYPE].split(';', 1)[0].strip() in ('application/directory', 'application/folder'):
1124 def _can_read(self, user, account, container, name):
1127 path = '/'.join((account, container, name))
1128 if self.permissions.public_get(path) is not None:
1130 path = self._get_permissions_path(account, container, name)
1132 raise NotAllowedError
1133 if not self.permissions.access_check(path, self.READ, user) and not self.permissions.access_check(path, self.WRITE, user):
1134 raise NotAllowedError
1136 def _can_write(self, user, account, container, name):
1139 path = '/'.join((account, container, name))
1140 path = self._get_permissions_path(account, container, name)
1142 raise NotAllowedError
1143 if not self.permissions.access_check(path, self.WRITE, user):
1144 raise NotAllowedError
1146 def _allowed_accounts(self, user):
1148 for path in self.permissions.access_list_paths(user):
1149 allow.add(path.split('/', 1)[0])
1150 return sorted(allow)
1152 def _allowed_containers(self, user, account):
1154 for path in self.permissions.access_list_paths(user, account):
1155 allow.add(path.split('/', 2)[1])
1156 return sorted(allow)