7 gadi atpakaļ · e3d02acfdd
--- a/.travis.yml
+++ b/.travis.yml
@@ -2,9 +2,8 @@ language: python
 
				 python:
			
 
				   - "3.5"
			
 
				   - "3.6"
			
 
				-  - "3.7-dev"  # 3.7 development branch
			
 
				 install:
			
 
				   - pip install -r requirements.txt
			
 
				   - coilmq&
			
 
				 script:
			
 
				-  - pytest
			
 
				+- pytest tests
			
--- a/README.md
+++ b/README.md
@@ -1,5 +1,9 @@
 
				 # LAKEsuperior
			
 
				 
			
 
				+[![build status](
			
 
				+  http://img.shields.io/travis/scossu/lakesuperior/master.svg?style=flat)](
			
 
				+ https://travis-ci.org/username/repo)
			
 
				+
			
 
				 LAKEsuperior is an alternative [Fedora Repository](http://fedorarepository.org)
			
 
				 implementation.
			
 
				 
			
@@ -156,6 +160,8 @@ meant to live as a community project.
 
				 
			
 
				 [Messaging](doc/notes/messaging.md)
			
 
				 
			
 
				+[Migration Guide](doc/notes/migration.md)
			
 
				+
			
 
				 [Command-Line Reference](doc/notes/cli.md)
			
 
				 
			
 
				 [Storage Implementation](doc/notes/storage.md)
			
--- a/data/bootstrap/rsrc_centric_layout.sparql
+++ b/data/bootstrap/rsrc_centric_layout.sparql
@@ -12,6 +12,8 @@ INSERT DATA {
 
				     <info:fcres/> a
			
 
				       fcrepo:RepositoryRoot , fcrepo:Resource , fcrepo:Container ,
			
 
				       ldp:Container , ldp:BasicContainer , ldp:RDFSource ;
			
 
				+      fcrepo:created "$timestamp"^^xsd:dateTime ;
			
 
				+      fcrepo:lastModified "$timestamp"^^xsd:dateTime ;
			
 
				     .
			
 
				   }
			
 
				 
			
--- a/doc/notes/fcrepo4_deltas.md
+++ b/doc/notes/fcrepo4_deltas.md
@@ -167,13 +167,22 @@ specs should not notice any difference.
 
				 The following are improvements in performance or usability that can only be taken
			
 
				 advantage of if client code is adjusted.
			
 
				 
			
 
				-### LDP-NR metadata by content negotiation
			
 
				+### LDP-NR content and metadata
			
 
				 
			
 
				 FCREPO4 relies on the `/fcr:metadata` identifier to retrieve RDF metadata about
			
 
				 an LDP-NR. LAKEsuperior supports this as a legacy option, but encourages the
			
 
				-use of content negotiation to do the same. Any request to an LDP-NR with an
			
 
				-`Accept` header set to one of the supported RDF serialization formats will
			
 
				-yield the RDF metadata of the resource instead of the binary contents.
			
 
				+use of content negotiation to do the same while offering explicit endpoints
			
 
				+for RDF and non-RDF content retrieval.
			
 
				+
			
 
				+Any request to an LDP-NR with an `Accept` header set to one of the supported
			
 
				+RDF serialization formats will yield the RDF metadata of the resource instead
			
 
				+of the binary contents.
			
 
				+
			
 
				+The `fcr:metadata` URI returns the RDF metadata of a LDP-NR.
			
 
				+
			
 
				+The `fcr:content` URI returns the non-RDF content.
			
 
				+
			
 
				+The two optionsabove return an HTTP error if requested for a LDP-RS.
			
 
				 
			
 
				 ### "Include" and "Omit" options for children
			
 
				 
			
--- a/doc/notes/migration.md
+++ b/doc/notes/migration.md
@@ -0,0 +1,44 @@
 
				+# Migration Guide
			
 
				+
			
 
				+A command-line utility is available as part of the `lsup-admin` suite
			
 
				+to migrate contents from a Fedora implementation to LAKEsuperior.
			
 
				+
			
 
				+A repository can be migrated with a one-line command such as:
			
 
				+
			
 
				+```
			
 
				+./lsup-admin migrate http://source-repo.edu/rest /local/dest/folder
			
 
				+```
			
 
				+
			
 
				+For more options, enter
			
 
				+
			
 
				+```
			
 
				+./lsup-admin migrate --help
			
 
				+```
			
 
				+
			
 
				+The script will crawl through the resources and crawl through outbound links
			
 
				+within them. In order to do this, resources are added as raw triples (i.e.
			
 
				+no consistency checks are made).
			
 
				+
			
 
				+**Note:** the consistency check tool has not yet been implemented at the moment
			
 
				+but its release should follow shortly. This will ensure that all the links
			
 
				+between resources are consistent in regard to referential integrity.
			
 
				+
			
 
				+This script will create a full dataset in the specified destination folder,
			
 
				+complete with a default configuration that allows to start the LAKEsuperior
			
 
				+server immediately after the migration is complete.
			
 
				+
			
 
				+Two approaches to migration are possible:
			
 
				+
			
 
				+1. By providing a starting point on the source repository. E.g. if the
			
 
				+   repository you want to migrate is at `http://repo.edu/rest/prod` you can add
			
 
				+   the `-s /prod` option to the script to avoid migrating irrelevant branches.
			
 
				+   Note that the script will still reach outside of the starting point if
			
 
				+   resources are referencing other resources outside of it.
			
 
				+2. By providing a file containing a list of resources to migrate. This is
			
 
				+   useful if a source repository cannot produce a full list (e.g. the root node
			
 
				+   has more children than the server can handle) but a list of individual
			
 
				+   resources is available via an external index (Solr, triplestore, etc.).
			
 
				+   The resources can be indicated by their fully qualified URIs or paths
			
 
				+   relative to the repository root. (*TODO latter option needs testing*)
			
 
				+
			
 
				+
			
--- a/docker/etc/application.yml
+++ b/docker/etc/application.yml
@@ -87,11 +87,14 @@ messaging:
 
				           # for this route.
			
 
				           active: True
			
 
				 
			
 
				+          # Protocol version. One of `10`, `11` or `12`.
			
 
				+          protocol: '11'
			
 
				           host: 127.0.0.1
			
 
				           port: 61613
			
 
				+
			
 
				+          # Credentials are optional.
			
 
				           username:
			
 
				           password:
			
 
				-          protocol: '12'
			
 
				           destination: '/topic/fcrepo'
			
 
				 
			
 
				           # Message format: at the moment the following are supported:
			
--- a/fcrepo
+++ b/fcrepo
@@ -2,4 +2,4 @@
 
				 default_conf_dir="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )/etc.defaults"
			
 
				 conf_dir=${FCREPO_CONFIG_DIR:-$default_conf_dir}
			
 
				 
			
 
				-gunicorn -c "${conf_dir}/gunicorn.py" server:fcrepo
			
 
				+gunicorn -c "${conf_dir}/gunicorn.py" server:fcrepo --preload
			
--- a/lakesuperior/api/admin.py
+++ b/lakesuperior/api/admin.py
@@ -1,27 +1,44 @@
 
				 import logging
			
 
				 
			
 
				 from lakesuperior.env import env
			
 
				+from lakesuperior.migrator import Migrator
			
 
				+from lakesuperior.store.ldp_nr.default_layout import DefaultLayout as FileLayout
			
 
				 from lakesuperior.store.ldp_rs.lmdb_store import TxnManager
			
 
				 
			
 
				-__doc__ = '''
			
 
				+__doc__ = """
			
 
				 Admin API.
			
 
				 
			
 
				 This module contains maintenance utilities and stats.
			
 
				-'''
			
 
				+"""
			
 
				 
			
 
				 logger = logging.getLogger(__name__)
			
 
				-app_globals = env.app_globals
			
 
				 
			
 
				 
			
 
				 def stats():
			
 
				-    '''
			
 
				+    """
			
 
				     Get repository statistics.
			
 
				 
			
 
				     @return dict Store statistics, resource statistics.
			
 
				-    '''
			
 
				+    """
			
 
				+    import lakesuperior.env_setup
			
 
				     repo_stats = {'rsrc_stats': env.app_globals.rdfly.count_rsrc()}
			
 
				     with TxnManager(env.app_globals.rdf_store) as txn:
			
 
				         repo_stats['store_stats'] = env.app_globals.rdf_store.stats()
			
 
				 
			
 
				     return repo_stats
			
 
				 
			
 
				+
			
 
				+def migrate(src, dest, start_pts=None, list_file=None, **kwargs):
			
 
				+    """
			
 
				+    Migrate an LDP repository to a new LAKEsuperior instance.
			
 
				+
			
 
				+    See :py:meth:`Migrator.__init__`.
			
 
				+    """
			
 
				+    if start_pts:
			
 
				+        if not isinstance(
			
 
				+                start_pts, list) and not isinstance(start_pts, tuple):
			
 
				+            start_pts = (start_pts,)
			
 
				+    elif not list_file:
			
 
				+        start_pts = ('/',)
			
 
				+
			
 
				+    return Migrator(src, dest, **kwargs).migrate(start_pts, list_file)
			
--- a/lakesuperior/api/resource.py
+++ b/lakesuperior/api/resource.py
@@ -20,7 +20,6 @@ from lakesuperior.store.ldp_rs.lmdb_store import TxnManager
 
				 
			
 
				 
			
 
				 logger = logging.getLogger(__name__)
			
 
				-app_globals = env.app_globals
			
 
				 
			
 
				 __doc__ = '''
			
 
				 Primary API for resource manipulation.
			
@@ -75,12 +74,11 @@ def transaction(write=False):
 
				             # update timestamps on resources.
			
 
				             env.timestamp = arrow.utcnow()
			
 
				             env.timestamp_term = Literal(env.timestamp, datatype=XSD.dateTime)
			
 
				-            with TxnManager(app_globals.rdf_store, write=write) as txn:
			
 
				+            with TxnManager(env.app_globals.rdf_store, write=write) as txn:
			
 
				                 ret = fn(*args, **kwargs)
			
 
				-            if len(app_globals.changelog):
			
 
				+            if len(env.app_globals.changelog):
			
 
				                 job = Thread(target=process_queue)
			
 
				                 job.start()
			
 
				-            logger.debug('Deleting timestamp: {}'.format(getattr(env, 'timestamp')))
			
 
				             delattr(env, 'timestamp')
			
 
				             delattr(env, 'timestamp_term')
			
 
				             return ret
			
@@ -94,8 +92,8 @@ def process_queue():
 
				     '''
			
 
				     lock = Lock()
			
 
				     lock.acquire()
			
 
				-    while len(app_globals.changelog):
			
 
				-        send_event_msg(*app_globals.changelog.popleft())
			
 
				+    while len(env.app_globals.changelog):
			
 
				+        send_event_msg(*env.app_globals.changelog.popleft())
			
 
				     lock.release()
			
 
				 
			
 
				 
			
@@ -118,11 +116,35 @@ def send_event_msg(remove_trp, add_trp, metadata):
 
				     subjects = set(remove_dict.keys()) | set(add_dict.keys())
			
 
				     for rsrc_uri in subjects:
			
 
				         logger.debug('Processing event for subject: {}'.format(rsrc_uri))
			
 
				-        app_globals.messenger.send(rsrc_uri, **metadata)
			
 
				+        env.app_globals.messenger.send(rsrc_uri, **metadata)
			
 
				 
			
 
				 
			
 
				 ### API METHODS ###
			
 
				 
			
 
				+@transaction()
			
 
				+def exists(uid):
			
 
				+    '''
			
 
				+    Return whether a resource exists (is stored) in the repository.
			
 
				+
			
 
				+    @param uid (string) Resource UID.
			
 
				+    '''
			
 
				+    try:
			
 
				+        exists = LdpFactory.from_stored(uid).is_stored
			
 
				+    except ResourceNotExistsError:
			
 
				+        exists = False
			
 
				+    return exists
			
 
				+
			
 
				+
			
 
				+@transaction()
			
 
				+def get_metadata(uid):
			
 
				+    '''
			
 
				+    Get metadata (admin triples) of an LDPR resource.
			
 
				+
			
 
				+    @param uid (string) Resource UID.
			
 
				+    '''
			
 
				+    return LdpFactory.from_stored(uid).metadata
			
 
				+
			
 
				+
			
 
				 @transaction()
			
 
				 def get(uid, repr_options={}):
			
 
				     '''
			
@@ -229,13 +251,10 @@ def update(uid, update_str, is_metadata=False):
 
				     If False, and the resource being updated is a LDP-NR, an error is raised.
			
 
				     '''
			
 
				     rsrc = LdpFactory.from_stored(uid)
			
 
				-    if LDP_NR_TYPE in rsrc.ldp_types:
			
 
				-        if is_metadata:
			
 
				-            rsrc.patch_metadata(update_str)
			
 
				-        else:
			
 
				-            raise InvalidResourceError(uid)
			
 
				-    else:
			
 
				-        rsrc.patch(update_str)
			
 
				+    if LDP_NR_TYPE in rsrc.ldp_types and not is_metadata:
			
 
				+        raise InvalidResourceError(uid)
			
 
				+
			
 
				+    rsrc.sparql_update(update_str)
			
 
				 
			
 
				     return rsrc
			
 
				 
			
@@ -266,11 +285,11 @@ def delete(uid, soft=True):
 
				     '''
			
 
				     # If referential integrity is enforced, grab all inbound relationships
			
 
				     # to break them.
			
 
				-    refint = app_globals.rdfly.config['referential_integrity']
			
 
				+    refint = env.app_globals.rdfly.config['referential_integrity']
			
 
				     inbound = True if refint else inbound
			
 
				     repr_opts = {'incl_inbound' : True} if refint else {}
			
 
				 
			
 
				-    children = app_globals.rdfly.get_descendants(uid)
			
 
				+    children = env.app_globals.rdfly.get_descendants(uid)
			
 
				 
			
 
				     if soft:
			
 
				         rsrc = LdpFactory.from_stored(uid, repr_opts)
			
@@ -279,16 +298,16 @@ def delete(uid, soft=True):
 
				         for child_uri in children:
			
 
				             try:
			
 
				                 child_rsrc = LdpFactory.from_stored(
			
 
				-                    app_globals.rdfly.uri_to_uid(child_uri),
			
 
				+                    env.app_globals.rdfly.uri_to_uid(child_uri),
			
 
				                     repr_opts={'incl_children' : False})
			
 
				             except (TombstoneError, ResourceNotExistsError):
			
 
				                 continue
			
 
				             child_rsrc.bury_rsrc(inbound, tstone_pointer=rsrc.uri)
			
 
				     else:
			
 
				-        ret = app_globals.rdfly.forget_rsrc(uid, inbound)
			
 
				+        ret = env.app_globals.rdfly.forget_rsrc(uid, inbound)
			
 
				         for child_uri in children:
			
 
				-            child_uid = app_globals.rdfly.uri_to_uid(child_uri)
			
 
				-            ret = app_globals.rdfly.forget_rsrc(child_uid, inbound)
			
 
				+            child_uid = env.app_globals.rdfly.uri_to_uid(child_uri)
			
 
				+            ret = env.app_globals.rdfly.forget_rsrc(child_uid, inbound)
			
 
				 
			
 
				     return ret
			
 
				 
			
--- a/lakesuperior/config_parser.py
+++ b/lakesuperior/config_parser.py
@@ -5,49 +5,72 @@ from os import path, environ
 
				 import hiyapyco
			
 
				 import yaml
			
 
				 
			
 
				-configs = (
			
 
				-    'application',
			
 
				-    'logging',
			
 
				-    'namespaces',
			
 
				-    'flask',
			
 
				-)
			
 
				-
			
 
				-# This will hold a dict of all configuration values.
			
 
				-config = {}
			
 
				-
			
 
				-# Parse configuration
			
 
				-CONFIG_DIR = environ.get(
			
 
				-        'FCREPO_CONFIG_DIR',
			
 
				-        path.dirname(path.dirname(path.abspath(__file__))) + '/etc.defaults')
			
 
				-
			
 
				-print('Reading configuration at {}'.format(CONFIG_DIR))
			
 
				-
			
 
				-for cname in configs:
			
 
				-    file = '{}/{}.yml'.format(CONFIG_DIR , cname)
			
 
				-    with open(file, 'r') as stream:
			
 
				-        config[cname] = yaml.load(stream, yaml.SafeLoader)
			
 
				-
			
 
				-# Merge default and test configurations.
			
 
				-error_msg = '''
			
 
				-**************
			
 
				-** WARNING! **
			
 
				-**************
			
 
				-
			
 
				-Your test {} store location is set to be the same as the production location.
			
 
				-This means that if you run a test suite, your live data may be wiped clean!
			
 
				-
			
 
				-Please review your configuration before starting.
			
 
				-'''
			
 
				-
			
 
				-test_config = {'application': hiyapyco.load(CONFIG_DIR + '/application.yml',
			
 
				-        CONFIG_DIR + '/test.yml', method=hiyapyco.METHOD_MERGE)}
			
 
				-
			
 
				-if config['application']['store']['ldp_rs']['location'] \
			
 
				-        == test_config['application']['store']['ldp_rs']['location']:
			
 
				-            raise RuntimeError(error_msg.format('RDF'))
			
 
				-            sys.exit()
			
 
				-
			
 
				-if config['application']['store']['ldp_nr']['path'] \
			
 
				-        == test_config['application']['store']['ldp_nr']['path']:
			
 
				-            raise RuntimeError(error_msg.format('binary'))
			
 
				-            sys.exit()
			
 
				+
			
 
				+def parse_config(config_dir=None):
			
 
				+    """
			
 
				+    Parse configuration from a directory.
			
 
				+
			
 
				+    This is normally called by the standard endpoints (``lsup_admin``, web
			
 
				+    server, etc.) or by a Python client by importing
			
 
				+    :py:mod:`lakesuperior.env_setup` but an application using a non-default
			
 
				+    configuration may specify an alternative configuration directory.
			
 
				+
			
 
				+    The directory must have the same structure as the one provided in
			
 
				+    ``etc.defaults``.
			
 
				+
			
 
				+    :param config_dir: Location on the filesystem of the configuration
			
 
				+    directory. The default is set by the ``FCREPO_CONFIG_DIR`` environment
			
 
				+    variable or, if this is not set, the ``etc.defaults`` stock directory.
			
 
				+    """
			
 
				+    configs = (
			
 
				+        'application',
			
 
				+        'logging',
			
 
				+        'namespaces',
			
 
				+        'flask',
			
 
				+    )
			
 
				+
			
 
				+    if not config_dir:
			
 
				+        config_dir = environ.get('FCREPO_CONFIG_DIR', path.dirname(
			
 
				+                path.dirname(path.abspath(__file__))) + '/etc.defaults')
			
 
				+
			
 
				+    # This will hold a dict of all configuration values.
			
 
				+    _config = {}
			
 
				+
			
 
				+    print('Reading configuration at {}'.format(config_dir))
			
 
				+
			
 
				+    for cname in configs:
			
 
				+        file = '{}/{}.yml'.format(config_dir , cname)
			
 
				+        with open(file, 'r') as stream:
			
 
				+            _config[cname] = yaml.load(stream, yaml.SafeLoader)
			
 
				+
			
 
				+    error_msg = '''
			
 
				+    **************
			
 
				+    ** WARNING! **
			
 
				+    **************
			
 
				+
			
 
				+    Your test {} store location is set to be the same as the production
			
 
				+    location. This means that if you run a test suite, your live data may be
			
 
				+    wiped clean!
			
 
				+
			
 
				+    Please review your configuration before starting.
			
 
				+    '''
			
 
				+
			
 
				+    # Merge default and test configurations.
			
 
				+    _test_config = {'application': hiyapyco.load(
			
 
				+            config_dir + '/application.yml',
			
 
				+            config_dir + '/test.yml', method=hiyapyco.METHOD_MERGE)}
			
 
				+
			
 
				+    if _config['application']['store']['ldp_rs']['location'] \
			
 
				+            == _test_config['application']['store']['ldp_rs']['location']:
			
 
				+                raise RuntimeError(error_msg.format('RDF'))
			
 
				+                sys.exit()
			
 
				+
			
 
				+    if _config['application']['store']['ldp_nr']['path'] \
			
 
				+            == _test_config['application']['store']['ldp_nr']['path']:
			
 
				+                raise RuntimeError(error_msg.format('binary'))
			
 
				+                sys.exit()
			
 
				+    return _config, _test_config
			
 
				+
			
 
				+
			
 
				+# Load default configuration.
			
 
				+config, test_config = parse_config()
			
--- a/lakesuperior/endpoints/ldp.py
+++ b/lakesuperior/endpoints/ldp.py
@@ -107,9 +107,11 @@ def log_request_end(rsp):
 
				 
			
 
				 @ldp.route('/<path:uid>', methods=['GET'], strict_slashes=False)
			
 
				 @ldp.route('/', defaults={'uid': '/'}, methods=['GET'], strict_slashes=False)
			
 
				-@ldp.route('/<path:uid>/fcr:metadata', defaults={'force_rdf' : True},
			
 
				+@ldp.route('/<path:uid>/fcr:metadata', defaults={'out_fmt' : 'rdf'},
			
 
				+        methods=['GET'])
			
 
				+@ldp.route('/<path:uid>/fcr:content', defaults={'out_fmt' : 'non_rdf'},
			
 
				         methods=['GET'])
			
 
				-def get_resource(uid, force_rdf=False):
			
 
				+def get_resource(uid, out_fmt=None):
			
 
				     '''
			
 
				     https://www.w3.org/TR/ldp/#ldpr-HTTP_GET
			
 
				 
			
@@ -117,9 +119,9 @@ def get_resource(uid, force_rdf=False):
 
				 
			
 
				     @param uid (string) UID of resource to retrieve. The repository root has
			
 
				     an empty string for UID.
			
 
				-    @param force_rdf (boolean) Whether to retrieve RDF even if the resource is
			
 
				+    @param out_fmt (string) Force output to RDF or non-RDF if the resource is
			
 
				     a LDP-NR. This is not available in the API but is used e.g. by the
			
 
				-    `*/fcr:metadata` endpoint. The default is False.
			
 
				+    `*/fcr:metadata` and `*/fcr:content` endpoints. The default is False.
			
 
				     '''
			
 
				     logger.info('UID: {}'.format(uid))
			
 
				     out_headers = std_headers
			
@@ -137,17 +139,22 @@ def get_resource(uid, force_rdf=False):
 
				     except TombstoneError as e:
			
 
				         return _tombstone_response(e, uid)
			
 
				     else:
			
 
				+        if out_fmt is None:
			
 
				+            out_fmt = (
			
 
				+                    'rdf'
			
 
				+                    if isinstance(rsrc, LdpRs) or is_accept_hdr_rdf_parsable()
			
 
				+                    else 'non_rdf')
			
 
				         out_headers.update(_headers_from_metadata(rsrc))
			
 
				         uri = g.tbox.uid_to_uri(uid)
			
 
				-        if (
			
 
				-                isinstance(rsrc, LdpRs)
			
 
				-                or is_accept_hdr_rdf_parsable()
			
 
				-                or force_rdf):
			
 
				+        if out_fmt == 'rdf':
			
 
				             ggr = g.tbox.globalize_graph(rsrc.out_graph)
			
 
				             ggr.namespace_manager = nsm
			
 
				             return _negotiate_content(ggr, out_headers, uid=uid, uri=uri)
			
 
				         else:
			
 
				-            logger.info('Streaming out binary content.')
			
 
				+            if not getattr(rsrc, 'local_path', False):
			
 
				+                return ('{} has no binary content.'.format(rsrc.uid), 404)
			
 
				+
			
 
				+            logger.debug('Streaming out binary content.')
			
 
				             rsp = make_response(send_file(
			
 
				                     rsrc.local_path, as_attachment=True,
			
 
				                     attachment_filename=rsrc.filename,
			
@@ -265,7 +272,6 @@ def put_resource(uid):
 
				     rsp_headers = {'Content-Type' : 'text/plain; charset=utf-8'}
			
 
				 
			
 
				     handling, disposition = set_post_put_params()
			
 
				-    #import pdb; pdb.set_trace()
			
 
				     stream, mimetype = _bistream_from_req()
			
 
				 
			
 
				     if LdpFactory.is_rdf_parsable(mimetype):
			
@@ -494,13 +500,6 @@ def _bistream_from_req():
 
				     return stream, mimetype
			
 
				 
			
 
				 
			
 
				-def _get_bitstream(rsrc):
			
 
				-    # @TODO This may change in favor of more low-level handling if the file
			
 
				-    # system is not local.
			
 
				-    return send_file(rsrc.local_path, as_attachment=True,
			
 
				-            attachment_filename=rsrc.filename)
			
 
				-
			
 
				-
			
 
				 def _tombstone_response(e, uid):
			
 
				     headers = {
			
 
				         'Link': '<{}/fcr:tombstone>; rel="hasTombstone"'.format(request.url),
			
--- a/lakesuperior/endpoints/templates/resource.html
+++ b/lakesuperior/endpoints/templates/resource.html
@@ -23,15 +23,20 @@
 
				 </nav>
			
 
				 {% endblock %}
			
 
				 {% block content %}
			
 
				+{% if gr[gr.identifier : nsc['rdf'].type : nsc['ldp'].NonRDFSource] %}
			
 
				+<div class="pull-right">
			
 
				+    <a href="{{ gr.identifier }}/fcr:content" class="btn btn-success btn-lg">
			
 
				+        <span class="glyphicon glyphicon-download" aria-hidden="true"></span>
			
 
				+        Download Content</a>
			
 
				+</div>
			
 
				+{% endif %}
			
 
				 {% set created_ts = arrow.get(
			
 
				-    gr.value(gr.identifier, nsc['fcrepo'].created)).replace(
			
 
				-    tzinfo='local') %}
			
 
				+    gr.value(gr.identifier, nsc['fcrepo'].created)).to('local') %}
			
 
				 {% set updated_ts = arrow.get(
			
 
				-    gr.value(gr.identifier, nsc['fcrepo'].lastModified)).replace(
			
 
				-    tzinfo='local') %}
			
 
				-<p><strong>Created on:</strong>&nbsp;{{ created_ts }}&nbsp;
			
 
				+    gr.value(gr.identifier, nsc['fcrepo'].lastModified)).to('local') %}
			
 
				+<p><strong>Created on:</strong>&nbsp;{{ created_ts.format('YYYY-MM-DD HH:mm:ss ZZ') }}&nbsp;
			
 
				 ({{created_ts.humanize() }})</p>
			
 
				-<p><strong>Last updated on:</strong>&nbsp;{{ updated_ts }}&nbsp;
			
 
				+<p><strong>Last updated on:</strong>&nbsp;{{ updated_ts.format('YYYY-MM-DD HH:mm:ss ZZ') }}&nbsp;
			
 
				 ({{updated_ts.humanize() }})</p>
			
 
				 <p><strong>Types:</strong>
			
 
				 {% for t in gr[gr.identifier : nsc['rdf'].type :] | sort %}
			
--- a/lakesuperior/messaging/handlers.py
+++ b/lakesuperior/messaging/handlers.py
@@ -14,9 +14,9 @@ class StompHandler(logging.Handler):
 
				     def __init__(self, conf):
			
 
				         self.conf = conf
			
 
				         if self.conf['protocol'] == '11':
			
 
				-            conn_cls = stomp.Connection12
			
 
				-        elif self.conf['protocol'] == '12':
			
 
				             conn_cls = stomp.Connection11
			
 
				+        elif self.conf['protocol'] == '12':
			
 
				+            conn_cls = stomp.Connection12
			
 
				         else:
			
 
				             conn_cls = stomp.Connection10
			
 
				 
			
--- a/lakesuperior/migrator.py
+++ b/lakesuperior/migrator.py
@@ -0,0 +1,278 @@
 
				+import logging
			
 
				+import shutil
			
 
				+
			
 
				+from io import BytesIO
			
 
				+from contextlib import ContextDecorator
			
 
				+from os import makedirs, path
			
 
				+from urllib.parse import urldefrag
			
 
				+
			
 
				+import lmdb
			
 
				+import requests
			
 
				+import yaml
			
 
				+
			
 
				+from rdflib import Graph, URIRef
			
 
				+
			
 
				+from lakesuperior.dictionaries.namespaces import ns_collection as nsc
			
 
				+from lakesuperior.env import env
			
 
				+from lakesuperior.globals import AppGlobals, ROOT_UID
			
 
				+from lakesuperior.config_parser import parse_config
			
 
				+from lakesuperior.store.ldp_rs.lmdb_store import TxnManager
			
 
				+
			
 
				+
			
 
				+logger = logging.getLogger(__name__)
			
 
				+
			
 
				+
			
 
				+class StoreWrapper(ContextDecorator):
			
 
				+    '''
			
 
				+    Open and close a store.
			
 
				+    '''
			
 
				+    def __init__(self, store):
			
 
				+        self.store = store
			
 
				+
			
 
				+    def __enter__(self):
			
 
				+        self.store.open(
			
 
				+                env.config['application']['store']['ldp_rs'])
			
 
				+
			
 
				+    def __exit__(self, *exc):
			
 
				+        self.store.close()
			
 
				+
			
 
				+
			
 
				+class Migrator:
			
 
				+    """
			
 
				+    Class to handle a database migration.
			
 
				+
			
 
				+    This class holds state of progress and shared variables as it crawls
			
 
				+    through linked resources in an LDP server.
			
 
				+
			
 
				+    Since a repository migration can be a very long operation but it is
			
 
				+    impossible to know the number of the resources to gather by LDP interaction
			
 
				+    alone, a progress ticker outputs the number of processed resources at
			
 
				+    regular intervals.
			
 
				+    """
			
 
				+
			
 
				+    """
			
 
				+    LMDB database parameters.
			
 
				+
			
 
				+    See :meth:`lmdb.Environment.__init__`
			
 
				+    """
			
 
				+    db_params = {
			
 
				+        'map_size': 1024 ** 4,
			
 
				+        'metasync': False,
			
 
				+        'readahead': False,
			
 
				+        'meminit': False,
			
 
				+    }
			
 
				+
			
 
				+    """List of predicates to ignore when looking for links."""
			
 
				+    ignored_preds = (
			
 
				+        nsc['fcrepo'].hasParent,
			
 
				+        nsc['fcrepo'].hasTransactionProvider,
			
 
				+        nsc['fcrepo'].hasFixityService,
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+    def __init__(
			
 
				+            self, src, dest, zero_binaries=False, compact_uris=False,
			
 
				+            skip_errors=False):
			
 
				+        """
			
 
				+        Set up base paths and clean up existing directories.
			
 
				+
			
 
				+        :param src: (URIRef) Webroot of source repository. This must
			
 
				+        correspond to the LDP root node (for Fedora it can be e.g.
			
 
				+        ``http://localhost:8080fcrepo/rest/``) and is used to determine if URIs
			
 
				+        retrieved are managed by this repository.
			
 
				+        :param dest: (str) Destination repository path. If the location exists
			
 
				+        it must be a writable directory. It will be deleted and recreated. If
			
 
				+        it does not exist, it will be created along with its parents if
			
 
				+        missing.
			
 
				+        :param binary_handling: (string) One of ``include``, ``truncate`` or
			
 
				+        ``split``.
			
 
				+        :param compact_uris: (bool) NOT IMPLEMENTED. Whether the process should
			
 
				+        attempt to compact URIs generated with broken up path segments. If the
			
 
				+        UID matches a pattern such as `/12/34/56/123456...` it is converted to
			
 
				+        `/123456...`. This would remove a lot of cruft caused by the pairtree
			
 
				+        segments. Note that this will change the publicly exposed URIs. If
			
 
				+        durability is a concern, a rewrite directive can be added to the HTTP
			
 
				+        server that proxies the WSGI endpoint.
			
 
				+        """
			
 
				+        # Set up repo folder structure and copy default configuration to
			
 
				+        # destination file.
			
 
				+        cur_dir = path.dirname(path.dirname(path.abspath(__file__)))
			
 
				+        self.dbpath = '{}/data/ldprs_store'.format(dest)
			
 
				+        self.fpath = '{}/data/ldpnr_store'.format(dest)
			
 
				+        self.config_dir = '{}/etc'.format(dest)
			
 
				+
			
 
				+        shutil.rmtree(dest, ignore_errors=True)
			
 
				+        shutil.copytree(
			
 
				+                '{}/etc.defaults'.format(cur_dir), self.config_dir)
			
 
				+
			
 
				+        # Modify and overwrite destination configuration.
			
 
				+        orig_config, _ = parse_config(self.config_dir)
			
 
				+        orig_config['application']['store']['ldp_rs']['location'] = self.dbpath
			
 
				+        orig_config['application']['store']['ldp_nr']['path'] = self.fpath
			
 
				+
			
 
				+        with open('{}/application.yml'.format(self.config_dir), 'w') \
			
 
				+                as config_file:
			
 
				+            config_file.write(yaml.dump(orig_config['application']))
			
 
				+
			
 
				+        env.config, _ = parse_config(self.config_dir)
			
 
				+        env.app_globals = AppGlobals(env.config)
			
 
				+
			
 
				+        self.rdfly = env.app_globals.rdfly
			
 
				+        self.nonrdfly = env.app_globals.nonrdfly
			
 
				+
			
 
				+        with TxnManager(env.app_globals.rdf_store, write=True) as txn:
			
 
				+            self.rdfly.bootstrap()
			
 
				+            self.rdfly.store.close()
			
 
				+        env.app_globals.nonrdfly.bootstrap()
			
 
				+
			
 
				+        self.src = src.rstrip('/')
			
 
				+        self.zero_binaries = zero_binaries
			
 
				+        self.skip_errors = skip_errors
			
 
				+
			
 
				+
			
 
				+
			
 
				+    def migrate(self, start_pts=None, list_file=None):
			
 
				+        """
			
 
				+        Migrate the database.
			
 
				+
			
 
				+        This method creates a fully functional and configured LAKEsuperior
			
 
				+        data set contained in a folder from an LDP repository.
			
 
				+
			
 
				+        :param tuple|list start_pts: List of starting points to retrieve
			
 
				+        resources from. It would typically be the repository root in case of a
			
 
				+        full dump or one or more resources in the repository for a partial one.
			
 
				+        :param str listf_ile: path to a local file containing a list of URIs,
			
 
				+        one per line.
			
 
				+        """
			
 
				+        from lakesuperior.api import resource as rsrc_api
			
 
				+        self._ct = 0
			
 
				+        with StoreWrapper(self.rdfly.store):
			
 
				+            if start_pts:
			
 
				+                for start in start_pts:
			
 
				+                    if not start.startswith('/'):
			
 
				+                        raise ValueError(
			
 
				+                            'Starting point {} does not begin with a slash.'
			
 
				+                            .format(start))
			
 
				+
			
 
				+                    if start != ROOT_UID:
			
 
				+                        # Create the full hierarchy with link to the parents.
			
 
				+                        rsrc_api.create_or_replace(start)
			
 
				+                    # Then populate the new resource and crawl for more
			
 
				+                    # relationships.
			
 
				+                    self._crawl(start)
			
 
				+            elif list_file:
			
 
				+                with open(list_file, 'r') as fp:
			
 
				+                    for uri in fp:
			
 
				+                        uid = uri.strip().replace(self.src, '')
			
 
				+                        if uid != ROOT_UID:
			
 
				+                            rsrc_api.create_or_replace(uid)
			
 
				+                        self._crawl(uid)
			
 
				+        logger.info('Dumped {} resources.'.format(self._ct))
			
 
				+
			
 
				+        return self._ct
			
 
				+
			
 
				+
			
 
				+    def _crawl(self, uid):
			
 
				+        """
			
 
				+        Get the contents of a resource and its relationships recursively.
			
 
				+
			
 
				+        This method recurses into itself each time a reference to a resource
			
 
				+        managed by the repository is encountered.
			
 
				+
			
 
				+        @param uid (string) The path relative to the source server webroot
			
 
				+        pointing to the resource to crawl, effectively the resource UID.
			
 
				+        """
			
 
				+        ibase = str(nsc['fcres'])
			
 
				+        # Public URI of source repo.
			
 
				+        uri = self.src + uid
			
 
				+        # Internal URI of destination.
			
 
				+        iuri = ibase + uid
			
 
				+
			
 
				+        rsp = requests.head(uri)
			
 
				+        if not self.skip_errors:
			
 
				+            rsp.raise_for_status()
			
 
				+        elif rsp.status_code > 399:
			
 
				+            print('Error retrieving resource {} headers: {} {}'.format(
			
 
				+                uri, rsp.status_code, rsp.text))
			
 
				+
			
 
				+        # Determine LDP type.
			
 
				+        ldp_type = 'ldp_nr'
			
 
				+        try:
			
 
				+            for link in requests.utils.parse_header_links(
			
 
				+                    rsp.headers.get('link')):
			
 
				+                if (
			
 
				+                        link.get('rel') == 'type'
			
 
				+                        and (
			
 
				+                            link.get('url') == str(nsc['ldp'].RDFSource)
			
 
				+                            or link.get('url') == str(nsc['ldp'].Container))
			
 
				+                ):
			
 
				+                    # Resource is an LDP-RS.
			
 
				+                    ldp_type = 'ldp_rs'
			
 
				+                    break
			
 
				+        except TypeError:
			
 
				+            ldp_type = 'ldp_rs'
			
 
				+            #raise ValueError('URI {} is not an LDP resource.'.format(uri))
			
 
				+
			
 
				+        # Get the whole RDF document now because we have to know all outbound
			
 
				+        # links.
			
 
				+        get_uri = (
			
 
				+                uri if ldp_type == 'ldp_rs' else '{}/fcr:metadata'.format(uri))
			
 
				+        get_rsp = requests.get(get_uri)
			
 
				+        if not self.skip_errors:
			
 
				+            get_rsp.raise_for_status()
			
 
				+        elif get_rsp.status_code > 399:
			
 
				+            print('Error retrieving resource {} body: {} {}'.format(
			
 
				+                uri, get_rsp.status_code, get_rsp.text))
			
 
				+
			
 
				+        data = get_rsp.content.replace(
			
 
				+                self.src.encode('utf-8'), ibase.encode('utf-8'))
			
 
				+        gr = Graph(identifier=iuri).parse(data=data, format='turtle')
			
 
				+
			
 
				+        # Store raw graph data. No checks.
			
 
				+        with TxnManager(self.rdfly.store, True):
			
 
				+            self.rdfly.modify_rsrc(uid, add_trp=set(gr))
			
 
				+
			
 
				+        # Grab binary and set new resource parameters.
			
 
				+        if ldp_type == 'ldp_nr':
			
 
				+            provided_imr = gr.resource(URIRef(iuri))
			
 
				+            if self.zero_binaries:
			
 
				+                data = b''
			
 
				+            else:
			
 
				+                bin_rsp = requests.get(uri)
			
 
				+                if not self.skip_errors:
			
 
				+                    bin_rsp.raise_for_status()
			
 
				+                elif bin_rsp.status_code > 399:
			
 
				+                    print('Error retrieving resource {} body: {} {}'.format(
			
 
				+                        uri, bin_rsp.status_code, bin_rsp.text))
			
 
				+                data = bin_rsp.content
			
 
				+            #import pdb; pdb.set_trace()
			
 
				+            uuid = str(gr.value(
			
 
				+                URIRef(iuri), nsc['premis'].hasMessageDigest)).split(':')[-1]
			
 
				+            fpath = self.nonrdfly.local_path(
			
 
				+                    self.nonrdfly.config['path'], uuid)
			
 
				+            makedirs(path.dirname(fpath), exist_ok=True)
			
 
				+            with open(fpath, 'wb') as fh:
			
 
				+                fh.write(data)
			
 
				+
			
 
				+        self._ct += 1
			
 
				+        if self._ct % 10 == 0:
			
 
				+            print('{} resources processed so far.'.format(self._ct))
			
 
				+
			
 
				+        # Now, crawl through outbound links.
			
 
				+        # LDP-NR fcr:metadata must be checked too.
			
 
				+        for pred, obj in gr.predicate_objects():
			
 
				+            #import pdb; pdb.set_trace()
			
 
				+            obj_uid = obj.replace(ibase, '')
			
 
				+            with TxnManager(self.rdfly.store, True):
			
 
				+                conditions = bool(
			
 
				+                    isinstance(obj, URIRef)
			
 
				+                    and obj.startswith(iuri)
			
 
				+                    # Avoid ∞ loop with fragment URIs.
			
 
				+                    and str(urldefrag(obj).url) != str(iuri)
			
 
				+                    # Avoid ∞ loop with circular references.
			
 
				+                    and not self.rdfly.ask_rsrc_exists(obj_uid)
			
 
				+                    and pred not in self.ignored_preds
			
 
				+                )
			
 
				+            if conditions:
			
 
				+                print('Object {} will be crawled.'.format(obj_uid))
			
 
				+                self._crawl(urldefrag(obj_uid).url)
			
--- a/lakesuperior/model/ldp_factory.py
+++ b/lakesuperior/model/ldp_factory.py
@@ -78,7 +78,8 @@ class LdpFactory:
 
				 
			
 
				 
			
 
				     @staticmethod
			
 
				-    def from_provided(uid, mimetype, stream=None, **kwargs):
			
 
				+    def from_provided(
			
 
				+            uid, mimetype=None, stream=None, provided_imr=None, **kwargs):
			
 
				         '''
			
 
				         Determine LDP type from request content.
			
 
				 
			
@@ -87,15 +88,15 @@ class LdpFactory:
 
				         @param stream (IOStream | None) The provided data stream. This can be
			
 
				         RDF or non-RDF content, or None. In the latter case, an empty container
			
 
				         is created.
			
 
				+        @param **kwargs Arguments passed to the LDP class constructor.
			
 
				         '''
			
 
				         uri = nsc['fcres'][uid]
			
 
				 
			
 
				-        if not stream:
			
 
				+        if not stream and not mimetype:
			
 
				             # Create empty LDPC.
			
 
				             logger.info('No data received in request. '
			
 
				                     'Creating empty container.')
			
 
				             inst = Ldpc(uid, provided_imr=Resource(Graph(), uri), **kwargs)
			
 
				-
			
 
				         elif __class__.is_rdf_parsable(mimetype):
			
 
				             # Create container and populate it with provided RDF data.
			
 
				             input_rdf = stream.read()
			
@@ -125,7 +126,9 @@ class LdpFactory:
 
				 
			
 
				         else:
			
 
				             # Create a LDP-NR and equip it with the binary file provided.
			
 
				-            provided_imr = Resource(Graph(), uri)
			
 
				+            # The IMR can also be provided for additional metadata.
			
 
				+            if not provided_imr:
			
 
				+                provided_imr = Resource(Graph(), uri)
			
 
				             inst = LdpNr(uid, stream=stream, mimetype=mimetype,
			
 
				                     provided_imr=provided_imr, **kwargs)
			
 
				 
			
--- a/lakesuperior/model/ldp_nr.py
+++ b/lakesuperior/model/ldp_nr.py
@@ -63,7 +63,8 @@ class LdpNr(Ldpr):
 
				     def local_path(self):
			
 
				         cksum_term = self.imr.value(nsc['premis'].hasMessageDigest)
			
 
				         cksum = str(cksum_term.identifier.replace('urn:sha1:',''))
			
 
				-        return nonrdfly.local_path(cksum)
			
 
				+        return nonrdfly.__class__.local_path(
			
 
				+                nonrdfly.root, cksum, nonrdfly.bl, nonrdfly.bc)
			
 
				 
			
 
				 
			
 
				     def create_or_replace(self, create_only=False):
			
@@ -87,17 +88,6 @@ class LdpNr(Ldpr):
 
				             return ev_type
			
 
				 
			
 
				 
			
 
				-    def patch_metadata(self, update_str):
			
 
				-        '''
			
 
				-        Update resource metadata by applying a SPARQL-UPDATE query.
			
 
				-
			
 
				-        @param update_str (string) SPARQL-Update staements.
			
 
				-        '''
			
 
				-        self.handling = 'lenient' # FCREPO does that and Hyrax requires it.
			
 
				-
			
 
				-        return self._sparql_update(update_str)
			
 
				-
			
 
				-
			
 
				     ## PROTECTED METHODS ##
			
 
				 
			
 
				     def _add_srv_mgd_triples(self, create=False):
			
--- a/lakesuperior/model/ldpr.py
+++ b/lakesuperior/model/ldpr.py
@@ -97,6 +97,16 @@ class Ldpr(metaclass=ABCMeta):
 
				     }
			
 
				 
			
 
				 
			
 
				+    # Predicates to remove when a resource is replaced.
			
 
				+    delete_preds_on_replace = {
			
 
				+        nsc['ebucore'].hasMimeType, 
			
 
				+        nsc['fcrepo'].lastModified,
			
 
				+        nsc['fcrepo'].lastModifiedBy,
			
 
				+        nsc['premis'].hasSize, 
			
 
				+        nsc['premis'].hasMessageDigest,
			
 
				+    }
			
 
				+
			
 
				+
			
 
				     ## MAGIC METHODS ##
			
 
				 
			
 
				     def __init__(self, uid, repr_opts={}, provided_imr=None, **kwargs):
			
@@ -121,6 +131,8 @@ class Ldpr(metaclass=ABCMeta):
 
				 
			
 
				         self.provided_imr = provided_imr
			
 
				 
			
 
				+        # Disable all internal checks e.g. for raw I/O.
			
 
				+
			
 
				 
			
 
				     @property
			
 
				     def rsrc(self):
			
@@ -211,33 +223,6 @@ class Ldpr(metaclass=ABCMeta):
 
				         self._metadata = rsrc
			
 
				 
			
 
				 
			
 
				-    @property
			
 
				-    def stored_or_new_imr(self):
			
 
				-        '''
			
 
				-        Extract an in-memory resource for harmless manipulation and output.
			
 
				-
			
 
				-        If the resource is not stored (yet), initialize a new IMR with basic
			
 
				-        triples.
			
 
				-
			
 
				-        @return rdflib.resource.Resource
			
 
				-        '''
			
 
				-        if not hasattr(self, '_imr'):
			
 
				-            if hasattr(self, '_imr_options'):
			
 
				-                #logger.debug('IMR options:{}'.format(self._imr_options))
			
 
				-                imr_options = self._imr_options
			
 
				-            else:
			
 
				-                imr_options = {}
			
 
				-            options = dict(imr_options, strict=True)
			
 
				-            try:
			
 
				-                self._imr = rdfly.extract_imr(self.uid, **options)
			
 
				-            except ResourceNotExistsError:
			
 
				-                self._imr = Resource(Graph(), self.uri)
			
 
				-                for t in self.base_types:
			
 
				-                    self.imr.add(RDF.type, t)
			
 
				-
			
 
				-        return self._imr
			
 
				-
			
 
				-
			
 
				     @property
			
 
				     def out_graph(self):
			
 
				         '''
			
@@ -249,7 +234,7 @@ class Ldpr(metaclass=ABCMeta):
 
				             if (
			
 
				                 # Exclude digest hash and version information.
			
 
				                 t[1] not in {
			
 
				-                    nsc['premis'].hasMessageDigest,
			
 
				+                    #nsc['premis'].hasMessageDigest,
			
 
				                     nsc['fcrepo'].hasVersion,
			
 
				                 }
			
 
				             ) and (
			
@@ -372,8 +357,8 @@ class Ldpr(metaclass=ABCMeta):
 
				         @param create_only (boolean) Whether this is a create-only operation.
			
 
				         '''
			
 
				         create = create_only or not self.is_stored
			
 
				-        ev_type = RES_CREATED if create else RES_UPDATED
			
 
				 
			
 
				+        ev_type = RES_CREATED if create else RES_UPDATED
			
 
				         self._add_srv_mgd_triples(create)
			
 
				         ref_int = rdfly.config['referential_integrity']
			
 
				         if ref_int:
			
@@ -384,10 +369,10 @@ class Ldpr(metaclass=ABCMeta):
 
				             rdfly.truncate_rsrc(self.uid)
			
 
				 
			
 
				         remove_trp = {
			
 
				-            (self.uri, nsc['fcrepo'].lastModified, None),
			
 
				-            (self.uri, nsc['fcrepo'].lastModifiedBy, None),
			
 
				-        }
			
 
				-        add_trp = set(self.provided_imr.graph) | self._containment_rel(create)
			
 
				+            (self.uri, pred, None) for pred in self.delete_preds_on_replace}
			
 
				+        add_trp = (
			
 
				+                set(self.provided_imr.graph)
			
 
				+                | self._containment_rel(create))
			
 
				 
			
 
				         self._modify_rsrc(ev_type, remove_trp, add_trp)
			
 
				         new_gr = Graph()
			
@@ -399,24 +384,6 @@ class Ldpr(metaclass=ABCMeta):
 
				         return ev_type
			
 
				 
			
 
				 
			
 
				-    def put(self):
			
 
				-        '''
			
 
				-        https://www.w3.org/TR/ldp/#ldpr-HTTP_PUT
			
 
				-        '''
			
 
				-        return self.create_or_replace()
			
 
				-
			
 
				-
			
 
				-    def patch(self, update_str):
			
 
				-        '''
			
 
				-        Update an existing resource by applying a SPARQL-UPDATE query.
			
 
				-
			
 
				-        @param update_str (string) SPARQL-Update staements.
			
 
				-        '''
			
 
				-        self.handling = 'lenient' # FCREPO does that and Hyrax requires it.
			
 
				-
			
 
				-        return self._sparql_update(update_str)
			
 
				-
			
 
				-
			
 
				     def bury_rsrc(self, inbound, tstone_pointer=None):
			
 
				         '''
			
 
				         Delete a single resource and create a tombstone.
			
@@ -510,7 +477,7 @@ class Ldpr(metaclass=ABCMeta):
 
				             (self.uri, nsc['fcrepo'].hasVersion, ver_uri),
			
 
				             (self.uri, nsc['fcrepo'].hasVersions, nsc['fcres'][vers_uid]),
			
 
				         }
			
 
				-        self._modify_rsrc(RES_UPDATED, add_trp=rsrc_add_gr, notify=False)
			
 
				+        self._modify_rsrc(RES_UPDATED, add_trp=rsrc_add_gr)
			
 
				 
			
 
				         return ver_uid
			
 
				 
			
@@ -608,7 +575,7 @@ class Ldpr(metaclass=ABCMeta):
 
				 
			
 
				 
			
 
				     def _modify_rsrc(
			
 
				-            self, ev_type, remove_trp=set(), add_trp=set(), notify=True):
			
 
				+            self, ev_type, remove_trp=set(), add_trp=set()):
			
 
				         '''
			
 
				         Low-level method to modify a graph for a single resource.
			
 
				 
			
@@ -616,14 +583,16 @@ class Ldpr(metaclass=ABCMeta):
 
				         store that needs to be notified should be performed by invoking this
			
 
				         method.
			
 
				 
			
 
				-        @param ev_type (string) The type of event (create, update, delete).
			
 
				+        @param ev_type (string|None) The type of event (create, update,
			
 
				+        delete) or None. In the latter case, no notification is sent.
			
 
				         @param remove_trp (set) Triples to be removed.
			
 
				         @param add_trp (set) Triples to be added.
			
 
				-        @param notify (boolean) Whether to send a message about the change.
			
 
				         '''
			
 
				         rdfly.modify_rsrc(self.uid, remove_trp, add_trp)
			
 
				 
			
 
				-        if notify and env.config['application'].get('messaging'):
			
 
				+        if (
			
 
				+                ev_type is not None
			
 
				+                and env.config['application'].get('messaging')):
			
 
				             logger.debug('Enqueuing message for {}'.format(self.uid))
			
 
				             self._enqueue_msg(ev_type, remove_trp, add_trp)
			
 
				 
			
@@ -857,7 +826,7 @@ class Ldpr(metaclass=ABCMeta):
 
				         return add_trp
			
 
				 
			
 
				 
			
 
				-    def _sparql_update(self, update_str, notify=True):
			
 
				+    def sparql_update(self, update_str):
			
 
				         '''
			
 
				         Apply a SPARQL update to a resource.
			
 
				 
			
@@ -868,7 +837,7 @@ class Ldpr(metaclass=ABCMeta):
 
				         self.handling = 'lenient' # FCREPO does that and Hyrax requires it.
			
 
				         delta = self._sparql_delta(update_str)
			
 
				 
			
 
				-        return self._modify_rsrc(RES_UPDATED, *delta, notify=notify)
			
 
				+        return self._modify_rsrc(RES_UPDATED, *delta)
			
 
				 
			
 
				 
			
 
				     def _sparql_delta(self, q):
			
--- a/lakesuperior/store/ldp_nr/default_layout.py
+++ b/lakesuperior/store/ldp_nr/default_layout.py
@@ -15,6 +15,36 @@ class DefaultLayout(BaseNonRdfLayout):
 
				     '''
			
 
				     Default file layout.
			
 
				     '''
			
 
				+    @staticmethod
			
 
				+    def local_path(root, uuid, bl=4, bc=4):
			
 
				+        '''
			
 
				+        Generate the resource path splitting the resource checksum according to
			
 
				+        configuration parameters.
			
 
				+
			
 
				+        @param uuid (string) The resource UUID. This corresponds to the content
			
 
				+        checksum.
			
 
				+        '''
			
 
				+        logger.debug('Generating path from uuid: {}'.format(uuid))
			
 
				+        term = len(uuid) if bc == 0 else min(bc * bl, len(uuid))
			
 
				+
			
 
				+        path = [uuid[i : i + bl] for i in range(0, term, bl)]
			
 
				+
			
 
				+        if bc > 0:
			
 
				+            path.append(uuid[term :])
			
 
				+        path.insert(0, root)
			
 
				+
			
 
				+        return '/'.join(path)
			
 
				+
			
 
				+
			
 
				+    def __init__(self, *args, **kwargs):
			
 
				+        '''
			
 
				+        Set up path segmentation parameters.
			
 
				+        '''
			
 
				+        super().__init__(*args, **kwargs)
			
 
				+
			
 
				+        self.bl = self.config['pairtree_branch_length']
			
 
				+        self.bc = self.config['pairtree_branches']
			
 
				+
			
 
				 
			
 
				     ## INTERFACE METHODS ##
			
 
				 
			
@@ -60,11 +90,11 @@ class DefaultLayout(BaseNonRdfLayout):
 
				             os.unlink(tmp_file)
			
 
				             raise
			
 
				         if size == 0:
			
 
				-            logger.warn('Zero-file size received.')
			
 
				+            logger.warn('Zero-length file received.')
			
 
				 
			
 
				         # Move temp file to final destination.
			
 
				         uuid = hash.hexdigest()
			
 
				-        dst = self.local_path(uuid)
			
 
				+        dst = __class__.local_path(self.root, uuid, self.bl, self.bc)
			
 
				         logger.debug('Saving file to disk: {}'.format(dst))
			
 
				         if not os.access(os.path.dirname(dst), os.X_OK):
			
 
				             os.makedirs(os.path.dirname(dst))
			
@@ -84,28 +114,4 @@ class DefaultLayout(BaseNonRdfLayout):
 
				         '''
			
 
				         See BaseNonRdfLayout.delete.
			
 
				         '''
			
 
				-        os.unlink(self.local_path(uuid))
			
 
				-
			
 
				-
			
 
				-    ## PROTECTED METHODS ##
			
 
				-
			
 
				-    def local_path(self, uuid):
			
 
				-        '''
			
 
				-        Generate the resource path splitting the resource checksum according to
			
 
				-        configuration parameters.
			
 
				-
			
 
				-        @param uuid (string) The resource UUID. This corresponds to the content
			
 
				-        checksum.
			
 
				-        '''
			
 
				-        logger.debug('Generating path from uuid: {}'.format(uuid))
			
 
				-        bl = self.config['pairtree_branch_length']
			
 
				-        bc = self.config['pairtree_branches']
			
 
				-        term = len(uuid) if bc==0 else min(bc*bl, len(uuid))
			
 
				-
			
 
				-        path = [ uuid[i:i+bl] for i in range(0, term, bl) ]
			
 
				-
			
 
				-        if bc > 0:
			
 
				-            path.append(uuid[term:])
			
 
				-        path.insert(0, self.root)
			
 
				-
			
 
				-        return '/'.join(path)
			
 
				+        os.unlink(__class__.local_path(self.root, uuid, self.bl, self.bc))
			
--- a/lakesuperior/store/ldp_rs/rsrc_centric_layout.py
+++ b/lakesuperior/store/ldp_rs/rsrc_centric_layout.py
@@ -2,6 +2,9 @@ import logging
 
				 
			
 
				 from collections import defaultdict
			
 
				 from itertools import chain
			
 
				+from string import Template
			
 
				+
			
 
				+import arrow
			
 
				 
			
 
				 from rdflib import Dataset, Graph, Literal, URIRef, plugin
			
 
				 from rdflib.namespace import RDF
			
@@ -178,7 +181,8 @@ class RsrcCentricLayout:
 
				         store.open()
			
 
				         with TxnManager(store, True):
			
 
				             with open('data/bootstrap/rsrc_centric_layout.sparql', 'r') as f:
			
 
				-                self.ds.update(f.read())
			
 
				+                data = Template(f.read())
			
 
				+                self.ds.update(data.substitute(timestamp=arrow.utcnow()))
			
 
				 
			
 
				 
			
 
				     def get_raw(self, uri, ctx=None):
			
@@ -491,7 +495,8 @@ class RsrcCentricLayout:
 
				             # Add metadata.
			
 
				             meta_gr.set(
			
 
				                     (gr_uri, nsc['foaf'].primaryTopic, nsc['fcres'][uid]))
			
 
				-            meta_gr.set((gr_uri, nsc['fcrepo'].created, env.timestamp_term))
			
 
				+            ts = getattr(env, 'timestamp_term', Literal(arrow.utcnow()))
			
 
				+            meta_gr.set((gr_uri, nsc['fcrepo'].created, ts))
			
 
				             if historic:
			
 
				                 # @FIXME Ugly reverse engineering.
			
 
				                 ver_uid = uid.split(VERS_CONT_LABEL)[1].lstrip('/')
			
--- a/lsup-admin
+++ b/lsup-admin
@@ -1,19 +1,18 @@
 
				 #!/usr/bin/env python
			
 
				 import click
			
 
				+import click_log
			
 
				 import json
			
 
				+import logging
			
 
				 import os
			
 
				 import sys
			
 
				 
			
 
				-import lakesuperior.env_setup
			
 
				-
			
 
				 from lakesuperior.api import admin as admin_api
			
 
				 from lakesuperior.config_parser import config
			
 
				-from lakesuperior.globals import AppGlobals
			
 
				 from lakesuperior.env import env
			
 
				 from lakesuperior.store.ldp_rs.lmdb_store import TxnManager
			
 
				 
			
 
				-rdfly = env.app_globals.rdfly
			
 
				-nonrdfly = env.app_globals.nonrdfly
			
 
				+logger = logging.getLogger(__name__)
			
 
				+click_log.basic_config(logger)
			
 
				 
			
 
				 
			
 
				 @click.group()
			
@@ -31,6 +30,11 @@ def bootstrap():
 
				 
			
 
				     Additional scaffolding files may be parsed to create initial contents.
			
 
				     '''
			
 
				+    import lakesuperior.env_setup
			
 
				+
			
 
				+    rdfly = env.app_globals.rdfly
			
 
				+    nonrdfly = env.app_globals.nonrdfly
			
 
				+
			
 
				     click.echo(
			
 
				             click.style(
			
 
				                 'WARNING: This operation will WIPE ALL YOUR DATA.\n',
			
@@ -119,19 +123,53 @@ def copy():
 
				 @click.argument('src')
			
 
				 @click.argument('dest')
			
 
				 @click.option(
			
 
				-    '--binaries', '-b', show_default=True,
			
 
				-    help='If set to `include`, full binaries are included in the dump. If '
			
 
				-    'set to `truncate`, binaries are created as zero-byte files in the proper '
			
 
				-    'folder structure. If set to `skip`, binaries are not exported. Data '
			
 
				-    'folders are not created.')
			
 
				-def dump(src, dest, binaries='include'):
			
 
				+    '--start', '-s', show_default=True,
			
 
				+    help='Starting point for looking for resources in the repository.\n'
			
 
				+    'The default `/` value starts at the root, i.e. migrates the whole '
			
 
				+    'repository.')
			
 
				+@click.option(
			
 
				+    '--list-file', '-l', help='Path to a local file containing URIs to be '
			
 
				+    'used as starting points, one per line. Use this alternatively to `-s`. '
			
 
				+    'The URIs can be relative to the repository root (e.g. `/a/b/c`) or fully '
			
 
				+    'qualified (e.g. `https://example.edu/fcrepo/rest/a/b/c`).')
			
 
				+@click.option(
			
 
				+    '--zero-binaries', '-z', is_flag=True,
			
 
				+    help='If set, binaries are created as zero-byte files in the proper '
			
 
				+    'folder structure rather than having their full content copied.')
			
 
				+@click.option(
			
 
				+    '--skip-errors', '-e', is_flag=True,
			
 
				+    help='If set, when the application encounters an error while retrieving '
			
 
				+    'a resource from the source repository, it will log the error rather than '
			
 
				+    'quitting. Other exceptions caused by the application will terminate the '
			
 
				+    'process as usual.')
			
 
				+@click_log.simple_verbosity_option(logger)
			
 
				+def migrate(src, dest, start, list_file, zero_binaries, skip_errors):
			
 
				     '''
			
 
				-    [STUB] Dump repository to disk.
			
 
				+    Migrate an LDP repository to LAKEsuperior.
			
 
				+
			
 
				+    This utility creates a fully functional LAKEshore repository from an
			
 
				+    existing repository. The source repo can be LAKEsuperior or
			
 
				+    another LDP-compatible implementation.
			
 
				 
			
 
				-    Dump a Fedora 4 repository to disk. The Fedora repo can be
			
 
				-    LAKEsuperior or another compatible implementation.
			
 
				+    A folder will be created in the location indicated by ``dest``. If the
			
 
				+    folder exists already, it will be deleted and recreated. The folder will be
			
 
				+    populated with the RDF and binary data directories and a default
			
 
				+    configuration directory. The new repository can be immediately started
			
 
				+    from this location.
			
 
				     '''
			
 
				-    pass
			
 
				+    logger.info('Migrating {} into a new repository on {}.'.format(
			
 
				+            src, dest))
			
 
				+    entries = admin_api.migrate(
			
 
				+            src, dest, start_pts=start, list_file=list_file,
			
 
				+            zero_binaries=zero_binaries, skip_errors=skip_errors)
			
 
				+    logger.info('Migrated {} resources.'.format(entries))
			
 
				+    logger.info('''Migration complete. To start the new repository, from the
			
 
				+    directory you launched this script run:
			
 
				+
			
 
				+    FCREPO_CONFIG_DIR="{}/etc" ./fcrepo
			
 
				+
			
 
				+    Make sure that the default port is not being used by another repository.
			
 
				+    '''.format(dest))
			
 
				 
			
 
				 
			
 
				 @click.command()
			
@@ -152,8 +190,8 @@ admin.add_command(check_fixity)
 
				 admin.add_command(check_refint)
			
 
				 admin.add_command(cleanup)
			
 
				 admin.add_command(copy)
			
 
				-admin.add_command(dump)
			
 
				 admin.add_command(load)
			
 
				+admin.add_command(migrate)
			
 
				 admin.add_command(stats)
			
 
				 
			
 
				 if __name__ == '__main__':
			
--- a/requirements.txt
+++ b/requirements.txt
@@ -5,11 +5,13 @@ Pillow==4.3.0
 
				 PyYAML==3.12
			
 
				 arrow==0.10.0
			
 
				 click==6.7
			
 
				+click-log==0.2.1
			
 
				 gevent==1.2.2
			
 
				 gunicorn==19.7.1
			
 
				 lmdb==0.93
			
 
				 numpy==1.14.1
			
 
				 pytest==3.2.2
			
 
				+pytest-flask==0.10.0
			
 
				 rdflib==4.2.2
			
 
				 requests-toolbelt==0.8.0
			
 
				 requests==2.18.4
			
--- a/util/benchmark.py
+++ b/util/benchmark.py
@@ -7,10 +7,11 @@ from uuid import uuid4
 
				 import arrow
			
 
				 import requests
			
 
				 
			
 
				-from rdflib import Graph, URIRef, Literal
			
 
				-
			
 
				-from util.generators import random_utf8_string
			
 
				+from util.generators import random_image, random_graph, random_utf8_string
			
 
				 
			
 
				+__doc__ = '''
			
 
				+Benchmark script to measure write performance.
			
 
				+'''
			
 
				 
			
 
				 default_n = 10000
			
 
				 webroot = 'http://localhost:8000/ldp'
			
@@ -31,7 +32,9 @@ if choice and choice.lower() not in ('post', 'put'):
 
				     raise ValueError('Not a valid verb.')
			
 
				 method = choice.lower() or 'put'
			
 
				 
			
 
				-# Generate 10,000 children of root node.
			
 
				+sys.stdout.write('RDF Sources (r), Non-RDF (n), or Both 50/50 (b)? [b] >')
			
 
				+choice = input().lower()
			
 
				+res_type = choice or 'b'
			
 
				 
			
 
				 if del_cont  == 'y':
			
 
				     requests.delete(container_uri, headers={'prefer': 'no-tombstone'})
			
@@ -44,52 +47,37 @@ ckpt = start
 
				 print('Inserting {} children.'.format(n))
			
 
				 
			
 
				 # URI used to establish an in-repo relationship.
			
 
				-prev_uri = container_uri
			
 
				-size = 50 # Size of graph to be multiplied by 4.
			
 
				+ref = container_uri
			
 
				+size = 200 # Size of graph.
			
 
				 
			
 
				 try:
			
 
				-    for i in range(1, n):
			
 
				+    for i in range(1, n + 1):
			
 
				         url = '{}/{}'.format(container_uri, uuid4()) if method == 'put' \
			
 
				                 else container_uri
			
 
				 
			
 
				-        # Generate synthetic graph.
			
 
				-        #print('generating graph: {}'.format(i))
			
 
				-        g = Graph()
			
 
				-        for ii in range(size):
			
 
				-            g.add((
			
 
				-                URIRef(''),
			
 
				-                URIRef('urn:inturi_p:{}'.format(ii % size)),
			
 
				-                URIRef(prev_uri)
			
 
				-            ))
			
 
				-            g.add((
			
 
				-                URIRef(''),
			
 
				-                URIRef('urn:lit_p:{}'.format(ii % size)),
			
 
				-                Literal(random_utf8_string(64))
			
 
				-            ))
			
 
				-            g.add((
			
 
				-                URIRef(''),
			
 
				-                URIRef('urn:lit_p:{}'.format(ii % size)),
			
 
				-                Literal(random_utf8_string(64))
			
 
				-            ))
			
 
				-            g.add((
			
 
				-                URIRef(''),
			
 
				-                URIRef('urn:exturi_p:{}'.format(ii % size)),
			
 
				-                URIRef('http://exmple.edu/res/{}'.format(ii // 10))
			
 
				-            ))
			
 
				-
			
 
				-        # Send request.
			
 
				-        rsp = requests.request(
			
 
				-                method, url, data=g.serialize(format='ttl'),
			
 
				-                headers={ 'content-type': 'text/turtle'})
			
 
				+        if res_type == 'r' or (res_type == 'b' and i % 2 == 0):
			
 
				+            data = random_graph(size, ref).serialize(format='ttl')
			
 
				+            headers = {'content-type': 'text/turtle'}
			
 
				+        else:
			
 
				+            img = random_image(name=uuid4(), ts=16, ims=512)
			
 
				+            data = img['content']
			
 
				+            data.seek(0)
			
 
				+            headers = {
			
 
				+                    'content-type': 'image/png',
			
 
				+                    'content-disposition': 'attachment; filename="{}"'
			
 
				+                        .format(uuid4())}
			
 
				+
			
 
				+        #import pdb; pdb.set_trace()
			
 
				+        rsp = requests.request(method, url, data=data, headers=headers)
			
 
				         rsp.raise_for_status()
			
 
				-        prev_uri = rsp.headers['location']
			
 
				+        ref = rsp.headers['location']
			
 
				         if i % 10 == 0:
			
 
				             now = arrow.utcnow()
			
 
				             tdelta = now - ckpt
			
 
				             ckpt = now
			
 
				             print('Record: {}\tTime elapsed: {}'.format(i, tdelta))
			
 
				 except KeyboardInterrupt:
			
 
				-    print('Interruped after {} iterations.'.format(i))
			
 
				+    print('Interrupted after {} iterations.'.format(i))
			
 
				 
			
 
				 tdelta = arrow.utcnow() - start
			
 
				 print('Total elapsed time: {}'.format(tdelta))
			
--- a/util/generators.py
+++ b/util/generators.py
@@ -2,11 +2,14 @@ import io
 
				 import random
			
 
				 
			
 
				 from hashlib import sha1
			
 
				+from math import floor
			
 
				 
			
 
				 import requests
			
 
				 import numpy
			
 
				 
			
 
				 from PIL import Image
			
 
				+from rdflib import Graph, URIRef, Literal
			
 
				+from rdflib.namespace import Namespace, NamespaceManager
			
 
				 
			
 
				 
			
 
				 # @TODO Update this to include code point ranges to be sampled
			
@@ -51,3 +54,45 @@ def random_image(name, ts=8, ims=256):
 
				     }
			
 
				 
			
 
				 
			
 
				+nsm = NamespaceManager(Graph())
			
 
				+nsc = {
			
 
				+    'extp': Namespace('http://ex.org/exturi_p#'),
			
 
				+    'intp': Namespace('http://ex.org/inturi_p#'),
			
 
				+    'litp': Namespace('http://ex.org/lit_p#'),
			
 
				+}
			
 
				+for pfx, ns in nsc.items():
			
 
				+    nsm.bind(pfx, ns)
			
 
				+
			
 
				+def random_graph(size, ref):
			
 
				+    '''
			
 
				+    Generate a synthetic graph.
			
 
				+
			
 
				+    @param size (int) size Size of the graph. It will be rounded by a
			
 
				+    multiplier of 4.
			
 
				+    '''
			
 
				+    gr = Graph()
			
 
				+    gr.namespace_manager = nsm
			
 
				+    for ii in range(floor(size / 4)):
			
 
				+        gr.add((
			
 
				+            URIRef(''),
			
 
				+            nsc['intp'][str(ii % size)],
			
 
				+            URIRef(ref)
			
 
				+        ))
			
 
				+        gr.add((
			
 
				+            URIRef(''),
			
 
				+            nsc['litp'][str(ii % size)],
			
 
				+            Literal(random_utf8_string(64))
			
 
				+        ))
			
 
				+        gr.add((
			
 
				+            URIRef(''),
			
 
				+            nsc['litp'][str(ii % size)],
			
 
				+            Literal(random_utf8_string(64))
			
 
				+        ))
			
 
				+        gr.add((
			
 
				+            URIRef(''),
			
 
				+            nsc['extp'][str(ii % size)],
			
 
				+            URIRef('http://example.edu/res/{}'.format(ii // 10))
			
 
				+        ))
			
 
				+
			
 
				+    #print('Graph: {}'.format(gr.serialize(format='turtle').decode('utf-8')))
			
 
				+    return gr