Browse Source

Add HTTP Basic authentication in migration tool.

Stefano Cossu 6 năm trước cách đây
mục cha
commit
690a1b0d6a
2 tập tin đã thay đổi với 20 bổ sung11 xóa
  1. 7 2
      lakesuperior/lsup_admin.py
  2. 13 9
      lakesuperior/migrator.py

+ 7 - 2
lakesuperior/lsup_admin.py

@@ -162,6 +162,10 @@ def cleanup():
 @click.command()
 @click.argument('src')
 @click.argument('dest')
+@click.option(
+    '--auth', '-a',
+    help='Colon-separated credentials for HTTP Basic authentication on the '
+    'source repository. E.g. `user:password`.')
 @click.option(
     '--start', '-s', show_default=True,
     help='Starting point for looking for resources in the repository.\n'
@@ -183,7 +187,7 @@ def cleanup():
     'quitting. Other exceptions caused by the application will terminate the '
     'process as usual.')
 @click_log.simple_verbosity_option(logger)
-def migrate(src, dest, start, list_file, zero_binaries, skip_errors):
+def migrate(src, dest, auth, start, list_file, zero_binaries, skip_errors):
     """
     Migrate an LDP repository to Lakesuperior.
 
@@ -199,8 +203,9 @@ def migrate(src, dest, start, list_file, zero_binaries, skip_errors):
     """
     logger.info('Migrating {} into a new repository on {}.'.format(
             src, dest))
+    src_auth = tuple(auth.split(':')) if auth else None
     entries = admin_api.migrate(
-            src, dest, start_pts=start, list_file=list_file,
+        src, dest, src_auth=src_auth, start_pts=start, list_file=list_file,
             zero_binaries=zero_binaries, skip_errors=skip_errors)
     logger.info('Migrated {} resources.'.format(entries))
     logger.info("""Migration complete. To start the new repository, from the

+ 13 - 9
lakesuperior/migrator.py

@@ -68,8 +68,8 @@ class Migrator:
 
 
     def __init__(
-            self, src, dest, clear=False, zero_binaries=False,
-            compact_uris=False, skip_errors=False):
+            self, src, dest, src_auth=(None, None), clear=False,
+            zero_binaries=False, compact_uris=False, skip_errors=False):
         """
         Set up base paths and clean up existing directories.
 
@@ -81,6 +81,8 @@ class Migrator:
             it must be a writable directory. It will be deleted and recreated.
             If it does not exist, it will be created along with its parents if
             missing.
+        :param tuple src_auth: if the source repo needs HTTP authentication,
+            specify here username and password as a 2-tuple of strings.
         :param bool clear: Whether to clear any pre-existing data at the
             locations indicated.
         :param bool zero_binaries: Whether to create zero-byte binary files
@@ -99,6 +101,7 @@ class Migrator:
         self.dbpath = '{}/data/ldprs_store'.format(dest)
         self.fpath = '{}/data/ldpnr_store'.format(dest)
         self.config_dir = '{}/etc'.format(dest)
+        self.auth = src_auth
 
         if clear:
             shutil.rmtree(dest, ignore_errors=True)
@@ -196,9 +199,10 @@ class Migrator:
         iuri = ibase + uid
 
         try:
-            rsp = requests.head(uri)
+            rsp = requests.head(uri, auth=self.auth)
+            rsp.raise_for_status()
         except:
-            logger.warn('Error retrieving resource {}'.format(uri))
+            logger.warn('Error retrieving resource {}: {}'.format(uri, rsp.status_code))
             return
         if rsp:
             if not self.skip_errors:
@@ -211,7 +215,7 @@ class Migrator:
         ldp_type = 'ldp_nr'
         try:
             for link in requests.utils.parse_header_links(
-                    rsp.headers.get('link')):
+                    rsp.headers.get('link', auth=self.auth)):
                 if (
                         link.get('rel') == 'type'
                         and (
@@ -230,7 +234,7 @@ class Migrator:
         get_uri = (
                 uri if ldp_type == 'ldp_rs' else '{}/fcr:metadata'.format(uri))
         try:
-            get_rsp = requests.get(get_uri)
+            get_rsp = requests.get(get_uri, auth=self.auth)
         except:
             logger.warn('Error retrieving resource {}'.format(get_uri))
             return
@@ -246,7 +250,7 @@ class Migrator:
         gr = Graph(identifier=iuri).parse(data=data, format='turtle')
 
         # Store raw graph data. No checks.
-        with self.rdfly.store.txn_mgr(True):
+        with self.rdfly.store.txn_ctx(True):
             self.rdfly.modify_rsrc(uid, add_trp=set(gr))
 
         # Grab binary and set new resource parameters.
@@ -255,7 +259,7 @@ class Migrator:
             if self.zero_binaries:
                 data = b''
             else:
-                bin_rsp = requests.get(uri)
+                bin_rsp = requests.get(uri, auth=self.auth)
                 if not self.skip_errors:
                     bin_rsp.raise_for_status()
                 elif bin_rsp.status_code > 399:
@@ -280,7 +284,7 @@ class Migrator:
         for pred, obj in gr.predicate_objects():
             #import pdb; pdb.set_trace()
             obj_uid = obj.replace(ibase, '')
-            with self.rdfly.store.txn_mgr(True):
+            with self.rdfly.store.txn_ctx(True):
                 conditions = bool(
                     isinstance(obj, URIRef)
                     and obj.startswith(iuri)