Explorar o código

fcr:versions improvements.

* Replace the last SPARQL statement in class with Python functions
* Remove `_parse_construct` method
* Improve performance of `fcr:versions` method (4s > 30ms)
Stefano Cossu %!s(int64=7) %!d(string=hai) anos
pai
achega
e9d54a3099
Modificáronse 1 ficheiros con 57 adicións e 48 borrados
  1. 57 48
      lakesuperior/store/ldp_rs/rsrc_centric_layout.py

+ 57 - 48
lakesuperior/store/ldp_rs/rsrc_centric_layout.py

@@ -77,6 +77,7 @@ class RsrcCentricLayout:
                 nsc['ldp'].membershipResource,
                 nsc['ldp'].hasMemberRelation,
                 nsc['ldp'].insertedContentRelation,
+
                 nsc['iana'].describedBy,
                 nsc['premis'].hasMessageDigest,
                 nsc['premis'].hasSize,
@@ -88,6 +89,7 @@ class RsrcCentricLayout:
                 nsc['fcrepo'].Container,
                 nsc['fcrepo'].Pairtree,
                 nsc['fcrepo'].Resource,
+                nsc['fcrepo'].Version,
                 nsc['fcsystem'].Tombstone,
                 nsc['ldp'].BasicContainer,
                 nsc['ldp'].Container,
@@ -106,13 +108,35 @@ class RsrcCentricLayout:
             }
         },
     }
+    """
+    Human-manageable map of attribute routes.
+
+    This serves as the source for :data:`attr_routes`.
+    """
 
-    # RDF types of graphs by prefix.
     graph_ns_types = {
         nsc['fcadmin']: nsc['fcsystem'].AdminGraph,
         nsc['fcmain']: nsc['fcsystem'].UserProvidedGraph,
         nsc['fcstruct']: nsc['fcsystem'].StructureGraph,
     }
+    """
+    RDF types of graphs by prefix.
+    """
+
+    ignore_vmeta_preds = {
+        nsc['foaf'].primaryTopic,
+    }
+    """
+    Predicates of version metadata to be ignored in output.
+    """
+
+    ignore_vmeta_types = {
+        nsc['fcsystem'].AdminGraph,
+        nsc['fcsystem'].UserProvidedGraph,
+    }
+    """
+    RDF types of version metadata to be ignored in output.
+    """
 
 
     ## MAGIC METHODS ##
@@ -293,6 +317,7 @@ class RsrcCentricLayout:
         Get all the user-provided data.
 
         :param string uid: Resource UID.
+        :rtype: rdflib.Graph
         """
         # *TODO* This only works as long as there is only one user-provided
         # graph. If multiple user-provided graphs will be supported, this
@@ -306,40 +331,39 @@ class RsrcCentricLayout:
     def get_version_info(self, uid, strict=True):
         """
         Get all metadata about a resource's versions.
+
+        :param string uid: Resource UID.
+        :rtype: rdflib.Graph
         """
-        # **Note:** This pretty much bends the ontology—it replaces the graph URI
-        # with the subject URI. But the concepts of data and metadata in Fedora
-        # are quite fluid anyways...
-
-        # WIP—Is it worth to replace SPARQL here?
-        #versions = self.ds.graph(nsc['fcadmin'][uid]).triples(
-        #        (nsc['fcres'][uid], nsc['fcrepo'].hasVersion, None))
-        #for version in versions:
-        #    version_meta = self.ds.graph(HIST_GRAPH_URI).triples(
-        qry = """
-        CONSTRUCT {
-          ?s fcrepo:hasVersion ?v .
-          ?v ?p ?o .
-        } {
-          GRAPH ?ag {
-            ?s fcrepo:hasVersion ?v .
-          }
-          GRAPH ?hg {
-            ?vm foaf:primaryTopic ?v .
-            ?vm  ?p ?o .
-            FILTER (?o != ?v)
-          }
-        }"""
-        gr = self._parse_construct(qry, init_bindings={
-            'ag': nsc['fcadmin'][uid],
-            'hg': HIST_GR_URI,
-            's': nsc['fcres'][uid]})
-        ver_info_gr = Graph(identifier=nsc['fcres'][uid])
-        ver_info_gr += gr
-        if strict:
-            self._check_rsrc_status(ver_info_gr)
+        # **Note:** This pretty much bends the ontology—it replaces the graph
+        # URI with the subject URI. But the concepts of data and metadata in
+        # Fedora are quite fluid anyways...
 
-        return ver_info_gr
+        # Result graph.
+        vmeta_gr = Graph(identifier=nsc['fcres'][uid])
+
+        # Get version meta graphs.
+        v_triples = self.ds.graph(nsc['fcadmin'][uid]).triples(
+                (nsc['fcres'][uid], nsc['fcrepo'].hasVersion, None))
+
+        #import pdb; pdb.set_trace()
+        #Get version graphs proper.
+        for vtrp in v_triples:
+            # While at it, add the hasVersion triple to the result graph.
+            vmeta_gr.add(vtrp)
+            vmeta_uris = self.ds.graph(HIST_GR_URI).subjects(
+                    nsc['foaf'].primaryTopic, vtrp[2])
+            # Get triples in the meta graph filtering out undesired triples.
+            for vmuri in vmeta_uris:
+                for trp in self.ds.graph(HIST_GR_URI).triples(
+                        (vmuri, None, None)):
+                    if (
+                            (trp[1] != nsc['rdf'].type
+                            or trp[2] not in self.ignore_vmeta_types)
+                            and (trp[1] not in self.ignore_vmeta_preds)):
+                        vmeta_gr.add((vtrp[2], trp[1], trp[2]))
+
+        return vmeta_gr
 
 
     def get_inbound_rel(self, subj_uri, full_triple=True):
@@ -594,21 +618,6 @@ class RsrcCentricLayout:
                 gr.value(gr.identifier, nsc['fcrepo'].created))
 
 
-    def _parse_construct(self, qry, init_bindings={}):
-        """
-        Parse a CONSTRUCT query.
-
-        :rtype: rdflib.Graph
-        """
-        try:
-            qres = self.ds.query(qry, initBindings=init_bindings)
-        except ResultException:
-            # RDFlib bug: https://github.com/RDFLib/rdflib/issues/775
-            return Graph()
-        else:
-            return qres.graph
-
-
     def _map_graph_uri(self, t, uid):
         """
         Map a triple to a namespace prefix corresponding to a graph.