ldp_rs.py 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180
  1. from flask import current_app, g
  2. from rdflib import Graph
  3. from rdflib.plugins.sparql.algebra import translateUpdate
  4. from rdflib.plugins.sparql.parser import parseUpdate
  5. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  6. from lakesuperior.model.ldpr import Ldpr
  7. class LdpRs(Ldpr):
  8. '''LDP-RS (LDP RDF source).
  9. Definition: https://www.w3.org/TR/ldp/#ldprs
  10. '''
  11. def __init__(self, uuid, repr_opts={}, handling='lenient', **kwargs):
  12. '''
  13. Extends Ldpr.__init__ by adding LDP-RS specific parameters.
  14. @param handling (string) One of `strict`, `lenient` (the default) or
  15. `none`. `strict` raises an error if a server-managed term is in the
  16. graph. `lenient` removes all sever-managed triples encountered. `none`
  17. skips all server-managed checks. It is used for internal modifications.
  18. '''
  19. super().__init__(uuid, **kwargs)
  20. self.base_types = super().base_types | {
  21. nsc['fcrepo'].Container,
  22. nsc['ldp'].Container,
  23. }
  24. # provided_imr can be empty. If None, it is an outbound resource.
  25. if self.provided_imr is not None:
  26. self.workflow = self.WRKF_INBOUND
  27. else:
  28. self.workflow = self.WRKF_OUTBOUND
  29. self._imr_options = repr_opts
  30. self.handling = handling
  31. ## LDP METHODS ##
  32. def patch(self, update_str):
  33. '''
  34. https://www.w3.org/TR/ldp/#ldpr-HTTP_PATCH
  35. Update an existing resource by applying a SPARQL-UPDATE query.
  36. @param update_str (string) SPARQL-Update staements.
  37. '''
  38. self.handling = 'lenient' # FCREPO does that and Hyrax requires it.
  39. local_update_str = g.tbox.localize_ext_str(update_str, self.urn)
  40. self._logger.debug('Local update string: {}'.format(local_update_str))
  41. return self._sparql_update(local_update_str)
  42. def _sparql_update(self, update_str, notify=True):
  43. '''
  44. Apply a SPARQL update to a resource.
  45. The SPARQL string is validated beforehand to make sure that it does
  46. not contain server-managed terms.
  47. In theory, server-managed terms in DELETE statements are harmless
  48. because the patch is only applied over the user-provided triples, but
  49. at the moment those are also checked.
  50. '''
  51. # Parse the SPARQL update string and validate contents.
  52. qry_struct = translateUpdate(parseUpdate(update_str))
  53. check_ins_gr = Graph()
  54. check_del_gr = Graph()
  55. for stmt in qry_struct:
  56. try:
  57. check_ins_gr += set(stmt.insert.triples)
  58. except AttributeError:
  59. pass
  60. try:
  61. check_del_gr += set(stmt.delete.triples)
  62. except AttributeError:
  63. pass
  64. self._check_mgd_terms(check_ins_gr)
  65. self._check_mgd_terms(check_del_gr)
  66. self.rdfly.patch_rsrc(self.uid, update_str)
  67. if notify and current_app.config.get('messaging'):
  68. self._send_msg(self.RES_UPDATED, check_del_gr, check_ins_gr)
  69. # @FIXME Ugly workaround until we find how to recompose a SPARQL query
  70. # string from a parsed query object.
  71. self.rdfly.clear_smt(self.uid)
  72. return self.RES_UPDATED
  73. #def _sparql_delta(self, q):
  74. # '''
  75. # Calculate the delta obtained by a SPARQL Update operation.
  76. # This is a critical component of the SPARQL update prcess and does a
  77. # couple of things:
  78. # 1. It ensures that no resources outside of the subject of the request
  79. # are modified (e.g. by variable subjects)
  80. # 2. It verifies that none of the terms being modified is server managed.
  81. # This method extracts an in-memory copy of the resource and performs the
  82. # query on that once it has checked if any of the server managed terms is
  83. # in the delta. If it is, it raises an exception.
  84. # NOTE: This only checks if a server-managed term is effectively being
  85. # modified. If a server-managed term is present in the query but does not
  86. # cause any change in the updated resource, no error is raised.
  87. # @return tuple(rdflib.Graph) Remove and add graphs. These can be used
  88. # with `BaseStoreLayout.update_resource` and/or recorded as separate
  89. # events in a provenance tracking system.
  90. # '''
  91. # self._logger.debug('Provided SPARQL query: {}'.format(q))
  92. # pre_gr = self.imr.graph
  93. # post_gr = pre_gr | Graph()
  94. # post_gr.update(q)
  95. # remove_gr, add_gr = self._dedup_deltas(pre_gr, post_gr)
  96. # #self._logger.debug('Removing: {}'.format(
  97. # # remove_gr.serialize(format='turtle').decode('utf8')))
  98. # #self._logger.debug('Adding: {}'.format(
  99. # # add_gr.serialize(format='turtle').decode('utf8')))
  100. # remove_gr = self._check_mgd_terms(remove_gr)
  101. # add_gr = self._check_mgd_terms(add_gr)
  102. # return set(remove_gr), set(add_gr)
  103. class Ldpc(LdpRs):
  104. '''LDPC (LDP Container).'''
  105. def __init__(self, uuid, *args, **kwargs):
  106. super().__init__(uuid, *args, **kwargs)
  107. self.base_types |= {
  108. nsc['fcrepo'].Container,
  109. nsc['ldp'].Container,
  110. }
  111. class LdpBc(Ldpc):
  112. '''LDP-BC (LDP Basic Container).'''
  113. def __init__(self, uuid, *args, **kwargs):
  114. super().__init__(uuid, *args, **kwargs)
  115. self.base_types |= {
  116. nsc['ldp'].BasicContainer,
  117. }
  118. class LdpDc(Ldpc):
  119. '''LDP-DC (LDP Direct Container).'''
  120. def __init__(self, uuid, *args, **kwargs):
  121. super().__init__(uuid, *args, **kwargs)
  122. self.base_types |= {
  123. nsc['ldp'].DirectContainer,
  124. }
  125. class LdpIc(Ldpc):
  126. '''LDP-IC (LDP Indirect Container).'''
  127. def __init__(self, uuid, *args, **kwargs):
  128. super().__init__(uuid, *args, **kwargs)
  129. self.base_types |= {
  130. nsc['ldp'].IndirectContainer,
  131. }