resource.py 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313
  1. import logging
  2. from functools import wraps
  3. from itertools import groupby
  4. from multiprocessing import Process
  5. from threading import Lock, Thread
  6. import arrow
  7. from rdflib import Literal
  8. from rdflib.namespace import XSD
  9. from lakesuperior.config_parser import config
  10. from lakesuperior.exceptions import InvalidResourceError
  11. from lakesuperior.env import env
  12. from lakesuperior.globals import RES_DELETED
  13. from lakesuperior.model.ldp_factory import LDP_NR_TYPE, LdpFactory
  14. from lakesuperior.store.ldp_rs.lmdb_store import TxnManager
  15. logger = logging.getLogger(__name__)
  16. app_globals = env.app_globals
  17. __doc__ = '''
  18. Primary API for resource manipulation.
  19. Quickstart:
  20. >>> # First import default configuration and globals—only done once.
  21. >>> import lakesuperior.default_env
  22. >>> from lakesuperior.api import resource
  23. >>> # Get root resource.
  24. >>> rsrc = resource.get('/')
  25. >>> # Dump graph.
  26. >>> set(rsrc.imr())
  27. {(rdflib.term.URIRef('info:fcres/'),
  28. rdflib.term.URIRef('http://purl.org/dc/terms/title'),
  29. rdflib.term.Literal('Repository Root')),
  30. (rdflib.term.URIRef('info:fcres/'),
  31. rdflib.term.URIRef('http://www.w3.org/1999/02/22-rdf-syntax-ns#type'),
  32. rdflib.term.URIRef('http://fedora.info/definitions/v4/repository#Container')),
  33. (rdflib.term.URIRef('info:fcres/'),
  34. rdflib.term.URIRef('http://www.w3.org/1999/02/22-rdf-syntax-ns#type'),
  35. rdflib.term.URIRef('http://fedora.info/definitions/v4/repository#RepositoryRoot')),
  36. (rdflib.term.URIRef('info:fcres/'),
  37. rdflib.term.URIRef('http://www.w3.org/1999/02/22-rdf-syntax-ns#type'),
  38. rdflib.term.URIRef('http://fedora.info/definitions/v4/repository#Resource')),
  39. (rdflib.term.URIRef('info:fcres/'),
  40. rdflib.term.URIRef('http://www.w3.org/1999/02/22-rdf-syntax-ns#type'),
  41. rdflib.term.URIRef('http://www.w3.org/ns/ldp#BasicContainer')),
  42. (rdflib.term.URIRef('info:fcres/'),
  43. rdflib.term.URIRef('http://www.w3.org/1999/02/22-rdf-syntax-ns#type'),
  44. rdflib.term.URIRef('http://www.w3.org/ns/ldp#Container')),
  45. (rdflib.term.URIRef('info:fcres/'),
  46. rdflib.term.URIRef('http://www.w3.org/1999/02/22-rdf-syntax-ns#type'),
  47. rdflib.term.URIRef('http://www.w3.org/ns/ldp#RDFSource'))}
  48. '''
  49. def transaction(write=False):
  50. '''
  51. Handle atomic operations in a store.
  52. This wrapper ensures that a write operation is performed atomically. It
  53. also takes care of sending a message for each resource changed in the
  54. transaction.
  55. ALL write operations on the LDP-RS and LDP-NR stores go through this
  56. wrapper.
  57. '''
  58. def _transaction_deco(fn):
  59. @wraps(fn)
  60. def _wrapper(*args, **kwargs):
  61. # Mark transaction begin timestamp. This is used for create and
  62. # update timestamps on resources.
  63. env.timestamp = arrow.utcnow()
  64. env.timestamp_term = Literal(env.timestamp, datatype=XSD.dateTime)
  65. with TxnManager(app_globals.rdf_store, write=write) as txn:
  66. ret = fn(*args, **kwargs)
  67. if len(app_globals.changelog):
  68. job = Thread(target=process_queue)
  69. job.start()
  70. delattr(env, 'timestamp')
  71. delattr(env, 'timestamp_term')
  72. return ret
  73. return _wrapper
  74. return _transaction_deco
  75. def process_queue():
  76. '''
  77. Process the message queue on a separate thread.
  78. '''
  79. lock = Lock()
  80. lock.acquire()
  81. while len(app_globals.changelog):
  82. send_event_msg(*app_globals.changelog.popleft())
  83. lock.release()
  84. def send_event_msg(remove_trp, add_trp, metadata):
  85. '''
  86. Break down delta triples, find subjects and send event message.
  87. '''
  88. remove_grp = groupby(remove_trp, lambda x : x[0])
  89. remove_dict = { k[0] : k[1] for k in remove_grp }
  90. add_grp = groupby(add_trp, lambda x : x[0])
  91. add_dict = { k[0] : k[1] for k in add_grp }
  92. subjects = set(remove_dict.keys()) | set(add_dict.keys())
  93. for rsrc_uri in subjects:
  94. logger.info('subject: {}'.format(rsrc_uri))
  95. app_globals.messenger.send
  96. ### API METHODS ###
  97. @transaction()
  98. def get(uid, repr_options={}):
  99. '''
  100. Get an LDPR resource.
  101. The resource comes preloaded with user data and metadata as indicated by
  102. the `repr_options` argument. Any further handling of this resource is done
  103. outside of a transaction.
  104. @param uid (string) Resource UID.
  105. @param repr_options (dict(bool)) Representation options. This is a dict
  106. that is unpacked downstream in the process. The default empty dict results
  107. in default values. The accepted dict keys are:
  108. - incl_inbound: include inbound references. Default: False.
  109. - incl_children: include children URIs. Default: True.
  110. - embed_children: Embed full graph of all child resources. Default: False
  111. '''
  112. rsrc = LdpFactory.from_stored(uid, repr_options)
  113. # Load graph before leaving the transaction.
  114. rsrc.imr
  115. return rsrc
  116. @transaction()
  117. def get_version_info(uid):
  118. '''
  119. Get version metadata (fcr:versions).
  120. '''
  121. return LdpFactory.from_stored(uid).version_info
  122. @transaction()
  123. def get_version(uid, ver_uid):
  124. '''
  125. Get version metadata (fcr:versions).
  126. '''
  127. return LdpFactory.from_stored(uid).get_version(ver_uid)
  128. @transaction(True)
  129. def create(parent, slug, **kwargs):
  130. '''
  131. Mint a new UID and create a resource.
  132. The UID is computed from a given parent UID and a "slug", a proposed path
  133. relative to the parent. The application will attempt to use the suggested
  134. path but it may use a different one if a conflict with an existing resource
  135. arises.
  136. @param parent (string) UID of the parent resource.
  137. @param slug (string) Tentative path relative to the parent UID.
  138. @param **kwargs Other parameters are passed to the
  139. LdpFactory.from_provided method. Please see the documentation for that
  140. method for explanation of individual parameters.
  141. @return string UID of the new resource.
  142. '''
  143. uid = LdpFactory.mint_uid(parent, slug)
  144. logger.debug('Minted UID for new resource: {}'.format(uid))
  145. rsrc = LdpFactory.from_provided(uid, **kwargs)
  146. rsrc.create_or_replace_rsrc(create_only=True)
  147. return uid
  148. @transaction(True)
  149. def create_or_replace(uid, stream=None, **kwargs):
  150. '''
  151. Create or replace a resource with a specified UID.
  152. If the resource already exists, all user-provided properties of the
  153. existing resource are deleted. If the resource exists and the provided
  154. content is empty, an exception is raised (not sure why, but that's how
  155. FCREPO4 handles it).
  156. @param uid (string) UID of the resource to be created or updated.
  157. @param stream (BytesIO) Content stream. If empty, an empty container is
  158. created.
  159. @param **kwargs Other parameters are passed to the
  160. LdpFactory.from_provided method. Please see the documentation for that
  161. method for explanation of individual parameters.
  162. @return string Event type: whether the resource was created or updated.
  163. '''
  164. rsrc = LdpFactory.from_provided(uid, stream=stream, **kwargs)
  165. if not stream and rsrc.is_stored:
  166. raise InvalidResourceError(rsrc.uid,
  167. 'Resource {} already exists and no data set was provided.')
  168. return rsrc.create_or_replace_rsrc()
  169. @transaction(True)
  170. def update(uid, update_str, is_metadata=False):
  171. '''
  172. Update a resource with a SPARQL-Update string.
  173. @param uid (string) Resource UID.
  174. @param update_str (string) SPARQL-Update statements.
  175. @param is_metadata (bool) Whether the resource metadata is being updated.
  176. If False, and the resource being updated is a LDP-NR, an error is raised.
  177. '''
  178. rsrc = LdpFactory.from_stored(uid)
  179. if LDP_NR_TYPE in rsrc.ldp_types:
  180. if is_metadata:
  181. rsrc.patch_metadata(update_str)
  182. else:
  183. raise InvalidResourceError(uid)
  184. else:
  185. rsrc.patch(update_str)
  186. return rsrc
  187. @transaction(True)
  188. def create_version(uid, ver_uid):
  189. '''
  190. Create a resource version.
  191. @param uid (string) Resource UID.
  192. @param ver_uid (string) Version UID to be appended to the resource URI.
  193. NOTE: this is a "slug", i.e. the version URI is not guaranteed to be the
  194. one indicated.
  195. @return string Version UID.
  196. '''
  197. return LdpFactory.from_stored(uid).create_version(ver_uid)
  198. @transaction(True)
  199. def delete(uid, leave_tstone=True):
  200. '''
  201. Delete a resource.
  202. @param uid (string) Resource UID.
  203. @param leave_tstone (bool) Whether to perform a soft-delete and leave a
  204. tombstone resource, or wipe any memory of the resource.
  205. '''
  206. # If referential integrity is enforced, grab all inbound relationships
  207. # to break them.
  208. refint = app_globals.rdfly.config['referential_integrity']
  209. inbound = True if refint else inbound
  210. repr_opts = {'incl_inbound' : True} if refint else {}
  211. children = app_globals.rdfly.get_descendants(uid)
  212. if leave_tstone:
  213. rsrc = LdpFactory.from_stored(uid, repr_opts)
  214. ret = rsrc.bury_rsrc(inbound)
  215. for child_uri in children:
  216. try:
  217. child_rsrc = LdpFactory.from_stored(
  218. app_globals.rdfly.uri_to_uid(child_uri),
  219. repr_opts={'incl_children' : False})
  220. except (TombstoneError, ResourceNotExistsError):
  221. continue
  222. child_rsrc.bury_rsrc(inbound, tstone_pointer=rsrc.uri)
  223. else:
  224. ret = forget(uid, inbound)
  225. for child_uri in children:
  226. forget(app_globals.rdfly.uri_to_uid(child_uri), inbound)
  227. return ret
  228. @transaction(True)
  229. def resurrect(uid):
  230. '''
  231. Reinstate a buried (soft-deleted) resource.
  232. @param uid (string) Resource UID.
  233. '''
  234. return LdpFactory.from_stored(uid).resurrect_rsrc()
  235. @transaction(True)
  236. def forget(uid, inbound=True):
  237. '''
  238. Delete a resource completely, removing all its traces.
  239. @param uid (string) Resource UID.
  240. @param inbound (bool) Whether the inbound relationships should be deleted
  241. as well. If referential integrity is checked system-wide inbound references
  242. are always deleted and this option has no effect.
  243. '''
  244. refint = app_globals.rdfly.config['referential_integrity']
  245. inbound = True if refint else inbound
  246. app_globals.rdfly.forget_rsrc(uid, inbound)
  247. return RES_DELETED