ldp.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394
  1. import logging
  2. from collections import defaultdict
  3. from uuid import uuid4
  4. from flask import Blueprint, current_app, g, request, send_file, url_for
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF, XSD
  7. from werkzeug.datastructures import FileStorage
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.exceptions import (
  10. InvalidResourceError, ResourceExistsError, ResourceNotExistsError,
  11. ServerManagedTermError, TombstoneError
  12. )
  13. from lakesuperior.model.ldpr import Ldpr
  14. from lakesuperior.model.ldp_nr import LdpNr
  15. from lakesuperior.model.ldp_rs import Ldpc, LdpDc, LdpIc, LdpRs
  16. from lakesuperior.toolbox import Toolbox
  17. logger = logging.getLogger(__name__)
  18. # Blueprint for LDP REST API. This is what is usually found under `/rest/` in
  19. # standard fcrepo4. Here, it is under `/ldp` but initially `/rest` can be kept
  20. # for backward compatibility.
  21. ldp = Blueprint('ldp', __name__)
  22. accept_patch = (
  23. 'application/sparql-update',
  24. )
  25. accept_rdf = (
  26. 'application/ld+json',
  27. 'application/n-triples',
  28. 'application/rdf+xml',
  29. #'application/x-turtle',
  30. #'application/xhtml+xml',
  31. #'application/xml',
  32. #'text/html',
  33. 'text/n3',
  34. #'text/plain',
  35. 'text/rdf+n3',
  36. 'text/turtle',
  37. )
  38. #allow = (
  39. # 'COPY',
  40. # 'DELETE',
  41. # 'GET',
  42. # 'HEAD',
  43. # 'MOVE',
  44. # 'OPTIONS',
  45. # 'PATCH',
  46. # 'POST',
  47. # 'PUT',
  48. #)
  49. std_headers = {
  50. 'Accept-Patch' : ','.join(accept_patch),
  51. 'Accept-Post' : ','.join(accept_rdf),
  52. #'Allow' : ','.join(allow),
  53. }
  54. @ldp.url_defaults
  55. def bp_url_defaults(endpoint, values):
  56. url_prefix = getattr(g, 'url_prefix', None)
  57. if url_prefix is not None:
  58. values.setdefault('url_prefix', url_prefix)
  59. @ldp.url_value_preprocessor
  60. def bp_url_value_preprocessor(endpoint, values):
  61. g.url_prefix = values.pop('url_prefix')
  62. ## REST SERVICES ##
  63. @ldp.route('/<path:uuid>', methods=['GET'])
  64. @ldp.route('/', defaults={'uuid': None}, methods=['GET'], strict_slashes=False)
  65. def get_resource(uuid, force_rdf=False):
  66. '''
  67. Retrieve RDF or binary content.
  68. @param uuid (string) UUID of resource to retrieve.
  69. @param force_rdf (boolean) Whether to retrieve RDF even if the resource is
  70. a LDP-NR. This is not available in the API but is used e.g. by the
  71. `*/fcr:metadata` endpoint. The default is False.
  72. '''
  73. out_headers = std_headers
  74. repr_options = defaultdict(dict)
  75. if 'prefer' in request.headers:
  76. prefer = Toolbox().parse_rfc7240(request.headers['prefer'])
  77. logger.debug('Parsed Prefer header: {}'.format(prefer))
  78. if 'return' in prefer:
  79. repr_options = parse_repr_options(prefer['return'])
  80. try:
  81. rsrc = Ldpr.inst(uuid, repr_options)
  82. except ResourceNotExistsError as e:
  83. return str(e), 404
  84. except TombstoneError as e:
  85. return _tombstone_response(e, uuid)
  86. else:
  87. out_headers.update(rsrc.head())
  88. if isinstance(rsrc, LdpRs) \
  89. or request.headers['accept'] in accept_rdf \
  90. or force_rdf:
  91. return (rsrc.get(), out_headers)
  92. else:
  93. return send_file(rsrc.local_path, as_attachment=True,
  94. attachment_filename=rsrc.filename)
  95. @ldp.route('/<path:uuid>/fcr:metadata', methods=['GET'])
  96. def get_metadata(uuid):
  97. '''
  98. Retrieve RDF metadata of a LDP-NR.
  99. '''
  100. return get_resource(uuid, force_rdf=True)
  101. @ldp.route('/<path:parent>', methods=['POST'])
  102. @ldp.route('/', defaults={'parent': None}, methods=['POST'],
  103. strict_slashes=False)
  104. def post_resource(parent):
  105. '''
  106. Add a new resource in a new URI.
  107. '''
  108. out_headers = std_headers
  109. try:
  110. slug = request.headers['Slug']
  111. except KeyError:
  112. slug = None
  113. handling, disposition = set_post_put_params()
  114. try:
  115. uuid = uuid_for_post(parent, slug)
  116. rsrc = Ldpr.inst_from_client_input(uuid, handling=handling,
  117. disposition=disposition)
  118. except ResourceNotExistsError as e:
  119. return str(e), 404
  120. except InvalidResourceError as e:
  121. return str(e), 409
  122. except TombstoneError as e:
  123. return _tombstone_response(e, uuid)
  124. try:
  125. rsrc.post()
  126. except ServerManagedTermError as e:
  127. return str(e), 412
  128. out_headers.update({
  129. 'Location' : rsrc.uri,
  130. })
  131. return rsrc.uri, 201, out_headers
  132. @ldp.route('/<path:uuid>', methods=['PUT'])
  133. def put_resource(uuid):
  134. '''
  135. Add a new resource at a specified URI.
  136. '''
  137. # Parse headers.
  138. logger.info('Request headers: {}'.format(request.headers))
  139. rsp_headers = std_headers
  140. handling, disposition = set_post_put_params()
  141. try:
  142. rsrc = Ldpr.inst_from_client_input(uuid, handling=handling,
  143. disposition=disposition)
  144. except ServerManagedTermError as e:
  145. return str(e), 412
  146. try:
  147. ret = rsrc.put()
  148. except InvalidResourceError as e:
  149. return str(e), 409
  150. except ResourceExistsError as e:
  151. return str(e), 409
  152. except TombstoneError as e:
  153. return _tombstone_response(e, uuid)
  154. res_code = 201 if ret == Ldpr.RES_CREATED else 204
  155. return '', res_code, rsp_headers
  156. @ldp.route('/<path:uuid>', methods=['PATCH'])
  157. def patch_resource(uuid):
  158. '''
  159. Update an existing resource with a SPARQL-UPDATE payload.
  160. '''
  161. headers = std_headers
  162. rsrc = Ldpc(uuid)
  163. try:
  164. rsrc.patch(request.get_data().decode('utf-8'))
  165. except ResourceNotExistsError as e:
  166. return str(e), 404
  167. except TombstoneError as e:
  168. return _tombstone_response(e, uuid)
  169. except ServerManagedTermError as e:
  170. return str(e), 412
  171. return '', 204, headers
  172. @ldp.route('/<path:uuid>', methods=['DELETE'])
  173. def delete_resource(uuid):
  174. '''
  175. Delete a resource.
  176. '''
  177. headers = std_headers
  178. # If referential integrity is enforced, grab all inbound relationships
  179. # to break them.
  180. repr_opts = {'incl_inbound' : True} \
  181. if current_app.config['store']['ldp_rs']['referential_integrity'] \
  182. else {}
  183. if 'prefer' in request.headers:
  184. prefer = Toolbox().parse_rfc7240(request.headers['prefer'])
  185. leave_tstone = 'no-tombstone' not in prefer
  186. else:
  187. leave_tstone = True
  188. try:
  189. Ldpr.inst(uuid, repr_opts).delete(leave_tstone=leave_tstone)
  190. except ResourceNotExistsError as e:
  191. return str(e), 404
  192. except TombstoneError as e:
  193. return _tombstone_response(e, uuid)
  194. return '', 204, headers
  195. @ldp.route('/<path:uuid>/fcr:tombstone', methods=['GET', 'POST', 'PUT',
  196. 'PATCH', 'DELETE'])
  197. def tombstone(uuid):
  198. '''
  199. Handle all tombstone operations.
  200. The only allowed method is DELETE; any other verb will return a 405.
  201. '''
  202. logger.debug('Deleting tombstone for {}.'.format(uuid))
  203. rsrc = Ldpr(uuid)
  204. try:
  205. imr = rsrc.imr
  206. except TombstoneError as e:
  207. if request.method == 'DELETE':
  208. if e.uuid == uuid:
  209. rsrc.delete_tombstone()
  210. return '', 204
  211. else:
  212. return _tombstone_response(e, uuid)
  213. else:
  214. return 'Method Not Allowed.', 405
  215. except ResourceNotExistsError as e:
  216. return str(e), 404
  217. else:
  218. return '', 404
  219. def uuid_for_post(parent_uuid=None, slug=None):
  220. '''
  221. Validate conditions to perform a POST and return an LDP resource
  222. UUID for using with the `post` method.
  223. This may raise an exception resulting in a 404 if the parent is not
  224. found or a 409 if the parent is not a valid container.
  225. '''
  226. # Shortcut!
  227. if not slug and not parent_uuid:
  228. return str(uuid4())
  229. parent = Ldpr.inst(parent_uuid, repr_opts={'incl_children' : False})
  230. # Set prefix.
  231. if parent_uuid:
  232. parent_types = { t.identifier for t in \
  233. parent.imr.objects(RDF.type) }
  234. logger.debug('Parent types: {}'.format(
  235. parent_types))
  236. if nsc['ldp'].Container not in parent_types:
  237. raise InvalidResourceError('Parent {} is not a container.'
  238. .format(parent_uuid))
  239. pfx = parent_uuid + '/'
  240. else:
  241. pfx = ''
  242. # Create candidate UUID and validate.
  243. if slug:
  244. cnd_uuid = pfx + slug
  245. if current_app.rdfly.ask_rsrc_exists(nsc['fcres'][cnd_uuid]):
  246. uuid = pfx + str(uuid4())
  247. else:
  248. uuid = cnd_uuid
  249. else:
  250. uuid = pfx + str(uuid4())
  251. return uuid
  252. def _get_bitstream(rsrc):
  253. out_headers = std_headers
  254. # @TODO This may change in favor of more low-level handling if the file
  255. # system is not local.
  256. return send_file(rsrc.local_path, as_attachment=True,
  257. attachment_filename=rsrc.filename)
  258. def _tombstone_response(e, uuid):
  259. headers = {
  260. 'Link' : '<{}/fcr:tombstone>; rel="hasTombstone"'.format(request.url),
  261. } if e.uuid == uuid else {}
  262. return str(e), 410, headers
  263. def set_post_put_params():
  264. '''
  265. Sets handling and content disposition for POST and PUT by parsing headers.
  266. '''
  267. handling = None
  268. if 'prefer' in request.headers:
  269. prefer = Toolbox().parse_rfc7240(request.headers['prefer'])
  270. logger.debug('Parsed Prefer header: {}'.format(prefer))
  271. if 'handling' in prefer:
  272. handling = prefer['handling']['value']
  273. try:
  274. disposition = Toolbox().parse_rfc7240(
  275. request.headers['content-disposition'])
  276. except KeyError:
  277. disposition = None
  278. return handling, disposition
  279. def parse_repr_options(retr_opts):
  280. '''
  281. Set options to retrieve IMR.
  282. Ideally, IMR retrieval is done once per request, so all the options
  283. are set once in the `imr()` property.
  284. @param retr_opts (dict): Options parsed from `Prefer` header.
  285. '''
  286. logger.debug('Parsing retrieval options: {}'.format(retr_opts))
  287. imr_options = {}
  288. if retr_opts.setdefault('value') == 'minimal':
  289. imr_options = {
  290. 'embed_children' : False,
  291. 'incl_children' : False,
  292. 'incl_inbound' : False,
  293. 'incl_srv_mgd' : False,
  294. }
  295. else:
  296. # Default.
  297. imr_options = {
  298. 'embed_children' : False,
  299. 'incl_children' : True,
  300. 'incl_inbound' : False,
  301. 'incl_srv_mgd' : True,
  302. }
  303. # Override defaults.
  304. if 'parameters' in retr_opts:
  305. include = retr_opts['parameters']['include'].split(' ') \
  306. if 'include' in retr_opts['parameters'] else []
  307. omit = retr_opts['parameters']['omit'].split(' ') \
  308. if 'omit' in retr_opts['parameters'] else []
  309. logger.debug('Include: {}'.format(include))
  310. logger.debug('Omit: {}'.format(omit))
  311. if str(Ldpr.EMBED_CHILD_RES_URI) in include:
  312. imr_options['embed_children'] = True
  313. if str(Ldpr.RETURN_CHILD_RES_URI) in omit:
  314. imr_options['incl_children'] = False
  315. if str(Ldpr.RETURN_INBOUND_REF_URI) in include:
  316. imr_options['incl_inbound'] = True
  317. if str(Ldpr.RETURN_SRV_MGD_RES_URI) in omit:
  318. imr_options['incl_srv_mgd'] = False
  319. logger.debug('Retrieval options: {}'.format(imr_options))
  320. return imr_options