ldp.py 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350
  1. import logging
  2. from collections import defaultdict
  3. from uuid import uuid4
  4. from flask import Blueprint, current_app, g, request, send_file, url_for
  5. from rdflib import Graph
  6. from werkzeug.datastructures import FileStorage
  7. from lakesuperior.exceptions import (
  8. InvalidResourceError, ResourceExistsError, ResourceNotExistsError,
  9. ServerManagedTermError, TombstoneError
  10. )
  11. from lakesuperior.model.ldpr import Ldpr
  12. from lakesuperior.model.ldp_nr import LdpNr
  13. from lakesuperior.model.ldp_rs import Ldpc, LdpDc, LdpIc, LdpRs
  14. from lakesuperior.toolbox import Toolbox
  15. logger = logging.getLogger(__name__)
  16. # Blueprint for LDP REST API. This is what is usually found under `/rest/` in
  17. # standard fcrepo4. Here, it is under `/ldp` but initially `/rest` can be kept
  18. # for backward compatibility.
  19. ldp = Blueprint('ldp', __name__)
  20. accept_patch = (
  21. 'application/sparql-update',
  22. )
  23. accept_rdf = (
  24. 'application/ld+json',
  25. 'application/n-triples',
  26. 'application/rdf+xml',
  27. #'application/x-turtle',
  28. #'application/xhtml+xml',
  29. #'application/xml',
  30. #'text/html',
  31. 'text/n3',
  32. #'text/plain',
  33. 'text/rdf+n3',
  34. 'text/turtle',
  35. )
  36. #allow = (
  37. # 'COPY',
  38. # 'DELETE',
  39. # 'GET',
  40. # 'HEAD',
  41. # 'MOVE',
  42. # 'OPTIONS',
  43. # 'PATCH',
  44. # 'POST',
  45. # 'PUT',
  46. #)
  47. std_headers = {
  48. 'Accept-Patch' : ','.join(accept_patch),
  49. 'Accept-Post' : ','.join(accept_rdf),
  50. #'Allow' : ','.join(allow),
  51. }
  52. @ldp.url_defaults
  53. def bp_url_defaults(endpoint, values):
  54. url_prefix = getattr(g, 'url_prefix', None)
  55. if url_prefix is not None:
  56. values.setdefault('url_prefix', url_prefix)
  57. @ldp.url_value_preprocessor
  58. def bp_url_value_preprocessor(endpoint, values):
  59. g.url_prefix = values.pop('url_prefix')
  60. ## REST SERVICES ##
  61. @ldp.route('/<path:uuid>', methods=['GET'])
  62. @ldp.route('/', defaults={'uuid': None}, methods=['GET'], strict_slashes=False)
  63. def get_resource(uuid, force_rdf=False):
  64. '''
  65. Retrieve RDF or binary content.
  66. @param uuid (string) UUID of resource to retrieve.
  67. @param force_rdf (boolean) Whether to retrieve RDF even if the resource is
  68. a LDP-NR. This is not available in the API but is used e.g. by the
  69. `*/fcr:metadata` endpoint. The default is False.
  70. '''
  71. out_headers = std_headers
  72. repr_options = defaultdict(dict)
  73. if 'prefer' in request.headers:
  74. prefer = Toolbox().parse_rfc7240(request.headers['prefer'])
  75. logger.debug('Parsed Prefer header: {}'.format(prefer))
  76. if 'return' in prefer:
  77. repr_options = prefer['return']
  78. try:
  79. rsrc = Ldpr.inst(uuid, repr_options)
  80. except ResourceNotExistsError as e:
  81. return str(e), 404
  82. except TombstoneError as e:
  83. return _tombstone_response(e, uuid)
  84. else:
  85. out_headers.update(rsrc.head())
  86. if isinstance(rsrc, LdpRs) \
  87. or request.headers['accept'] in accept_rdf \
  88. or force_rdf:
  89. return (rsrc.out_graph.serialize(format='turtle'), out_headers)
  90. else:
  91. return send_file(rsrc.local_path, as_attachment=True,
  92. attachment_filename=rsrc.filename)
  93. @ldp.route('/<path:uuid>/fcr:metadata', methods=['GET'])
  94. def get_metadata(uuid):
  95. '''
  96. Retrieve RDF metadata of a LDP-NR.
  97. '''
  98. return get_resource(uuid, force_rdf=True)
  99. @ldp.route('/<path:parent>', methods=['POST'])
  100. @ldp.route('/', defaults={'parent': None}, methods=['POST'],
  101. strict_slashes=False)
  102. def post_resource(parent):
  103. '''
  104. Add a new resource in a new URI.
  105. '''
  106. out_headers = std_headers
  107. try:
  108. slug = request.headers['Slug']
  109. except KeyError:
  110. slug = None
  111. cls, data = class_from_req_body()
  112. try:
  113. rsrc = cls.inst_for_post(parent, slug)
  114. except ResourceNotExistsError as e:
  115. return str(e), 404
  116. except InvalidResourceError as e:
  117. return str(e), 409
  118. except TombstoneError as e:
  119. return _tombstone_response(e, uuid)
  120. if cls == LdpNr:
  121. try:
  122. cont_disp = Toolbox().parse_rfc7240(
  123. request.headers['content-disposition'])
  124. except KeyError:
  125. cont_disp = None
  126. rsrc.post(data, mimetype=request.content_type, disposition=cont_disp)
  127. else:
  128. try:
  129. rsrc.post(data)
  130. except ServerManagedTermError as e:
  131. return str(e), 412
  132. out_headers.update({
  133. 'Location' : rsrc.uri,
  134. })
  135. return rsrc.uri, 201, out_headers
  136. @ldp.route('/<path:uuid>', methods=['PUT'])
  137. def put_resource(uuid):
  138. '''
  139. Add a new resource at a specified URI.
  140. '''
  141. logger.info('Request headers: {}'.format(request.headers))
  142. rsp_headers = std_headers
  143. cls, data = class_from_req_body()
  144. rsrc = cls(uuid)
  145. # Parse headers.
  146. pref_handling = None
  147. if cls == LdpNr:
  148. try:
  149. logger.debug('Headers: {}'.format(request.headers))
  150. cont_disp = Toolbox().parse_rfc7240(
  151. request.headers['content-disposition'])
  152. except KeyError:
  153. cont_disp = None
  154. try:
  155. ret = rsrc.put(data, disposition=cont_disp,
  156. mimetype=request.content_type)
  157. except InvalidResourceError as e:
  158. return str(e), 409
  159. except ResourceExistsError as e:
  160. return str(e), 409
  161. except TombstoneError as e:
  162. return _tombstone_response(e, uuid)
  163. else:
  164. if 'prefer' in request.headers:
  165. prefer = Toolbox().parse_rfc7240(request.headers['prefer'])
  166. logger.debug('Parsed Prefer header: {}'.format(prefer))
  167. if 'handling' in prefer:
  168. pref_handling = prefer['handling']['value']
  169. try:
  170. ret = rsrc.put(data, handling=pref_handling)
  171. except InvalidResourceError as e:
  172. return str(e), 409
  173. except ResourceExistsError as e:
  174. return str(e), 409
  175. except TombstoneError as e:
  176. return _tombstone_response(e, uuid)
  177. except ServerManagedTermError as e:
  178. return str(e), 412
  179. res_code = 201 if ret == Ldpr.RES_CREATED else 204
  180. return '', res_code, rsp_headers
  181. @ldp.route('/<path:uuid>', methods=['PATCH'])
  182. def patch_resource(uuid):
  183. '''
  184. Update an existing resource with a SPARQL-UPDATE payload.
  185. '''
  186. headers = std_headers
  187. rsrc = Ldpc(uuid)
  188. try:
  189. rsrc.patch(request.get_data().decode('utf-8'))
  190. except ResourceNotExistsError as e:
  191. return str(e), 404
  192. except TombstoneError as e:
  193. return _tombstone_response(e, uuid)
  194. except ServerManagedTermError as e:
  195. return str(e), 412
  196. return '', 204, headers
  197. @ldp.route('/<path:uuid>', methods=['DELETE'])
  198. def delete_resource(uuid):
  199. '''
  200. Delete a resource.
  201. '''
  202. headers = std_headers
  203. # If referential integrity is enforced, grab all inbound relationships
  204. # to break them.
  205. repr_opts = {'parameters' : {'include' : Ldpr.RETURN_INBOUND_REF_URI}} \
  206. if current_app.config['store']['ldp_rs']['referential_integrity'] \
  207. else None
  208. if 'prefer' in request.headers:
  209. prefer = Toolbox().parse_rfc7240(request.headers['prefer'])
  210. leave_tstone = 'no-tombstone' not in prefer
  211. else:
  212. leave_tstone = True
  213. try:
  214. Ldpr.inst(uuid, repr_opts).delete(leave_tstone=leave_tstone)
  215. except ResourceNotExistsError as e:
  216. return str(e), 404
  217. except TombstoneError as e:
  218. return _tombstone_response(e, uuid)
  219. return '', 204, headers
  220. @ldp.route('/<path:uuid>/fcr:tombstone', methods=['GET', 'POST', 'PUT',
  221. 'PATCH', 'DELETE'])
  222. def tombstone(uuid):
  223. '''
  224. Handle all tombstone operations.
  225. The only allowed method is DELETE; any other verb will return a 405.
  226. '''
  227. logger.debug('Deleting tombstone for {}.'.format(uuid))
  228. rsrc = Ldpr(uuid, repr_opts={'value' : 'minimal'})
  229. try:
  230. imr = rsrc.imr
  231. except TombstoneError as e:
  232. if request.method == 'DELETE':
  233. if e.uuid == uuid:
  234. rsrc.delete_tombstone()
  235. return '', 204
  236. else:
  237. return _tombstone_response(e, uuid)
  238. else:
  239. return 'Method Not Allowed.', 405
  240. except ResourceNotExistsError as e:
  241. return str(e), 404
  242. else:
  243. return '', 404
  244. def class_from_req_body():
  245. '''
  246. Determine LDP type (and instance class) from the provided RDF body.
  247. '''
  248. logger.debug('Content type: {}'.format(request.mimetype))
  249. logger.debug('files: {}'.format(request.files))
  250. logger.debug('stream: {}'.format(request.stream))
  251. # LDP-NR types
  252. if not request.content_length:
  253. logger.debug('No data received in body.')
  254. cls = Ldpc
  255. data = None
  256. elif request.mimetype in accept_rdf:
  257. # Parse out the RDF string.
  258. data = request.data.decode('utf-8')
  259. g = Graph().parse(data=data, format=request.mimetype)
  260. if Ldpr.MBR_RSRC_URI in g.predicates() and \
  261. Ldpr.MBR_REL_URI in g.predicates():
  262. if Ldpr.INS_CNT_REL_URI in g.predicates():
  263. cls = LdpIc
  264. else:
  265. cls = LdpDc
  266. else:
  267. cls = Ldpc
  268. else:
  269. cls = LdpNr
  270. if request.mimetype == 'multipart/form-data':
  271. # This seems the "right" way to upload a binary file, with a
  272. # multipart/form-data MIME type and the file in the `file`
  273. # field. This however is not supported by FCREPO4.
  274. data = request.files.get('file').stream
  275. else:
  276. # This is a less clean way, with the file in the form body and
  277. # the request as application/x-www-form-urlencoded.
  278. # This is how FCREPO4 accepts binary uploads.
  279. data = request.stream
  280. logger.info('Creating resource of type: {}'.format(cls.__name__))
  281. return cls, data
  282. def _get_bitstream(rsrc):
  283. out_headers = std_headers
  284. # @TODO This may change in favor of more low-level handling if the file
  285. # system is not local.
  286. return send_file(rsrc.local_path, as_attachment=True,
  287. attachment_filename=rsrc.filename)
  288. def _tombstone_response(e, uuid):
  289. headers = {
  290. 'Link' : '<{}/fcr:tombstone>; rel="hasTombstone"'.format(request.url),
  291. } if e.uuid == uuid else {}
  292. return str(e), 410, headers