test_ldp.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import url_for
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. from lakesuperior.toolbox import Toolbox
  11. @pytest.fixture(scope='module')
  12. def random_uuid():
  13. return str(uuid.uuid4())
  14. @pytest.mark.usefixtures('client_class')
  15. @pytest.mark.usefixtures('db')
  16. class TestLdp:
  17. '''
  18. Test HTTP interaction with LDP endpoint.
  19. '''
  20. def test_get_root_node(self):
  21. '''
  22. Get the root node from two different endpoints.
  23. The test triplestore must be initialized, hence the `db` fixture.
  24. '''
  25. ldp_resp = self.client.get('/ldp')
  26. rest_resp = self.client.get('/rest')
  27. assert ldp_resp.status_code == 200
  28. assert rest_resp.status_code == 200
  29. #assert ldp_resp.data == rest_resp.data
  30. def test_post_resource(self, client):
  31. '''
  32. Check response headers for a POST operation with empty payload.
  33. '''
  34. res = self.client.post('/ldp/')
  35. assert res.status_code == 201
  36. assert 'Location' in res.headers
  37. def test_put_empty_resource(self, random_uuid):
  38. '''
  39. Check response headers for a PUT operation with empty payload.
  40. '''
  41. res = self.client.put('/ldp/{}'.format(random_uuid))
  42. assert res.status_code == 201
  43. def test_put_existing_resource(self, random_uuid):
  44. '''
  45. Trying to PUT an existing resource should return a 204 if the payload
  46. is empty.
  47. '''
  48. path = '/ldp/nonidempotent01'
  49. assert self.client.put(path).status_code == 201
  50. assert self.client.get(path).status_code == 200
  51. assert self.client.put(path).status_code == 204
  52. def test_put_ldp_rs(self, client):
  53. '''
  54. PUT a resource with RDF payload and verify.
  55. '''
  56. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  57. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  58. resp = self.client.get('/ldp/ldprs01', headers={'accept' : 'text/turtle'})
  59. assert resp.status_code == 200
  60. g = Graph().parse(data=resp.data, format='text/turtle')
  61. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  62. g.objects(None, RDF.type)
  63. def test_put_ldp_nr(self, rnd_img):
  64. '''
  65. PUT a resource with binary payload and verify checksums.
  66. '''
  67. rnd_img['content'].seek(0)
  68. self.client.put('/ldp/ldpnr01', data=rnd_img['content'], headers={
  69. 'Content-Disposition' : 'attachment; filename={}'.format(
  70. rnd_img['filename'])})
  71. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  72. assert resp.status_code == 200
  73. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  74. def test_post_slug(self):
  75. '''
  76. Verify that a POST with slug results in the expected URI only if the
  77. resource does not exist already.
  78. '''
  79. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  80. assert slug01_resp.status_code == 201
  81. assert slug01_resp.headers['location'] == \
  82. Toolbox().base_url + '/slug01'
  83. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  84. assert slug02_resp.status_code == 201
  85. assert slug02_resp.headers['location'] != \
  86. Toolbox().base_url + '/slug01'
  87. def test_post_404(self):
  88. '''
  89. Verify that a POST to a non-existing parent results in a 404.
  90. '''
  91. assert self.client.post('/ldp/{}'.format(uuid.uuid4()))\
  92. .status_code == 404
  93. def test_post_409(self, rnd_img):
  94. '''
  95. Verify that you cannot POST to a binary resource.
  96. '''
  97. rnd_img['content'].seek(0)
  98. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  99. 'Content-Disposition' : 'attachment; filename={}'.format(
  100. rnd_img['filename'])})
  101. assert self.client.post('/ldp/post_409').status_code == 409
  102. def test_delete(self):
  103. create_resp = self.client.put('/ldp/test_delete01')
  104. delete_resp = self.client.delete('/ldp/test_delete01')
  105. assert delete_resp.status_code == 204
  106. def test_tombstone(self):
  107. tstone_resp = self.client.get('/ldp/test_delete01')
  108. assert tstone_resp.status_code == 410
  109. assert tstone_resp.headers['Link'] == \
  110. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  111. .format(Toolbox().base_url)
  112. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  113. assert self.client.get(tstone_path).status_code == 405
  114. assert self.client.put(tstone_path).status_code == 405
  115. assert self.client.post(tstone_path).status_code == 405
  116. assert self.client.delete(tstone_path).status_code == 204
  117. assert self.client.get('/ldp/test_delete01').status_code == 404
  118. @pytest.mark.usefixtures('client_class')
  119. @pytest.mark.usefixtures('db')
  120. class TestPrefHeader:
  121. '''
  122. Test various combinations of `Prefer` header.
  123. '''
  124. @pytest.fixture(scope='class')
  125. def cont_structure(self):
  126. '''
  127. Create a container structure to be used for subsequent requests.
  128. '''
  129. parent_path = '/ldp/test_parent'
  130. self.client.put(parent_path)
  131. self.client.put(parent_path + '/child1')
  132. self.client.put(parent_path + '/child2')
  133. self.client.put(parent_path + '/child3')
  134. return {
  135. 'path' : parent_path,
  136. 'response' : self.client.get(parent_path),
  137. 'subject' : URIRef(Toolbox().base_url + '/test_parent')
  138. }
  139. def test_put_prefer_handling(self, random_uuid):
  140. '''
  141. Trying to PUT an existing resource should:
  142. - Return a 204 if the payload is empty
  143. - Return a 204 if the payload is RDF, server-managed triples are
  144. included and the 'Prefer' header is set to 'handling=lenient'
  145. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  146. server-managed triples are included and handling is set to 'strict'
  147. '''
  148. path = '/ldp/put_pref_header01'
  149. assert self.client.put(path).status_code == 201
  150. assert self.client.get(path).status_code == 200
  151. assert self.client.put(path).status_code == 204
  152. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  153. rsp_len = self.client.put(
  154. '/ldp/{}'.format(random_uuid),
  155. headers={
  156. 'Prefer' : 'handling=lenient',
  157. 'Content-Type' : 'text/turtle',
  158. },
  159. data=f
  160. )
  161. assert rsp_len.status_code == 204
  162. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  163. rsp_strict = self.client.put(
  164. path,
  165. headers={
  166. 'Prefer' : 'handling=strict',
  167. 'Content-Type' : 'text/turtle',
  168. },
  169. data=f
  170. )
  171. assert rsp_strict.status_code == 412
  172. def test_embed_children(self, cont_structure):
  173. '''
  174. verify the "embed children" prefer header.
  175. '''
  176. parent_path = cont_structure['path']
  177. cont_resp = cont_structure['response']
  178. cont_subject = cont_structure['subject']
  179. minimal_resp = self.client.get(parent_path, headers={
  180. 'Prefer' : 'return=minimal',
  181. })
  182. incl_embed_children_resp = self.client.get(parent_path, headers={
  183. 'Prefer' : 'return=representation; include={}'\
  184. .format(Ldpr.EMBED_CHILD_RES_URI),
  185. })
  186. omit_embed_children_resp = self.client.get(parent_path, headers={
  187. 'Prefer' : 'return=representation; omit={}'\
  188. .format(Ldpr.EMBED_CHILD_RES_URI),
  189. })
  190. assert omit_embed_children_resp.data == cont_resp.data
  191. incl_g = Graph().parse(
  192. data=incl_embed_children_resp.data, format='turtle')
  193. omit_g = Graph().parse(
  194. data=omit_embed_children_resp.data, format='turtle')
  195. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  196. assert len(children) == 3
  197. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  198. for child_uri in children:
  199. assert set(incl_g[ child_uri : : ])
  200. assert not set(omit_g[ child_uri : : ])
  201. def test_return_children(self, cont_structure):
  202. '''
  203. verify the "return children" prefer header.
  204. '''
  205. parent_path = cont_structure['path']
  206. cont_resp = cont_structure['response']
  207. cont_subject = cont_structure['subject']
  208. incl_children_resp = self.client.get(parent_path, headers={
  209. 'Prefer' : 'return=representation; include={}'\
  210. .format(Ldpr.RETURN_CHILD_RES_URI),
  211. })
  212. omit_children_resp = self.client.get(parent_path, headers={
  213. 'Prefer' : 'return=representation; omit={}'\
  214. .format(Ldpr.RETURN_CHILD_RES_URI),
  215. })
  216. assert incl_children_resp.data == cont_resp.data
  217. incl_g = Graph().parse(data=incl_children_resp.data, format='turtle')
  218. omit_g = Graph().parse(data=omit_children_resp.data, format='turtle')
  219. children = incl_g[cont_subject : nsc['ldp'].contains]
  220. for child_uri in children:
  221. assert not omit_g[ cont_subject : nsc['ldp'].contains : child_uri ]
  222. def test_inbound_rel(self, cont_structure):
  223. '''
  224. verify the "inboud relationships" prefer header.
  225. '''
  226. parent_path = cont_structure['path']
  227. cont_resp = cont_structure['response']
  228. cont_subject = cont_structure['subject']
  229. incl_inbound_resp = self.client.get(parent_path, headers={
  230. 'Prefer' : 'return=representation; include={}'\
  231. .format(Ldpr.RETURN_INBOUND_REF_URI),
  232. })
  233. omit_inbound_resp = self.client.get(parent_path, headers={
  234. 'Prefer' : 'return=representation; omit={}'\
  235. .format(Ldpr.RETURN_INBOUND_REF_URI),
  236. })
  237. assert omit_inbound_resp.data == cont_resp.data
  238. incl_g = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  239. omit_g = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  240. assert set(incl_g[ : : cont_subject ])
  241. assert not set(omit_g[ : : cont_subject ])
  242. def test_srv_mgd_triples(self, cont_structure):
  243. '''
  244. verify the "server managed triples" prefer header.
  245. '''
  246. parent_path = cont_structure['path']
  247. cont_resp = cont_structure['response']
  248. cont_subject = cont_structure['subject']
  249. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  250. 'Prefer' : 'return=representation; include={}'\
  251. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  252. })
  253. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  254. 'Prefer' : 'return=representation; omit={}'\
  255. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  256. })
  257. assert incl_srv_mgd_resp.data == cont_resp.data
  258. incl_g = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  259. omit_g = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  260. for pred in {
  261. nsc['fcrepo'].created,
  262. nsc['fcrepo'].createdBy,
  263. nsc['fcrepo'].lastModified,
  264. nsc['fcrepo'].lastModifiedBy,
  265. nsc['ldp'].contains,
  266. }:
  267. assert set(incl_g[ cont_subject : pred : ])
  268. assert not set(omit_g[ cont_subject : pred : ])
  269. for type in {
  270. nsc['fcrepo'].Resource,
  271. nsc['ldp'].Container,
  272. nsc['ldp'].Resource,
  273. }:
  274. assert incl_g[ cont_subject : RDF.type : type ]
  275. assert not omit_g[ cont_subject : RDF.type : type ]