test_ldp.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import url_for
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. from lakesuperior.toolbox import Toolbox
  11. @pytest.fixture(scope='module')
  12. def random_uuid():
  13. return str(uuid.uuid4())
  14. @pytest.mark.usefixtures('client_class')
  15. @pytest.mark.usefixtures('db')
  16. class TestLdp:
  17. '''
  18. Test HTTP interaction with LDP endpoint.
  19. '''
  20. def test_get_root_node(self):
  21. '''
  22. Get the root node from two different endpoints.
  23. The test triplestore must be initialized, hence the `db` fixture.
  24. '''
  25. ldp_resp = self.client.get('/ldp')
  26. rest_resp = self.client.get('/rest')
  27. assert ldp_resp.status_code == 200
  28. assert rest_resp.status_code == 200
  29. #assert ldp_resp.data == rest_resp.data
  30. def test_put_empty_resource(self, random_uuid):
  31. '''
  32. Check response headers for a PUT operation with empty payload.
  33. '''
  34. res = self.client.put('/ldp/{}'.format(random_uuid))
  35. assert res.status_code == 201
  36. def test_put_existing_resource(self, random_uuid):
  37. '''
  38. Trying to PUT an existing resource should return a 204 if the payload
  39. is empty.
  40. '''
  41. path = '/ldp/nonidempotent01'
  42. assert self.client.put(path).status_code == 201
  43. assert self.client.get(path).status_code == 200
  44. assert self.client.put(path).status_code == 204
  45. def test_put_ldp_rs(self, client):
  46. '''
  47. PUT a resource with RDF payload and verify.
  48. '''
  49. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  50. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  51. resp = self.client.get('/ldp/ldprs01',
  52. headers={'accept' : 'text/turtle'})
  53. assert resp.status_code == 200
  54. g = Graph().parse(data=resp.data, format='text/turtle')
  55. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  56. g.objects(None, RDF.type)
  57. def test_put_ldp_nr(self, rnd_img):
  58. '''
  59. PUT a resource with binary payload and verify checksums.
  60. '''
  61. rnd_img['content'].seek(0)
  62. resp = self.client.put('/ldp/ldpnr01', data=rnd_img['content'],
  63. headers={
  64. 'Content-Disposition' : 'attachment; filename={}'.format(
  65. rnd_img['filename'])})
  66. assert resp.status_code == 201
  67. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  68. assert resp.status_code == 200
  69. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  70. def test_put_mismatched_ldp_rs(self, rnd_img):
  71. '''
  72. Verify MIME type / LDP mismatch.
  73. PUT a LDP-RS, then PUT a LDP-NR on the same location and verify it
  74. fails.
  75. '''
  76. path = '/ldp/' + str(uuid.uuid4())
  77. rnd_img['content'].seek(0)
  78. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  79. headers={
  80. 'Content-Disposition' : 'attachment; filename={}'.format(
  81. rnd_img['filename'])})
  82. assert ldp_nr_resp.status_code == 201
  83. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  84. ldp_rs_resp = self.client.put(path, data=f,
  85. content_type='text/turtle')
  86. assert ldp_rs_resp.status_code == 415
  87. def test_put_mismatched_ldp_nr(self, rnd_img):
  88. '''
  89. Verify MIME type / LDP mismatch.
  90. PUT a LDP-NR, then PUT a LDP-RS on the same location and verify it
  91. fails.
  92. '''
  93. path = '/ldp/' + str(uuid.uuid4())
  94. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  95. ldp_rs_resp = self.client.put(path, data=f,
  96. content_type='text/turtle')
  97. assert ldp_rs_resp.status_code == 201
  98. rnd_img['content'].seek(0)
  99. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  100. headers={
  101. 'Content-Disposition' : 'attachment; filename={}'.format(
  102. rnd_img['filename'])})
  103. assert ldp_nr_resp.status_code == 415
  104. def test_post_resource(self, client):
  105. '''
  106. Check response headers for a POST operation with empty payload.
  107. '''
  108. res = self.client.post('/ldp/')
  109. assert res.status_code == 201
  110. assert 'Location' in res.headers
  111. def test_post_slug(self):
  112. '''
  113. Verify that a POST with slug results in the expected URI only if the
  114. resource does not exist already.
  115. '''
  116. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  117. assert slug01_resp.status_code == 201
  118. assert slug01_resp.headers['location'] == \
  119. Toolbox().base_url + '/slug01'
  120. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  121. assert slug02_resp.status_code == 201
  122. assert slug02_resp.headers['location'] != \
  123. Toolbox().base_url + '/slug01'
  124. def test_post_404(self):
  125. '''
  126. Verify that a POST to a non-existing parent results in a 404.
  127. '''
  128. assert self.client.post('/ldp/{}'.format(uuid.uuid4()))\
  129. .status_code == 404
  130. def test_post_409(self, rnd_img):
  131. '''
  132. Verify that you cannot POST to a binary resource.
  133. '''
  134. rnd_img['content'].seek(0)
  135. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  136. 'Content-Disposition' : 'attachment; filename={}'.format(
  137. rnd_img['filename'])})
  138. assert self.client.post('/ldp/post_409').status_code == 409
  139. def test_patch(self):
  140. '''
  141. Test patching a resource.
  142. '''
  143. path = '/ldp/test_patch01'
  144. self.client.put(path)
  145. uri = Toolbox().base_url + '/test_patch01'
  146. self.client.patch(path,
  147. data=open('tests/data/sparql_update/simple_insert.sparql'),
  148. headers={'content-type' : 'application/sparql-update'})
  149. resp = self.client.get(path)
  150. g = Graph().parse(data=resp.data, format='text/turtle')
  151. print('Triples after first PATCH: {}'.format(set(g)))
  152. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  153. self.client.patch(path,
  154. data=open('tests/data/sparql_update/delete+insert+where.sparql'),
  155. headers={'content-type' : 'application/sparql-update'})
  156. resp = self.client.get(path)
  157. g = Graph().parse(data=resp.data, format='text/turtle')
  158. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  159. def test_delete(self):
  160. '''
  161. Test delete response codes.
  162. '''
  163. create_resp = self.client.put('/ldp/test_delete01')
  164. delete_resp = self.client.delete('/ldp/test_delete01')
  165. assert delete_resp.status_code == 204
  166. bogus_delete_resp = self.client.delete('/ldp/test_delete101')
  167. assert bogus_delete_resp.status_code == 404
  168. def test_tombstone(self):
  169. '''
  170. Test tombstone behaviors.
  171. '''
  172. tstone_resp = self.client.get('/ldp/test_delete01')
  173. assert tstone_resp.status_code == 410
  174. assert tstone_resp.headers['Link'] == \
  175. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  176. .format(Toolbox().base_url)
  177. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  178. assert self.client.get(tstone_path).status_code == 405
  179. assert self.client.put(tstone_path).status_code == 405
  180. assert self.client.post(tstone_path).status_code == 405
  181. assert self.client.delete(tstone_path).status_code == 204
  182. assert self.client.get('/ldp/test_delete01').status_code == 404
  183. def test_delete_recursive(self):
  184. '''
  185. Test response codes for resources deleted recursively and their
  186. tombstones.
  187. '''
  188. self.client.put('/ldp/test_delete_recursive01')
  189. self.client.put('/ldp/test_delete_recursive01/a')
  190. self.client.delete('/ldp/test_delete_recursive01')
  191. tstone_resp = self.client.get('/ldp/test_delete_recursive01')
  192. assert tstone_resp.status_code == 410
  193. assert tstone_resp.headers['Link'] == \
  194. '<{}/test_delete_recursive01/fcr:tombstone>; rel="hasTombstone"'\
  195. .format(Toolbox().base_url)
  196. child_tstone_resp = self.client.get('/ldp/test_delete_recursive01/a')
  197. assert child_tstone_resp.status_code == tstone_resp.status_code
  198. assert 'Link' not in child_tstone_resp.headers.keys()
  199. @pytest.mark.usefixtures('client_class')
  200. @pytest.mark.usefixtures('db')
  201. class TestPrefHeader:
  202. '''
  203. Test various combinations of `Prefer` header.
  204. '''
  205. @pytest.fixture(scope='class')
  206. def cont_structure(self):
  207. '''
  208. Create a container structure to be used for subsequent requests.
  209. '''
  210. parent_path = '/ldp/test_parent'
  211. self.client.put(parent_path)
  212. self.client.put(parent_path + '/child1')
  213. self.client.put(parent_path + '/child2')
  214. self.client.put(parent_path + '/child3')
  215. return {
  216. 'path' : parent_path,
  217. 'response' : self.client.get(parent_path),
  218. 'subject' : URIRef(Toolbox().base_url + '/test_parent')
  219. }
  220. def test_put_prefer_handling(self, random_uuid):
  221. '''
  222. Trying to PUT an existing resource should:
  223. - Return a 204 if the payload is empty
  224. - Return a 204 if the payload is RDF, server-managed triples are
  225. included and the 'Prefer' header is set to 'handling=lenient'
  226. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  227. server-managed triples are included and handling is set to 'strict'
  228. '''
  229. path = '/ldp/put_pref_header01'
  230. assert self.client.put(path).status_code == 201
  231. assert self.client.get(path).status_code == 200
  232. assert self.client.put(path).status_code == 204
  233. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  234. rsp_len = self.client.put(
  235. path,
  236. headers={
  237. 'Prefer' : 'handling=lenient',
  238. 'Content-Type' : 'text/turtle',
  239. },
  240. data=f
  241. )
  242. assert rsp_len.status_code == 204
  243. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  244. rsp_strict = self.client.put(
  245. path,
  246. headers={
  247. 'Prefer' : 'handling=strict',
  248. 'Content-Type' : 'text/turtle',
  249. },
  250. data=f
  251. )
  252. assert rsp_strict.status_code == 412
  253. def test_embed_children(self, cont_structure):
  254. '''
  255. verify the "embed children" prefer header.
  256. '''
  257. parent_path = cont_structure['path']
  258. cont_resp = cont_structure['response']
  259. cont_subject = cont_structure['subject']
  260. minimal_resp = self.client.get(parent_path, headers={
  261. 'Prefer' : 'return=minimal',
  262. })
  263. incl_embed_children_resp = self.client.get(parent_path, headers={
  264. 'Prefer' : 'return=representation; include={}'\
  265. .format(Ldpr.EMBED_CHILD_RES_URI),
  266. })
  267. omit_embed_children_resp = self.client.get(parent_path, headers={
  268. 'Prefer' : 'return=representation; omit={}'\
  269. .format(Ldpr.EMBED_CHILD_RES_URI),
  270. })
  271. assert omit_embed_children_resp.data == cont_resp.data
  272. incl_g = Graph().parse(
  273. data=incl_embed_children_resp.data, format='turtle')
  274. omit_g = Graph().parse(
  275. data=omit_embed_children_resp.data, format='turtle')
  276. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  277. assert len(children) == 3
  278. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  279. for child_uri in children:
  280. assert set(incl_g[ child_uri : : ])
  281. assert not set(omit_g[ child_uri : : ])
  282. def test_return_children(self, cont_structure):
  283. '''
  284. verify the "return children" prefer header.
  285. '''
  286. parent_path = cont_structure['path']
  287. cont_resp = cont_structure['response']
  288. cont_subject = cont_structure['subject']
  289. incl_children_resp = self.client.get(parent_path, headers={
  290. 'Prefer' : 'return=representation; include={}'\
  291. .format(Ldpr.RETURN_CHILD_RES_URI),
  292. })
  293. omit_children_resp = self.client.get(parent_path, headers={
  294. 'Prefer' : 'return=representation; omit={}'\
  295. .format(Ldpr.RETURN_CHILD_RES_URI),
  296. })
  297. assert incl_children_resp.data == cont_resp.data
  298. incl_g = Graph().parse(data=incl_children_resp.data, format='turtle')
  299. omit_g = Graph().parse(data=omit_children_resp.data, format='turtle')
  300. children = incl_g[cont_subject : nsc['ldp'].contains]
  301. for child_uri in children:
  302. assert not omit_g[ cont_subject : nsc['ldp'].contains : child_uri ]
  303. def test_inbound_rel(self, cont_structure):
  304. '''
  305. verify the "inboud relationships" prefer header.
  306. '''
  307. parent_path = cont_structure['path']
  308. cont_resp = cont_structure['response']
  309. cont_subject = cont_structure['subject']
  310. incl_inbound_resp = self.client.get(parent_path, headers={
  311. 'Prefer' : 'return=representation; include={}'\
  312. .format(Ldpr.RETURN_INBOUND_REF_URI),
  313. })
  314. omit_inbound_resp = self.client.get(parent_path, headers={
  315. 'Prefer' : 'return=representation; omit={}'\
  316. .format(Ldpr.RETURN_INBOUND_REF_URI),
  317. })
  318. assert omit_inbound_resp.data == cont_resp.data
  319. incl_g = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  320. omit_g = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  321. assert set(incl_g[ : : cont_subject ])
  322. assert not set(omit_g[ : : cont_subject ])
  323. def test_srv_mgd_triples(self, cont_structure):
  324. '''
  325. verify the "server managed triples" prefer header.
  326. '''
  327. parent_path = cont_structure['path']
  328. cont_resp = cont_structure['response']
  329. cont_subject = cont_structure['subject']
  330. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  331. 'Prefer' : 'return=representation; include={}'\
  332. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  333. })
  334. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  335. 'Prefer' : 'return=representation; omit={}'\
  336. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  337. })
  338. assert incl_srv_mgd_resp.data == cont_resp.data
  339. incl_g = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  340. omit_g = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  341. for pred in {
  342. nsc['fcrepo'].created,
  343. nsc['fcrepo'].createdBy,
  344. nsc['fcrepo'].lastModified,
  345. nsc['fcrepo'].lastModifiedBy,
  346. nsc['ldp'].contains,
  347. }:
  348. assert set(incl_g[ cont_subject : pred : ])
  349. assert not set(omit_g[ cont_subject : pred : ])
  350. for type in {
  351. nsc['fcrepo'].Resource,
  352. nsc['ldp'].Container,
  353. nsc['ldp'].Resource,
  354. }:
  355. assert incl_g[ cont_subject : RDF.type : type ]
  356. assert not omit_g[ cont_subject : RDF.type : type ]
  357. def test_delete_no_tstone(self):
  358. '''
  359. Test the `no-tombstone` Prefer option.
  360. '''
  361. self.client.put('/ldp/test_delete_no_tstone01')
  362. self.client.put('/ldp/test_delete_no_tstone01/a')
  363. self.client.delete('/ldp/test_delete_no_tstone01', headers={
  364. 'prefer' : 'no-tombstone'})
  365. resp = self.client.get('/ldp/test_delete_no_tstone01')
  366. assert resp.status_code == 404
  367. child_resp = self.client.get('/ldp/test_delete_no_tstone01/a')
  368. assert child_resp.status_code == 404