test_ldp.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import url_for
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. from lakesuperior.toolbox import Toolbox
  11. @pytest.fixture(scope='module')
  12. def random_uuid():
  13. return str(uuid.uuid4())
  14. @pytest.mark.usefixtures('client_class')
  15. @pytest.mark.usefixtures('db')
  16. class TestLdp:
  17. '''
  18. Test HTTP interaction with LDP endpoint.
  19. '''
  20. def test_get_root_node(self):
  21. '''
  22. Get the root node from two different endpoints.
  23. The test triplestore must be initialized, hence the `db` fixture.
  24. '''
  25. ldp_resp = self.client.get('/ldp')
  26. rest_resp = self.client.get('/rest')
  27. assert ldp_resp.status_code == 200
  28. assert rest_resp.status_code == 200
  29. #assert ldp_resp.data == rest_resp.data
  30. def test_put_empty_resource(self, random_uuid):
  31. '''
  32. Check response headers for a PUT operation with empty payload.
  33. '''
  34. res = self.client.put('/ldp/{}'.format(random_uuid))
  35. assert res.status_code == 201
  36. def test_put_existing_resource(self, random_uuid):
  37. '''
  38. Trying to PUT an existing resource should return a 204 if the payload
  39. is empty.
  40. '''
  41. path = '/ldp/nonidempotent01'
  42. assert self.client.put(path).status_code == 201
  43. assert self.client.get(path).status_code == 200
  44. assert self.client.put(path).status_code == 204
  45. def test_put_tree(self, client):
  46. '''
  47. PUT a resource with several path segments.
  48. The test should create intermediate path segments that are not
  49. accessible to PUT but allow POST.
  50. '''
  51. path = '/ldp/test_tree/a/b/c/d/e/f/g'
  52. self.client.put(path)
  53. assert self.client.get(path).resp.status_code == 200
  54. def test_put_nested_tree(self, client):
  55. '''
  56. Verify that containment is set correctly in nested hierarchies.
  57. First put a new hierarchy and verify that the root node is its
  58. container; then put another hierarchy under it and verify that the
  59. first hierarchy is the container of the second one.
  60. '''
  61. uuid1 = 'test_nested_tree/a/b/c/d'
  62. uuid2 = uuid1 + '/e/f/g'
  63. path1 = '/ldp/' + uuid1
  64. path2 = '/ldp/' + uuid2
  65. self.client.put(path1)
  66. cont1_data = self.client.get('/ldp').data
  67. g1 = Graph().parse(data=cont1_data, format='turtle')
  68. assert g1[ URIRef(Toolbox().base_url + '/') : nsc['ldp'].contains : \
  69. URIRef(Toolbox().base_url + '/' + uuid1) ]
  70. self.client.put(path2)
  71. cont2_data = self.client.get(path1).data
  72. g1 = Graph().parse(data=cont2_data, format='turtle')
  73. assert g1[ URIRef(Toolbox().base_url + '/' + uuid1) : \
  74. nsc['ldp'].contains : \
  75. URIRef(Toolbox().base_url + '/' + uuid2) ]
  76. def test_put_ldp_rs(self, client):
  77. '''
  78. PUT a resource with RDF payload and verify.
  79. '''
  80. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  81. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  82. resp = self.client.get('/ldp/ldprs01',
  83. headers={'accept' : 'text/turtle'})
  84. assert resp.status_code == 200
  85. g = Graph().parse(data=resp.data, format='text/turtle')
  86. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  87. g.objects(None, RDF.type)
  88. def test_put_ldp_nr(self, rnd_img):
  89. '''
  90. PUT a resource with binary payload and verify checksums.
  91. '''
  92. rnd_img['content'].seek(0)
  93. resp = self.client.put('/ldp/ldpnr01', data=rnd_img['content'],
  94. headers={
  95. 'Content-Disposition' : 'attachment; filename={}'.format(
  96. rnd_img['filename'])})
  97. assert resp.status_code == 201
  98. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  99. assert resp.status_code == 200
  100. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  101. def test_put_mismatched_ldp_rs(self, rnd_img):
  102. '''
  103. Verify MIME type / LDP mismatch.
  104. PUT a LDP-RS, then PUT a LDP-NR on the same location and verify it
  105. fails.
  106. '''
  107. path = '/ldp/' + str(uuid.uuid4())
  108. rnd_img['content'].seek(0)
  109. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  110. headers={
  111. 'Content-Disposition' : 'attachment; filename={}'.format(
  112. rnd_img['filename'])})
  113. assert ldp_nr_resp.status_code == 201
  114. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  115. ldp_rs_resp = self.client.put(path, data=f,
  116. content_type='text/turtle')
  117. assert ldp_rs_resp.status_code == 415
  118. def test_put_mismatched_ldp_nr(self, rnd_img):
  119. '''
  120. Verify MIME type / LDP mismatch.
  121. PUT a LDP-NR, then PUT a LDP-RS on the same location and verify it
  122. fails.
  123. '''
  124. path = '/ldp/' + str(uuid.uuid4())
  125. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  126. ldp_rs_resp = self.client.put(path, data=f,
  127. content_type='text/turtle')
  128. assert ldp_rs_resp.status_code == 201
  129. rnd_img['content'].seek(0)
  130. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  131. headers={
  132. 'Content-Disposition' : 'attachment; filename={}'.format(
  133. rnd_img['filename'])})
  134. assert ldp_nr_resp.status_code == 415
  135. def test_post_resource(self, client):
  136. '''
  137. Check response headers for a POST operation with empty payload.
  138. '''
  139. res = self.client.post('/ldp/')
  140. assert res.status_code == 201
  141. assert 'Location' in res.headers
  142. def test_post_slug(self):
  143. '''
  144. Verify that a POST with slug results in the expected URI only if the
  145. resource does not exist already.
  146. '''
  147. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  148. assert slug01_resp.status_code == 201
  149. assert slug01_resp.headers['location'] == \
  150. Toolbox().base_url + '/slug01'
  151. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  152. assert slug02_resp.status_code == 201
  153. assert slug02_resp.headers['location'] != \
  154. Toolbox().base_url + '/slug01'
  155. def test_post_404(self):
  156. '''
  157. Verify that a POST to a non-existing parent results in a 404.
  158. '''
  159. assert self.client.post('/ldp/{}'.format(uuid.uuid4()))\
  160. .status_code == 404
  161. def test_post_409(self, rnd_img):
  162. '''
  163. Verify that you cannot POST to a binary resource.
  164. '''
  165. rnd_img['content'].seek(0)
  166. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  167. 'Content-Disposition' : 'attachment; filename={}'.format(
  168. rnd_img['filename'])})
  169. assert self.client.post('/ldp/post_409').status_code == 409
  170. def test_patch(self):
  171. '''
  172. Test patching a resource.
  173. '''
  174. path = '/ldp/test_patch01'
  175. self.client.put(path)
  176. uri = Toolbox().base_url + '/test_patch01'
  177. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  178. resp = self.client.patch(path,
  179. data=data,
  180. headers={'content-type' : 'application/sparql-update'})
  181. assert resp.status_code == 204
  182. resp = self.client.get(path)
  183. g = Graph().parse(data=resp.data, format='text/turtle')
  184. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  185. self.client.patch(path,
  186. data=open('tests/data/sparql_update/delete+insert+where.sparql'),
  187. headers={'content-type' : 'application/sparql-update'})
  188. resp = self.client.get(path)
  189. g = Graph().parse(data=resp.data, format='text/turtle')
  190. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  191. def test_patch_ldp_nr_metadata(self):
  192. '''
  193. Test patching a LDP-NR metadata resource, both from the fcr:metadata
  194. and the resource URIs.
  195. '''
  196. path = '/ldp/ldpnr01'
  197. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  198. self.client.patch(path + '/fcr:metadata',
  199. data=data,
  200. headers={'content-type' : 'application/sparql-update'})
  201. resp = self.client.get(path + '/fcr:metadata')
  202. assert resp.status_code == 200
  203. uri = Toolbox().base_url + '/ldpnr01'
  204. g = Graph().parse(data=resp.data, format='text/turtle')
  205. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  206. with open(
  207. 'tests/data/sparql_update/delete+insert+where.sparql') as data:
  208. patch_resp = self.client.patch(path,
  209. data=data,
  210. headers={'content-type' : 'application/sparql-update'})
  211. assert patch_resp.status_code == 204
  212. resp = self.client.get(path + '/fcr:metadata')
  213. assert resp.status_code == 200
  214. g = Graph().parse(data=resp.data, format='text/turtle')
  215. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  216. def test_patch_ldp_nr(self, rnd_img):
  217. '''
  218. Verify that a PATCH using anything other than an
  219. `application/sparql-update` MIME type results in an error.
  220. '''
  221. rnd_img['content'].seek(0)
  222. resp = self.client.patch('/ldp/ldpnr01/fcr:metadata',
  223. data=rnd_img,
  224. headers={'content-type' : 'image/jpeg'})
  225. assert resp.status_code == 415
  226. def test_delete(self):
  227. '''
  228. Test delete response codes.
  229. '''
  230. create_resp = self.client.put('/ldp/test_delete01')
  231. delete_resp = self.client.delete('/ldp/test_delete01')
  232. assert delete_resp.status_code == 204
  233. bogus_delete_resp = self.client.delete('/ldp/test_delete101')
  234. assert bogus_delete_resp.status_code == 404
  235. def test_tombstone(self):
  236. '''
  237. Test tombstone behaviors.
  238. '''
  239. tstone_resp = self.client.get('/ldp/test_delete01')
  240. assert tstone_resp.status_code == 410
  241. assert tstone_resp.headers['Link'] == \
  242. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  243. .format(Toolbox().base_url)
  244. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  245. assert self.client.get(tstone_path).status_code == 405
  246. assert self.client.put(tstone_path).status_code == 405
  247. assert self.client.post(tstone_path).status_code == 405
  248. assert self.client.delete(tstone_path).status_code == 204
  249. assert self.client.get('/ldp/test_delete01').status_code == 404
  250. def test_delete_recursive(self):
  251. '''
  252. Test response codes for resources deleted recursively and their
  253. tombstones.
  254. '''
  255. self.client.put('/ldp/test_delete_recursive01')
  256. self.client.put('/ldp/test_delete_recursive01/a')
  257. self.client.delete('/ldp/test_delete_recursive01')
  258. tstone_resp = self.client.get('/ldp/test_delete_recursive01')
  259. assert tstone_resp.status_code == 410
  260. assert tstone_resp.headers['Link'] == \
  261. '<{}/test_delete_recursive01/fcr:tombstone>; rel="hasTombstone"'\
  262. .format(Toolbox().base_url)
  263. child_tstone_resp = self.client.get('/ldp/test_delete_recursive01/a')
  264. assert child_tstone_resp.status_code == tstone_resp.status_code
  265. assert 'Link' not in child_tstone_resp.headers.keys()
  266. @pytest.mark.usefixtures('client_class')
  267. @pytest.mark.usefixtures('db')
  268. class TestPrefHeader:
  269. '''
  270. Test various combinations of `Prefer` header.
  271. '''
  272. @pytest.fixture(scope='class')
  273. def cont_structure(self):
  274. '''
  275. Create a container structure to be used for subsequent requests.
  276. '''
  277. parent_path = '/ldp/test_parent'
  278. self.client.put(parent_path)
  279. self.client.put(parent_path + '/child1')
  280. self.client.put(parent_path + '/child2')
  281. self.client.put(parent_path + '/child3')
  282. return {
  283. 'path' : parent_path,
  284. 'response' : self.client.get(parent_path),
  285. 'subject' : URIRef(Toolbox().base_url + '/test_parent')
  286. }
  287. def test_put_prefer_handling(self, random_uuid):
  288. '''
  289. Trying to PUT an existing resource should:
  290. - Return a 204 if the payload is empty
  291. - Return a 204 if the payload is RDF, server-managed triples are
  292. included and the 'Prefer' header is set to 'handling=lenient'
  293. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  294. server-managed triples are included and handling is set to 'strict'
  295. '''
  296. path = '/ldp/put_pref_header01'
  297. assert self.client.put(path).status_code == 201
  298. assert self.client.get(path).status_code == 200
  299. assert self.client.put(path).status_code == 204
  300. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  301. rsp_len = self.client.put(
  302. path,
  303. headers={
  304. 'Prefer' : 'handling=lenient',
  305. 'Content-Type' : 'text/turtle',
  306. },
  307. data=f
  308. )
  309. assert rsp_len.status_code == 204
  310. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  311. rsp_strict = self.client.put(
  312. path,
  313. headers={
  314. 'Prefer' : 'handling=strict',
  315. 'Content-Type' : 'text/turtle',
  316. },
  317. data=f
  318. )
  319. assert rsp_strict.status_code == 412
  320. def test_embed_children(self, cont_structure):
  321. '''
  322. verify the "embed children" prefer header.
  323. '''
  324. parent_path = cont_structure['path']
  325. cont_resp = cont_structure['response']
  326. cont_subject = cont_structure['subject']
  327. minimal_resp = self.client.get(parent_path, headers={
  328. 'Prefer' : 'return=minimal',
  329. })
  330. incl_embed_children_resp = self.client.get(parent_path, headers={
  331. 'Prefer' : 'return=representation; include={}'\
  332. .format(Ldpr.EMBED_CHILD_RES_URI),
  333. })
  334. omit_embed_children_resp = self.client.get(parent_path, headers={
  335. 'Prefer' : 'return=representation; omit={}'\
  336. .format(Ldpr.EMBED_CHILD_RES_URI),
  337. })
  338. assert omit_embed_children_resp.data == cont_resp.data
  339. incl_g = Graph().parse(
  340. data=incl_embed_children_resp.data, format='turtle')
  341. omit_g = Graph().parse(
  342. data=omit_embed_children_resp.data, format='turtle')
  343. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  344. assert len(children) == 3
  345. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  346. for child_uri in children:
  347. assert set(incl_g[ child_uri : : ])
  348. assert not set(omit_g[ child_uri : : ])
  349. def test_return_children(self, cont_structure):
  350. '''
  351. verify the "return children" prefer header.
  352. '''
  353. parent_path = cont_structure['path']
  354. cont_resp = cont_structure['response']
  355. cont_subject = cont_structure['subject']
  356. incl_children_resp = self.client.get(parent_path, headers={
  357. 'Prefer' : 'return=representation; include={}'\
  358. .format(Ldpr.RETURN_CHILD_RES_URI),
  359. })
  360. omit_children_resp = self.client.get(parent_path, headers={
  361. 'Prefer' : 'return=representation; omit={}'\
  362. .format(Ldpr.RETURN_CHILD_RES_URI),
  363. })
  364. assert incl_children_resp.data == cont_resp.data
  365. incl_g = Graph().parse(data=incl_children_resp.data, format='turtle')
  366. omit_g = Graph().parse(data=omit_children_resp.data, format='turtle')
  367. children = incl_g[cont_subject : nsc['ldp'].contains]
  368. for child_uri in children:
  369. assert not omit_g[ cont_subject : nsc['ldp'].contains : child_uri ]
  370. def test_inbound_rel(self, cont_structure):
  371. '''
  372. verify the "inboud relationships" prefer header.
  373. '''
  374. parent_path = cont_structure['path']
  375. cont_resp = cont_structure['response']
  376. cont_subject = cont_structure['subject']
  377. incl_inbound_resp = self.client.get(parent_path, headers={
  378. 'Prefer' : 'return=representation; include={}'\
  379. .format(Ldpr.RETURN_INBOUND_REF_URI),
  380. })
  381. omit_inbound_resp = self.client.get(parent_path, headers={
  382. 'Prefer' : 'return=representation; omit={}'\
  383. .format(Ldpr.RETURN_INBOUND_REF_URI),
  384. })
  385. assert omit_inbound_resp.data == cont_resp.data
  386. incl_g = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  387. omit_g = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  388. assert set(incl_g[ : : cont_subject ])
  389. assert not set(omit_g[ : : cont_subject ])
  390. def test_srv_mgd_triples(self, cont_structure):
  391. '''
  392. verify the "server managed triples" prefer header.
  393. '''
  394. parent_path = cont_structure['path']
  395. cont_resp = cont_structure['response']
  396. cont_subject = cont_structure['subject']
  397. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  398. 'Prefer' : 'return=representation; include={}'\
  399. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  400. })
  401. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  402. 'Prefer' : 'return=representation; omit={}'\
  403. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  404. })
  405. assert incl_srv_mgd_resp.data == cont_resp.data
  406. incl_g = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  407. omit_g = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  408. for pred in {
  409. nsc['fcrepo'].created,
  410. nsc['fcrepo'].createdBy,
  411. nsc['fcrepo'].lastModified,
  412. nsc['fcrepo'].lastModifiedBy,
  413. nsc['ldp'].contains,
  414. }:
  415. assert set(incl_g[ cont_subject : pred : ])
  416. assert not set(omit_g[ cont_subject : pred : ])
  417. for type in {
  418. nsc['fcrepo'].Resource,
  419. nsc['ldp'].Container,
  420. nsc['ldp'].Resource,
  421. }:
  422. assert incl_g[ cont_subject : RDF.type : type ]
  423. assert not omit_g[ cont_subject : RDF.type : type ]
  424. def test_delete_no_tstone(self):
  425. '''
  426. Test the `no-tombstone` Prefer option.
  427. '''
  428. self.client.put('/ldp/test_delete_no_tstone01')
  429. self.client.put('/ldp/test_delete_no_tstone01/a')
  430. self.client.delete('/ldp/test_delete_no_tstone01', headers={
  431. 'prefer' : 'no-tombstone'})
  432. resp = self.client.get('/ldp/test_delete_no_tstone01')
  433. assert resp.status_code == 404
  434. child_resp = self.client.get('/ldp/test_delete_no_tstone01/a')
  435. assert child_resp.status_code == 404