test_ldp.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import url_for
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. from lakesuperior.toolbox import Toolbox
  11. @pytest.fixture(scope='module')
  12. def random_uuid():
  13. return str(uuid.uuid4())
  14. @pytest.mark.usefixtures('client_class')
  15. @pytest.mark.usefixtures('db')
  16. class TestLdp:
  17. '''
  18. Test HTTP interaction with LDP endpoint.
  19. '''
  20. def test_get_root_node(self):
  21. '''
  22. Get the root node from two different endpoints.
  23. The test triplestore must be initialized, hence the `db` fixture.
  24. '''
  25. ldp_resp = self.client.get('/ldp')
  26. rest_resp = self.client.get('/rest')
  27. assert ldp_resp.status_code == 200
  28. assert rest_resp.status_code == 200
  29. #assert ldp_resp.data == rest_resp.data
  30. def test_put_empty_resource(self, random_uuid):
  31. '''
  32. Check response headers for a PUT operation with empty payload.
  33. '''
  34. resp = self.client.put('/ldp/new_resource')
  35. assert resp.status_code == 201
  36. assert resp.data == bytes(
  37. '{}/new_resource'.format(Toolbox().base_url), 'utf-8')
  38. def test_put_existing_resource(self, random_uuid):
  39. '''
  40. Trying to PUT an existing resource should return a 204 if the payload
  41. is empty.
  42. '''
  43. path = '/ldp/nonidempotent01'
  44. put1_resp = self.client.put(path)
  45. assert put1_resp.status_code == 201
  46. assert self.client.get(path).status_code == 200
  47. put2_resp = self.client.put(path)
  48. assert put2_resp.status_code == 204
  49. assert put2_resp.data == b''
  50. def test_put_tree(self, client):
  51. '''
  52. PUT a resource with several path segments.
  53. The test should create intermediate path segments that are not
  54. accessible to PUT or POST.
  55. '''
  56. path = '/ldp/test_tree/a/b/c/d/e/f/g'
  57. self.client.put(path)
  58. assert self.client.get(path).status_code == 200
  59. assert self.client.put('/ldp/test_tree/a').status_code == 409
  60. assert self.client.post('/ldp/test_tree/a').status_code == 409
  61. def test_put_nested_tree(self, client):
  62. '''
  63. Verify that containment is set correctly in nested hierarchies.
  64. First put a new hierarchy and verify that the root node is its
  65. container; then put another hierarchy under it and verify that the
  66. first hierarchy is the container of the second one.
  67. '''
  68. uuid1 = 'test_nested_tree/a/b/c/d'
  69. uuid2 = uuid1 + '/e/f/g'
  70. path1 = '/ldp/' + uuid1
  71. path2 = '/ldp/' + uuid2
  72. self.client.put(path1)
  73. cont1_data = self.client.get('/ldp').data
  74. g1 = Graph().parse(data=cont1_data, format='turtle')
  75. assert g1[ URIRef(Toolbox().base_url + '/') : nsc['ldp'].contains : \
  76. URIRef(Toolbox().base_url + '/' + uuid1) ]
  77. self.client.put(path2)
  78. cont2_data = self.client.get(path1).data
  79. g1 = Graph().parse(data=cont2_data, format='turtle')
  80. assert g1[ URIRef(Toolbox().base_url + '/' + uuid1) : \
  81. nsc['ldp'].contains : \
  82. URIRef(Toolbox().base_url + '/' + uuid2) ]
  83. def test_put_ldp_rs(self, client):
  84. '''
  85. PUT a resource with RDF payload and verify.
  86. '''
  87. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  88. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  89. resp = self.client.get('/ldp/ldprs01',
  90. headers={'accept' : 'text/turtle'})
  91. assert resp.status_code == 200
  92. g = Graph().parse(data=resp.data, format='text/turtle')
  93. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  94. g.objects(None, RDF.type)
  95. def test_put_ldp_nr(self, rnd_img):
  96. '''
  97. PUT a resource with binary payload and verify checksums.
  98. '''
  99. rnd_img['content'].seek(0)
  100. resp = self.client.put('/ldp/ldpnr01', data=rnd_img['content'],
  101. headers={
  102. 'Content-Disposition' : 'attachment; filename={}'.format(
  103. rnd_img['filename'])})
  104. assert resp.status_code == 201
  105. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  106. assert resp.status_code == 200
  107. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  108. def test_put_mismatched_ldp_rs(self, rnd_img):
  109. '''
  110. Verify MIME type / LDP mismatch.
  111. PUT a LDP-RS, then PUT a LDP-NR on the same location and verify it
  112. fails.
  113. '''
  114. path = '/ldp/' + str(uuid.uuid4())
  115. rnd_img['content'].seek(0)
  116. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  117. headers={
  118. 'Content-Disposition' : 'attachment; filename={}'.format(
  119. rnd_img['filename'])})
  120. assert ldp_nr_resp.status_code == 201
  121. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  122. ldp_rs_resp = self.client.put(path, data=f,
  123. content_type='text/turtle')
  124. assert ldp_rs_resp.status_code == 415
  125. def test_put_mismatched_ldp_nr(self, rnd_img):
  126. '''
  127. Verify MIME type / LDP mismatch.
  128. PUT a LDP-NR, then PUT a LDP-RS on the same location and verify it
  129. fails.
  130. '''
  131. path = '/ldp/' + str(uuid.uuid4())
  132. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  133. ldp_rs_resp = self.client.put(path, data=f,
  134. content_type='text/turtle')
  135. assert ldp_rs_resp.status_code == 201
  136. rnd_img['content'].seek(0)
  137. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  138. headers={
  139. 'Content-Disposition' : 'attachment; filename={}'.format(
  140. rnd_img['filename'])})
  141. assert ldp_nr_resp.status_code == 415
  142. def test_post_resource(self, client):
  143. '''
  144. Check response headers for a POST operation with empty payload.
  145. '''
  146. res = self.client.post('/ldp/')
  147. assert res.status_code == 201
  148. assert 'Location' in res.headers
  149. def test_post_slug(self):
  150. '''
  151. Verify that a POST with slug results in the expected URI only if the
  152. resource does not exist already.
  153. '''
  154. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  155. assert slug01_resp.status_code == 201
  156. assert slug01_resp.headers['location'] == \
  157. Toolbox().base_url + '/slug01'
  158. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  159. assert slug02_resp.status_code == 201
  160. assert slug02_resp.headers['location'] != \
  161. Toolbox().base_url + '/slug01'
  162. def test_post_404(self):
  163. '''
  164. Verify that a POST to a non-existing parent results in a 404.
  165. '''
  166. assert self.client.post('/ldp/{}'.format(uuid.uuid4()))\
  167. .status_code == 404
  168. def test_post_409(self, rnd_img):
  169. '''
  170. Verify that you cannot POST to a binary resource.
  171. '''
  172. rnd_img['content'].seek(0)
  173. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  174. 'Content-Disposition' : 'attachment; filename={}'.format(
  175. rnd_img['filename'])})
  176. assert self.client.post('/ldp/post_409').status_code == 409
  177. def test_patch(self):
  178. '''
  179. Test patching a resource.
  180. '''
  181. path = '/ldp/test_patch01'
  182. self.client.put(path)
  183. uri = Toolbox().base_url + '/test_patch01'
  184. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  185. resp = self.client.patch(path,
  186. data=data,
  187. headers={'content-type' : 'application/sparql-update'})
  188. assert resp.status_code == 204
  189. resp = self.client.get(path)
  190. g = Graph().parse(data=resp.data, format='text/turtle')
  191. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  192. self.client.patch(path,
  193. data=open('tests/data/sparql_update/delete+insert+where.sparql'),
  194. headers={'content-type' : 'application/sparql-update'})
  195. resp = self.client.get(path)
  196. g = Graph().parse(data=resp.data, format='text/turtle')
  197. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  198. def test_patch_ldp_nr_metadata(self):
  199. '''
  200. Test patching a LDP-NR metadata resource, both from the fcr:metadata
  201. and the resource URIs.
  202. '''
  203. path = '/ldp/ldpnr01'
  204. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  205. self.client.patch(path + '/fcr:metadata',
  206. data=data,
  207. headers={'content-type' : 'application/sparql-update'})
  208. resp = self.client.get(path + '/fcr:metadata')
  209. assert resp.status_code == 200
  210. uri = Toolbox().base_url + '/ldpnr01'
  211. g = Graph().parse(data=resp.data, format='text/turtle')
  212. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  213. with open(
  214. 'tests/data/sparql_update/delete+insert+where.sparql') as data:
  215. patch_resp = self.client.patch(path,
  216. data=data,
  217. headers={'content-type' : 'application/sparql-update'})
  218. assert patch_resp.status_code == 204
  219. resp = self.client.get(path + '/fcr:metadata')
  220. assert resp.status_code == 200
  221. g = Graph().parse(data=resp.data, format='text/turtle')
  222. assert g[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  223. def test_patch_ldp_nr(self, rnd_img):
  224. '''
  225. Verify that a PATCH using anything other than an
  226. `application/sparql-update` MIME type results in an error.
  227. '''
  228. rnd_img['content'].seek(0)
  229. resp = self.client.patch('/ldp/ldpnr01/fcr:metadata',
  230. data=rnd_img,
  231. headers={'content-type' : 'image/jpeg'})
  232. assert resp.status_code == 415
  233. def test_delete(self):
  234. '''
  235. Test delete response codes.
  236. '''
  237. create_resp = self.client.put('/ldp/test_delete01')
  238. delete_resp = self.client.delete('/ldp/test_delete01')
  239. assert delete_resp.status_code == 204
  240. bogus_delete_resp = self.client.delete('/ldp/test_delete101')
  241. assert bogus_delete_resp.status_code == 404
  242. def test_tombstone(self):
  243. '''
  244. Test tombstone behaviors.
  245. '''
  246. tstone_resp = self.client.get('/ldp/test_delete01')
  247. assert tstone_resp.status_code == 410
  248. assert tstone_resp.headers['Link'] == \
  249. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  250. .format(Toolbox().base_url)
  251. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  252. assert self.client.get(tstone_path).status_code == 405
  253. assert self.client.put(tstone_path).status_code == 405
  254. assert self.client.post(tstone_path).status_code == 405
  255. assert self.client.delete(tstone_path).status_code == 204
  256. assert self.client.get('/ldp/test_delete01').status_code == 404
  257. def test_delete_recursive(self):
  258. '''
  259. Test response codes for resources deleted recursively and their
  260. tombstones.
  261. '''
  262. self.client.put('/ldp/test_delete_recursive01')
  263. self.client.put('/ldp/test_delete_recursive01/a')
  264. self.client.delete('/ldp/test_delete_recursive01')
  265. tstone_resp = self.client.get('/ldp/test_delete_recursive01')
  266. assert tstone_resp.status_code == 410
  267. assert tstone_resp.headers['Link'] == \
  268. '<{}/test_delete_recursive01/fcr:tombstone>; rel="hasTombstone"'\
  269. .format(Toolbox().base_url)
  270. child_tstone_resp = self.client.get('/ldp/test_delete_recursive01/a')
  271. assert child_tstone_resp.status_code == tstone_resp.status_code
  272. assert 'Link' not in child_tstone_resp.headers.keys()
  273. @pytest.mark.usefixtures('client_class')
  274. @pytest.mark.usefixtures('db')
  275. class TestPrefHeader:
  276. '''
  277. Test various combinations of `Prefer` header.
  278. '''
  279. @pytest.fixture(scope='class')
  280. def cont_structure(self):
  281. '''
  282. Create a container structure to be used for subsequent requests.
  283. '''
  284. parent_path = '/ldp/test_parent'
  285. self.client.put(parent_path)
  286. self.client.put(parent_path + '/child1')
  287. self.client.put(parent_path + '/child2')
  288. self.client.put(parent_path + '/child3')
  289. return {
  290. 'path' : parent_path,
  291. 'response' : self.client.get(parent_path),
  292. 'subject' : URIRef(Toolbox().base_url + '/test_parent')
  293. }
  294. def test_put_prefer_handling(self, random_uuid):
  295. '''
  296. Trying to PUT an existing resource should:
  297. - Return a 204 if the payload is empty
  298. - Return a 204 if the payload is RDF, server-managed triples are
  299. included and the 'Prefer' header is set to 'handling=lenient'
  300. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  301. server-managed triples are included and handling is set to 'strict'
  302. '''
  303. path = '/ldp/put_pref_header01'
  304. assert self.client.put(path).status_code == 201
  305. assert self.client.get(path).status_code == 200
  306. assert self.client.put(path).status_code == 204
  307. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  308. rsp_len = self.client.put(
  309. path,
  310. headers={
  311. 'Prefer' : 'handling=lenient',
  312. 'Content-Type' : 'text/turtle',
  313. },
  314. data=f
  315. )
  316. assert rsp_len.status_code == 204
  317. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  318. rsp_strict = self.client.put(
  319. path,
  320. headers={
  321. 'Prefer' : 'handling=strict',
  322. 'Content-Type' : 'text/turtle',
  323. },
  324. data=f
  325. )
  326. assert rsp_strict.status_code == 412
  327. def test_embed_children(self, cont_structure):
  328. '''
  329. verify the "embed children" prefer header.
  330. '''
  331. parent_path = cont_structure['path']
  332. cont_resp = cont_structure['response']
  333. cont_subject = cont_structure['subject']
  334. minimal_resp = self.client.get(parent_path, headers={
  335. 'Prefer' : 'return=minimal',
  336. })
  337. incl_embed_children_resp = self.client.get(parent_path, headers={
  338. 'Prefer' : 'return=representation; include={}'\
  339. .format(Ldpr.EMBED_CHILD_RES_URI),
  340. })
  341. omit_embed_children_resp = self.client.get(parent_path, headers={
  342. 'Prefer' : 'return=representation; omit={}'\
  343. .format(Ldpr.EMBED_CHILD_RES_URI),
  344. })
  345. assert omit_embed_children_resp.data == cont_resp.data
  346. incl_g = Graph().parse(
  347. data=incl_embed_children_resp.data, format='turtle')
  348. omit_g = Graph().parse(
  349. data=omit_embed_children_resp.data, format='turtle')
  350. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  351. assert len(children) == 3
  352. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  353. for child_uri in children:
  354. assert set(incl_g[ child_uri : : ])
  355. assert not set(omit_g[ child_uri : : ])
  356. def test_return_children(self, cont_structure):
  357. '''
  358. verify the "return children" prefer header.
  359. '''
  360. parent_path = cont_structure['path']
  361. cont_resp = cont_structure['response']
  362. cont_subject = cont_structure['subject']
  363. incl_children_resp = self.client.get(parent_path, headers={
  364. 'Prefer' : 'return=representation; include={}'\
  365. .format(Ldpr.RETURN_CHILD_RES_URI),
  366. })
  367. omit_children_resp = self.client.get(parent_path, headers={
  368. 'Prefer' : 'return=representation; omit={}'\
  369. .format(Ldpr.RETURN_CHILD_RES_URI),
  370. })
  371. assert incl_children_resp.data == cont_resp.data
  372. incl_g = Graph().parse(data=incl_children_resp.data, format='turtle')
  373. omit_g = Graph().parse(data=omit_children_resp.data, format='turtle')
  374. children = incl_g[cont_subject : nsc['ldp'].contains]
  375. for child_uri in children:
  376. assert not omit_g[ cont_subject : nsc['ldp'].contains : child_uri ]
  377. def test_inbound_rel(self, cont_structure):
  378. '''
  379. verify the "inboud relationships" prefer header.
  380. '''
  381. parent_path = cont_structure['path']
  382. cont_resp = cont_structure['response']
  383. cont_subject = cont_structure['subject']
  384. incl_inbound_resp = self.client.get(parent_path, headers={
  385. 'Prefer' : 'return=representation; include={}'\
  386. .format(Ldpr.RETURN_INBOUND_REF_URI),
  387. })
  388. omit_inbound_resp = self.client.get(parent_path, headers={
  389. 'Prefer' : 'return=representation; omit={}'\
  390. .format(Ldpr.RETURN_INBOUND_REF_URI),
  391. })
  392. assert omit_inbound_resp.data == cont_resp.data
  393. incl_g = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  394. omit_g = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  395. assert set(incl_g[ : : cont_subject ])
  396. assert not set(omit_g[ : : cont_subject ])
  397. def test_srv_mgd_triples(self, cont_structure):
  398. '''
  399. verify the "server managed triples" prefer header.
  400. '''
  401. parent_path = cont_structure['path']
  402. cont_resp = cont_structure['response']
  403. cont_subject = cont_structure['subject']
  404. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  405. 'Prefer' : 'return=representation; include={}'\
  406. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  407. })
  408. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  409. 'Prefer' : 'return=representation; omit={}'\
  410. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  411. })
  412. assert incl_srv_mgd_resp.data == cont_resp.data
  413. incl_g = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  414. omit_g = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  415. for pred in {
  416. nsc['fcrepo'].created,
  417. nsc['fcrepo'].createdBy,
  418. nsc['fcrepo'].lastModified,
  419. nsc['fcrepo'].lastModifiedBy,
  420. nsc['ldp'].contains,
  421. }:
  422. assert set(incl_g[ cont_subject : pred : ])
  423. assert not set(omit_g[ cont_subject : pred : ])
  424. for type in {
  425. nsc['fcrepo'].Resource,
  426. nsc['ldp'].Container,
  427. nsc['ldp'].Resource,
  428. }:
  429. assert incl_g[ cont_subject : RDF.type : type ]
  430. assert not omit_g[ cont_subject : RDF.type : type ]
  431. def test_delete_no_tstone(self):
  432. '''
  433. Test the `no-tombstone` Prefer option.
  434. '''
  435. self.client.put('/ldp/test_delete_no_tstone01')
  436. self.client.put('/ldp/test_delete_no_tstone01/a')
  437. self.client.delete('/ldp/test_delete_no_tstone01', headers={
  438. 'prefer' : 'no-tombstone'})
  439. resp = self.client.get('/ldp/test_delete_no_tstone01')
  440. assert resp.status_code == 404
  441. child_resp = self.client.get('/ldp/test_delete_no_tstone01/a')
  442. assert child_resp.status_code == 404