test_ldp.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import g
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. @pytest.fixture(scope='module')
  11. def random_uuid():
  12. return str(uuid.uuid4())
  13. @pytest.mark.usefixtures('client_class')
  14. @pytest.mark.usefixtures('db')
  15. class TestLdp:
  16. '''
  17. Test HTTP interaction with LDP endpoint.
  18. '''
  19. def test_get_root_node(self):
  20. '''
  21. Get the root node from two different endpoints.
  22. The test triplestore must be initialized, hence the `db` fixture.
  23. '''
  24. ldp_resp = self.client.get('/ldp')
  25. rest_resp = self.client.get('/rest')
  26. assert ldp_resp.status_code == 200
  27. assert rest_resp.status_code == 200
  28. #assert ldp_resp.data == rest_resp.data
  29. def test_put_empty_resource(self, random_uuid):
  30. '''
  31. Check response headers for a PUT operation with empty payload.
  32. '''
  33. resp = self.client.put('/ldp/new_resource')
  34. assert resp.status_code == 201
  35. assert resp.data == bytes(
  36. '{}/new_resource'.format(g.webroot), 'utf-8')
  37. def test_put_existing_resource(self, random_uuid):
  38. '''
  39. Trying to PUT an existing resource should return a 204 if the payload
  40. is empty.
  41. '''
  42. path = '/ldp/nonidempotent01'
  43. put1_resp = self.client.put(path)
  44. assert put1_resp.status_code == 201
  45. assert self.client.get(path).status_code == 200
  46. put2_resp = self.client.put(path)
  47. assert put2_resp.status_code == 204
  48. assert put2_resp.data == b''
  49. def test_put_tree(self, client):
  50. '''
  51. PUT a resource with several path segments.
  52. The test should create intermediate path segments that are not
  53. accessible to PUT or POST.
  54. '''
  55. path = '/ldp/test_tree/a/b/c/d/e/f/g'
  56. self.client.put(path)
  57. assert self.client.get(path).status_code == 200
  58. assert self.client.put('/ldp/test_tree/a').status_code == 409
  59. assert self.client.post('/ldp/test_tree/a').status_code == 409
  60. def test_put_nested_tree(self, client):
  61. '''
  62. Verify that containment is set correctly in nested hierarchies.
  63. First put a new hierarchy and verify that the root node is its
  64. container; then put another hierarchy under it and verify that the
  65. first hierarchy is the container of the second one.
  66. '''
  67. uuid1 = 'test_nested_tree/a/b/c/d'
  68. uuid2 = uuid1 + '/e/f/g'
  69. path1 = '/ldp/' + uuid1
  70. path2 = '/ldp/' + uuid2
  71. self.client.put(path1)
  72. cont1_data = self.client.get('/ldp').data
  73. g1 = Graph().parse(data=cont1_data, format='turtle')
  74. assert g1[ URIRef(g.webroot + '/') : nsc['ldp'].contains : \
  75. URIRef(g.webroot + '/' + uuid1) ]
  76. self.client.put(path2)
  77. cont2_data = self.client.get(path1).data
  78. g1 = Graph().parse(data=cont2_data, format='turtle')
  79. assert g1[ URIRef(g.webroot + '/' + uuid1) : \
  80. nsc['ldp'].contains : \
  81. URIRef(g.webroot + '/' + uuid2) ]
  82. def test_put_ldp_rs(self, client):
  83. '''
  84. PUT a resource with RDF payload and verify.
  85. '''
  86. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  87. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  88. resp = self.client.get('/ldp/ldprs01',
  89. headers={'accept' : 'text/turtle'})
  90. assert resp.status_code == 200
  91. gr = Graph().parse(data=resp.data, format='text/turtle')
  92. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  93. gr.objects(None, RDF.type)
  94. def test_put_ldp_nr(self, rnd_img):
  95. '''
  96. PUT a resource with binary payload and verify checksums.
  97. '''
  98. rnd_img['content'].seek(0)
  99. resp = self.client.put('/ldp/ldpnr01', data=rnd_img['content'],
  100. headers={
  101. 'Content-Disposition' : 'attachment; filename={}'.format(
  102. rnd_img['filename'])})
  103. assert resp.status_code == 201
  104. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  105. assert resp.status_code == 200
  106. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  107. def test_put_mismatched_ldp_rs(self, rnd_img):
  108. '''
  109. Verify MIME type / LDP mismatch.
  110. PUT a LDP-RS, then PUT a LDP-NR on the same location and verify it
  111. fails.
  112. '''
  113. path = '/ldp/' + str(uuid.uuid4())
  114. rnd_img['content'].seek(0)
  115. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  116. headers={
  117. 'Content-Disposition' : 'attachment; filename={}'.format(
  118. rnd_img['filename'])})
  119. assert ldp_nr_resp.status_code == 201
  120. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  121. ldp_rs_resp = self.client.put(path, data=f,
  122. content_type='text/turtle')
  123. assert ldp_rs_resp.status_code == 415
  124. def test_put_mismatched_ldp_nr(self, rnd_img):
  125. '''
  126. Verify MIME type / LDP mismatch.
  127. PUT a LDP-NR, then PUT a LDP-RS on the same location and verify it
  128. fails.
  129. '''
  130. path = '/ldp/' + str(uuid.uuid4())
  131. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  132. ldp_rs_resp = self.client.put(path, data=f,
  133. content_type='text/turtle')
  134. assert ldp_rs_resp.status_code == 201
  135. rnd_img['content'].seek(0)
  136. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  137. headers={
  138. 'Content-Disposition' : 'attachment; filename={}'.format(
  139. rnd_img['filename'])})
  140. assert ldp_nr_resp.status_code == 415
  141. def test_post_resource(self, client):
  142. '''
  143. Check response headers for a POST operation with empty payload.
  144. '''
  145. res = self.client.post('/ldp/')
  146. assert res.status_code == 201
  147. assert 'Location' in res.headers
  148. def test_post_slug(self):
  149. '''
  150. Verify that a POST with slug results in the expected URI only if the
  151. resource does not exist already.
  152. '''
  153. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  154. assert slug01_resp.status_code == 201
  155. assert slug01_resp.headers['location'] == \
  156. g.webroot + '/slug01'
  157. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  158. assert slug02_resp.status_code == 201
  159. assert slug02_resp.headers['location'] != \
  160. g.webroot + '/slug01'
  161. def test_post_404(self):
  162. '''
  163. Verify that a POST to a non-existing parent results in a 404.
  164. '''
  165. assert self.client.post('/ldp/{}'.format(uuid.uuid4()))\
  166. .status_code == 404
  167. def test_post_409(self, rnd_img):
  168. '''
  169. Verify that you cannot POST to a binary resource.
  170. '''
  171. rnd_img['content'].seek(0)
  172. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  173. 'Content-Disposition' : 'attachment; filename={}'.format(
  174. rnd_img['filename'])})
  175. assert self.client.post('/ldp/post_409').status_code == 409
  176. def test_patch(self):
  177. '''
  178. Test patching a resource.
  179. '''
  180. path = '/ldp/test_patch01'
  181. self.client.put(path)
  182. uri = g.webroot + '/test_patch01'
  183. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  184. resp = self.client.patch(path,
  185. data=data,
  186. headers={'content-type' : 'application/sparql-update'})
  187. assert resp.status_code == 204
  188. resp = self.client.get(path)
  189. gr = Graph().parse(data=resp.data, format='text/turtle')
  190. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  191. self.client.patch(path,
  192. data=open('tests/data/sparql_update/delete+insert+where.sparql'),
  193. headers={'content-type' : 'application/sparql-update'})
  194. resp = self.client.get(path)
  195. gr = Graph().parse(data=resp.data, format='text/turtle')
  196. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  197. def test_patch_ldp_nr_metadata(self):
  198. '''
  199. Test patching a LDP-NR metadata resource, both from the fcr:metadata
  200. and the resource URIs.
  201. '''
  202. path = '/ldp/ldpnr01'
  203. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  204. self.client.patch(path + '/fcr:metadata',
  205. data=data,
  206. headers={'content-type' : 'application/sparql-update'})
  207. resp = self.client.get(path + '/fcr:metadata')
  208. assert resp.status_code == 200
  209. uri = g.webroot + '/ldpnr01'
  210. gr = Graph().parse(data=resp.data, format='text/turtle')
  211. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  212. with open(
  213. 'tests/data/sparql_update/delete+insert+where.sparql') as data:
  214. patch_resp = self.client.patch(path,
  215. data=data,
  216. headers={'content-type' : 'application/sparql-update'})
  217. assert patch_resp.status_code == 204
  218. resp = self.client.get(path + '/fcr:metadata')
  219. assert resp.status_code == 200
  220. gr = Graph().parse(data=resp.data, format='text/turtle')
  221. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  222. def test_patch_ldp_nr(self, rnd_img):
  223. '''
  224. Verify that a PATCH using anything other than an
  225. `application/sparql-update` MIME type results in an error.
  226. '''
  227. rnd_img['content'].seek(0)
  228. resp = self.client.patch('/ldp/ldpnr01/fcr:metadata',
  229. data=rnd_img,
  230. headers={'content-type' : 'image/jpeg'})
  231. assert resp.status_code == 415
  232. def test_delete(self):
  233. '''
  234. Test delete response codes.
  235. '''
  236. create_resp = self.client.put('/ldp/test_delete01')
  237. delete_resp = self.client.delete('/ldp/test_delete01')
  238. assert delete_resp.status_code == 204
  239. bogus_delete_resp = self.client.delete('/ldp/test_delete101')
  240. assert bogus_delete_resp.status_code == 404
  241. def test_tombstone(self):
  242. '''
  243. Test tombstone behaviors.
  244. '''
  245. tstone_resp = self.client.get('/ldp/test_delete01')
  246. assert tstone_resp.status_code == 410
  247. assert tstone_resp.headers['Link'] == \
  248. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  249. .format(g.webroot)
  250. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  251. assert self.client.get(tstone_path).status_code == 405
  252. assert self.client.put(tstone_path).status_code == 405
  253. assert self.client.post(tstone_path).status_code == 405
  254. assert self.client.delete(tstone_path).status_code == 204
  255. assert self.client.get('/ldp/test_delete01').status_code == 404
  256. def test_delete_recursive(self):
  257. '''
  258. Test response codes for resources deleted recursively and their
  259. tombstones.
  260. '''
  261. self.client.put('/ldp/test_delete_recursive01')
  262. self.client.put('/ldp/test_delete_recursive01/a')
  263. self.client.delete('/ldp/test_delete_recursive01')
  264. tstone_resp = self.client.get('/ldp/test_delete_recursive01')
  265. assert tstone_resp.status_code == 410
  266. assert tstone_resp.headers['Link'] == \
  267. '<{}/test_delete_recursive01/fcr:tombstone>; rel="hasTombstone"'\
  268. .format(g.webroot)
  269. child_tstone_resp = self.client.get('/ldp/test_delete_recursive01/a')
  270. assert child_tstone_resp.status_code == tstone_resp.status_code
  271. assert 'Link' not in child_tstone_resp.headers.keys()
  272. @pytest.mark.usefixtures('client_class')
  273. @pytest.mark.usefixtures('db')
  274. class TestPrefHeader:
  275. '''
  276. Test various combinations of `Prefer` header.
  277. '''
  278. @pytest.fixture(scope='class')
  279. def cont_structure(self):
  280. '''
  281. Create a container structure to be used for subsequent requests.
  282. '''
  283. parent_path = '/ldp/test_parent'
  284. self.client.put(parent_path)
  285. self.client.put(parent_path + '/child1')
  286. self.client.put(parent_path + '/child2')
  287. self.client.put(parent_path + '/child3')
  288. return {
  289. 'path' : parent_path,
  290. 'response' : self.client.get(parent_path),
  291. 'subject' : URIRef(g.webroot + '/test_parent')
  292. }
  293. def test_put_prefer_handling(self, random_uuid):
  294. '''
  295. Trying to PUT an existing resource should:
  296. - Return a 204 if the payload is empty
  297. - Return a 204 if the payload is RDF, server-managed triples are
  298. included and the 'Prefer' header is set to 'handling=lenient'
  299. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  300. server-managed triples are included and handling is set to 'strict'
  301. '''
  302. path = '/ldp/put_pref_header01'
  303. assert self.client.put(path).status_code == 201
  304. assert self.client.get(path).status_code == 200
  305. assert self.client.put(path).status_code == 204
  306. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  307. rsp_len = self.client.put(
  308. path,
  309. headers={
  310. 'Prefer' : 'handling=lenient',
  311. 'Content-Type' : 'text/turtle',
  312. },
  313. data=f
  314. )
  315. assert rsp_len.status_code == 204
  316. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  317. rsp_strict = self.client.put(
  318. path,
  319. headers={
  320. 'Prefer' : 'handling=strict',
  321. 'Content-Type' : 'text/turtle',
  322. },
  323. data=f
  324. )
  325. assert rsp_strict.status_code == 412
  326. def test_embed_children(self, cont_structure):
  327. '''
  328. verify the "embed children" prefer header.
  329. '''
  330. parent_path = cont_structure['path']
  331. cont_resp = cont_structure['response']
  332. cont_subject = cont_structure['subject']
  333. minimal_resp = self.client.get(parent_path, headers={
  334. 'Prefer' : 'return=minimal',
  335. })
  336. incl_embed_children_resp = self.client.get(parent_path, headers={
  337. 'Prefer' : 'return=representation; include={}'\
  338. .format(Ldpr.EMBED_CHILD_RES_URI),
  339. })
  340. omit_embed_children_resp = self.client.get(parent_path, headers={
  341. 'Prefer' : 'return=representation; omit={}'\
  342. .format(Ldpr.EMBED_CHILD_RES_URI),
  343. })
  344. assert omit_embed_children_resp.data == cont_resp.data
  345. incl_gr = Graph().parse(
  346. data=incl_embed_children_resp.data, format='turtle')
  347. omit_gr = Graph().parse(
  348. data=omit_embed_children_resp.data, format='turtle')
  349. children = set(incl_gr[cont_subject : nsc['ldp'].contains])
  350. assert len(children) == 3
  351. children = set(incl_gr[cont_subject : nsc['ldp'].contains])
  352. for child_uri in children:
  353. assert set(incl_gr[ child_uri : : ])
  354. assert not set(omit_gr[ child_uri : : ])
  355. def test_return_children(self, cont_structure):
  356. '''
  357. verify the "return children" prefer header.
  358. '''
  359. parent_path = cont_structure['path']
  360. cont_resp = cont_structure['response']
  361. cont_subject = cont_structure['subject']
  362. incl_children_resp = self.client.get(parent_path, headers={
  363. 'Prefer' : 'return=representation; include={}'\
  364. .format(Ldpr.RETURN_CHILD_RES_URI),
  365. })
  366. omit_children_resp = self.client.get(parent_path, headers={
  367. 'Prefer' : 'return=representation; omit={}'\
  368. .format(Ldpr.RETURN_CHILD_RES_URI),
  369. })
  370. assert incl_children_resp.data == cont_resp.data
  371. incl_gr = Graph().parse(data=incl_children_resp.data, format='turtle')
  372. omit_gr = Graph().parse(data=omit_children_resp.data, format='turtle')
  373. children = incl_gr[cont_subject : nsc['ldp'].contains]
  374. for child_uri in children:
  375. assert not omit_gr[ cont_subject : nsc['ldp'].contains : child_uri ]
  376. def test_inbound_rel(self, cont_structure):
  377. '''
  378. verify the "inboud relationships" prefer header.
  379. '''
  380. parent_path = cont_structure['path']
  381. cont_resp = cont_structure['response']
  382. cont_subject = cont_structure['subject']
  383. incl_inbound_resp = self.client.get(parent_path, headers={
  384. 'Prefer' : 'return=representation; include={}'\
  385. .format(Ldpr.RETURN_INBOUND_REF_URI),
  386. })
  387. omit_inbound_resp = self.client.get(parent_path, headers={
  388. 'Prefer' : 'return=representation; omit={}'\
  389. .format(Ldpr.RETURN_INBOUND_REF_URI),
  390. })
  391. assert omit_inbound_resp.data == cont_resp.data
  392. incl_gr = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  393. omit_gr = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  394. assert set(incl_gr[ : : cont_subject ])
  395. assert not set(omit_gr[ : : cont_subject ])
  396. def test_srv_mgd_triples(self, cont_structure):
  397. '''
  398. verify the "server managed triples" prefer header.
  399. '''
  400. parent_path = cont_structure['path']
  401. cont_resp = cont_structure['response']
  402. cont_subject = cont_structure['subject']
  403. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  404. 'Prefer' : 'return=representation; include={}'\
  405. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  406. })
  407. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  408. 'Prefer' : 'return=representation; omit={}'\
  409. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  410. })
  411. assert incl_srv_mgd_resp.data == cont_resp.data
  412. incl_gr = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  413. omit_gr = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  414. for pred in {
  415. nsc['fcrepo'].created,
  416. nsc['fcrepo'].createdBy,
  417. nsc['fcrepo'].lastModified,
  418. nsc['fcrepo'].lastModifiedBy,
  419. nsc['ldp'].contains,
  420. }:
  421. assert set(incl_gr[ cont_subject : pred : ])
  422. assert not set(omit_gr[ cont_subject : pred : ])
  423. for type in {
  424. nsc['fcrepo'].Resource,
  425. nsc['ldp'].Container,
  426. nsc['ldp'].Resource,
  427. }:
  428. assert incl_gr[ cont_subject : RDF.type : type ]
  429. assert not omit_gr[ cont_subject : RDF.type : type ]
  430. def test_delete_no_tstone(self):
  431. '''
  432. Test the `no-tombstone` Prefer option.
  433. '''
  434. self.client.put('/ldp/test_delete_no_tstone01')
  435. self.client.put('/ldp/test_delete_no_tstone01/a')
  436. self.client.delete('/ldp/test_delete_no_tstone01', headers={
  437. 'prefer' : 'no-tombstone'})
  438. resp = self.client.get('/ldp/test_delete_no_tstone01')
  439. assert resp.status_code == 404
  440. child_resp = self.client.get('/ldp/test_delete_no_tstone01/a')
  441. assert child_resp.status_code == 404