test_ldp.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import g
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. @pytest.fixture(scope='module')
  11. def random_uuid():
  12. return str(uuid.uuid4())
  13. @pytest.mark.usefixtures('client_class')
  14. @pytest.mark.usefixtures('db')
  15. class TestLdp:
  16. '''
  17. Test HTTP interaction with LDP endpoint.
  18. '''
  19. def test_get_root_node(self):
  20. '''
  21. Get the root node from two different endpoints.
  22. The test triplestore must be initialized, hence the `db` fixture.
  23. '''
  24. ldp_resp = self.client.get('/ldp')
  25. rest_resp = self.client.get('/rest')
  26. assert ldp_resp.status_code == 200
  27. assert rest_resp.status_code == 200
  28. def test_put_empty_resource(self, random_uuid):
  29. '''
  30. Check response headers for a PUT operation with empty payload.
  31. '''
  32. resp = self.client.put('/ldp/new_resource')
  33. assert resp.status_code == 201
  34. assert resp.data == bytes(
  35. '{}/new_resource'.format(g.webroot), 'utf-8')
  36. def test_put_existing_resource(self, random_uuid):
  37. '''
  38. Trying to PUT an existing resource should return a 204 if the payload
  39. is empty.
  40. '''
  41. path = '/ldp/nonidempotent01'
  42. put1_resp = self.client.put(path)
  43. assert put1_resp.status_code == 201
  44. assert self.client.get(path).status_code == 200
  45. put2_resp = self.client.put(path)
  46. assert put2_resp.status_code == 204
  47. assert put2_resp.data == b''
  48. def test_put_tree(self, client):
  49. '''
  50. PUT a resource with several path segments.
  51. The test should create intermediate path segments that are not
  52. accessible to PUT or POST.
  53. '''
  54. path = '/ldp/test_tree/a/b/c/d/e/f/g'
  55. self.client.put(path)
  56. assert self.client.get(path).status_code == 200
  57. assert self.client.put('/ldp/test_tree/a').status_code == 409
  58. assert self.client.post('/ldp/test_tree/a').status_code == 409
  59. def test_put_nested_tree(self, client):
  60. '''
  61. Verify that containment is set correctly in nested hierarchies.
  62. First put a new hierarchy and verify that the root node is its
  63. container; then put another hierarchy under it and verify that the
  64. first hierarchy is the container of the second one.
  65. '''
  66. uuid1 = 'test_nested_tree/a/b/c/d'
  67. uuid2 = uuid1 + '/e/f/g'
  68. path1 = '/ldp/' + uuid1
  69. path2 = '/ldp/' + uuid2
  70. self.client.put(path1)
  71. cont1_data = self.client.get('/ldp').data
  72. gr1 = Graph().parse(data=cont1_data, format='turtle')
  73. assert gr1[ URIRef(g.webroot + '/') : nsc['ldp'].contains : \
  74. URIRef(g.webroot + '/' + uuid1) ]
  75. self.client.put(path2)
  76. cont2_data = self.client.get(path1).data
  77. gr2 = Graph().parse(data=cont2_data, format='turtle')
  78. assert gr2[ URIRef(g.webroot + '/' + uuid1) : \
  79. nsc['ldp'].contains : \
  80. URIRef(g.webroot + '/' + uuid2) ]
  81. def test_put_ldp_rs(self, client):
  82. '''
  83. PUT a resource with RDF payload and verify.
  84. '''
  85. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  86. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  87. resp = self.client.get('/ldp/ldprs01',
  88. headers={'accept' : 'text/turtle'})
  89. assert resp.status_code == 200
  90. gr = Graph().parse(data=resp.data, format='text/turtle')
  91. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  92. gr.objects(None, RDF.type)
  93. def test_put_ldp_nr(self, rnd_img):
  94. '''
  95. PUT a resource with binary payload and verify checksums.
  96. '''
  97. rnd_img['content'].seek(0)
  98. resp = self.client.put('/ldp/ldpnr01', data=rnd_img['content'],
  99. headers={
  100. 'Content-Disposition' : 'attachment; filename={}'.format(
  101. rnd_img['filename'])})
  102. assert resp.status_code == 201
  103. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  104. assert resp.status_code == 200
  105. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  106. def test_put_mismatched_ldp_rs(self, rnd_img):
  107. '''
  108. Verify MIME type / LDP mismatch.
  109. PUT a LDP-RS, then PUT a LDP-NR on the same location and verify it
  110. fails.
  111. '''
  112. path = '/ldp/' + str(uuid.uuid4())
  113. rnd_img['content'].seek(0)
  114. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  115. headers={
  116. 'Content-Disposition' : 'attachment; filename={}'.format(
  117. rnd_img['filename'])})
  118. assert ldp_nr_resp.status_code == 201
  119. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  120. ldp_rs_resp = self.client.put(path, data=f,
  121. content_type='text/turtle')
  122. assert ldp_rs_resp.status_code == 415
  123. def test_put_mismatched_ldp_nr(self, rnd_img):
  124. '''
  125. Verify MIME type / LDP mismatch.
  126. PUT a LDP-NR, then PUT a LDP-RS on the same location and verify it
  127. fails.
  128. '''
  129. path = '/ldp/' + str(uuid.uuid4())
  130. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  131. ldp_rs_resp = self.client.put(path, data=f,
  132. content_type='text/turtle')
  133. assert ldp_rs_resp.status_code == 201
  134. rnd_img['content'].seek(0)
  135. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  136. headers={
  137. 'Content-Disposition' : 'attachment; filename={}'.format(
  138. rnd_img['filename'])})
  139. assert ldp_nr_resp.status_code == 415
  140. def test_post_resource(self, client):
  141. '''
  142. Check response headers for a POST operation with empty payload.
  143. '''
  144. res = self.client.post('/ldp/')
  145. assert res.status_code == 201
  146. assert 'Location' in res.headers
  147. def test_post_slug(self):
  148. '''
  149. Verify that a POST with slug results in the expected URI only if the
  150. resource does not exist already.
  151. '''
  152. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  153. assert slug01_resp.status_code == 201
  154. assert slug01_resp.headers['location'] == \
  155. g.webroot + '/slug01'
  156. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  157. assert slug02_resp.status_code == 201
  158. assert slug02_resp.headers['location'] != \
  159. g.webroot + '/slug01'
  160. def test_post_404(self):
  161. '''
  162. Verify that a POST to a non-existing parent results in a 404.
  163. '''
  164. assert self.client.post('/ldp/{}'.format(uuid.uuid4()))\
  165. .status_code == 404
  166. def test_post_409(self, rnd_img):
  167. '''
  168. Verify that you cannot POST to a binary resource.
  169. '''
  170. rnd_img['content'].seek(0)
  171. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  172. 'Content-Disposition' : 'attachment; filename={}'.format(
  173. rnd_img['filename'])})
  174. assert self.client.post('/ldp/post_409').status_code == 409
  175. def test_patch(self):
  176. '''
  177. Test patching a resource.
  178. '''
  179. path = '/ldp/test_patch01'
  180. self.client.put(path)
  181. uri = g.webroot + '/test_patch01'
  182. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  183. resp = self.client.patch(path,
  184. data=data,
  185. headers={'content-type' : 'application/sparql-update'})
  186. assert resp.status_code == 204
  187. resp = self.client.get(path)
  188. gr = Graph().parse(data=resp.data, format='text/turtle')
  189. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  190. self.client.patch(path,
  191. data=open('tests/data/sparql_update/delete+insert+where.sparql'),
  192. headers={'content-type' : 'application/sparql-update'})
  193. resp = self.client.get(path)
  194. gr = Graph().parse(data=resp.data, format='text/turtle')
  195. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  196. def test_patch_ldp_nr_metadata(self):
  197. '''
  198. Test patching a LDP-NR metadata resource, both from the fcr:metadata
  199. and the resource URIs.
  200. '''
  201. path = '/ldp/ldpnr01'
  202. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  203. self.client.patch(path + '/fcr:metadata',
  204. data=data,
  205. headers={'content-type' : 'application/sparql-update'})
  206. resp = self.client.get(path + '/fcr:metadata')
  207. assert resp.status_code == 200
  208. uri = g.webroot + '/ldpnr01'
  209. gr = Graph().parse(data=resp.data, format='text/turtle')
  210. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  211. with open(
  212. 'tests/data/sparql_update/delete+insert+where.sparql') as data:
  213. patch_resp = self.client.patch(path,
  214. data=data,
  215. headers={'content-type' : 'application/sparql-update'})
  216. assert patch_resp.status_code == 204
  217. resp = self.client.get(path + '/fcr:metadata')
  218. assert resp.status_code == 200
  219. gr = Graph().parse(data=resp.data, format='text/turtle')
  220. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  221. def test_patch_ldp_nr(self, rnd_img):
  222. '''
  223. Verify that a PATCH using anything other than an
  224. `application/sparql-update` MIME type results in an error.
  225. '''
  226. rnd_img['content'].seek(0)
  227. resp = self.client.patch('/ldp/ldpnr01/fcr:metadata',
  228. data=rnd_img,
  229. headers={'content-type' : 'image/jpeg'})
  230. assert resp.status_code == 415
  231. def test_delete(self):
  232. '''
  233. Test delete response codes.
  234. '''
  235. create_resp = self.client.put('/ldp/test_delete01')
  236. delete_resp = self.client.delete('/ldp/test_delete01')
  237. assert delete_resp.status_code == 204
  238. bogus_delete_resp = self.client.delete('/ldp/test_delete101')
  239. assert bogus_delete_resp.status_code == 404
  240. def test_tombstone(self):
  241. '''
  242. Test tombstone behaviors.
  243. '''
  244. tstone_resp = self.client.get('/ldp/test_delete01')
  245. assert tstone_resp.status_code == 410
  246. assert tstone_resp.headers['Link'] == \
  247. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  248. .format(g.webroot)
  249. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  250. assert self.client.get(tstone_path).status_code == 405
  251. assert self.client.put(tstone_path).status_code == 405
  252. assert self.client.post(tstone_path).status_code == 405
  253. assert self.client.delete(tstone_path).status_code == 204
  254. assert self.client.get('/ldp/test_delete01').status_code == 404
  255. def test_delete_recursive(self):
  256. '''
  257. Test response codes for resources deleted recursively and their
  258. tombstones.
  259. '''
  260. self.client.put('/ldp/test_delete_recursive01')
  261. self.client.put('/ldp/test_delete_recursive01/a')
  262. self.client.delete('/ldp/test_delete_recursive01')
  263. tstone_resp = self.client.get('/ldp/test_delete_recursive01')
  264. assert tstone_resp.status_code == 410
  265. assert tstone_resp.headers['Link'] == \
  266. '<{}/test_delete_recursive01/fcr:tombstone>; rel="hasTombstone"'\
  267. .format(g.webroot)
  268. child_tstone_resp = self.client.get('/ldp/test_delete_recursive01/a')
  269. assert child_tstone_resp.status_code == tstone_resp.status_code
  270. assert 'Link' not in child_tstone_resp.headers.keys()
  271. @pytest.mark.usefixtures('client_class')
  272. @pytest.mark.usefixtures('db')
  273. class TestPrefHeader:
  274. '''
  275. Test various combinations of `Prefer` header.
  276. '''
  277. @pytest.fixture(scope='class')
  278. def cont_structure(self):
  279. '''
  280. Create a container structure to be used for subsequent requests.
  281. '''
  282. parent_path = '/ldp/test_parent'
  283. self.client.put(parent_path)
  284. self.client.put(parent_path + '/child1')
  285. self.client.put(parent_path + '/child2')
  286. self.client.put(parent_path + '/child3')
  287. return {
  288. 'path' : parent_path,
  289. 'response' : self.client.get(parent_path),
  290. 'subject' : URIRef(g.webroot + '/test_parent')
  291. }
  292. def test_put_prefer_handling(self, random_uuid):
  293. '''
  294. Trying to PUT an existing resource should:
  295. - Return a 204 if the payload is empty
  296. - Return a 204 if the payload is RDF, server-managed triples are
  297. included and the 'Prefer' header is set to 'handling=lenient'
  298. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  299. server-managed triples are included and handling is set to 'strict'
  300. '''
  301. path = '/ldp/put_pref_header01'
  302. assert self.client.put(path).status_code == 201
  303. assert self.client.get(path).status_code == 200
  304. assert self.client.put(path).status_code == 204
  305. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  306. rsp_len = self.client.put(
  307. path,
  308. headers={
  309. 'Prefer' : 'handling=lenient',
  310. 'Content-Type' : 'text/turtle',
  311. },
  312. data=f
  313. )
  314. assert rsp_len.status_code == 204
  315. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  316. rsp_strict = self.client.put(
  317. path,
  318. headers={
  319. 'Prefer' : 'handling=strict',
  320. 'Content-Type' : 'text/turtle',
  321. },
  322. data=f
  323. )
  324. assert rsp_strict.status_code == 412
  325. def test_embed_children(self, cont_structure):
  326. '''
  327. verify the "embed children" prefer header.
  328. '''
  329. parent_path = cont_structure['path']
  330. cont_resp = cont_structure['response']
  331. cont_subject = cont_structure['subject']
  332. minimal_resp = self.client.get(parent_path, headers={
  333. 'Prefer' : 'return=minimal',
  334. })
  335. incl_embed_children_resp = self.client.get(parent_path, headers={
  336. 'Prefer' : 'return=representation; include={}'\
  337. .format(Ldpr.EMBED_CHILD_RES_URI),
  338. })
  339. omit_embed_children_resp = self.client.get(parent_path, headers={
  340. 'Prefer' : 'return=representation; omit={}'\
  341. .format(Ldpr.EMBED_CHILD_RES_URI),
  342. })
  343. assert omit_embed_children_resp.data == cont_resp.data
  344. incl_gr = Graph().parse(
  345. data=incl_embed_children_resp.data, format='turtle')
  346. omit_gr = Graph().parse(
  347. data=omit_embed_children_resp.data, format='turtle')
  348. children = set(incl_gr[cont_subject : nsc['ldp'].contains])
  349. assert len(children) == 3
  350. children = set(incl_gr[cont_subject : nsc['ldp'].contains])
  351. for child_uri in children:
  352. assert set(incl_gr[ child_uri : : ])
  353. assert not set(omit_gr[ child_uri : : ])
  354. def test_return_children(self, cont_structure):
  355. '''
  356. verify the "return children" prefer header.
  357. '''
  358. parent_path = cont_structure['path']
  359. cont_resp = cont_structure['response']
  360. cont_subject = cont_structure['subject']
  361. incl_children_resp = self.client.get(parent_path, headers={
  362. 'Prefer' : 'return=representation; include={}'\
  363. .format(Ldpr.RETURN_CHILD_RES_URI),
  364. })
  365. omit_children_resp = self.client.get(parent_path, headers={
  366. 'Prefer' : 'return=representation; omit={}'\
  367. .format(Ldpr.RETURN_CHILD_RES_URI),
  368. })
  369. assert incl_children_resp.data == cont_resp.data
  370. incl_gr = Graph().parse(data=incl_children_resp.data, format='turtle')
  371. omit_gr = Graph().parse(data=omit_children_resp.data, format='turtle')
  372. children = incl_gr[cont_subject : nsc['ldp'].contains]
  373. for child_uri in children:
  374. assert not omit_gr[ cont_subject : nsc['ldp'].contains : child_uri ]
  375. def test_inbound_rel(self, cont_structure):
  376. '''
  377. verify the "inboud relationships" prefer header.
  378. '''
  379. parent_path = cont_structure['path']
  380. cont_resp = cont_structure['response']
  381. cont_subject = cont_structure['subject']
  382. incl_inbound_resp = self.client.get(parent_path, headers={
  383. 'Prefer' : 'return=representation; include={}'\
  384. .format(Ldpr.RETURN_INBOUND_REF_URI),
  385. })
  386. omit_inbound_resp = self.client.get(parent_path, headers={
  387. 'Prefer' : 'return=representation; omit={}'\
  388. .format(Ldpr.RETURN_INBOUND_REF_URI),
  389. })
  390. assert omit_inbound_resp.data == cont_resp.data
  391. incl_gr = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  392. omit_gr = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  393. assert set(incl_gr[ : : cont_subject ])
  394. assert not set(omit_gr[ : : cont_subject ])
  395. def test_srv_mgd_triples(self, cont_structure):
  396. '''
  397. verify the "server managed triples" prefer header.
  398. '''
  399. parent_path = cont_structure['path']
  400. cont_resp = cont_structure['response']
  401. cont_subject = cont_structure['subject']
  402. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  403. 'Prefer' : 'return=representation; include={}'\
  404. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  405. })
  406. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  407. 'Prefer' : 'return=representation; omit={}'\
  408. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  409. })
  410. assert incl_srv_mgd_resp.data == cont_resp.data
  411. incl_gr = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  412. omit_gr = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  413. for pred in {
  414. nsc['fcrepo'].created,
  415. nsc['fcrepo'].createdBy,
  416. nsc['fcrepo'].lastModified,
  417. nsc['fcrepo'].lastModifiedBy,
  418. nsc['ldp'].contains,
  419. }:
  420. assert set(incl_gr[ cont_subject : pred : ])
  421. assert not set(omit_gr[ cont_subject : pred : ])
  422. for type in {
  423. nsc['fcrepo'].Resource,
  424. nsc['ldp'].Container,
  425. nsc['ldp'].Resource,
  426. }:
  427. assert incl_gr[ cont_subject : RDF.type : type ]
  428. assert not omit_gr[ cont_subject : RDF.type : type ]
  429. def test_delete_no_tstone(self):
  430. '''
  431. Test the `no-tombstone` Prefer option.
  432. '''
  433. self.client.put('/ldp/test_delete_no_tstone01')
  434. self.client.put('/ldp/test_delete_no_tstone01/a')
  435. self.client.delete('/ldp/test_delete_no_tstone01', headers={
  436. 'prefer' : 'no-tombstone'})
  437. resp = self.client.get('/ldp/test_delete_no_tstone01')
  438. assert resp.status_code == 404
  439. child_resp = self.client.get('/ldp/test_delete_no_tstone01/a')
  440. assert child_resp.status_code == 404