test_ldp.py 58 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690
  1. import pdb
  2. import pytest
  3. from base64 import b64encode
  4. from datetime import timedelta
  5. from hashlib import sha1
  6. from uuid import uuid4
  7. from werkzeug.http import http_date
  8. import arrow
  9. from flask import g
  10. from rdflib import Graph
  11. from rdflib.compare import isomorphic
  12. from rdflib.namespace import RDF
  13. from rdflib.term import Literal, URIRef
  14. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  15. from lakesuperior.model.ldpr import Ldpr
  16. @pytest.fixture(scope='module')
  17. def random_uuid():
  18. return str(uuid4())
  19. @pytest.mark.usefixtures('client_class')
  20. @pytest.mark.usefixtures('db')
  21. class TestLdp:
  22. """
  23. Test HTTP interaction with LDP endpoint.
  24. """
  25. def test_get_root_node(self):
  26. """
  27. Get the root node from two different endpoints.
  28. The test triplestore must be initialized, hence the `db` fixture.
  29. """
  30. ldp_resp = self.client.get('/ldp')
  31. rest_resp = self.client.get('/rest')
  32. assert ldp_resp.status_code == 200
  33. assert rest_resp.status_code == 200
  34. def test_put_empty_resource(self, random_uuid):
  35. """
  36. Check response headers for a PUT operation with empty payload.
  37. """
  38. resp = self.client.put('/ldp/new_resource')
  39. assert resp.status_code == 201
  40. assert resp.data == bytes(
  41. '{}/new_resource'.format(g.webroot), 'utf-8')
  42. def test_put_existing_resource(self, random_uuid):
  43. """
  44. Trying to PUT an existing resource should return a 204 if the payload
  45. is empty.
  46. """
  47. path = '/ldp/nonidempotent01'
  48. put1_resp = self.client.put(path)
  49. assert put1_resp.status_code == 201
  50. assert self.client.get(path).status_code == 200
  51. put2_resp = self.client.put(path)
  52. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  53. put2_resp = self.client.put(
  54. path, data=f, content_type='text/turtle')
  55. assert put2_resp.status_code == 204
  56. put2_resp = self.client.put(path)
  57. assert put2_resp.status_code == 204
  58. def test_put_tree(self, client):
  59. """
  60. PUT a resource with several path segments.
  61. The test should create intermediate path segments that are LDPCs,
  62. accessible to PUT or POST.
  63. """
  64. path = '/ldp/test_tree/a/b/c/d/e/f/g'
  65. self.client.put(path)
  66. assert self.client.get(path).status_code == 200
  67. assert self.client.get('/ldp/test_tree/a/b/c').status_code == 200
  68. assert self.client.post('/ldp/test_tree/a/b').status_code == 201
  69. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  70. put_int_resp = self.client.put(
  71. 'ldp/test_tree/a', data=f, content_type='text/turtle')
  72. assert put_int_resp.status_code == 204
  73. # @TODO More thorough testing of contents
  74. def test_put_nested_tree(self, client):
  75. """
  76. Verify that containment is set correctly in nested hierarchies.
  77. First put a new hierarchy and verify that the root node is its
  78. container; then put another hierarchy under it and verify that the
  79. first hierarchy is the container of the second one.
  80. """
  81. uuid1 = 'test_nested_tree/a/b/c/d'
  82. uuid2 = uuid1 + '/e/f/g'
  83. path1 = '/ldp/' + uuid1
  84. path2 = '/ldp/' + uuid2
  85. self.client.put(path1)
  86. cont1_data = self.client.get('/ldp').data
  87. gr1 = Graph().parse(data=cont1_data, format='turtle')
  88. assert gr1[ URIRef(g.webroot + '/') : nsc['ldp'].contains : \
  89. URIRef(g.webroot + '/test_nested_tree') ]
  90. self.client.put(path2)
  91. cont2_data = self.client.get(path1).data
  92. gr2 = Graph().parse(data=cont2_data, format='turtle')
  93. assert gr2[ URIRef(g.webroot + '/' + uuid1) : \
  94. nsc['ldp'].contains : \
  95. URIRef(g.webroot + '/' + uuid1 + '/e') ]
  96. def test_put_ldp_rs(self, client):
  97. """
  98. PUT a resource with RDF payload and verify.
  99. """
  100. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  101. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  102. resp = self.client.get('/ldp/ldprs01',
  103. headers={'accept' : 'text/turtle'})
  104. assert resp.status_code == 200
  105. gr = Graph().parse(data=resp.data, format='text/turtle')
  106. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  107. gr.objects(None, RDF.type)
  108. def test_put_ldp_nr(self, rnd_img):
  109. """
  110. PUT a resource with binary payload and verify checksums.
  111. """
  112. rnd_img['content'].seek(0)
  113. resp = self.client.put('/ldp/ldpnr01', data=rnd_img['content'],
  114. headers={
  115. 'Content-Type': 'image/png',
  116. 'Content-Disposition' : 'attachment; filename={}'.format(
  117. rnd_img['filename'])})
  118. assert resp.status_code == 201
  119. resp = self.client.get(
  120. '/ldp/ldpnr01', headers={'accept' : 'image/png'})
  121. assert resp.status_code == 200
  122. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  123. def test_put_ldp_nr_multipart(self, rnd_img):
  124. """
  125. PUT a resource with a multipart/form-data payload.
  126. """
  127. rnd_img['content'].seek(0)
  128. resp = self.client.put(
  129. '/ldp/ldpnr02',
  130. data={
  131. 'file': (
  132. rnd_img['content'], rnd_img['filename'],
  133. 'image/png',
  134. )
  135. }
  136. )
  137. assert resp.status_code == 201
  138. resp = self.client.get(
  139. '/ldp/ldpnr02', headers={'accept' : 'image/png'})
  140. assert resp.status_code == 200
  141. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  142. def test_get_ldp_nr(self, rnd_img):
  143. """
  144. PUT a resource with binary payload and test various retieval methods.
  145. """
  146. uid = '/ldpnr03'
  147. path = '/ldp' + uid
  148. content = b'This is some exciting content.'
  149. resp = self.client.put(path, data=content,
  150. headers={
  151. 'Content-Type': 'text/plain',
  152. 'Content-Disposition' : 'attachment; filename=exciting.txt'})
  153. assert resp.status_code == 201
  154. uri = g.webroot + uid
  155. # Content retrieval methods.
  156. resp_bin1 = self.client.get(path)
  157. assert resp_bin1.status_code == 200
  158. assert resp_bin1.data == content
  159. resp_bin2 = self.client.get(path, headers={'accept' : 'text/plain'})
  160. assert resp_bin2.status_code == 200
  161. assert resp_bin2.data == content
  162. resp_bin3 = self.client.get(path + '/fcr:content')
  163. assert resp_bin3.status_code == 200
  164. assert resp_bin3.data == content
  165. # Metadata retrieval methods.
  166. resp_md1 = self.client.get(path, headers={'accept' : 'text/turtle'})
  167. assert resp_md1.status_code == 200
  168. gr1 = Graph().parse(data=resp_md1.data, format='text/turtle')
  169. assert gr1[ URIRef(uri) : nsc['rdf'].type : nsc['ldp'].Resource]
  170. resp_md2 = self.client.get(path + '/fcr:metadata')
  171. assert resp_md2.status_code == 200
  172. gr2 = Graph().parse(data=resp_md2.data, format='text/turtle')
  173. assert isomorphic(gr1, gr2)
  174. def test_put_mismatched_ldp_rs(self, rnd_img):
  175. """
  176. Verify MIME type / LDP mismatch.
  177. PUT a LDP-RS, then PUT a LDP-NR on the same location and verify it
  178. fails.
  179. """
  180. path = '/ldp/' + str(uuid4())
  181. rnd_img['content'].seek(0)
  182. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  183. headers={
  184. 'Content-Disposition' : 'attachment; filename={}'.format(
  185. rnd_img['filename'])})
  186. assert ldp_nr_resp.status_code == 201
  187. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  188. ldp_rs_resp = self.client.put(path, data=f,
  189. content_type='text/turtle')
  190. assert ldp_rs_resp.status_code == 415
  191. def test_put_mismatched_ldp_nr(self, rnd_img):
  192. """
  193. Verify MIME type / LDP mismatch.
  194. PUT a LDP-NR, then PUT a LDP-RS on the same location and verify it
  195. fails.
  196. """
  197. path = '/ldp/' + str(uuid4())
  198. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  199. ldp_rs_resp = self.client.put(path, data=f,
  200. content_type='text/turtle')
  201. assert ldp_rs_resp.status_code == 201
  202. rnd_img['content'].seek(0)
  203. ldp_nr_resp = self.client.put(path, data=rnd_img['content'],
  204. headers={
  205. 'Content-Disposition' : 'attachment; filename={}'.format(
  206. rnd_img['filename'])})
  207. assert ldp_nr_resp.status_code == 415
  208. def test_missing_reference(self, client):
  209. """
  210. PUT a resource with RDF payload referencing a non-existing in-repo
  211. resource.
  212. """
  213. self.client.get('/ldp')
  214. data = '''
  215. PREFIX ns: <http://example.org#>
  216. PREFIX res: <http://example-source.org/res/>
  217. <> ns:p1 res:bogus ;
  218. ns:p2 <{0}> ;
  219. ns:p3 <{0}/> ;
  220. ns:p4 <{0}/nonexistent> .
  221. '''.format(g.webroot)
  222. put_rsp = self.client.put('/ldp/test_missing_ref', data=data, headers={
  223. 'content-type': 'text/turtle'})
  224. assert put_rsp.status_code == 201
  225. resp = self.client.get('/ldp/test_missing_ref',
  226. headers={'accept' : 'text/turtle'})
  227. assert resp.status_code == 200
  228. gr = Graph().parse(data=resp.data, format='text/turtle')
  229. assert URIRef('http://example-source.org/res/bogus') in \
  230. gr.objects(None, URIRef('http://example.org#p1'))
  231. assert URIRef(g.webroot + '/') in (
  232. gr.objects(None, URIRef('http://example.org#p2')))
  233. assert URIRef(g.webroot + '/') in (
  234. gr.objects(None, URIRef('http://example.org#p3')))
  235. assert URIRef(g.webroot + '/nonexistent') not in (
  236. gr.objects(None, URIRef('http://example.org#p4')))
  237. def test_post_resource(self, client):
  238. """
  239. Check response headers for a POST operation with empty payload.
  240. """
  241. res = self.client.post('/ldp/')
  242. assert res.status_code == 201
  243. assert 'Location' in res.headers
  244. def test_post_ldp_nr(self, rnd_img):
  245. """
  246. POST a resource with binary payload and verify checksums.
  247. """
  248. rnd_img['content'].seek(0)
  249. resp = self.client.post('/ldp/', data=rnd_img['content'],
  250. headers={
  251. 'slug': 'ldpnr04',
  252. 'Content-Type': 'image/png',
  253. 'Content-Disposition' : 'attachment; filename={}'.format(
  254. rnd_img['filename'])})
  255. assert resp.status_code == 201
  256. resp = self.client.get(
  257. '/ldp/ldpnr04', headers={'accept' : 'image/png'})
  258. assert resp.status_code == 200
  259. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  260. def test_post_slug(self):
  261. """
  262. Verify that a POST with slug results in the expected URI only if the
  263. resource does not exist already.
  264. """
  265. slug01_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  266. assert slug01_resp.status_code == 201
  267. assert slug01_resp.headers['location'] == \
  268. g.webroot + '/slug01'
  269. slug02_resp = self.client.post('/ldp', headers={'slug' : 'slug01'})
  270. assert slug02_resp.status_code == 201
  271. assert slug02_resp.headers['location'] != \
  272. g.webroot + '/slug01'
  273. def test_post_404(self):
  274. """
  275. Verify that a POST to a non-existing parent results in a 404.
  276. """
  277. assert self.client.post('/ldp/{}'.format(uuid4()))\
  278. .status_code == 404
  279. def test_post_409(self, rnd_img):
  280. """
  281. Verify that you cannot POST to a binary resource.
  282. """
  283. rnd_img['content'].seek(0)
  284. self.client.put('/ldp/post_409', data=rnd_img['content'], headers={
  285. 'Content-Disposition' : 'attachment; filename={}'.format(
  286. rnd_img['filename'])})
  287. assert self.client.post('/ldp/post_409').status_code == 409
  288. def test_patch_root(self):
  289. """
  290. Test patching root node.
  291. """
  292. path = '/ldp/'
  293. self.client.get(path)
  294. uri = g.webroot + '/'
  295. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  296. resp = self.client.patch(path,
  297. data=data,
  298. headers={'content-type' : 'application/sparql-update'})
  299. assert resp.status_code == 204
  300. resp = self.client.get(path)
  301. gr = Graph().parse(data=resp.data, format='text/turtle')
  302. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  303. def test_patch(self):
  304. """
  305. Test patching a resource.
  306. """
  307. path = '/ldp/test_patch01'
  308. self.client.put(path)
  309. uri = g.webroot + '/test_patch01'
  310. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  311. resp = self.client.patch(path,
  312. data=data,
  313. headers={'content-type' : 'application/sparql-update'})
  314. assert resp.status_code == 204
  315. resp = self.client.get(path)
  316. gr = Graph().parse(data=resp.data, format='text/turtle')
  317. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Hello') ]
  318. self.client.patch(path,
  319. data=open('tests/data/sparql_update/delete+insert+where.sparql'),
  320. headers={'content-type' : 'application/sparql-update'})
  321. resp = self.client.get(path)
  322. gr = Graph().parse(data=resp.data, format='text/turtle')
  323. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  324. def test_patch_ssr(self):
  325. """
  326. Test patching a resource violating the single-subject rule.
  327. """
  328. path = '/ldp/test_patch_ssr'
  329. self.client.put(path)
  330. uri = g.webroot + '/test_patch_ssr'
  331. nossr_qry = 'INSERT { <http://bogus.org> a <urn:ns:A> . } WHERE {}'
  332. abs_qry = 'INSERT {{ <{}> a <urn:ns:A> . }} WHERE {{}}'.format(uri)
  333. frag_qry = 'INSERT {{ <{}#frag> a <urn:ns:A> . }} WHERE {{}}'\
  334. .format(uri)
  335. # @TODO Leave commented until a decision is made about SSR.
  336. assert self.client.patch(
  337. path, data=nossr_qry,
  338. headers={'content-type': 'application/sparql-update'}
  339. ).status_code == 204
  340. assert self.client.patch(
  341. path, data=abs_qry,
  342. headers={'content-type': 'application/sparql-update'}
  343. ).status_code == 204
  344. assert self.client.patch(
  345. path, data=frag_qry,
  346. headers={'content-type': 'application/sparql-update'}
  347. ).status_code == 204
  348. def test_patch_ldp_nr_metadata(self):
  349. """
  350. Test patching a LDP-NR metadata resource from the fcr:metadata URI.
  351. """
  352. path = '/ldp/ldpnr01'
  353. with open('tests/data/sparql_update/simple_insert.sparql') as data:
  354. self.client.patch(path + '/fcr:metadata',
  355. data=data,
  356. headers={'content-type' : 'application/sparql-update'})
  357. resp = self.client.get(path + '/fcr:metadata')
  358. assert resp.status_code == 200
  359. uri = g.webroot + '/ldpnr01'
  360. gr = Graph().parse(data=resp.data, format='text/turtle')
  361. assert gr[URIRef(uri) : nsc['dc'].title : Literal('Hello')]
  362. with open(
  363. 'tests/data/sparql_update/delete+insert+where.sparql') as data:
  364. patch_resp = self.client.patch(path + '/fcr:metadata',
  365. data=data,
  366. headers={'content-type' : 'application/sparql-update'})
  367. assert patch_resp.status_code == 204
  368. resp = self.client.get(path + '/fcr:metadata')
  369. assert resp.status_code == 200
  370. gr = Graph().parse(data=resp.data, format='text/turtle')
  371. assert gr[ URIRef(uri) : nsc['dc'].title : Literal('Ciao') ]
  372. def test_patch_ldpnr(self):
  373. """
  374. Verify that a direct PATCH to a LDP-NR results in a 415.
  375. """
  376. with open(
  377. 'tests/data/sparql_update/delete+insert+where.sparql') as data:
  378. patch_resp = self.client.patch('/ldp/ldpnr01',
  379. data=data,
  380. headers={'content-type': 'application/sparql-update'})
  381. assert patch_resp.status_code == 415
  382. def test_patch_invalid_mimetype(self, rnd_img):
  383. """
  384. Verify that a PATCH using anything other than an
  385. `application/sparql-update` MIME type results in an error.
  386. """
  387. self.client.put('/ldp/test_patch_invalid_mimetype')
  388. rnd_img['content'].seek(0)
  389. ldpnr_resp = self.client.patch('/ldp/ldpnr01/fcr:metadata',
  390. data=rnd_img,
  391. headers={'content-type' : 'image/jpeg'})
  392. ldprs_resp = self.client.patch('/ldp/test_patch_invalid_mimetype',
  393. data=b'Hello, I\'m not a SPARQL update.',
  394. headers={'content-type' : 'text/plain'})
  395. assert ldprs_resp.status_code == ldpnr_resp.status_code == 415
  396. def test_delete(self):
  397. """
  398. Test delete response codes.
  399. """
  400. self.client.put('/ldp/test_delete01')
  401. delete_resp = self.client.delete('/ldp/test_delete01')
  402. assert delete_resp.status_code == 204
  403. bogus_delete_resp = self.client.delete('/ldp/test_delete101')
  404. assert bogus_delete_resp.status_code == 404
  405. def test_tombstone(self):
  406. """
  407. Test tombstone behaviors.
  408. For POST on a tombstone, check `test_resurrection`.
  409. """
  410. tstone_resp = self.client.get('/ldp/test_delete01')
  411. assert tstone_resp.status_code == 410
  412. assert tstone_resp.headers['Link'] == \
  413. '<{}/test_delete01/fcr:tombstone>; rel="hasTombstone"'\
  414. .format(g.webroot)
  415. tstone_path = '/ldp/test_delete01/fcr:tombstone'
  416. assert self.client.get(tstone_path).status_code == 405
  417. assert self.client.put(tstone_path).status_code == 405
  418. assert self.client.delete(tstone_path).status_code == 204
  419. assert self.client.get('/ldp/test_delete01').status_code == 404
  420. def test_delete_recursive(self):
  421. """
  422. Test response codes for resources deleted recursively and their
  423. tombstones.
  424. """
  425. child_suffixes = ('a', 'a/b', 'a/b/c', 'a1', 'a1/b1')
  426. self.client.put('/ldp/test_delete_recursive01')
  427. for cs in child_suffixes:
  428. self.client.put('/ldp/test_delete_recursive01/{}'.format(cs))
  429. assert self.client.delete(
  430. '/ldp/test_delete_recursive01').status_code == 204
  431. tstone_resp = self.client.get('/ldp/test_delete_recursive01')
  432. assert tstone_resp.status_code == 410
  433. assert tstone_resp.headers['Link'] == \
  434. '<{}/test_delete_recursive01/fcr:tombstone>; rel="hasTombstone"'\
  435. .format(g.webroot)
  436. for cs in child_suffixes:
  437. child_tstone_resp = self.client.get(
  438. '/ldp/test_delete_recursive01/{}'.format(cs))
  439. assert child_tstone_resp.status_code == tstone_resp.status_code
  440. assert 'Link' not in child_tstone_resp.headers.keys()
  441. def test_put_fragments(self):
  442. """
  443. Test the correct handling of fragment URIs on PUT and GET.
  444. """
  445. with open('tests/data/fragments.ttl', 'rb') as f:
  446. self.client.put(
  447. '/ldp/test_fragment01',
  448. headers={
  449. 'Content-Type' : 'text/turtle',
  450. },
  451. data=f
  452. )
  453. rsp = self.client.get('/ldp/test_fragment01')
  454. gr = Graph().parse(data=rsp.data, format='text/turtle')
  455. assert gr[
  456. URIRef(g.webroot + '/test_fragment01#hash1')
  457. : URIRef('http://ex.org/p2') : URIRef('http://ex.org/o2')]
  458. def test_patch_fragments(self):
  459. """
  460. Test the correct handling of fragment URIs on PATCH.
  461. """
  462. self.client.put('/ldp/test_fragment_patch')
  463. with open('tests/data/fragments_insert.sparql', 'rb') as f:
  464. self.client.patch(
  465. '/ldp/test_fragment_patch',
  466. headers={
  467. 'Content-Type' : 'application/sparql-update',
  468. },
  469. data=f
  470. )
  471. ins_rsp = self.client.get('/ldp/test_fragment_patch')
  472. ins_gr = Graph().parse(data=ins_rsp.data, format='text/turtle')
  473. assert ins_gr[
  474. URIRef(g.webroot + '/test_fragment_patch#hash1234')
  475. : URIRef('http://ex.org/p3') : URIRef('http://ex.org/o3')]
  476. with open('tests/data/fragments_delete.sparql', 'rb') as f:
  477. self.client.patch(
  478. '/ldp/test_fragment_patch',
  479. headers={
  480. 'Content-Type' : 'application/sparql-update',
  481. },
  482. data=f
  483. )
  484. del_rsp = self.client.get('/ldp/test_fragment_patch')
  485. del_gr = Graph().parse(data=del_rsp.data, format='text/turtle')
  486. assert not del_gr[
  487. URIRef(g.webroot + '/test_fragment_patch#hash1234')
  488. : URIRef('http://ex.org/p3') : URIRef('http://ex.org/o3')]
  489. @pytest.mark.usefixtures('client_class')
  490. @pytest.mark.usefixtures('db')
  491. class TestMimeType:
  492. """
  493. Test ``Accept`` headers and input & output formats.
  494. """
  495. def test_accept(self):
  496. """
  497. Verify the default serialization method.
  498. """
  499. accept_list = {
  500. ('', 'text/turtle'),
  501. ('text/turtle', 'text/turtle'),
  502. ('application/rdf+xml', 'application/rdf+xml'),
  503. ('application/n-triples', 'application/n-triples'),
  504. ('application/bogus', 'text/turtle'),
  505. (
  506. 'application/rdf+xml;q=0.5,application/n-triples;q=0.7',
  507. 'application/n-triples'),
  508. (
  509. 'application/rdf+xml;q=0.5,application/bogus;q=0.7',
  510. 'application/rdf+xml'),
  511. ('application/rdf+xml;q=0.5,text/n3;q=0.7', 'text/n3'),
  512. (
  513. 'application/rdf+xml;q=0.5,application/ld+json;q=0.7',
  514. 'application/ld+json'),
  515. }
  516. for mimetype, fmt in accept_list:
  517. rsp = self.client.get('/ldp', headers={'Accept': mimetype})
  518. assert rsp.mimetype == fmt
  519. gr = Graph(identifier=g.webroot + '/').parse(
  520. data=rsp.data, format=fmt)
  521. assert nsc['fcrepo'].RepositoryRoot in set(gr.objects())
  522. def test_provided_rdf(self):
  523. """
  524. Test several input RDF serialiation formats.
  525. """
  526. self.client.get('/ldp')
  527. gr = Graph()
  528. gr.add((
  529. URIRef(g.webroot + '/test_mimetype'),
  530. nsc['dcterms'].title, Literal('Test MIME type.')))
  531. test_list = {
  532. 'application/n-triples',
  533. 'application/rdf+xml',
  534. 'text/n3',
  535. 'text/turtle',
  536. 'application/ld+json',
  537. }
  538. for mimetype in test_list:
  539. rdf_data = gr.serialize(format=mimetype)
  540. self.client.put('/ldp/test_mimetype', data=rdf_data, headers={
  541. 'content-type': mimetype})
  542. rsp = self.client.get('/ldp/test_mimetype')
  543. rsp_gr = Graph(identifier=g.webroot + '/test_mimetype').parse(
  544. data=rsp.data, format='text/turtle')
  545. assert (
  546. URIRef(g.webroot + '/test_mimetype'),
  547. nsc['dcterms'].title, Literal('Test MIME type.')) in rsp_gr
  548. @pytest.mark.usefixtures('client_class')
  549. class TestDigestHeaders:
  550. """
  551. Test Digest and ETag headers.
  552. """
  553. def test_etag_digest(self):
  554. """
  555. Verify ETag and Digest headers on creation.
  556. The headers must correspond to the SHA1 checksum of the binary content.
  557. """
  558. uid = '/test_etag1'
  559. path = '/ldp' + uid
  560. content = uuid4().bytes
  561. content_cksum = sha1(content)
  562. put_rsp = self.client.put(
  563. path, data=content, headers={'content-type': 'text/plain'})
  564. assert content_cksum.hexdigest() in \
  565. put_rsp.headers.get('etag').split(',')
  566. assert put_rsp.headers.get('digest') == \
  567. 'SHA1=' + b64encode(content_cksum.digest()).decode()
  568. get_rsp = self.client.get(path)
  569. assert content_cksum.hexdigest() in \
  570. put_rsp.headers.get('etag').split(',')
  571. assert get_rsp.headers.get('digest') == \
  572. 'SHA1=' + b64encode(content_cksum.digest()).decode()
  573. def test_etag_ident(self):
  574. """
  575. Verify that two resources with the same content yield identical ETags.
  576. """
  577. path1 = f'/ldp/{uuid4()}'
  578. path2 = f'/ldp/{uuid4()}'
  579. content = uuid4().bytes
  580. content_cksum = sha1(content)
  581. self.client.put(
  582. path1, data=content, headers={'content-type': 'text/plain'})
  583. self.client.put(
  584. path2, data=content, headers={'content-type': 'text/plain'})
  585. get_rsp1 = self.client.get(path1)
  586. get_rsp2 = self.client.get(path2)
  587. assert get_rsp1.headers.get('etag') == get_rsp2.headers.get('etag')
  588. assert get_rsp1.headers.get('digest') == get_rsp2.headers.get('digest')
  589. def test_etag_diff(self):
  590. """
  591. Verify that two resources with different content yield different ETags.
  592. """
  593. path1 = f'/ldp/{uuid4()}'
  594. path2 = f'/ldp/{uuid4()}'
  595. content1 = b'some interesting content.'
  596. content_cksum1 = sha1(content1)
  597. content2 = b'Some great content.'
  598. content_cksum2 = sha1(content2)
  599. self.client.put(
  600. path1, data=content1, headers={'content-type': 'text/plain'})
  601. self.client.put(
  602. path2, data=content2, headers={'content-type': 'text/plain'})
  603. get_rsp1 = self.client.get(path1)
  604. get_rsp2 = self.client.get(path2)
  605. assert get_rsp1.headers.get('etag') != get_rsp2.headers.get('etag')
  606. assert get_rsp1.headers.get('digest') != get_rsp2.headers.get('digest')
  607. def test_etag_update(self):
  608. """
  609. Verify that ETag and digest change when the resource is updated.
  610. The headers should NOT change if the same binary content is
  611. re-submitted.
  612. """
  613. path = f'/ldp/{uuid4()}'
  614. content1 = uuid4().bytes
  615. content_cksum1 = sha1(content1)
  616. content2 = uuid4().bytes
  617. content_cksum2 = sha1(content2)
  618. self.client.put(
  619. path, data=content1, headers={'content-type': 'text/plain'})
  620. get_rsp = self.client.get(path)
  621. assert content_cksum1.hexdigest() == \
  622. get_rsp.headers.get('etag').strip('"')
  623. assert get_rsp.headers.get('digest') == \
  624. 'SHA1=' + b64encode(content_cksum1.digest()).decode()
  625. put_rsp = self.client.put(
  626. path, data=content2, headers={'content-type': 'text/plain'})
  627. assert content_cksum2.hexdigest() == \
  628. put_rsp.headers.get('etag').strip('"')
  629. assert put_rsp.headers.get('digest') == \
  630. 'SHA1=' + b64encode(content_cksum2.digest()).decode()
  631. get_rsp = self.client.get(path)
  632. assert content_cksum2.hexdigest() == \
  633. get_rsp.headers.get('etag').strip('"')
  634. assert get_rsp.headers.get('digest') == \
  635. 'SHA1=' + b64encode(content_cksum2.digest()).decode()
  636. def test_etag_rdf(self):
  637. """
  638. Verify that LDP-RS resources don't get an ETag.
  639. TODO This is by design for now; when a reliable hashing method
  640. for a graph is devised, this test should change.
  641. """
  642. path = '/ldp/test_etag_rdf1'
  643. put_rsp = self.client.put(path)
  644. assert not put_rsp.headers.get('etag')
  645. assert not put_rsp.headers.get('digest')
  646. get_rsp = self.client.get(path)
  647. assert not get_rsp.headers.get('etag')
  648. assert not get_rsp.headers.get('digest')
  649. @pytest.mark.usefixtures('client_class')
  650. class TestETagCondHeaders:
  651. """
  652. Test Digest and ETag headers.
  653. """
  654. def test_if_match_get(self):
  655. """
  656. Test the If-Match header on GET requests.
  657. Test providing single and multiple ETags.
  658. """
  659. path = '/ldp/test_if_match1'
  660. content = uuid4().bytes
  661. content_cksum = sha1(content).hexdigest()
  662. bogus_cksum = uuid4().hex
  663. self.client.put(
  664. path, data=content, headers={'content-type': 'text/plain'})
  665. get_rsp = self.client.get(path, headers={
  666. 'if-match': f'"{content_cksum}"'})
  667. assert get_rsp.status_code == 200
  668. get_rsp = self.client.get(path, headers={
  669. 'if-match': f'"{bogus_cksum}"'})
  670. assert get_rsp.status_code == 412
  671. get_rsp = self.client.get(path, headers={
  672. 'if-match': f'"{content_cksum}", "{bogus_cksum}"'})
  673. assert get_rsp.status_code == 200
  674. def test_if_match_put(self):
  675. """
  676. Test the If-Match header on PUT requests.
  677. Test providing single and multiple ETags.
  678. """
  679. path = '/ldp/test_if_match1'
  680. content = uuid4().bytes
  681. content_cksum = sha1(content).hexdigest()
  682. bogus_cksum = uuid4().hex
  683. get_rsp = self.client.get(path)
  684. old_cksum = get_rsp.headers.get('etag')
  685. put_rsp = self.client.put(path, data=content, headers={
  686. 'if-match': f'"{content_cksum}"'})
  687. assert put_rsp.status_code == 412
  688. put_rsp = self.client.put(path, data=content, headers={
  689. 'if-match': f'"{content_cksum}", "{bogus_cksum}"'})
  690. assert put_rsp.status_code == 412
  691. put_rsp = self.client.put(path, data=content, headers={
  692. 'if-match': f'"{old_cksum}", "{bogus_cksum}"'})
  693. assert put_rsp.status_code == 204
  694. # Now contents have changed.
  695. put_rsp = self.client.put(path, data=content, headers={
  696. 'if-match': f'"{old_cksum}"'})
  697. assert put_rsp.status_code == 412
  698. put_rsp = self.client.put(path, data=content, headers={
  699. 'if-match': f'"{content_cksum}"'})
  700. assert put_rsp.status_code == 204
  701. # Exactly the same content was uploaded, so the ETag should not have
  702. # changed.
  703. put_rsp = self.client.put(path, data=content, headers={
  704. 'if-match': f'"{content_cksum}"'})
  705. assert put_rsp.status_code == 204
  706. # Catch-all: Proceed if resource exists at the given location.
  707. put_rsp = self.client.put(path, data=content, headers={
  708. 'if-match': '*'})
  709. assert put_rsp.status_code == 204
  710. # This is wrong syntax. It will not update because the literal asterisk
  711. # won't match.
  712. put_rsp = self.client.put(path, data=content, headers={
  713. 'if-match': '"*"'})
  714. assert put_rsp.status_code == 412
  715. # Test delete.
  716. del_rsp = self.client.delete(path, headers={
  717. 'if-match': f'"{old_cksum}"', 'Prefer': 'no-tombstone'})
  718. assert del_rsp.status_code == 412
  719. del_rsp = self.client.delete(path, headers={
  720. 'if-match': f'"{content_cksum}"', 'Prefer': 'no-tombstone'})
  721. assert del_rsp.status_code == 204
  722. put_rsp = self.client.put(path, data=content, headers={
  723. 'if-match': '*'})
  724. assert put_rsp.status_code == 412
  725. def test_if_none_match_get(self):
  726. """
  727. Test the If-None-Match header on GET requests.
  728. Test providing single and multiple ETags.
  729. """
  730. path = '/ldp/test_if_none_match1'
  731. content = uuid4().bytes
  732. content_cksum = sha1(content).hexdigest()
  733. bogus_cksum = uuid4().hex
  734. self.client.put(
  735. path, data=content, headers={'content-type': 'text/plain'})
  736. get_rsp1 = self.client.get(path, headers={
  737. 'if-none-match': f'"{content_cksum}"'})
  738. assert get_rsp1.status_code == 304
  739. get_rsp2 = self.client.get(path, headers={
  740. 'if-none-match': f'"{bogus_cksum}"'})
  741. assert get_rsp2.status_code == 200
  742. get_rsp3 = self.client.get(path, headers={
  743. 'if-none-match': f'"{content_cksum}", "{bogus_cksum}"'})
  744. assert get_rsp3.status_code == 304
  745. # 404 has precedence on ETag handling.
  746. get_rsp = self.client.get('/ldp/bogus', headers={
  747. 'if-none-match': f'"{bogus_cksum}"'})
  748. assert get_rsp.status_code == 404
  749. get_rsp = self.client.get('/ldp/bogus', headers={
  750. 'if-none-match': f'"{content_cksum}"'})
  751. assert get_rsp.status_code == 404
  752. def test_if_none_match_put(self):
  753. """
  754. Test the If-None-Match header on PUT requests.
  755. Test providing single and multiple ETags.
  756. Uses a previously created resource.
  757. """
  758. path = '/ldp/test_if_none_match1'
  759. content = uuid4().bytes
  760. content_cksum = sha1(content).hexdigest()
  761. bogus_cksum = uuid4().hex
  762. get_rsp = self.client.get(path)
  763. old_cksum = get_rsp.headers.get('etag')
  764. put_rsp = self.client.put(path, data=content, headers={
  765. 'if-none-match': f'"{old_cksum}"'})
  766. assert put_rsp.status_code == 412
  767. put_rsp = self.client.put(path, data=content, headers={
  768. 'if-none-match': f'"{old_cksum}", "{bogus_cksum}"'})
  769. assert put_rsp.status_code == 412
  770. put_rsp = self.client.put(path, data=content, headers={
  771. 'if-none-match': f'"{bogus_cksum}"'})
  772. assert put_rsp.status_code == 204
  773. # Now contents have changed.
  774. put_rsp = self.client.put(path, data=content, headers={
  775. 'if-none-match': f'"{content_cksum}"'})
  776. assert put_rsp.status_code == 412
  777. put_rsp = self.client.put(path, data=content, headers={
  778. 'if-none-match': f'"{old_cksum}"'})
  779. assert put_rsp.status_code == 204
  780. # Catch-all: fail if any resource exists at the given location.
  781. put_rsp = self.client.put(path, data=content, headers={
  782. 'if-none-match': '*'})
  783. assert put_rsp.status_code == 412
  784. # Test delete.
  785. del_rsp = self.client.delete(path, headers={
  786. 'if-none-match': f'"{content_cksum}"', 'Prefer': 'no-tombstone'})
  787. assert del_rsp.status_code == 412
  788. del_rsp = self.client.delete(path, headers={
  789. 'if-none-match': f'"{bogus_cksum}"', 'Prefer': 'no-tombstone'})
  790. assert del_rsp.status_code == 204
  791. put_rsp = self.client.put(path, data=content, headers={
  792. 'if-none-match': '*'})
  793. assert put_rsp.status_code == 201
  794. # This is wrong syntax. It will update because the literal asterisk
  795. # won't match.
  796. put_rsp = self.client.put(path, data=content, headers={
  797. 'if-none-match': '"*"'})
  798. assert put_rsp.status_code == 204
  799. def test_etag_notfound(self):
  800. """
  801. Verify that 404 and 410 have precedence on ETag handling.
  802. """
  803. path = f'/ldp/{uuid4()}'
  804. bogus_cksum = uuid4().hex
  805. get_rsp = self.client.get(path, headers={
  806. 'if-match': f'"{bogus_cksum}"'})
  807. assert get_rsp.status_code == 404
  808. get_rsp = self.client.get(path, headers={
  809. 'if-match': '*'})
  810. assert get_rsp.status_code == 404
  811. get_rsp = self.client.get(path, headers={
  812. 'if-none-match': f'"{bogus_cksum}"'})
  813. assert get_rsp.status_code == 404
  814. self.client.put(path)
  815. self.client.delete(path)
  816. get_rsp = self.client.get(path, headers={
  817. 'if-match': f'"{bogus_cksum}"'})
  818. assert get_rsp.status_code == 410
  819. get_rsp = self.client.get(path, headers={
  820. 'if-none-match': f'"{bogus_cksum}"'})
  821. assert get_rsp.status_code == 410
  822. get_rsp = self.client.get(path, headers={
  823. 'if-match': '*'})
  824. assert get_rsp.status_code == 410
  825. @pytest.mark.usefixtures('client_class')
  826. class TestModifyTimeCondHeaders:
  827. """
  828. Test time-related conditional headers.
  829. """
  830. @pytest.fixture(scope='class')
  831. def timeframe(self):
  832. """
  833. Times used in these tests: UTC midnight of today, yesterday, tomorrow.
  834. """
  835. today = arrow.utcnow().floor('day')
  836. yesterday = today.shift(days=-1)
  837. tomorrow = today.shift(days=1)
  838. path = f'/ldp/{uuid4()}'
  839. self.client.put(path)
  840. return path, today, yesterday, tomorrow
  841. def test_nothing(self):
  842. """
  843. For some reason, without this the fixture won't initialize properly.
  844. """
  845. self.client.get('/')
  846. def test_if_modified_since(self, timeframe):
  847. """
  848. Test various uses of the If-Modified-Since header.
  849. """
  850. path, today, yesterday, tomorrow = timeframe
  851. assert self.client.head(
  852. path, headers={'if-modified-since': http_date(today.timestamp)}
  853. ).status_code == 200
  854. assert self.client.get(
  855. path, headers={'if-modified-since': http_date(today.timestamp)}
  856. ).status_code == 200
  857. assert self.client.head(
  858. path, headers={'if-modified-since': http_date(yesterday.timestamp)}
  859. ).status_code == 200
  860. assert self.client.get(
  861. path, headers={'if-modified-since': http_date(yesterday.timestamp)}
  862. ).status_code == 200
  863. assert self.client.head(
  864. path, headers={'if-modified-since': http_date(tomorrow.timestamp)}
  865. ).status_code == 304
  866. assert self.client.get(
  867. path, headers={'if-modified-since': http_date(tomorrow.timestamp)}
  868. ).status_code == 304
  869. def test_if_unmodified_since(self, timeframe):
  870. """
  871. Test various uses of the If-Unmodified-Since header.
  872. """
  873. path, today, yesterday, tomorrow = timeframe
  874. assert self.client.head(
  875. path, headers={'if-unmodified-since': http_date(today.timestamp)}
  876. ).status_code == 304
  877. assert self.client.get(
  878. path, headers={'if-unmodified-since': http_date(today.timestamp)}
  879. ).status_code == 304
  880. assert self.client.head(
  881. path, headers={'if-unmodified-since': http_date(yesterday.timestamp)}
  882. ).status_code == 304
  883. assert self.client.get(
  884. path, headers={'if-unmodified-since': http_date(yesterday.timestamp)}
  885. ).status_code == 304
  886. assert self.client.head(
  887. path, headers={'if-unmodified-since': http_date(tomorrow.timestamp)}
  888. ).status_code == 200
  889. assert self.client.get(
  890. path, headers={'if-unmodified-since': http_date(tomorrow.timestamp)}
  891. ).status_code == 200
  892. def test_time_range(self, timeframe):
  893. """
  894. Test conditions inside and outside of a time range.
  895. """
  896. path, today, yesterday, tomorrow = timeframe
  897. # Send me the resource if it has been modified between yesterday
  898. # and tomorrow.
  899. assert self.client.get(path, headers={
  900. 'if-modified-since': http_date(yesterday.timestamp),
  901. 'if-unmodified-since': http_date(tomorrow.timestamp),
  902. }).status_code == 200
  903. # Send me the resource if it has been modified between today
  904. # and tomorrow.
  905. assert self.client.get(path, headers={
  906. 'if-modified-since': http_date(today.timestamp),
  907. 'if-unmodified-since': http_date(tomorrow.timestamp),
  908. }).status_code == 200
  909. # Send me the resource if it has been modified between yesterday
  910. # and today.
  911. assert self.client.get(path, headers={
  912. 'if-modified-since': http_date(yesterday.timestamp),
  913. 'if-unmodified-since': http_date(today.timestamp),
  914. }).status_code == 304
  915. # Send me the resource if it has been modified between two days ago
  916. # and yesterday.
  917. assert self.client.get(path, headers={
  918. 'if-modified-since': http_date(yesterday.shift(days=-1).timestamp),
  919. 'if-unmodified-since': http_date(yesterday.timestamp),
  920. }).status_code == 304
  921. # Send me the resource if it has been modified between tomorrow
  922. # and two days from today.
  923. assert self.client.get(path, headers={
  924. 'if-modified-since': http_date(tomorrow.timestamp),
  925. 'if-unmodified-since': http_date(tomorrow.shift(days=1).timestamp),
  926. }).status_code == 304
  927. def test_time_etag_combo(self, timeframe):
  928. """
  929. Test evaluation priorities among ETag and time headers.
  930. """
  931. _, today, yesterday, tomorrow = timeframe
  932. path = f'/ldp/{uuid4()}'
  933. content = uuid4().bytes
  934. content_cksum = sha1(content).hexdigest()
  935. bogus_cksum = uuid4().hex
  936. self.client.put(
  937. path, data=content, headers={'content-type': 'text/plain'})
  938. # Negative ETag match wins.
  939. assert self.client.get(path, headers={
  940. 'if-match': f'"{bogus_cksum}"',
  941. 'if-modified-since': http_date(yesterday.timestamp),
  942. }).status_code == 412
  943. assert self.client.get(path, headers={
  944. 'if-match': f'"{bogus_cksum}"',
  945. 'if-unmodified-since': http_date(tomorrow.timestamp),
  946. }).status_code == 412
  947. assert self.client.get(path, headers={
  948. 'if-none-match': f'"{content_cksum}"',
  949. 'if-modified-since': http_date(yesterday.timestamp),
  950. }).status_code == 304
  951. assert self.client.get(path, headers={
  952. 'if-none-match': f'"{content_cksum}"',
  953. 'if-unmodified-since': http_date(tomorrow.timestamp),
  954. }).status_code == 304
  955. # Positive ETag match wins.
  956. assert self.client.get(path, headers={
  957. 'if-match': f'"{content_cksum}"',
  958. 'if-unmodified-since': http_date(yesterday.timestamp),
  959. }).status_code == 200
  960. assert self.client.get(path, headers={
  961. 'if-match': f'"{content_cksum}"',
  962. 'if-modified-since': http_date(tomorrow.timestamp),
  963. }).status_code == 200
  964. assert self.client.get(path, headers={
  965. 'if-none-match': f'"{bogus_cksum}"',
  966. 'if-unmodified-since': http_date(yesterday.timestamp),
  967. }).status_code == 200
  968. assert self.client.get(path, headers={
  969. 'if-none-match': f'"{bogus_cksum}"',
  970. 'if-modified-since': http_date(tomorrow.timestamp),
  971. }).status_code == 200
  972. @pytest.mark.usefixtures('client_class')
  973. class TestPrefHeader:
  974. """
  975. Test various combinations of `Prefer` header.
  976. """
  977. @pytest.fixture(scope='class')
  978. def cont_structure(self):
  979. """
  980. Create a container structure to be used for subsequent requests.
  981. """
  982. parent_path = '/ldp/test_parent'
  983. self.client.put(parent_path)
  984. self.client.put(parent_path + '/child1')
  985. self.client.put(parent_path + '/child2')
  986. self.client.put(parent_path + '/child3')
  987. return {
  988. 'path' : parent_path,
  989. 'response' : self.client.get(parent_path),
  990. }
  991. def test_put_prefer_handling(self, random_uuid):
  992. """
  993. Trying to PUT an existing resource should:
  994. - Return a 204 if the payload is empty
  995. - Return a 204 if the payload is RDF, server-managed triples are
  996. included and the 'Prefer' header is set to 'handling=lenient'
  997. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  998. server-managed triples are included and handling is set to 'strict',
  999. or not set.
  1000. """
  1001. path = '/ldp/put_pref_header01'
  1002. assert self.client.put(path).status_code == 201
  1003. assert self.client.get(path).status_code == 200
  1004. assert self.client.put(path).status_code == 204
  1005. # Default handling is strict.
  1006. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  1007. rsp_default = self.client.put(
  1008. path,
  1009. headers={
  1010. 'Content-Type' : 'text/turtle',
  1011. },
  1012. data=f
  1013. )
  1014. assert rsp_default.status_code == 412
  1015. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  1016. rsp_len = self.client.put(
  1017. path,
  1018. headers={
  1019. 'Prefer' : 'handling=lenient',
  1020. 'Content-Type' : 'text/turtle',
  1021. },
  1022. data=f
  1023. )
  1024. assert rsp_len.status_code == 204
  1025. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  1026. rsp_strict = self.client.put(
  1027. path,
  1028. headers={
  1029. 'Prefer' : 'handling=strict',
  1030. 'Content-Type' : 'text/turtle',
  1031. },
  1032. data=f
  1033. )
  1034. assert rsp_strict.status_code == 412
  1035. # @HOLD Embed children is debated.
  1036. def _disabled_test_embed_children(self, cont_structure):
  1037. """
  1038. verify the "embed children" prefer header.
  1039. """
  1040. self.client.get('/ldp')
  1041. parent_path = cont_structure['path']
  1042. cont_resp = cont_structure['response']
  1043. cont_subject = URIRef(g.webroot + '/test_parent')
  1044. #minimal_resp = self.client.get(parent_path, headers={
  1045. # 'Prefer' : 'return=minimal',
  1046. #})
  1047. incl_embed_children_resp = self.client.get(parent_path, headers={
  1048. 'Prefer' : 'return=representation; include={}'\
  1049. .format(Ldpr.EMBED_CHILD_RES_URI),
  1050. })
  1051. omit_embed_children_resp = self.client.get(parent_path, headers={
  1052. 'Prefer' : 'return=representation; omit={}'\
  1053. .format(Ldpr.EMBED_CHILD_RES_URI),
  1054. })
  1055. default_gr = Graph().parse(data=cont_resp.data, format='turtle')
  1056. incl_gr = Graph().parse(
  1057. data=incl_embed_children_resp.data, format='turtle')
  1058. omit_gr = Graph().parse(
  1059. data=omit_embed_children_resp.data, format='turtle')
  1060. assert isomorphic(omit_gr, default_gr)
  1061. children = set(incl_gr[cont_subject : nsc['ldp'].contains])
  1062. assert len(children) == 3
  1063. children = set(incl_gr[cont_subject : nsc['ldp'].contains])
  1064. for child_uri in children:
  1065. assert set(incl_gr[ child_uri : : ])
  1066. assert not set(omit_gr[ child_uri : : ])
  1067. def test_return_children(self, cont_structure):
  1068. """
  1069. verify the "return children" prefer header.
  1070. """
  1071. self.client.get('/ldp')
  1072. parent_path = cont_structure['path']
  1073. cont_resp = cont_structure['response']
  1074. cont_subject = URIRef(g.webroot + '/test_parent')
  1075. incl_children_resp = self.client.get(parent_path, headers={
  1076. 'Prefer' : 'return=representation; include={}'\
  1077. .format(Ldpr.RETURN_CHILD_RES_URI),
  1078. })
  1079. omit_children_resp = self.client.get(parent_path, headers={
  1080. 'Prefer' : 'return=representation; omit={}'\
  1081. .format(Ldpr.RETURN_CHILD_RES_URI),
  1082. })
  1083. default_gr = Graph().parse(data=cont_resp.data, format='turtle')
  1084. incl_gr = Graph().parse(data=incl_children_resp.data, format='turtle')
  1085. omit_gr = Graph().parse(data=omit_children_resp.data, format='turtle')
  1086. assert isomorphic(incl_gr, default_gr)
  1087. children = incl_gr[cont_subject : nsc['ldp'].contains]
  1088. for child_uri in children:
  1089. assert not omit_gr[cont_subject : nsc['ldp'].contains : child_uri]
  1090. def test_inbound_rel(self, cont_structure):
  1091. """
  1092. verify the "inbound relationships" prefer header.
  1093. """
  1094. self.client.put('/ldp/test_target')
  1095. data = '<> <http://ex.org/ns#shoots> <{}> .'.format(
  1096. g.webroot + '/test_target')
  1097. self.client.put('/ldp/test_shooter', data=data,
  1098. headers={'Content-Type': 'text/turtle'})
  1099. cont_resp = self.client.get('/ldp/test_target')
  1100. incl_inbound_resp = self.client.get('/ldp/test_target', headers={
  1101. 'Prefer' : 'return=representation; include="{}"'\
  1102. .format(Ldpr.RETURN_INBOUND_REF_URI),
  1103. })
  1104. omit_inbound_resp = self.client.get('/ldp/test_target', headers={
  1105. 'Prefer' : 'return=representation; omit="{}"'\
  1106. .format(Ldpr.RETURN_INBOUND_REF_URI),
  1107. })
  1108. default_gr = Graph().parse(data=cont_resp.data, format='turtle')
  1109. incl_gr = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  1110. omit_gr = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  1111. subject = URIRef(g.webroot + '/test_target')
  1112. inbd_subject = URIRef(g.webroot + '/test_shooter')
  1113. assert isomorphic(omit_gr, default_gr)
  1114. assert len(set(incl_gr[inbd_subject : : ])) == 1
  1115. assert incl_gr[
  1116. inbd_subject : URIRef('http://ex.org/ns#shoots') : subject]
  1117. assert not len(set(omit_gr[inbd_subject : :]))
  1118. def test_srv_mgd_triples(self, cont_structure):
  1119. """
  1120. verify the "server managed triples" prefer header.
  1121. """
  1122. self.client.get('/ldp')
  1123. parent_path = cont_structure['path']
  1124. cont_resp = cont_structure['response']
  1125. cont_subject = URIRef(g.webroot + '/test_parent')
  1126. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  1127. 'Prefer' : 'return=representation; include={}'\
  1128. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  1129. })
  1130. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  1131. 'Prefer' : 'return=representation; omit={}'\
  1132. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  1133. })
  1134. default_gr = Graph().parse(data=cont_resp.data, format='turtle')
  1135. incl_gr = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  1136. omit_gr = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  1137. assert isomorphic(incl_gr, default_gr)
  1138. for pred in {
  1139. nsc['fcrepo'].created,
  1140. nsc['fcrepo'].createdBy,
  1141. nsc['fcrepo'].lastModified,
  1142. nsc['fcrepo'].lastModifiedBy,
  1143. nsc['ldp'].contains,
  1144. }:
  1145. assert set(incl_gr[ cont_subject : pred : ])
  1146. assert not set(omit_gr[ cont_subject : pred : ])
  1147. for type in {
  1148. nsc['fcrepo'].Resource,
  1149. nsc['ldp'].Container,
  1150. nsc['ldp'].Resource,
  1151. }:
  1152. assert incl_gr[ cont_subject : RDF.type : type ]
  1153. assert not omit_gr[ cont_subject : RDF.type : type ]
  1154. def test_delete_no_tstone(self):
  1155. """
  1156. Test the `no-tombstone` Prefer option.
  1157. """
  1158. self.client.put('/ldp/test_delete_no_tstone01')
  1159. self.client.put('/ldp/test_delete_no_tstone01/a')
  1160. self.client.delete('/ldp/test_delete_no_tstone01', headers={
  1161. 'prefer' : 'no-tombstone'})
  1162. resp = self.client.get('/ldp/test_delete_no_tstone01')
  1163. assert resp.status_code == 404
  1164. child_resp = self.client.get('/ldp/test_delete_no_tstone01/a')
  1165. assert child_resp.status_code == 404
  1166. #@pytest.mark.usefixtures('client_class')
  1167. #@pytest.mark.usefixtures('db')
  1168. #class TestDigest:
  1169. # """
  1170. # Test digest and ETag handling.
  1171. # """
  1172. # @pytest.mark.skip(reason='TODO Need to implement async digest queue')
  1173. # def test_digest_post(self):
  1174. # """
  1175. # Test ``Digest`` and ``ETag`` headers on resource POST.
  1176. # """
  1177. # resp = self.client.post('/ldp/')
  1178. # assert 'Digest' in resp.headers
  1179. # assert 'ETag' in resp.headers
  1180. # assert (
  1181. # b64encode(bytes.fromhex(
  1182. # resp.headers['ETag'].replace('W/', '')
  1183. # )).decode('ascii') ==
  1184. # resp.headers['Digest'].replace('SHA256=', ''))
  1185. #
  1186. #
  1187. # @pytest.mark.skip(reason='TODO Need to implement async digest queue')
  1188. # def test_digest_put(self):
  1189. # """
  1190. # Test ``Digest`` and ``ETag`` headers on resource PUT.
  1191. # """
  1192. # resp_put = self.client.put('/ldp/test_digest_put')
  1193. # assert 'Digest' in resp_put.headers
  1194. # assert 'ETag' in resp_put.headers
  1195. # assert (
  1196. # b64encode(bytes.fromhex(
  1197. # resp_put.headers['ETag'].replace('W/', '')
  1198. # )).decode('ascii') ==
  1199. # resp_put.headers['Digest'].replace('SHA256=', ''))
  1200. #
  1201. # resp_get = self.client.get('/ldp/test_digest_put')
  1202. # assert 'Digest' in resp_get.headers
  1203. # assert 'ETag' in resp_get.headers
  1204. # assert (
  1205. # b64encode(bytes.fromhex(
  1206. # resp_get.headers['ETag'].replace('W/', '')
  1207. # )).decode('ascii') ==
  1208. # resp_get.headers['Digest'].replace('SHA256=', ''))
  1209. #
  1210. #
  1211. # @pytest.mark.skip(reason='TODO Need to implement async digest queue')
  1212. # def test_digest_patch(self):
  1213. # """
  1214. # Verify that the digest and ETag change on resource change.
  1215. # """
  1216. # path = '/ldp/test_digest_patch'
  1217. # self.client.put(path)
  1218. # rsp1 = self.client.get(path)
  1219. #
  1220. # self.client.patch(
  1221. # path, data=b'DELETE {} INSERT {<> a <http://ex.org/Test> .} '
  1222. # b'WHERE {}',
  1223. # headers={'Content-Type': 'application/sparql-update'})
  1224. # rsp2 = self.client.get(path)
  1225. #
  1226. # assert rsp1.headers['ETag'] != rsp2.headers['ETag']
  1227. # assert rsp1.headers['Digest'] != rsp2.headers['Digest']
  1228. @pytest.mark.usefixtures('client_class')
  1229. @pytest.mark.usefixtures('db')
  1230. class TestVersion:
  1231. """
  1232. Test version creation, retrieval and deletion.
  1233. """
  1234. def test_create_versions(self):
  1235. """
  1236. Test that POSTing multiple times to fcr:versions creates the
  1237. 'hasVersions' triple and yields multiple version snapshots.
  1238. """
  1239. self.client.put('/ldp/test_version')
  1240. create_rsp = self.client.post('/ldp/test_version/fcr:versions')
  1241. assert create_rsp.status_code == 201
  1242. rsrc_rsp = self.client.get('/ldp/test_version')
  1243. rsrc_gr = Graph().parse(data=rsrc_rsp.data, format='turtle')
  1244. assert len(set(rsrc_gr[: nsc['fcrepo'].hasVersions :])) == 1
  1245. info_rsp = self.client.get('/ldp/test_version/fcr:versions')
  1246. assert info_rsp.status_code == 200
  1247. info_gr = Graph().parse(data=info_rsp.data, format='turtle')
  1248. assert len(set(info_gr[: nsc['fcrepo'].hasVersion :])) == 1
  1249. self.client.post('/ldp/test_version/fcr:versions')
  1250. info2_rsp = self.client.get('/ldp/test_version/fcr:versions')
  1251. info2_gr = Graph().parse(data=info2_rsp.data, format='turtle')
  1252. assert len(set(info2_gr[: nsc['fcrepo'].hasVersion :])) == 2
  1253. def test_version_with_slug(self):
  1254. """
  1255. Test a version with a slug.
  1256. """
  1257. self.client.put('/ldp/test_version_slug')
  1258. create_rsp = self.client.post('/ldp/test_version_slug/fcr:versions',
  1259. headers={'slug' : 'v1'})
  1260. new_ver_uri = create_rsp.headers['Location']
  1261. assert new_ver_uri == g.webroot + '/test_version_slug/fcr:versions/v1'
  1262. info_rsp = self.client.get('/ldp/test_version_slug/fcr:versions')
  1263. info_gr = Graph().parse(data=info_rsp.data, format='turtle')
  1264. assert info_gr[
  1265. URIRef(new_ver_uri) :
  1266. nsc['fcrepo'].hasVersionLabel :
  1267. Literal('v1')]
  1268. def test_dupl_version(self):
  1269. """
  1270. Make sure that two POSTs with the same slug result in two different
  1271. versions.
  1272. """
  1273. path = '/ldp/test_duplicate_slug'
  1274. self.client.put(path)
  1275. v1_rsp = self.client.post(path + '/fcr:versions',
  1276. headers={'slug' : 'v1'})
  1277. v1_uri = v1_rsp.headers['Location']
  1278. dup_rsp = self.client.post(path + '/fcr:versions',
  1279. headers={'slug' : 'v1'})
  1280. dup_uri = dup_rsp.headers['Location']
  1281. assert v1_uri != dup_uri
  1282. def test_revert_version(self):
  1283. """
  1284. Take a version snapshot, update a resource, and then revert to the
  1285. previous vresion.
  1286. """
  1287. rsrc_path = '/ldp/test_revert_version'
  1288. payload1 = '<> <urn:demo:p1> <urn:demo:o1> .'
  1289. payload2 = '<> <urn:demo:p1> <urn:demo:o2> .'
  1290. self.client.put(rsrc_path, headers={
  1291. 'content-type': 'text/turtle'}, data=payload1)
  1292. self.client.post(
  1293. rsrc_path + '/fcr:versions', headers={'slug': 'v1'})
  1294. v1_rsp = self.client.get(rsrc_path)
  1295. v1_gr = Graph().parse(data=v1_rsp.data, format='turtle')
  1296. assert v1_gr[
  1297. URIRef(g.webroot + '/test_revert_version')
  1298. : URIRef('urn:demo:p1')
  1299. : URIRef('urn:demo:o1')
  1300. ]
  1301. self.client.put(rsrc_path, headers={
  1302. 'content-type': 'text/turtle'}, data=payload2)
  1303. v2_rsp = self.client.get(rsrc_path)
  1304. v2_gr = Graph().parse(data=v2_rsp.data, format='turtle')
  1305. assert v2_gr[
  1306. URIRef(g.webroot + '/test_revert_version')
  1307. : URIRef('urn:demo:p1')
  1308. : URIRef('urn:demo:o2')
  1309. ]
  1310. self.client.patch(rsrc_path + '/fcr:versions/v1')
  1311. revert_rsp = self.client.get(rsrc_path)
  1312. revert_gr = Graph().parse(data=revert_rsp.data, format='turtle')
  1313. assert revert_gr[
  1314. URIRef(g.webroot + '/test_revert_version')
  1315. : URIRef('urn:demo:p1')
  1316. : URIRef('urn:demo:o1')
  1317. ]
  1318. def test_resurrection(self):
  1319. """
  1320. Delete and then resurrect a resource.
  1321. Make sure that the resource is resurrected to the latest version.
  1322. """
  1323. path = '/ldp/test_lazarus'
  1324. self.client.put(path)
  1325. self.client.post(path + '/fcr:versions', headers={'slug': 'v1'})
  1326. self.client.put(
  1327. path, headers={'content-type': 'text/turtle'},
  1328. data=b'<> <urn:demo:p1> <urn:demo:o1> .')
  1329. self.client.post(path + '/fcr:versions', headers={'slug': 'v2'})
  1330. self.client.put(
  1331. path, headers={'content-type': 'text/turtle'},
  1332. data=b'<> <urn:demo:p1> <urn:demo:o2> .')
  1333. self.client.delete(path)
  1334. assert self.client.get(path).status_code == 410
  1335. self.client.post(path + '/fcr:tombstone')
  1336. laz_data = self.client.get(path).data
  1337. laz_gr = Graph().parse(data=laz_data, format='turtle')
  1338. assert laz_gr[
  1339. URIRef(g.webroot + '/test_lazarus')
  1340. : URIRef('urn:demo:p1')
  1341. : URIRef('urn:demo:o2')
  1342. ]