test_ldp.py 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287
  1. import pytest
  2. import uuid
  3. from hashlib import sha1
  4. from flask import url_for
  5. from rdflib import Graph
  6. from rdflib.namespace import RDF
  7. from rdflib.term import Literal, URIRef
  8. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  9. from lakesuperior.model.ldpr import Ldpr
  10. from lakesuperior.toolbox import Toolbox
  11. @pytest.fixture(scope='module')
  12. def random_uuid():
  13. return str(uuid.uuid4())
  14. @pytest.mark.usefixtures('client_class')
  15. @pytest.mark.usefixtures('db')
  16. class TestLdp:
  17. '''
  18. Test HTTP interaction with LDP endpoint.
  19. '''
  20. def test_get_root_node(self):
  21. '''
  22. Get the root node from two different endpoints.
  23. The test triplestore must be initialized, hence the `db` fixture.
  24. '''
  25. ldp_resp = self.client.get('/ldp')
  26. rest_resp = self.client.get('/rest')
  27. assert ldp_resp.status_code == 200
  28. assert rest_resp.status_code == 200
  29. #assert ldp_resp.data == rest_resp.data
  30. def test_post_resource(self, client):
  31. '''
  32. Check response headers for a POST operation with empty payload.
  33. '''
  34. res = self.client.post('/ldp/')
  35. assert res.status_code == 201
  36. assert 'Location' in res.headers
  37. def test_put_empty_resource(self, random_uuid):
  38. '''
  39. Check response headers for a PUT operation with empty payload.
  40. '''
  41. res = self.client.put('/ldp/{}'.format(random_uuid))
  42. assert res.status_code == 201
  43. def test_put_existing_resource(self, random_uuid):
  44. '''
  45. Trying to PUT an existing resource should return a 204 if the payload
  46. is empty.
  47. '''
  48. path = '/ldp/nonidempotent01'
  49. assert self.client.put(path).status_code == 201
  50. assert self.client.get(path).status_code == 200
  51. assert self.client.put(path).status_code == 204
  52. def test_put_ldp_rs(self, client):
  53. '''
  54. PUT a resource with RDF payload and verify.
  55. '''
  56. with open('tests/data/marcel_duchamp_single_subject.ttl', 'rb') as f:
  57. self.client.put('/ldp/ldprs01', data=f, content_type='text/turtle')
  58. resp = self.client.get('/ldp/ldprs01', headers={'accept' : 'text/turtle'})
  59. assert resp.status_code == 200
  60. g = Graph().parse(data=resp.data, format='text/turtle')
  61. assert URIRef('http://vocab.getty.edu/ontology#Subject') in \
  62. g.objects(None, RDF.type)
  63. def test_put_ldp_nr(self, rnd_img):
  64. '''
  65. PUT a resource with binary payload and verify checksums.
  66. '''
  67. rnd_img['content'].seek(0)
  68. self.client.put('/ldp/ldpnr01', data=rnd_img['content'], headers={
  69. 'Content-Disposition' : 'attachment; filename={}'.format(
  70. rnd_img['filename'])})
  71. resp = self.client.get('/ldp/ldpnr01', headers={'accept' : 'image/png'})
  72. assert resp.status_code == 200
  73. assert sha1(resp.data).hexdigest() == rnd_img['hash']
  74. @pytest.mark.usefixtures('client_class')
  75. @pytest.mark.usefixtures('db')
  76. class TestPrefHeader:
  77. '''
  78. Test various combinations of `Prefer` header.
  79. '''
  80. @pytest.fixture(scope='class')
  81. def cont_structure(self):
  82. '''
  83. Create a container structure to be used for subsequent requests.
  84. '''
  85. parent_path = '/ldp/test_parent'
  86. self.client.put(parent_path)
  87. self.client.put(parent_path + '/child1')
  88. self.client.put(parent_path + '/child2')
  89. self.client.put(parent_path + '/child3')
  90. return {
  91. 'path' : parent_path,
  92. 'response' : self.client.get(parent_path),
  93. 'subject' : URIRef(Toolbox().base_url + '/test_parent')
  94. }
  95. def test_put_prefer_handling(self, random_uuid):
  96. '''
  97. Trying to PUT an existing resource should:
  98. - Return a 204 if the payload is empty
  99. - Return a 204 if the payload is RDF, server-managed triples are
  100. included and the 'Prefer' header is set to 'handling=lenient'
  101. - Return a 412 (ServerManagedTermError) if the payload is RDF,
  102. server-managed triples are included and handling is set to 'strict'
  103. '''
  104. path = '/ldp/put_pref_header01'
  105. assert self.client.put(path).status_code == 201
  106. assert self.client.get(path).status_code == 200
  107. assert self.client.put(path).status_code == 204
  108. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  109. rsp_len = self.client.put(
  110. '/ldp/{}'.format(random_uuid),
  111. headers={
  112. 'Prefer' : 'handling=lenient',
  113. 'Content-Type' : 'text/turtle',
  114. },
  115. data=f
  116. )
  117. assert rsp_len.status_code == 204
  118. with open('tests/data/rdf_payload_w_srv_mgd_trp.ttl', 'rb') as f:
  119. rsp_strict = self.client.put(
  120. path,
  121. headers={
  122. 'Prefer' : 'handling=strict',
  123. 'Content-Type' : 'text/turtle',
  124. },
  125. data=f
  126. )
  127. assert rsp_strict.status_code == 412
  128. def test_embed_children(self, cont_structure):
  129. '''
  130. verify the "embed children" prefer header.
  131. '''
  132. parent_path = cont_structure['path']
  133. cont_resp = cont_structure['response']
  134. cont_subject = cont_structure['subject']
  135. minimal_resp = self.client.get(parent_path, headers={
  136. 'Prefer' : 'return=minimal',
  137. })
  138. incl_embed_children_resp = self.client.get(parent_path, headers={
  139. 'Prefer' : 'return=representation; include={}'\
  140. .format(Ldpr.EMBED_CHILD_RES_URI),
  141. })
  142. omit_embed_children_resp = self.client.get(parent_path, headers={
  143. 'Prefer' : 'return=representation; omit={}'\
  144. .format(Ldpr.EMBED_CHILD_RES_URI),
  145. })
  146. assert omit_embed_children_resp.data == cont_resp.data
  147. incl_g = Graph().parse(
  148. data=incl_embed_children_resp.data, format='turtle')
  149. omit_g = Graph().parse(
  150. data=omit_embed_children_resp.data, format='turtle')
  151. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  152. assert len(children) == 3
  153. children = set(incl_g[cont_subject : nsc['ldp'].contains])
  154. for child_uri in children:
  155. assert set(incl_g[ child_uri : : ])
  156. assert not set(omit_g[ child_uri : : ])
  157. def test_return_children(self, cont_structure):
  158. '''
  159. verify the "return children" prefer header.
  160. '''
  161. parent_path = cont_structure['path']
  162. cont_resp = cont_structure['response']
  163. cont_subject = cont_structure['subject']
  164. incl_children_resp = self.client.get(parent_path, headers={
  165. 'Prefer' : 'return=representation; include={}'\
  166. .format(Ldpr.RETURN_CHILD_RES_URI),
  167. })
  168. omit_children_resp = self.client.get(parent_path, headers={
  169. 'Prefer' : 'return=representation; omit={}'\
  170. .format(Ldpr.RETURN_CHILD_RES_URI),
  171. })
  172. assert incl_children_resp.data == cont_resp.data
  173. incl_g = Graph().parse(data=incl_children_resp.data, format='turtle')
  174. omit_g = Graph().parse(data=omit_children_resp.data, format='turtle')
  175. children = incl_g[cont_subject : nsc['ldp'].contains]
  176. for child_uri in children:
  177. assert not omit_g[ cont_subject : nsc['ldp'].contains : child_uri ]
  178. def test_inbound_rel(self, cont_structure):
  179. '''
  180. verify the "inboud relationships" prefer header.
  181. '''
  182. parent_path = cont_structure['path']
  183. cont_resp = cont_structure['response']
  184. cont_subject = cont_structure['subject']
  185. incl_inbound_resp = self.client.get(parent_path, headers={
  186. 'Prefer' : 'return=representation; include={}'\
  187. .format(Ldpr.RETURN_INBOUND_REF_URI),
  188. })
  189. omit_inbound_resp = self.client.get(parent_path, headers={
  190. 'Prefer' : 'return=representation; omit={}'\
  191. .format(Ldpr.RETURN_INBOUND_REF_URI),
  192. })
  193. assert omit_inbound_resp.data == cont_resp.data
  194. incl_g = Graph().parse(data=incl_inbound_resp.data, format='turtle')
  195. omit_g = Graph().parse(data=omit_inbound_resp.data, format='turtle')
  196. assert set(incl_g[ : : cont_subject ])
  197. assert not set(omit_g[ : : cont_subject ])
  198. def test_srv_mgd_triples(self, cont_structure):
  199. '''
  200. verify the "server managed triples" prefer header.
  201. '''
  202. parent_path = cont_structure['path']
  203. cont_resp = cont_structure['response']
  204. cont_subject = cont_structure['subject']
  205. incl_srv_mgd_resp = self.client.get(parent_path, headers={
  206. 'Prefer' : 'return=representation; include={}'\
  207. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  208. })
  209. omit_srv_mgd_resp = self.client.get(parent_path, headers={
  210. 'Prefer' : 'return=representation; omit={}'\
  211. .format(Ldpr.RETURN_SRV_MGD_RES_URI),
  212. })
  213. assert incl_srv_mgd_resp.data == cont_resp.data
  214. incl_g = Graph().parse(data=incl_srv_mgd_resp.data, format='turtle')
  215. omit_g = Graph().parse(data=omit_srv_mgd_resp.data, format='turtle')
  216. for pred in {
  217. nsc['fcrepo'].created,
  218. nsc['fcrepo'].createdBy,
  219. nsc['fcrepo'].lastModified,
  220. nsc['fcrepo'].lastModifiedBy,
  221. nsc['ldp'].contains,
  222. }:
  223. assert set(incl_g[ cont_subject : pred : ])
  224. assert not set(omit_g[ cont_subject : pred : ])
  225. for type in {
  226. nsc['fcrepo'].Resource,
  227. nsc['ldp'].Container,
  228. nsc['ldp'].Resource,
  229. }:
  230. assert incl_g[ cont_subject : RDF.type : type ]
  231. assert not omit_g[ cont_subject : RDF.type : type ]