ldp_factory.py 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243
  1. import logging
  2. from pprint import pformat
  3. from uuid import uuid4
  4. from rdflib import Graph, parser, plugin, serializer
  5. from rdflib.resource import Resource
  6. from rdflib.namespace import RDF
  7. from lakesuperior.model.ldpr import Ldpr
  8. from lakesuperior.model.ldp_nr import LdpNr
  9. from lakesuperior.model.ldp_rs import LdpRs, Ldpc, LdpDc, LdpIc
  10. from lakesuperior.config_parser import config
  11. from lakesuperior.env import env
  12. from lakesuperior.dictionaries.namespaces import ns_collection as nsc
  13. from lakesuperior.exceptions import (
  14. IncompatibleLdpTypeError, InvalidResourceError, ResourceExistsError,
  15. ResourceNotExistsError, TombstoneError)
  16. LDP_NR_TYPE = nsc['ldp'].NonRDFSource
  17. LDP_RS_TYPE = nsc['ldp'].RDFSource
  18. rdfly = env.app_globals.rdfly
  19. logger = logging.getLogger(__name__)
  20. class LdpFactory:
  21. """
  22. Generate LDP instances.
  23. The instance classes are based on provided client data or on stored data.
  24. """
  25. @staticmethod
  26. def new_container(uid):
  27. if not uid.startswith('/') or uid == '/':
  28. raise InvalidResourceError(uid)
  29. if rdfly.ask_rsrc_exists(uid):
  30. raise ResourceExistsError(uid)
  31. rsrc = Ldpc(uid, provided_imr=Graph(identifier=nsc['fcres'][uid]))
  32. return rsrc
  33. @staticmethod
  34. def from_stored(uid, repr_opts={}, **kwargs):
  35. """
  36. Create an instance for retrieval purposes.
  37. This factory method creates and returns an instance of an LDPR subclass
  38. based on information that needs to be queried from the underlying
  39. graph store.
  40. N.B. The resource must exist.
  41. :param uid: UID of the instance.
  42. """
  43. #logger.info('Retrieving stored resource: {}'.format(uid))
  44. imr_urn = nsc['fcres'][uid]
  45. rsrc_meta = rdfly.get_metadata(uid)
  46. #logger.debug('Extracted metadata: {}'.format(
  47. # pformat(set(rsrc_meta))))
  48. rdf_types = set(rsrc_meta[imr_urn : RDF.type])
  49. if LDP_NR_TYPE in rdf_types:
  50. logger.info('Resource is a LDP-NR.')
  51. rsrc = LdpNr(uid, repr_opts, **kwargs)
  52. elif LDP_RS_TYPE in rdf_types:
  53. logger.info('Resource is a LDP-RS.')
  54. rsrc = LdpRs(uid, repr_opts, **kwargs)
  55. else:
  56. raise ResourceNotExistsError(uid)
  57. # Sneak in the already extracted metadata to save a query.
  58. rsrc._metadata = rsrc_meta
  59. return rsrc
  60. @staticmethod
  61. def from_provided(
  62. uid, mimetype=None, stream=None, init_gr=None, **kwargs):
  63. r"""
  64. Create and LDPR instance from provided data.
  65. the LDP class (LDP-RS, LDP_NR, etc.) is determined by the contents
  66. passed.
  67. :param str uid: UID of the resource to be created or updated.
  68. :param str mimetype: The provided content MIME type.
  69. :param stream: The provided data stream. This can be
  70. RDF or non-RDF content, or None. In the latter case, an empty
  71. container is created.
  72. :type stream: IOStream or None
  73. :param rdflib.Graph init_gr: Initial graph to populate the
  74. resource with, alternatively to ``stream``. This can be
  75. used for LDP-RS and LDP-NR types alike.
  76. :param \*\*kwargs: Arguments passed to the LDP class constructor.
  77. """
  78. uri = nsc['fcres'][uid]
  79. # If no content or MIME type is passed, create an empty LDPC.
  80. if not any((stream, mimetype, init_gr)):
  81. logger.info('No data received in request. '
  82. 'Creating empty container.')
  83. inst = Ldpc(uid, provided_imr=Graph(identifier=uri), **kwargs)
  84. # Make sure we are not updating an LDP-NR with an LDP-RS.
  85. if inst.is_stored and LDP_NR_TYPE in inst.ldp_types:
  86. raise IncompatibleLdpTypeError(uid, mimetype)
  87. # Otherwise, determine LDP type from provided content.
  88. else:
  89. # If the stream is RDF, or an IMR is provided, create a container
  90. # and populate it with provided RDF data.
  91. provided_imr = Graph(identifier=uri)
  92. # Provided RDF stream overrides provided IMR.
  93. if __class__.is_rdf_parsable(mimetype) :
  94. provided_imr.parse(
  95. data=stream.read(), format=mimetype, publicID=uri)
  96. elif init_gr:
  97. provided_imr += init_gr
  98. #logger.debug('Provided graph: {}'.format(
  99. # pformat(set(provided_imr))))
  100. if not mimetype or __class__.is_rdf_parsable(mimetype):
  101. # Determine whether it is a basic, direct or indirect
  102. # container.
  103. if Ldpr.MBR_RSRC_URI in provided_imr.predicates() and \
  104. Ldpr.MBR_REL_URI in provided_imr.predicates():
  105. if Ldpr.INS_CNT_REL_URI in provided_imr.predicates():
  106. cls = LdpIc
  107. else:
  108. cls = LdpDc
  109. else:
  110. cls = Ldpc
  111. inst = cls(uid, provided_imr=provided_imr, **kwargs)
  112. # Make sure we are not updating an LDP-NR with an LDP-RS.
  113. if inst.is_stored and LDP_NR_TYPE in inst.ldp_types:
  114. raise IncompatibleLdpTypeError(uid, mimetype)
  115. if kwargs.get('handling', 'strict') != 'none':
  116. inst._check_mgd_terms(inst.provided_imr)
  117. else:
  118. # Create a LDP-NR and equip it with the binary file provided.
  119. inst = LdpNr(uid, stream=stream, mimetype=mimetype,
  120. provided_imr=provided_imr, **kwargs)
  121. # Make sure we are not updating an LDP-RS with an LDP-NR.
  122. if inst.is_stored and LDP_RS_TYPE in inst.ldp_types:
  123. raise IncompatibleLdpTypeError(uid, mimetype)
  124. logger.info('Creating resource of type: {}'.format(
  125. inst.__class__.__name__))
  126. try:
  127. types = inst.types
  128. except (TombstoneError, ResourceNotExistsError):
  129. types = set()
  130. return inst
  131. @staticmethod
  132. def is_rdf_parsable(mimetype):
  133. """
  134. Checks whether a MIME type support RDF parsing by a RDFLib plugin.
  135. :param str mimetype: MIME type to check.
  136. """
  137. try:
  138. plugin.get(mimetype, parser.Parser)
  139. except plugin.PluginException:
  140. return False
  141. else:
  142. return True
  143. @staticmethod
  144. def is_rdf_serializable(mimetype):
  145. """
  146. Checks whether a MIME type support RDF serialization by a RDFLib plugin
  147. :param str mimetype: MIME type to check.
  148. """
  149. try:
  150. plugin.get(mimetype, serializer.Serializer)
  151. except plugin.PluginException:
  152. return False
  153. else:
  154. return True
  155. @staticmethod
  156. def mint_uid(parent_uid, path=None):
  157. """
  158. Mint a new resource UID based on client directives.
  159. This method takes a parent ID and a tentative path and returns an LDP
  160. resource UID.
  161. This may raise an exception resulting in a 404 if the parent is not
  162. found or a 409 if the parent is not a valid container.
  163. :param str parent_uid: UID of the parent resource. It must be an
  164. existing LDPC.
  165. :param str path: path to the resource, relative to the parent.
  166. :rtype: str
  167. :return: The confirmed resource UID. This may be different from
  168. what has been indicated.
  169. """
  170. def split_if_legacy(uid):
  171. if config['application']['store']['ldp_rs']['legacy_ptree_split']:
  172. uid = tbox.split_uuid(uid)
  173. return uid
  174. if path and path.startswith('/'):
  175. raise ValueError('Slug cannot start with a slash.')
  176. # Shortcut!
  177. if not path and parent_uid == '/':
  178. return '/' + split_if_legacy(str(uuid4()))
  179. if not parent_uid.startswith('/'):
  180. raise ValueError('Invalid parent UID: {}'.format(parent_uid))
  181. parent = LdpFactory.from_stored(parent_uid)
  182. if nsc['ldp'].Container not in parent.types:
  183. raise InvalidResourceError(parent_uid,
  184. 'Parent {} is not a container.')
  185. pfx = parent_uid.rstrip('/') + '/'
  186. if path:
  187. cnd_uid = pfx + path
  188. if not rdfly.ask_rsrc_exists(cnd_uid):
  189. return cnd_uid
  190. return pfx + split_if_legacy(str(uuid4()))