store_interface.h 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538
  1. /** @file store_interface.h
  2. *
  3. * @brief Common store back end interfaces.
  4. *
  5. * Code using the store interface should include NOT this header, but rahter
  6. * `store.h`.
  7. *
  8. * This header is included by all back end implementations, which are in
  9. * their turn included by `store.h`.
  10. *
  11. * The basic interfaces for store and store iterator implementations are
  12. * defined here. New store implementations should include this header and
  13. * implement three basic elements:
  14. *
  15. * - A structure representing the store back end. This structure will be
  16. * opaque to all downstream code and its layout is entirely up to the
  17. * implementer.
  18. *
  19. * - A structure representing a store iterator state, also opaque.
  20. *
  21. * - The LSUP_StoreInt interface with all the functions defined in the
  22. * interface necessary to interact with the store.
  23. *
  24. * See the `store_htable.{c,h}` and `store_mdb.{c,h}` files for examples of
  25. * fully functioning implementations.
  26. *
  27. * The #LSUP_StoreInt structure defines a store interface for raw buffer
  28. * triples. Nothing in the store functions' signatures should hint at RDF
  29. * triples—they should accept and produce exclusively raw byte buffers
  30. * (#LSUP_Buffer). A store interface may have any of the `LSUP_STORE_*` faeture
  31. * flags which should be reflected in the way its members are implemented.
  32. */
  33. #ifndef _LSUP_STORE_INTERFACE_H
  34. #define _LSUP_STORE_INTERFACE_H
  35. #include "environment.h"
  36. /*
  37. * Store feature flags.
  38. *
  39. * NOTE: LSUP_STORE_PERM need only be set by an implementation based on whether
  40. * its path is on a default temporary dir (e.g. LSUP_MDB_RAMDISK_PATH). If this
  41. * flag is not set, it means the data will be cleared before the next execution
  42. * of the program. However, its being set does not guarantee the persistence of
  43. * the medium (i.e. a "permanent" store may have been created ad hoc on a
  44. * tempfs).
  45. */
  46. typedef enum {
  47. LSUP_STORE_PERM = 1<<0, ///< Store is on a permanent support.
  48. LSUP_STORE_CTX = 1<<1, ///< Store supports contexts (quads).
  49. LSUP_STORE_IDX = 1<<2, ///< Store is fully SPO(C)-indexed.
  50. LSUP_STORE_TXN = 1<<3, ///< Supports transaction handling.
  51. LSUP_STORE_COW = 1<<4, ///< Copy on write. @sa #iter_next_fn_t()
  52. //LSUP_STORE_NET = 1<<5, ///< Store is over a network protocol.
  53. } LSUP_StoreFeature;
  54. /*
  55. * Store function types.
  56. */
  57. /** @brief Prototype: create any environment necessary for the store to work.
  58. *
  59. * This function should be idempotent on separate calls to the same `id`,
  60. * unless the `clear` option is set to `true`.
  61. *
  62. * @param[in,out] id Identifier to use for the store. This should be
  63. * a URI that uniquely identifies a back end for the implementation using it,
  64. * e.g. a SQL connection string, file path for an embedded store, the URL of a
  65. * REST API endpoint, etc. It may also be NULL, in which case it will be set to
  66. * the default identifier set by the implementation. It can be retrieved from
  67. * an existing store via #store_id_fn_t .
  68. *
  69. * @param[in] clear Whether to remove an existing environment with the same ID.
  70. */
  71. typedef LSUP_rc (*store_setup_fn_t)(const char *id, bool clear);
  72. /** @brief Prototype: create a new store.
  73. *
  74. * @param[in] id Identifier for the new store. How this is interpreted, and
  75. * whether it is even used, depends on the implementation, which should
  76. * provide documentation on how to pass and interpret this parameter.
  77. *
  78. * @param[in] size Initial size for the store. It may be 0. Only meaningful
  79. * for stores that may preallocate memory, such as #HTStore.
  80. *
  81. * @return New store handle.
  82. */
  83. typedef void * (*store_new_fn_t)(const char *id, size_t size);
  84. /** @brief Prototype: free store handle.
  85. *
  86. * @param[in] store Store handle.
  87. *
  88. */
  89. typedef void (*store_free_fn_t)(void *store);
  90. /** @brief Prototype: get the store ID.
  91. *
  92. * @param[in] store Store handle.
  93. *
  94. * @return store ID string. This is a copy and should be freed after use.
  95. */
  96. typedef char * (*store_id_fn_t)(const void *store);
  97. /** @brief Prototype: get store size.
  98. *
  99. * @param[in] store The store to calculate size of.
  100. *
  101. * @return Number of stored SPO triples (across all contexts if supported).
  102. */
  103. typedef size_t (*store_size_fn_t)(const void *store);
  104. #if 0
  105. /** @brief Print stats about a store.
  106. *
  107. * TODO
  108. *
  109. * @param[in] store The store to get stats for.
  110. */
  111. typedef LSUP_rc (*store_stat_fn_t)(void *store, void *stat);
  112. #endif
  113. /** @brief Begin a transaction.
  114. *
  115. * Only for LSUP_STORE_TXN stores.
  116. *
  117. * The transaction handle is managed by the store implementation and can be any
  118. * data type.
  119. *
  120. * @param[in] store Store handle.
  121. *
  122. * @param[in] flags Transaction flags. These vary with each implementation.
  123. *
  124. * @param[out] txn Will point to the new open transaction on success, or to
  125. * undefined content on failure.
  126. *
  127. * @return LSUP_OK if the transaction started successfully, <0 on error.
  128. */
  129. typedef LSUP_rc (*store_txn_begin_fn_t)(void *store, int flags, void **txn);
  130. /** @brief Commit a transaction.
  131. *
  132. * Only for LSUP_STORE_TXN stores.
  133. *
  134. * @param[in] store Store handle.
  135. *
  136. * @param[in] txn Transaction handle generated by #store_txn_begin_fn_t.
  137. *
  138. * @return LSUP_OK if the transaction was committed successfully, <0 on error.
  139. */
  140. typedef LSUP_rc (*store_txn_commit_fn_t)(void *store);
  141. /** @brief Abort a transaction.
  142. *
  143. * Only for LSUP_STORE_TXN stores.
  144. *
  145. * @param[in] store Store handle.
  146. *
  147. * @param[in] txn Transaction handle generated by #store_txn_begin_fn_t.
  148. */
  149. typedef void (*store_txn_abort_fn_t)(void *store);
  150. /** @brief Initialize bulk triple load.
  151. *
  152. * This is the first step of a bulk load. It is best used when the data at hand
  153. * need to be pre-processed, which can be done in the same loop as the next
  154. * step to keep memory usage low.
  155. *
  156. * @param store[in] The store to add to.
  157. *
  158. * @param sc[in] Context as a serialized term. If this is NULL, and the
  159. * default context is not NULL, triples will be added to the default context
  160. * for the store, If the default context for the store is NULL, regardless of
  161. * the value of sc, triples will be added with no context. Only meaningful
  162. * for stores with the LSUP_STORE_CTX feature.
  163. *
  164. * @param[in] udata User data. Consult individual store implementations for
  165. * how this is interpreted.
  166. *
  167. * @return Iterator handle to be passed to the following load steps.
  168. */
  169. typedef void * (*store_add_init_fn_t)(
  170. void *store, const LSUP_Buffer *sc, void *udata);
  171. /** @brief Add one triple into the store.
  172. *
  173. * This must be called after #add_init_fn, using the iterator
  174. * yielded by that function. It may be called multiple times and must be
  175. * followed by #add_done_fn or #add_abort_fn (if supported).
  176. *
  177. * @param it[in] Iterator obtained by #store_add_init_fn_t.
  178. * The following members are of interest:
  179. * it->i stores the total number of records inserted.
  180. *
  181. * @param sspo[in] Serialized triple to be added.
  182. *
  183. * @return LSUP_OK if the triple was inserted; LSUP_NOACTION if the triple
  184. * already existed; LSUP_DB_ERR if an MDB error occurred.
  185. */
  186. typedef LSUP_rc (*store_add_iter_fn_t)(
  187. void *it, const LSUP_BufferTriple * sspo);
  188. /** @brief Abort an add loop and free iterator.
  189. *
  190. * Usually called on an irrecoverable error from #add_iter_fn. None of the
  191. * successful inserts in the same loop is retained.
  192. *
  193. * @param it[in] Iterator obtained by #store_add_init_fn_t.
  194. */
  195. typedef void (*store_add_abort_fn_t)(void *it);
  196. /*
  197. * Iterator function types.
  198. */
  199. /** @brief Get iterator active transaction handle.
  200. *
  201. * This function is used to get an active transaction during an iteration loop
  202. * in order to perform an action using the store state within that loop. Some
  203. * stores (e.g. MDB) only support one R/W open transaction per thread, so this
  204. * is also the only way to perform anything else than iterating or committing
  205. * while a loop is open.
  206. *
  207. * @param[in] it Iterator handle to get the transaction from.
  208. *
  209. * @return Transaction handle. DO NOT close this transaction directly.
  210. */
  211. typedef void * (*iter_txn_fn_t)(void *it);
  212. /** @brief Finalize an add loop and free iterator.
  213. *
  214. * This must be called after #add_iter_fn.
  215. *
  216. * @param it[in] Iterator obtained by #LSUP_mdbstore_add_init.
  217. */
  218. typedef LSUP_rc (*store_add_done_fn_t)(void *it);
  219. /** @brief Add a single term to the store.
  220. *
  221. * @param[in] store Store handle.
  222. *
  223. * @param[in] sterm Serialized term to store.
  224. */
  225. typedef LSUP_rc (*store_add_term_fn_t)(
  226. void *store, const LSUP_Buffer *sterm, void *udata);
  227. /** @brief Prototype: look up triples by pattern matching.
  228. *
  229. * This function may return a count of matches and/or an iterator of results as
  230. * serialized triples.
  231. *
  232. * For stores with #LSUP_STORE_TXN, this opens a read-only transaction. The
  233. * transaction handle is held in the iterator structure and is closed when the
  234. * iterator is freed with #iter_free_fn_t().
  235. *
  236. * Any and all of the terms may be NULL, which indicates an unbound query
  237. * term. Stores witout context support will always ignore sc.
  238. *
  239. * @param[in] store The store to be queried.
  240. *
  241. * @param[in] ss Serialized s term.
  242. *
  243. * @param[in] sp Serialized p term.
  244. *
  245. * @param[in] so Serialized o term.
  246. *
  247. * @param[in] sc Serialized context to limit search to. It may be NULL, in
  248. * which case search is done in all contexts. Note that triples inserted
  249. * without context are assigned the *default* context for the store.
  250. *
  251. * @param[out] ct If not NULL, this will be populated with the number of
  252. * entries found. It is very inexpensive to set for lookups without context,
  253. * much less so for 1-bound and 2-bound context lookups, in which cases it
  254. * should be set only if needed.
  255. *
  256. * @param[in] udata User data. Consult individual store implementations for
  257. * how this is interpreted.
  258. *
  259. * @return Iterator handle that will be populated with a result iterator. This
  260. * is always created even if no matches are found and must be freed with
  261. * #LSUP_mdbiter_free() after use. If matches are found, the iterator points to
  262. * the first result which can be retrieved with #iter_next_fn().
  263. */
  264. typedef void * (*store_lookup_fn_t)(
  265. void *store,
  266. const LSUP_Buffer *ss, const LSUP_Buffer *sp, const LSUP_Buffer *so,
  267. const LSUP_Buffer *sc, void *udata, size_t *ct);
  268. /** @brief Prototype: check for existence of a triple (T/F).
  269. *
  270. * @param[in] Store to be queried.
  271. *
  272. * @param[in] spo Triple to look up. All members must not be NULL.
  273. *
  274. * @param[in] c Optional context to look into. It may be NULL. It is
  275. * disregarded by stores without the LSUP_STORE_CTX feature.
  276. *
  277. * @return Whether the triple exist in the store (/context).
  278. */
  279. typedef bool (*store_trp_exist_fn_t)(
  280. void *store, const LSUP_BufferTriple *sspo, const LSUP_Buffer *sc);
  281. /** @brief Prototype: delete triples by pattern matching.
  282. *
  283. * The ss, sp, so, sc terms act as a matching pattern as documented in
  284. * @sa #store_lookup_fn. if not NULL, ct yields the number of triples actually
  285. * deleted.
  286. *
  287. * @param[in] udata User data. Consult individual store implementations for
  288. * how this is interpreted.
  289. */
  290. typedef LSUP_rc (*store_remove_fn_t)(
  291. void *store,
  292. const LSUP_Buffer *ss, const LSUP_Buffer *sp, const LSUP_Buffer *so,
  293. const LSUP_Buffer *sc, void *udata, size_t *ct);
  294. /** @brief Put an in-memory namespace map into a permanent back end.
  295. *
  296. * This is only available in stores with the LSUP_STORE_PERM feature.
  297. *
  298. * Existing prefixes and namespaces are not updated. Thus, if the following are
  299. * already stored:
  300. *
  301. * ns1: <urn:ns:a#>
  302. * ns2: <urn:ns:b#>
  303. *
  304. * Neither of the following will be inserted:
  305. *
  306. * ns3: <urn:ns:a#>
  307. * ns2: <urn:ns:c#>
  308. *
  309. * @param[in] store MDB store to update.
  310. *
  311. * @param[out] nsm Namespace map handle to store.
  312. *
  313. * @param[in] udata User-defined data. Consult individual implementations for
  314. * details.
  315. *
  316. * @return LSUP_OK if all terms were updated; LSUP_CONFLICT if one or more
  317. * namespaces or terms were not updated because they already existed; <0 if
  318. * an error occurred.
  319. */
  320. typedef LSUP_rc (*store_nsm_put_fn_t)(
  321. void *store, const LSUP_NSMap * nsm, void *udata);
  322. /** @brief Get the store's namespace prefix map.
  323. *
  324. * @param[in] store MDB store to query.
  325. *
  326. * @return NS map or NULL on error.
  327. */
  328. typedef LSUP_NSMap * (*store_nsm_get_fn_t)(void *store);
  329. /** @brief Prototype: yield the matching triples and advance the iterator.
  330. *
  331. * NOTE: Iterators keep transactions open. Don't hold on to them longer than
  332. * necessary.
  333. *
  334. * NOTE: If the store interface has the LSUP_STORE_COW feature, the memory
  335. * buffer referenced by the #LSUP_Buffer handle is owned by the database. It
  336. * must not be written to or freed. To modify the data or use them beyond the
  337. * caller's scope, this memory must be copied. Note that the #LSUP_Buffer
  338. * handle must still be freed (with a plain `free()`), but not the underlying
  339. * data buffer, since only the latter is owned by the back end. For stores
  340. * without the LSUP_STORE_COW, data are copied on retrieval and the resulting
  341. * buffers can be freed with #LSUP_buffer_free() or analogous methods.
  342. *
  343. * @param[in] it Opaque iterator handle obtained with the store's #lookup_fn.
  344. *
  345. * @param[out] sspo #LSUP_BufferTriple to be populated with three serialized
  346. * terms if found. It may be NULL, in which case it is not populated.
  347. *
  348. * @param[out] ctx If not NULL, it is populated with a NULL-terminated array of
  349. * LSUP_Buffer structs, one for each context associated with the matching
  350. * triple. These contexts are the same regardless of the context filter used
  351. * in the lookup. The array is freed with a simple #free(). This parameter
  352. * is ignored by implementations without the LSUP_STORE_CTX feature.
  353. *
  354. * To iterate over the context array, use this loop:
  355. *
  356. * size_t i = 0;
  357. * while (ctx[i].addr)
  358. * do_something(ctx + (i++));
  359. *
  360. * @return LSUP_OK if results were found; LSUP_END if no (more) results were
  361. * found; LSUP_DB_ERR if a backend error occurred.
  362. */
  363. typedef LSUP_rc (*iter_next_fn_t)(
  364. void *it, LSUP_BufferTriple *sspo, LSUP_Buffer **ctx);
  365. /** @brief Prototype: free an iterator allocated by a lookup.
  366. *
  367. * @param it[in] Iterator pointer. It will be set to NULL after freeing.
  368. */
  369. typedef void (*iter_free_fn_t)(void * it);
  370. /*
  371. * Iterface type definitions.
  372. */
  373. /** @brief Store interface.
  374. *
  375. * New store implementations should define a static structure with the relevant
  376. * members filled in. Some members are only relevant to certain types of stores
  377. * and may be set to NULL.
  378. *
  379. * #setup_fn may be optionally defined and MUST cause an idempotent action,
  380. * unless the `clear` argument is set to `true`. Callers should check if this
  381. * member is NULL and if it is not, call it at the beginning of the
  382. * interaction with the store.
  383. *
  384. * Transaction control members are only applicable to stores with the
  385. * #LSUP_STORE_TXN feature.
  386. */
  387. typedef struct store_if_t {
  388. // Basic properties.
  389. char name[16]; ///< Store type name.
  390. LSUP_StoreFeature features; ///< Feature flags.
  391. // Allocation, setup and deallocation.
  392. store_setup_fn_t setup_fn; ///< Called before #store_new_fn_t.
  393. store_new_fn_t new_fn; ///< Create a new store instance.
  394. store_free_fn_t free_fn; ///< Free the store.
  395. // Metadata.
  396. store_size_fn_t size_fn; ///< Number of triples in the store.
  397. store_id_fn_t id_fn; ///< Get store ID.
  398. // Transaction control.
  399. store_txn_begin_fn_t txn_begin_fn; ///< Begin transaction.
  400. store_txn_commit_fn_t txn_commit_fn; ///< Commit transaction.
  401. store_txn_abort_fn_t txn_abort_fn; ///< Abort transaction.
  402. iter_txn_fn_t iter_txn_fn; ///< Get iterator's transaction.
  403. // Addition.
  404. store_add_init_fn_t add_init_fn; ///< Initialize add iteration.
  405. store_add_iter_fn_t add_iter_fn; ///< Add one triple.
  406. store_add_abort_fn_t add_abort_fn; /**< Abort (roll back) the add process.
  407. *
  408. * Only available in
  409. * stores with #LSUP_STORE_TXN
  410. * feature. Optional.
  411. */
  412. store_add_done_fn_t add_done_fn; ///< Complete the add process.
  413. store_add_term_fn_t add_term_fn; /**< Add (index) a term to the store.
  414. *
  415. * Only available in stores with
  416. * #LSUP_STORE_IDX feature. Optional.
  417. */
  418. // Look up.
  419. store_lookup_fn_t lookup_fn; ///< Look up triples by pattern. 
  420. //store_trp_exist_fn_t exist_fn; ///< Check if a triple exists.
  421. iter_next_fn_t lu_next_fn; ///< Advance the lookup iterator.
  422. iter_free_fn_t lu_free_fn; ///< Free the lookup iterator.
  423. // Removal.
  424. store_remove_fn_t remove_fn; ///< Remove triples by pattern.
  425. // Namespace prefix mapping.
  426. store_nsm_put_fn_t nsm_put_fn; /**< Add a ns/pfx pair to the map.
  427. *
  428. * Only available (and mandatory)
  429. * in stores with the
  430. * #LSUP_STORE_IDX feature.
  431. */
  432. store_nsm_get_fn_t nsm_get_fn; /**< Get a namespace from the map.
  433. *
  434. * Only available (and mandatory)
  435. * in stores with the
  436. * #LSUP_STORE_IDX feature.
  437. */
  438. } LSUP_StoreInt;
  439. /*
  440. * Template for a new store and iterator implementation.
  441. * These should be placed in the .c file where the interface functions are
  442. * defined, and declared as `extern` in the related .h file.
  443. const LSUP_StoreInt my_store_int = {
  444. .name = "My Store", // Truncated to 15 chars.
  445. .features = LSUP_STORE_PERM | LSUP_STORE_IDX,
  446. .setup_fn = my_setup_fn,
  447. .new_fn = my_new_fn,
  448. .free_fn = my_free_fn,
  449. .size_fn = my_size_fn,
  450. .id_fn = my_id_fn,
  451. .txn_begin_fn = my_txn_begin_fn,
  452. .txn_commit_fn = my_txn_commit_fn,
  453. .txn_abort_fn = my_txn_abort_fn,
  454. .add_init_fn = my_init_fn,
  455. .add_iter_fn = my_iter_fn,
  456. .add_abort_fn = my_add_abort_fn,
  457. .add_done_fn = my_add_done_fn,
  458. .add_term_fn = my_add_term_fn,
  459. .lookup_fn = my_lookup_fn,
  460. .lu_next_fn = my_iter_next_fn,
  461. .lu_free_fn = my_iter_free_fn,
  462. .remove_fn = my_remove_fn,
  463. .nsm_put_fn = my_nsm_put_fn,
  464. .nsm_get_fn = my_nsm_get_fn,
  465. };
  466. */
  467. #endif /* _LSUP_STORE_INTERFACE_H */