keyset.pyx 4.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159
  1. from cpython.mem cimport PyMem_Malloc, PyMem_Realloc, PyMem_Free
  2. cdef class Keyset:
  3. """
  4. Pre-allocated result set.
  5. Data in the set are stored as a 1D contiguous array of characters.
  6. Access to elements at an arbitrary index position is achieved by using the
  7. ``itemsize`` property multiplied by the index number.
  8. Key properties:
  9. ``ct``: number of elements in the set.
  10. ``itemsize``: size of each element, in bytes. All elements have the same
  11. size.
  12. ``size``: Total size, in bytes, of the data set. This is the product of
  13. ``itemsize`` and ``ct``.
  14. """
  15. def __cinit__(self, size_t ct, unsigned char itemsize):
  16. """
  17. Initialize and allocate memory for the data set.
  18. :param size_t ct: Number of elements to be accounted for.
  19. :param unsigned char itemsize: Size of an individual item.
  20. Note that the ``itemsize`` is an unsigned char,
  21. i.e. an item can be at most 255 bytes. This is for economy reasons,
  22. since many multiplications are done between ``itemsize`` and other
  23. char variables.
  24. """
  25. self.ct = ct
  26. self.itemsize = itemsize
  27. self.size = self.itemsize * self.ct
  28. self._cur = 0
  29. #logger.debug('Got malloc sizes: {}, {}'.format(ct, itemsize))
  30. #logger.debug(
  31. # 'Allocating {0} ({1}x{2}) bytes of Keyset data...'.format(
  32. # self.size, self.ct, self.itemsize))
  33. self.data = <unsigned char *>PyMem_Malloc(ct * itemsize)
  34. if not self.data:
  35. raise MemoryError()
  36. #logger.debug('...done allocating @ {0:x}.'.format(
  37. # <unsigned long>self.data))
  38. def __dealloc__(self):
  39. """
  40. Free the memory.
  41. This is called when the Python instance is garbage collected, which
  42. makes it handy to safely pass a Keyset instance across functions.
  43. """
  44. #logger.debug(
  45. # 'Releasing {0} ({1}x{2}) bytes of Keyset @ {3:x}...'.format(
  46. # self.size, self.ct, self.itemsize,
  47. # <unsigned long>self.data))
  48. PyMem_Free(self.data)
  49. #logger.debug('...done releasing.')
  50. cdef void resize(self, size_t ct) except *:
  51. """
  52. Resize the result set. Uses ``PyMem_Realloc``.
  53. Note that resizing to a smaller size does not copy or reallocate the
  54. data, resizing to a larger size does.
  55. Also, note that only the number of items can be changed, the item size
  56. cannot.
  57. :param size_t ct: Number of items in the result set.
  58. """
  59. cdef unsigned char *tmp
  60. self.ct = ct
  61. self.size = self.itemsize * self.ct
  62. #logger.debug(
  63. # 'Resizing Keyset to {0} ({1}x{2}) bytes @ {3:x}...'.format(
  64. # self.itemsize * ct, ct, self.itemsize,
  65. # <unsigned long>self.data))
  66. tmp = <unsigned char *>PyMem_Realloc(self.data, ct * self.itemsize)
  67. if not tmp:
  68. raise MemoryError()
  69. #logger.debug('...done resizing.')
  70. self.data = tmp
  71. # Access methods.
  72. def to_tuple(self):
  73. """
  74. Return the data set as a Python tuple.
  75. :rtype: tuple
  76. """
  77. return tuple(
  78. self.data[i: i + self.itemsize]
  79. for i in range(0, self.size, self.itemsize))
  80. def get_item_obj(self, i):
  81. """
  82. Get an item at a given index position.
  83. :rtype: bytes
  84. """
  85. if i >= self.ct:
  86. raise ValueError(f'Index {i} out of range.')
  87. return self.get_item(i)[: self.itemsize]
  88. def reset(self):
  89. """
  90. Reset the cursor to the initial position.
  91. """
  92. self._cur = 0
  93. def tell(self):
  94. """
  95. Tell the position of the cursor in the keyset.
  96. """
  97. return self._cur
  98. cdef unsigned char *get_item(self, i):
  99. """
  100. Get an item at a given index position. Cython-level method.
  101. The item size is known by the ``itemsize`` property of the object.
  102. :rtype: unsigned char*
  103. """
  104. self._cur = i
  105. return self.data + self.itemsize * i
  106. cdef bint next(self, void *val):
  107. """
  108. Populate the current value and advance the cursor by 1.
  109. :param void *val: Addres of value returned. It is NULL if
  110. the end of the buffer was reached.
  111. :rtype: bint
  112. :return: True if a value was found, False if the end of the buffer
  113. has been reached.
  114. """
  115. if self._cur >= self.ct:
  116. val = NULL
  117. return False
  118. val = self.data + self.itemsize * self._cur
  119. self._cur += 1
  120. return True