keyset.pyx 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122
  1. from cpython.mem cimport PyMem_Malloc, PyMem_Realloc, PyMem_Free
  2. cdef class Keyset:
  3. """
  4. Pre-allocated result set.
  5. Data in the set are stored as a 1D contiguous array of characters.
  6. Access to elements at an arbitrary index position is achieved by using the
  7. ``itemsize`` property multiplied by the index number.
  8. Key properties:
  9. ``ct``: number of elements in the set.
  10. ``itemsize``: size of each element, in bytes. All elements have the same
  11. size.
  12. ``size``: Total size, in bytes, of the data set. This is the product of
  13. ``itemsize`` and ``ct``.
  14. """
  15. def __cinit__(self, size_t ct, unsigned char itemsize):
  16. """
  17. Initialize and allocate memory for the data set.
  18. :param size_t ct: Number of elements to be accounted for.
  19. :param unsigned char itemsize: Size of an individual item.
  20. Note that the ``itemsize`` is an unsigned char,
  21. i.e. an item can be at most 255 bytes. This is for economy reasons,
  22. since many multiplications are done between ``itemsize`` and other
  23. char variables.
  24. """
  25. self.ct = ct
  26. self.itemsize = itemsize
  27. self.size = self.itemsize * self.ct
  28. #logger.debug('Got malloc sizes: {}, {}'.format(ct, itemsize))
  29. #logger.debug(
  30. # 'Allocating {0} ({1}x{2}) bytes of Keyset data...'.format(
  31. # self.size, self.ct, self.itemsize))
  32. self.data = <unsigned char *>PyMem_Malloc(ct * itemsize)
  33. if not self.data:
  34. raise MemoryError()
  35. #logger.debug('...done allocating @ {0:x}.'.format(
  36. # <unsigned long>self.data))
  37. def __dealloc__(self):
  38. """
  39. Free the memory.
  40. This is called when the Python instance is garbage collected, which
  41. makes it handy to safely pass a Keyset instance across functions.
  42. """
  43. #logger.debug(
  44. # 'Releasing {0} ({1}x{2}) bytes of Keyset @ {3:x}...'.format(
  45. # self.size, self.ct, self.itemsize,
  46. # <unsigned long>self.data))
  47. PyMem_Free(self.data)
  48. #logger.debug('...done releasing.')
  49. cdef void resize(self, size_t ct) except *:
  50. """
  51. Resize the result set. Uses ``PyMem_Realloc``.
  52. Note that resizing to a smaller size does not copy or reallocate the
  53. data, resizing to a larger size does.
  54. Also, note that only the number of items can be changed, the item size
  55. cannot.
  56. :param size_t ct: Number of items in the result set.
  57. """
  58. cdef unsigned char *tmp
  59. self.ct = ct
  60. self.size = self.itemsize * self.ct
  61. #logger.debug(
  62. # 'Resizing Keyset to {0} ({1}x{2}) bytes @ {3:x}...'.format(
  63. # self.itemsize * ct, ct, self.itemsize,
  64. # <unsigned long>self.data))
  65. tmp = <unsigned char *>PyMem_Realloc(self.data, ct * self.itemsize)
  66. if not tmp:
  67. raise MemoryError()
  68. #logger.debug('...done resizing.')
  69. self.data = tmp
  70. # Access methods.
  71. def to_tuple(self):
  72. """
  73. Return the data set as a Python tuple.
  74. :rtype: tuple
  75. """
  76. return tuple(
  77. self.data[i: i + self.itemsize]
  78. for i in range(0, self.size, self.itemsize))
  79. def get_item_obj(self, i):
  80. """
  81. Get an item at a given index position.
  82. :rtype: bytes
  83. """
  84. return self.get_item(i)[: self.itemsize]
  85. cdef unsigned char *get_item(self, i):
  86. """
  87. Get an item at a given index position. Cython-level method.
  88. The item size is known by the ``itemsize`` property of the object.
  89. :rtype: unsigned char*
  90. """
  91. return self.data + self.itemsize * i