test_subclassing.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469
  1. """Tests suite for MaskedArray & subclassing.
  2. :author: Pierre Gerard-Marchant
  3. :contact: pierregm_at_uga_dot_edu
  4. """
  5. import numpy as np
  6. from numpy.lib.mixins import NDArrayOperatorsMixin
  7. from numpy.ma.core import (
  8. MaskedArray,
  9. add,
  10. arange,
  11. array,
  12. asanyarray,
  13. asarray,
  14. divide,
  15. hypot,
  16. log,
  17. masked,
  18. masked_array,
  19. nomask,
  20. )
  21. from numpy.ma.testutils import assert_equal
  22. from numpy.testing import assert_, assert_raises
  23. # from numpy.ma.core import (
  24. def assert_startswith(a, b):
  25. # produces a better error message than assert_(a.startswith(b))
  26. assert_equal(a[:len(b)], b)
  27. class SubArray(np.ndarray):
  28. # Defines a generic np.ndarray subclass, that stores some metadata
  29. # in the dictionary `info`.
  30. def __new__(cls, arr, info={}):
  31. x = np.asanyarray(arr).view(cls)
  32. x.info = info.copy()
  33. return x
  34. def __array_finalize__(self, obj):
  35. super().__array_finalize__(obj)
  36. self.info = getattr(obj, 'info', {}).copy()
  37. def __add__(self, other):
  38. result = super().__add__(other)
  39. result.info['added'] = result.info.get('added', 0) + 1
  40. return result
  41. def __iadd__(self, other):
  42. result = super().__iadd__(other)
  43. result.info['iadded'] = result.info.get('iadded', 0) + 1
  44. return result
  45. subarray = SubArray
  46. class SubMaskedArray(MaskedArray):
  47. """Pure subclass of MaskedArray, keeping some info on subclass."""
  48. def __new__(cls, info=None, **kwargs):
  49. obj = super().__new__(cls, **kwargs)
  50. obj._optinfo['info'] = info
  51. return obj
  52. class MSubArray(SubArray, MaskedArray):
  53. def __new__(cls, data, info={}, mask=nomask):
  54. subarr = SubArray(data, info)
  55. _data = MaskedArray.__new__(cls, data=subarr, mask=mask)
  56. _data.info = subarr.info
  57. return _data
  58. @property
  59. def _series(self):
  60. _view = self.view(MaskedArray)
  61. _view._sharedmask = False
  62. return _view
  63. msubarray = MSubArray
  64. # Also a subclass that overrides __str__, __repr__ and __setitem__, disallowing
  65. # setting to non-class values (and thus np.ma.core.masked_print_option)
  66. # and overrides __array_wrap__, updating the info dict, to check that this
  67. # doesn't get destroyed by MaskedArray._update_from. But this one also needs
  68. # its own iterator...
  69. class CSAIterator:
  70. """
  71. Flat iterator object that uses its own setter/getter
  72. (works around ndarray.flat not propagating subclass setters/getters
  73. see https://github.com/numpy/numpy/issues/4564)
  74. roughly following MaskedIterator
  75. """
  76. def __init__(self, a):
  77. self._original = a
  78. self._dataiter = a.view(np.ndarray).flat
  79. def __iter__(self):
  80. return self
  81. def __getitem__(self, indx):
  82. out = self._dataiter.__getitem__(indx)
  83. if not isinstance(out, np.ndarray):
  84. out = out.__array__()
  85. out = out.view(type(self._original))
  86. return out
  87. def __setitem__(self, index, value):
  88. self._dataiter[index] = self._original._validate_input(value)
  89. def __next__(self):
  90. return next(self._dataiter).__array__().view(type(self._original))
  91. class ComplicatedSubArray(SubArray):
  92. def __str__(self):
  93. return f'myprefix {self.view(SubArray)} mypostfix'
  94. def __repr__(self):
  95. # Return a repr that does not start with 'name('
  96. return f'<{self.__class__.__name__} {self}>'
  97. def _validate_input(self, value):
  98. if not isinstance(value, ComplicatedSubArray):
  99. raise ValueError("Can only set to MySubArray values")
  100. return value
  101. def __setitem__(self, item, value):
  102. # validation ensures direct assignment with ndarray or
  103. # masked_print_option will fail
  104. super().__setitem__(item, self._validate_input(value))
  105. def __getitem__(self, item):
  106. # ensure getter returns our own class also for scalars
  107. value = super().__getitem__(item)
  108. if not isinstance(value, np.ndarray): # scalar
  109. value = value.__array__().view(ComplicatedSubArray)
  110. return value
  111. @property
  112. def flat(self):
  113. return CSAIterator(self)
  114. @flat.setter
  115. def flat(self, value):
  116. y = self.ravel()
  117. y[:] = value
  118. def __array_wrap__(self, obj, context=None, return_scalar=False):
  119. obj = super().__array_wrap__(obj, context, return_scalar)
  120. if context is not None and context[0] is np.multiply:
  121. obj.info['multiplied'] = obj.info.get('multiplied', 0) + 1
  122. return obj
  123. class WrappedArray(NDArrayOperatorsMixin):
  124. """
  125. Wrapping a MaskedArray rather than subclassing to test that
  126. ufunc deferrals are commutative.
  127. See: https://github.com/numpy/numpy/issues/15200)
  128. """
  129. __slots__ = ('_array', 'attrs')
  130. __array_priority__ = 20
  131. def __init__(self, array, **attrs):
  132. self._array = array
  133. self.attrs = attrs
  134. def __repr__(self):
  135. return f"{self.__class__.__name__}(\n{self._array}\n{self.attrs}\n)"
  136. def __array__(self, dtype=None, copy=None):
  137. return np.asarray(self._array)
  138. def __array_ufunc__(self, ufunc, method, *inputs, **kwargs):
  139. if method == '__call__':
  140. inputs = [arg._array if isinstance(arg, self.__class__) else arg
  141. for arg in inputs]
  142. return self.__class__(ufunc(*inputs, **kwargs), **self.attrs)
  143. else:
  144. return NotImplemented
  145. class TestSubclassing:
  146. # Test suite for masked subclasses of ndarray.
  147. def _create_data(self):
  148. x = np.arange(5, dtype='float')
  149. mx = msubarray(x, mask=[0, 1, 0, 0, 0])
  150. return x, mx
  151. def test_data_subclassing(self):
  152. # Tests whether the subclass is kept.
  153. x = np.arange(5)
  154. m = [0, 0, 1, 0, 0]
  155. xsub = SubArray(x)
  156. xmsub = masked_array(xsub, mask=m)
  157. assert_(isinstance(xmsub, MaskedArray))
  158. assert_equal(xmsub._data, xsub)
  159. assert_(isinstance(xmsub._data, SubArray))
  160. def test_maskedarray_subclassing(self):
  161. # Tests subclassing MaskedArray
  162. mx = self._create_data()[1]
  163. assert_(isinstance(mx._data, subarray))
  164. def test_masked_unary_operations(self):
  165. # Tests masked_unary_operation
  166. x, mx = self._create_data()
  167. with np.errstate(divide='ignore'):
  168. assert_(isinstance(log(mx), msubarray))
  169. assert_equal(log(x), np.log(x))
  170. def test_masked_binary_operations(self):
  171. # Tests masked_binary_operation
  172. x, mx = self._create_data()
  173. # Result should be a msubarray
  174. assert_(isinstance(add(mx, mx), msubarray))
  175. assert_(isinstance(add(mx, x), msubarray))
  176. # Result should work
  177. assert_equal(add(mx, x), mx + x)
  178. assert_(isinstance(add(mx, mx)._data, subarray))
  179. assert_(isinstance(add.outer(mx, mx), msubarray))
  180. assert_(isinstance(hypot(mx, mx), msubarray))
  181. assert_(isinstance(hypot(mx, x), msubarray))
  182. def test_masked_binary_operations2(self):
  183. # Tests domained_masked_binary_operation
  184. x, mx = self._create_data()
  185. xmx = masked_array(mx.data.__array__(), mask=mx.mask)
  186. assert_(isinstance(divide(mx, mx), msubarray))
  187. assert_(isinstance(divide(mx, x), msubarray))
  188. assert_equal(divide(mx, mx), divide(xmx, xmx))
  189. def test_attributepropagation(self):
  190. x = array(arange(5), mask=[0] + [1] * 4)
  191. my = masked_array(subarray(x))
  192. ym = msubarray(x)
  193. #
  194. z = (my + 1)
  195. assert_(isinstance(z, MaskedArray))
  196. assert_(not isinstance(z, MSubArray))
  197. assert_(isinstance(z._data, SubArray))
  198. assert_equal(z._data.info, {})
  199. #
  200. z = (ym + 1)
  201. assert_(isinstance(z, MaskedArray))
  202. assert_(isinstance(z, MSubArray))
  203. assert_(isinstance(z._data, SubArray))
  204. assert_(z._data.info['added'] > 0)
  205. # Test that inplace methods from data get used (gh-4617)
  206. ym += 1
  207. assert_(isinstance(ym, MaskedArray))
  208. assert_(isinstance(ym, MSubArray))
  209. assert_(isinstance(ym._data, SubArray))
  210. assert_(ym._data.info['iadded'] > 0)
  211. #
  212. ym._set_mask([1, 0, 0, 0, 1])
  213. assert_equal(ym._mask, [1, 0, 0, 0, 1])
  214. ym._series._set_mask([0, 0, 0, 0, 1])
  215. assert_equal(ym._mask, [0, 0, 0, 0, 1])
  216. #
  217. xsub = subarray(x, info={'name': 'x'})
  218. mxsub = masked_array(xsub)
  219. assert_(hasattr(mxsub, 'info'))
  220. assert_equal(mxsub.info, xsub.info)
  221. def test_subclasspreservation(self):
  222. # Checks that masked_array(...,subok=True) preserves the class.
  223. x = np.arange(5)
  224. m = [0, 0, 1, 0, 0]
  225. xinfo = list(zip(x, m))
  226. xsub = MSubArray(x, mask=m, info={'xsub': xinfo})
  227. #
  228. mxsub = masked_array(xsub, subok=False)
  229. assert_(not isinstance(mxsub, MSubArray))
  230. assert_(isinstance(mxsub, MaskedArray))
  231. assert_equal(mxsub._mask, m)
  232. #
  233. mxsub = asarray(xsub)
  234. assert_(not isinstance(mxsub, MSubArray))
  235. assert_(isinstance(mxsub, MaskedArray))
  236. assert_equal(mxsub._mask, m)
  237. #
  238. mxsub = masked_array(xsub, subok=True)
  239. assert_(isinstance(mxsub, MSubArray))
  240. assert_equal(mxsub.info, xsub.info)
  241. assert_equal(mxsub._mask, xsub._mask)
  242. #
  243. mxsub = asanyarray(xsub)
  244. assert_(isinstance(mxsub, MSubArray))
  245. assert_equal(mxsub.info, xsub.info)
  246. assert_equal(mxsub._mask, m)
  247. def test_subclass_items(self):
  248. """test that getter and setter go via baseclass"""
  249. x = np.arange(5)
  250. xcsub = ComplicatedSubArray(x)
  251. mxcsub = masked_array(xcsub, mask=[True, False, True, False, False])
  252. # getter should return a ComplicatedSubArray, even for single item
  253. # first check we wrote ComplicatedSubArray correctly
  254. assert_(isinstance(xcsub[1], ComplicatedSubArray))
  255. assert_(isinstance(xcsub[1, ...], ComplicatedSubArray))
  256. assert_(isinstance(xcsub[1:4], ComplicatedSubArray))
  257. # now that it propagates inside the MaskedArray
  258. assert_(isinstance(mxcsub[1], ComplicatedSubArray))
  259. assert_(isinstance(mxcsub[1, ...].data, ComplicatedSubArray))
  260. assert_(mxcsub[0] is masked)
  261. assert_(isinstance(mxcsub[0, ...].data, ComplicatedSubArray))
  262. assert_(isinstance(mxcsub[1:4].data, ComplicatedSubArray))
  263. # also for flattened version (which goes via MaskedIterator)
  264. assert_(isinstance(mxcsub.flat[1].data, ComplicatedSubArray))
  265. assert_(mxcsub.flat[0] is masked)
  266. assert_(isinstance(mxcsub.flat[1:4].base, ComplicatedSubArray))
  267. # setter should only work with ComplicatedSubArray input
  268. # first check we wrote ComplicatedSubArray correctly
  269. assert_raises(ValueError, xcsub.__setitem__, 1, x[4])
  270. # now that it propagates inside the MaskedArray
  271. assert_raises(ValueError, mxcsub.__setitem__, 1, x[4])
  272. assert_raises(ValueError, mxcsub.__setitem__, slice(1, 4), x[1:4])
  273. mxcsub[1] = xcsub[4]
  274. mxcsub[1:4] = xcsub[1:4]
  275. # also for flattened version (which goes via MaskedIterator)
  276. assert_raises(ValueError, mxcsub.flat.__setitem__, 1, x[4])
  277. assert_raises(ValueError, mxcsub.flat.__setitem__, slice(1, 4), x[1:4])
  278. mxcsub.flat[1] = xcsub[4]
  279. mxcsub.flat[1:4] = xcsub[1:4]
  280. def test_subclass_nomask_items(self):
  281. x = np.arange(5)
  282. xcsub = ComplicatedSubArray(x)
  283. mxcsub_nomask = masked_array(xcsub)
  284. assert_(isinstance(mxcsub_nomask[1, ...].data, ComplicatedSubArray))
  285. assert_(isinstance(mxcsub_nomask[0, ...].data, ComplicatedSubArray))
  286. assert_(isinstance(mxcsub_nomask[1], ComplicatedSubArray))
  287. assert_(isinstance(mxcsub_nomask[0], ComplicatedSubArray))
  288. def test_subclass_repr(self):
  289. """test that repr uses the name of the subclass
  290. and 'array' for np.ndarray"""
  291. x = np.arange(5)
  292. mx = masked_array(x, mask=[True, False, True, False, False])
  293. assert_startswith(repr(mx), 'masked_array')
  294. xsub = SubArray(x)
  295. mxsub = masked_array(xsub, mask=[True, False, True, False, False])
  296. assert_startswith(repr(mxsub),
  297. f'masked_{SubArray.__name__}(data=[--, 1, --, 3, 4]')
  298. def test_subclass_str(self):
  299. """test str with subclass that has overridden str, setitem"""
  300. # first without override
  301. x = np.arange(5)
  302. xsub = SubArray(x)
  303. mxsub = masked_array(xsub, mask=[True, False, True, False, False])
  304. assert_equal(str(mxsub), '[-- 1 -- 3 4]')
  305. xcsub = ComplicatedSubArray(x)
  306. assert_raises(ValueError, xcsub.__setitem__, 0,
  307. np.ma.core.masked_print_option)
  308. mxcsub = masked_array(xcsub, mask=[True, False, True, False, False])
  309. assert_equal(str(mxcsub), 'myprefix [-- 1 -- 3 4] mypostfix')
  310. def test_pure_subclass_info_preservation(self):
  311. # Test that ufuncs and methods conserve extra information consistently;
  312. # see gh-7122.
  313. arr1 = SubMaskedArray('test', data=[1, 2, 3, 4, 5, 6])
  314. arr2 = SubMaskedArray(data=[0, 1, 2, 3, 4, 5])
  315. diff1 = np.subtract(arr1, arr2)
  316. assert_('info' in diff1._optinfo)
  317. assert_(diff1._optinfo['info'] == 'test')
  318. diff2 = arr1 - arr2
  319. assert_('info' in diff2._optinfo)
  320. assert_(diff2._optinfo['info'] == 'test')
  321. class ArrayNoInheritance:
  322. """Quantity-like class that does not inherit from ndarray"""
  323. def __init__(self, data, units):
  324. self.magnitude = data
  325. self.units = units
  326. def __getattr__(self, attr):
  327. return getattr(self.magnitude, attr)
  328. def test_array_no_inheritance():
  329. data_masked = np.ma.array([1, 2, 3], mask=[True, False, True])
  330. data_masked_units = ArrayNoInheritance(data_masked, 'meters')
  331. # Get the masked representation of the Quantity-like class
  332. new_array = np.ma.array(data_masked_units)
  333. assert_equal(data_masked.data, new_array.data)
  334. assert_equal(data_masked.mask, new_array.mask)
  335. # Test sharing the mask
  336. data_masked.mask = [True, False, False]
  337. assert_equal(data_masked.mask, new_array.mask)
  338. assert_(new_array.sharedmask)
  339. # Get the masked representation of the Quantity-like class
  340. new_array = np.ma.array(data_masked_units, copy=True)
  341. assert_equal(data_masked.data, new_array.data)
  342. assert_equal(data_masked.mask, new_array.mask)
  343. # Test that the mask is not shared when copy=True
  344. data_masked.mask = [True, False, True]
  345. assert_equal([True, False, False], new_array.mask)
  346. assert_(not new_array.sharedmask)
  347. # Get the masked representation of the Quantity-like class
  348. new_array = np.ma.array(data_masked_units, keep_mask=False)
  349. assert_equal(data_masked.data, new_array.data)
  350. # The change did not affect the original mask
  351. assert_equal(data_masked.mask, [True, False, True])
  352. # Test that the mask is False and not shared when keep_mask=False
  353. assert_(not new_array.mask)
  354. assert_(not new_array.sharedmask)
  355. class TestClassWrapping:
  356. # Test suite for classes that wrap MaskedArrays
  357. def _create_data(self):
  358. m = np.ma.masked_array([1, 3, 5], mask=[False, True, False])
  359. wm = WrappedArray(m)
  360. return m, wm
  361. def test_masked_unary_operations(self):
  362. # Tests masked_unary_operation
  363. wm = self._create_data()[1]
  364. with np.errstate(divide='ignore'):
  365. assert_(isinstance(np.log(wm), WrappedArray))
  366. def test_masked_binary_operations(self):
  367. # Tests masked_binary_operation
  368. m, wm = self._create_data()
  369. # Result should be a WrappedArray
  370. assert_(isinstance(np.add(wm, wm), WrappedArray))
  371. assert_(isinstance(np.add(m, wm), WrappedArray))
  372. assert_(isinstance(np.add(wm, m), WrappedArray))
  373. # add and '+' should call the same ufunc
  374. assert_equal(np.add(m, wm), m + wm)
  375. assert_(isinstance(np.hypot(m, wm), WrappedArray))
  376. assert_(isinstance(np.hypot(wm, m), WrappedArray))
  377. # Test domained binary operations
  378. assert_(isinstance(np.divide(wm, m), WrappedArray))
  379. assert_(isinstance(np.divide(m, wm), WrappedArray))
  380. assert_equal(np.divide(wm, m) * m, np.divide(m, m) * wm)
  381. # Test broadcasting
  382. m2 = np.stack([m, m])
  383. assert_(isinstance(np.divide(wm, m2), WrappedArray))
  384. assert_(isinstance(np.divide(m2, wm), WrappedArray))
  385. assert_equal(np.divide(m2, wm), np.divide(wm, m2))
  386. def test_mixins_have_slots(self):
  387. mixin = NDArrayOperatorsMixin()
  388. # Should raise an error
  389. assert_raises(AttributeError, mixin.__setattr__, "not_a_real_attr", 1)
  390. m = np.ma.masked_array([1, 3, 5], mask=[False, True, False])
  391. wm = WrappedArray(m)
  392. assert_raises(AttributeError, wm.__setattr__, "not_an_attr", 2)