pandas-dev · hexgnu · Jan 29, 2018 · Jan 29, 2018 · Feb 2, 2018 · Feb 2, 2018
diff --git a/doc/source/whatsnew/v0.23.0.txt b/doc/source/whatsnew/v0.23.0.txt
@@ -589,3 +589,4 @@ Other
 ^^^^^
 
 - Improved error message when attempting to use a Python keyword as an identifier in a ``numexpr`` backed query (:issue:`18221`)
+- Bug in `Series.memory_usage` which assumes series will always have more than one element (:issue:`19368`)
diff --git a/pandas/_libs/lib.pyx b/pandas/_libs/lib.pyx
@@ -59,8 +59,14 @@ def memory_usage_of_objects(ndarray[object, ndim=1] arr):
  cdef Py_ssize_t i, n
  cdef int64_t s = 0
 
+ # The problem here is that... 
+ # A SparseArray of size 1 that has fill_value = the only value
+ # will cause this
+
+ # n = 1
+ # 
  n = len(arr)
- for i from 0 <= i < n:
+ for i in range(n):
  s += arr[i].__sizeof__()
  return s
 
@@ -131,10 +137,10 @@ def fast_unique_multiple(list arrays):
  dict table = {}
  object val, stub = 0
 
- for i from 0 <= i < k:
+ for i in range(k):
  buf = arrays[i]
  n = len(buf)
- for j from 0 <= j < n:
+ for j in range(n):
  val = buf[j]
  if val not in table:
  table[val] = stub
@@ -158,10 +164,10 @@ def fast_unique_multiple_list(list lists):
  dict table = {}
  object val, stub = 0
 
- for i from 0 <= i < k:
+ for i in range(k):
  buf = lists[i]
  n = len(buf)
- for j from 0 <= j < n:
+ for j in range(n):
  val = buf[j]
  if val not in table:
  table[val] = stub
@@ -200,7 +206,7 @@ def fast_unique_multiple_list_gen(object gen, bint sort=True):
 
  for buf in gen:
  n = len(buf)
- for j from 0 <= j < n:
+ for j in range(n): 
  val = buf[j]
  if val not in table:
  table[val] = stub
@@ -830,15 +836,15 @@ def count_level_2d(ndarray[uint8_t, ndim=2, cast=True] mask,
  if axis == 0:
  counts = np.zeros((max_bin, k), dtype='i8')
  with nogil:
- for i from 0 <= i < n:
- for j from 0 <= j < k:
+ for i in range(n):
+ for j in range(n):
  counts[labels[i], j] += mask[i, j]
 
  else: # axis == 1
  counts = np.zeros((n, max_bin), dtype='i8')
  with nogil:
- for i from 0 <= i < n:
- for j from 0 <= j < k:
+ for i in range(n):
+ for j in range(k):
  counts[i, labels[j]] += mask[i, j]
 
  return counts

diff --git a/pandas/core/base.py b/pandas/core/base.py
@@ -1069,12 +1069,18 @@ def memory_usage(self, deep=False):
  --------
  numpy.ndarray.nbytes
  """
- if hasattr(self.values, 'memory_usage'):
- return self.values.memory_usage(deep=deep)
+ # Use sparse values if they exist for memory consumption
+ if hasattr(self.values, 'sp_values'):
+ values = self.values.sp_values
+ else:
+ values = self.values
+
+ if hasattr(values, 'memory_usage'):
+ return values.memory_usage(deep=deep)
 
- v = self.values.nbytes
+ v = values.nbytes
  if deep and is_object_dtype(self) and not PYPY:
- v += lib.memory_usage_of_objects(self.values)
+ v += lib.memory_usage_of_objects(values)
  return v
 
  def factorize(self, sort=False, na_sentinel=-1):

diff --git a/pandas/tests/sparse/series/test_series.py b/pandas/tests/sparse/series/test_series.py
@@ -23,6 +23,8 @@
 from pandas.core.sparse.api import SparseSeries
 from pandas.tests.series.test_api import SharedWithSparse
 
+from itertools import product
+
 
 def _test_data1():
  # nan-based
@@ -971,6 +973,17 @@ def test_combine_first(self):
  tm.assert_sp_series_equal(result, result2)
  tm.assert_sp_series_equal(result, expected)
 
+ @pytest.mark.parametrize('deep,fill_values', [([True, False],
+ [0, 1, np.nan, None])])
+ def test_memory_usage_deep(self, deep, fill_values):
+ for deep, fill_value in product(deep, fill_values):
+ sparse_series = SparseSeries(fill_values, fill_value=fill_value)
+ dense_series = Series(fill_values)
+ sparse_usage = sparse_series.memory_usage(deep=deep)
+ dense_usage = dense_series.memory_usage(deep=deep)
+
+ assert sparse_usage < dense_usage
+
 
 class TestSparseHandlingMultiIndexes(object):
Original file line number	Diff line number	Diff line change
Expand Up		@@ -589,3 +589,4 @@ Other
		^^^^^

		- Improved error message when attempting to use a Python keyword as an identifier in a ``numexpr`` backed query (:issue:`18221`)
		- Bug in `Series.memory_usage` which assumes series will always have more than one element (:issue:`19368`)