MAINT: Extract helper function for last-bound-inclusive search_sorted

Also avoids `r_`, and construction of arrays from lists
author: Eric Wieser <wieser.eric@gmail.com> 2017-12-27 10:07:54 +0000
committer: Eric Wieser <wieser.eric@gmail.com> 2017-12-27 10:08:22 +0000
commit: 0953c4d9543bd5e3c007f1013cf93779314ca327 (patch)
tree: d746c5c06e35c2315e645555d292cb35cc0ca139 /numpy/lib
parent: a4c995577505ed4c5480f3229537eeabd728f598 (diff)
download: numpy-0953c4d9543bd5e3c007f1013cf93779314ca327.tar.gz
1 files changed, 16 insertions, 6 deletions
diff --git a/numpy/lib/histograms.py b/numpy/lib/histograms.py
index a19ff07d8..ec2d0fe81 100644
--- a/numpy/lib/histograms.py
+++ b/numpy/lib/histograms.py
@@ -326,6 +326,18 @@ def _get_bin_edges(a, bins, range, weights):
         return bin_edges, None
 
 
+def _search_sorted_inclusive(a, v):
+    """
+    Like `searchsorted`, but where the last item in `v` is placed on the right.
+
+    In the context of a histogram, this makes the last bin edge inclusive
+    """
+    return np.concatenate((
+        a.searchsorted(v[:-1], 'left'),
+        a.searchsorted(v[-1:], 'right')
+    ))
+
+
 def histogram(a, bins=10, range=None, normed=False, weights=None,
               density=None):
     r"""
@@ -626,19 +638,17 @@ def histogram(a, bins=10, range=None, normed=False, weights=None,
         if weights is None:
             for i in np.arange(0, len(a), BLOCK):
                 sa = np.sort(a[i:i+BLOCK])
-                cum_n += np.r_[sa.searchsorted(bin_edges[:-1], 'left'),
-                               sa.searchsorted(bin_edges[-1], 'right')]
+                cum_n += _search_sorted_inclusive(sa, bin_edges)
         else:
-            zero = np.array(0, dtype=ntype)
+            zero = np.zeros(1, dtype=ntype)
             for i in np.arange(0, len(a), BLOCK):
                 tmp_a = a[i:i+BLOCK]
                 tmp_w = weights[i:i+BLOCK]
                 sorting_index = np.argsort(tmp_a)
                 sa = tmp_a[sorting_index]
                 sw = tmp_w[sorting_index]
-                cw = np.concatenate(([zero], sw.cumsum()))
-                bin_index = np.r_[sa.searchsorted(bin_edges[:-1], 'left'),
-                                  sa.searchsorted(bin_edges[-1], 'right')]
+                cw = np.concatenate((zero, sw.cumsum()))
+                bin_index = _search_sorted_inclusive(sa, bin_edges)
                 cum_n += cw[bin_index]
 
         n = np.diff(cum_n)
author	Eric Wieser <wieser.eric@gmail.com>	2017-12-27 10:07:54 +0000
committer	Eric Wieser <wieser.eric@gmail.com>	2017-12-27 10:08:22 +0000
commit	0953c4d9543bd5e3c007f1013cf93779314ca327 (patch)
tree	d746c5c06e35c2315e645555d292cb35cc0ca139 /numpy/lib
parent	a4c995577505ed4c5480f3229537eeabd728f598 (diff)
download	numpy-0953c4d9543bd5e3c007f1013cf93779314ca327.tar.gz