Adding fill parameters to pairwise and windowed (#350)

* first cut at adding fill parameters to pairwise and windowed, with tests and doc updates * rename 'fill' to 'end' on pairwise per discussion in PR
2023-10-31 11:31:12 -07:00 · 2023-10-31 11:31:12 -07:00 · 3bbb9487aa
parent 4815fc8dd1
commit 3bbb9487aa
2 changed files with 87 additions and 25 deletions
--- a/boltons/iterutils.py
+++ b/boltons/iterutils.py
@ -64,7 +64,7 @@ except ImportError:
 try:
    from future_builtins import filter
-    from itertools import izip
+    from itertools import izip, izip_longest as zip_longest
    _IS_PY3 = False
 except ImportError:
    # Python 3 compat
@ -72,6 +72,7 @@ except ImportError:
    basestring = (str, bytes)
    unicode = str
    izip, xrange = zip, range
    from itertools import zip_longest
 def is_iterable(obj):
@ -424,7 +425,7 @@ def chunk_ranges(input_size, chunk_size, input_offset=0, overlap_size=0, align=F
            return
-def pairwise(src):
+def pairwise(src, end=_UNSET):
    """Convenience function for calling :func:`windowed` on *src*, with
    *size* set to 2.
@ -433,14 +434,22 @@ def pairwise(src):
    >>> pairwise([])
    []
-    The number of pairs is always one less than the number of elements
+    Unless *end* is set, the number of pairs is always one less than 
-    in the iterable passed in, except on empty inputs, which returns
+    the number of elements in the iterable passed in, except on an empty input, 
-    an empty list.
+    which will return an empty list.
    With *end* set, a number of pairs equal to the length of *src* is returned,
    with the last item of the last pair being equal to *end*.
    >>> list(pairwise(range(3), end=None))
    [(0, 1), (1, 2), (2, None)]
    This way, *end* values can be useful as sentinels to signal the end of the iterable.
    """
-    return windowed(src, 2)
+    return windowed(src, 2, fill=end)
-def pairwise_iter(src):
+def pairwise_iter(src, end=_UNSET):
    """Convenience function for calling :func:`windowed_iter` on *src*,
    with *size* set to 2.
@ -449,43 +458,70 @@ def pairwise_iter(src):
    >>> list(pairwise_iter([]))
    []
-    The number of pairs is always one less than the number of elements
+    Unless *end* is set, the number of pairs is always one less 
-    in the iterable passed in, or zero, when *src* is empty.
+    than the number of elements in the iterable passed in, 
    or zero, when *src* is empty.
    With *end* set, a number of pairs equal to the length of *src* is returned,
    with the last item of the last pair being equal to *end*. 
    >>> list(pairwise_iter(range(3), end=None))
    [(0, 1), (1, 2), (2, None)]    
    This way, *end* values can be useful as sentinels to signal the end
    of the iterable. For infinite iterators, setting *end* has no effect.
    """
-    return windowed_iter(src, 2)
+    return windowed_iter(src, 2, fill=end)
-def windowed(src, size):
+def windowed(src, size, fill=_UNSET):
-    """Returns tuples with exactly length *size*. If the iterable is
+    """Returns tuples with exactly length *size*. If *fill* is unset 
-    too short to make a window of length *size*, no tuples are
+    and the iterable is too short to make a window of length *size*, 
-    returned. See :func:`windowed_iter` for more.
+    no tuples are returned. See :func:`windowed_iter` for more.
    """
-    return list(windowed_iter(src, size))
+    return list(windowed_iter(src, size, fill=fill))
-def windowed_iter(src, size):
+def windowed_iter(src, size, fill=_UNSET):
    """Returns tuples with length *size* which represent a sliding
    window over iterable *src*.
    >>> list(windowed_iter(range(7), 3))
    [(0, 1, 2), (1, 2, 3), (2, 3, 4), (3, 4, 5), (4, 5, 6)]
-    If the iterable is too short to make a window of length *size*,
+    If *fill* is unset, and the iterable is too short to make a window 
-    then no window tuples are returned.
+    of length *size*, then no window tuples are returned.
    >>> list(windowed_iter(range(3), 5))
    []
    With *fill* set, the iterator always yields a number of windows
    equal to the length of the *src* iterable.
    >>> windowed(range(4), 3, fill=None)
    [(0, 1, 2), (1, 2, 3), (2, 3, None), (3, None, None)]
    This way, *fill* values can be useful to signal the end of the iterable.
    For infinite iterators, setting *fill* has no effect.
    """
    # TODO: lists? (for consistency)
    tees = itertools.tee(src, size)
-    try:
+    if fill is _UNSET:
-        for i, t in enumerate(tees):
+        try:
-            for _ in xrange(i):
+            for i, t in enumerate(tees):
                for _ in range(i):
                    next(t)
        except StopIteration:
            return zip([])
        return zip(*tees)
    for i, t in enumerate(tees):
        for _ in range(i):  
            try:
                next(t)
-    except StopIteration:
+            except StopIteration:
-        return izip([])
+                continue
-    return izip(*tees)
+    return zip_longest(*tees, fillvalue=fill)
 def xfrange(stop, start=None, step=1.0):
--- a/tests/test_iterutils.py
+++ b/tests/test_iterutils.py
@ -5,6 +5,10 @@ import pytest
 from boltons.dictutils import OMD
 from boltons.iterutils import (first,
                               pairwise,
                               pairwise_iter,
                               windowed,
                               windowed_iter,
                               remap,
                               research,
                               default_enter,
@ -551,3 +555,25 @@ def test_strip():
    assert strip([0,0,0,1,0,2,0,3,0,0,0],0) == [1,0,2,0,3]
    assert strip([]) == []
 def test_pairwise_filled():
    assert pairwise(range(4)) == [(0, 1), (1, 2), (2, 3)]
    assert pairwise(range(4), end=None) == [(0, 1), (1, 2), (2, 3), (3, None)]
    assert pairwise([]) == []
    assert pairwise([1], end=None) == [(1, None)]
    assert list(pairwise_iter(range(4))) == [(0, 1), (1, 2), (2, 3)]
    assert list(pairwise_iter(range(4), end=None)) == [(0, 1), (1, 2), (2, 3), (3, None)]
 def test_windowed_filled():
    assert windowed(range(4), 3) == [(0, 1, 2), (1, 2, 3)]
    assert windowed(range(4), 3, fill=None) == [(0, 1, 2), (1, 2, 3), (2, 3, None), (3, None, None)]
    assert windowed([], 3) == []
    assert windowed([], 3, fill=None) == []
    assert windowed([1, 2], 3, fill=None) == [(1, 2, None), (2, None, None)]
    assert list(windowed_iter(range(4), 3)) == [(0, 1, 2), (1, 2, 3)]
    assert list(windowed_iter(range(4), 3, fill=None)) == [(0, 1, 2), (1, 2, 3), (2, 3, None), (3, None, None)]