summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorRaymond Hettinger <python@rcn.com>2006-03-26 01:33:11 (GMT)
committerRaymond Hettinger <python@rcn.com>2006-03-26 01:33:11 (GMT)
commitee43b6c0d1583976334233c967a0b2c65b92ba84 (patch)
treebac32caab61e88989d9985db6ac228c4ad66458f
parentaf7bb8e95a1d7b1b2d35d3abdc9fe38786478161 (diff)
downloadcpython-ee43b6c0d1583976334233c967a0b2c65b92ba84.zip
cpython-ee43b6c0d1583976334233c967a0b2c65b92ba84.tar.gz
cpython-ee43b6c0d1583976334233c967a0b2c65b92ba84.tar.bz2
Guarantee evaluation order for izip(). Document its creative uses and its limitations.
-rw-r--r--Doc/lib/libitertools.tex26
1 files changed, 24 insertions, 2 deletions
diff --git a/Doc/lib/libitertools.tex b/Doc/lib/libitertools.tex
index b62bd87..88639dc 100644
--- a/Doc/lib/libitertools.tex
+++ b/Doc/lib/libitertools.tex
@@ -271,12 +271,29 @@ by functions or loops that truncate the stream.
def izip(*iterables):
iterables = map(iter, iterables)
while iterables:
- result = [i.next() for i in iterables]
+ result = [it.next() for it in iterables]
yield tuple(result)
\end{verbatim}
\versionchanged[When no iterables are specified, returns a zero length
- iterator instead of raising a TypeError exception]{2.4}
+ iterator instead of raising a TypeError exception]{2.4}
+
+ Note, the left-to-right evaluation order of the iterables is guaranteed.
+ This makes possible an idiom for clustering a data series into n-length
+ groups using \samp{izip(*[iter(s)]*n)}. For data that doesn't fit
+ n-length groups exactly, the last tuple can be pre-padded with fill
+ values using \samp(izip(*[chain(s, [None]*(n-1))]*n)}.
+
+ Note, when \function{izip()} is used with unequal length inputs, subsequent
+ iteration over the longer iterables cannot reliably be continued after
+ \function{izip()} terminates. Potentially, up to one entry will be missing
+ from each of the left-over iterables. This occurs because a value is fetched
+ from each iterator in-turn, but the process ends when one of the iterators
+ terminates. This leaves the last fetched values in limbo (they cannot be
+ returned in a final, incomplete tuple and they are cannot be pushed back
+ into the iterator for retrieval with \code{it.next()}. In general,
+ \function{izip()} should only be used with unequal length inputs when you
+ don't care about trailing, unmatched values from the longer iterables.
\end{funcdesc}
\begin{funcdesc}{repeat}{object\optional{, times}}
@@ -512,4 +529,9 @@ def pairwise(iterable):
pass
return izip(a, b)
+def grouper(n, iterable, padvalue=None):
+ "grouper(3, 'abcdefg', 'x') --> ('a','b','c'), ('d','e','f'), ('g','x','x')"
+ return izip(*[chain(iterable, repeat(padvalue, n-1))]*n)
+
+
\end{verbatim}