new BatchIterator utility class for more control when retrieving objects from an iterator or generator
This commit is contained in:
parent
6815364dec
commit
ba7cf1311f
3 changed files with 110 additions and 0 deletions
55
util/iterate.py
Normal file
55
util/iterate.py
Normal file
|
@ -0,0 +1,55 @@
|
||||||
|
#
|
||||||
|
# Copyright (c) 2012 Helmut Merz helmutm@cy55.de
|
||||||
|
#
|
||||||
|
# This program is free software; you can redistribute it and/or modify
|
||||||
|
# it under the terms of the GNU General Public License as published by
|
||||||
|
# the Free Software Foundation; either version 2 of the License, or
|
||||||
|
# (at your option) any later version.
|
||||||
|
#
|
||||||
|
# This program is distributed in the hope that it will be useful,
|
||||||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
# GNU General Public License for more details.
|
||||||
|
#
|
||||||
|
# You should have received a copy of the GNU General Public License
|
||||||
|
# along with this program; if not, write to the Free Software
|
||||||
|
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
||||||
|
#
|
||||||
|
|
||||||
|
"""
|
||||||
|
Iterator and generator utilities.
|
||||||
|
"""
|
||||||
|
|
||||||
|
from itertools import islice
|
||||||
|
|
||||||
|
|
||||||
|
class BatchIterator(object):
|
||||||
|
|
||||||
|
def __init__(self, data, limit=20, start=0):
|
||||||
|
self.data = iter(data)
|
||||||
|
self.limit = limit
|
||||||
|
self.start = start
|
||||||
|
self.count = 0
|
||||||
|
self.batch = 0
|
||||||
|
self.exhausted = False
|
||||||
|
|
||||||
|
def __iter__(self):
|
||||||
|
return self
|
||||||
|
|
||||||
|
def next(self):
|
||||||
|
if self.count >= (self.batch + 1) * self.limit:
|
||||||
|
raise StopIteration
|
||||||
|
if self.start:
|
||||||
|
for i in islice(self.data, 0, self.start*self.limit):
|
||||||
|
pass
|
||||||
|
self.start = 0
|
||||||
|
self.count += 1
|
||||||
|
try:
|
||||||
|
return self.data.next()
|
||||||
|
except StopIteration:
|
||||||
|
self.exhausted = True
|
||||||
|
raise
|
||||||
|
|
||||||
|
def advance(self, batches=1):
|
||||||
|
self.batch += batches
|
||||||
|
return not self.exhausted
|
54
util/iterate.txt
Normal file
54
util/iterate.txt
Normal file
|
@ -0,0 +1,54 @@
|
||||||
|
================================
|
||||||
|
Iterator and Generator Utilities
|
||||||
|
================================
|
||||||
|
|
||||||
|
|
||||||
|
Batch Iterator
|
||||||
|
==============
|
||||||
|
|
||||||
|
A batch iterator only provides a limited number of items in one
|
||||||
|
series of access steps.
|
||||||
|
|
||||||
|
>>> from cybertools.util.iterate import BatchIterator
|
||||||
|
|
||||||
|
We create a BatchIterator upon a base iterator. The BatchIterator
|
||||||
|
only gives us a limited portion of the values provided by the base
|
||||||
|
iterator.
|
||||||
|
|
||||||
|
>>> it = BatchIterator(xrange(30))
|
||||||
|
>>> list(it)
|
||||||
|
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19]
|
||||||
|
>>> list(it)
|
||||||
|
[]
|
||||||
|
|
||||||
|
Now we advance to the next batch. The return value tells us that the
|
||||||
|
base iterator is not exhausted yet.
|
||||||
|
|
||||||
|
>>> it.advance()
|
||||||
|
True
|
||||||
|
>>> list(it)
|
||||||
|
[20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
|
||||||
|
|
||||||
|
Advancing would not help if the base iterator is exhausted.
|
||||||
|
|
||||||
|
>>> it.advance()
|
||||||
|
False
|
||||||
|
>>> list(it)
|
||||||
|
[]
|
||||||
|
|
||||||
|
We can also immediately start at the second batch by providing the ``start``
|
||||||
|
argument to the BatchIterator constructor.
|
||||||
|
|
||||||
|
>>> it = BatchIterator(xrange(30), start=1)
|
||||||
|
>>> list(it)
|
||||||
|
[20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
|
||||||
|
|
||||||
|
We can use another limit (i.e. the batch size) via the BatchIterator constructor.
|
||||||
|
|
||||||
|
>>> it = BatchIterator(xrange(30), start=1, limit=8)
|
||||||
|
>>> list(it)
|
||||||
|
[8, 9, 10, 11, 12, 13, 14, 15]
|
||||||
|
>>> it.advance()
|
||||||
|
True
|
||||||
|
>>> list(it)
|
||||||
|
[16, 17, 18, 19, 20, 21, 22, 23]
|
|
@ -25,6 +25,7 @@ def test_suite():
|
||||||
doctest.DocFileSuite('defer.txt', optionflags=flags),
|
doctest.DocFileSuite('defer.txt', optionflags=flags),
|
||||||
doctest.DocFileSuite('format.txt', optionflags=flags),
|
doctest.DocFileSuite('format.txt', optionflags=flags),
|
||||||
doctest.DocFileSuite('html.txt', optionflags=flags),
|
doctest.DocFileSuite('html.txt', optionflags=flags),
|
||||||
|
doctest.DocFileSuite('iterate.txt', optionflags=flags),
|
||||||
doctest.DocFileSuite('multikey.txt', optionflags=flags),
|
doctest.DocFileSuite('multikey.txt', optionflags=flags),
|
||||||
doctest.DocFileSuite('property.txt', optionflags=flags),
|
doctest.DocFileSuite('property.txt', optionflags=flags),
|
||||||
doctest.DocFileSuite('json.txt', optionflags=flags),
|
doctest.DocFileSuite('json.txt', optionflags=flags),
|
||||||
|
|
Loading…
Add table
Reference in a new issue