# 迭代器与生成器

In [1]:
import re
import reprlib

RE_WORD = re.compile('\w+')


class Sentence:
    
    def __init__(self, text):
        self.text = text
        self.words = RE_WORD.findall(text)
        
    def __getitem__(self, index):
        return self.words[index]
    
    def __len__(self):
        return len(self.words)
    
    def __repr__(self):
        return 'Sentence(%s)' % reprlib.repr(self.text)

In [2]:
s = Sentence('"The time has come," the Walrus said,')
s

Sentence('"The time ha... Walrus said,')

In [3]:
for word in s:
    print(word)

The
time
has
come
the
Walrus
said


In [4]:
list(s)

['The', 'time', 'has', 'come', 'the', 'Walrus', 'said']

In [5]:
s[0]

'The'

In [6]:
s[5]

'Walrus'

In [7]:
s[-1]

'said'

In [8]:
Sentence.__dict__

mappingproxy({'__module__': '__main__',
              '__init__': <function __main__.Sentence.__init__(self, text)>,
              '__getitem__': <function __main__.Sentence.__getitem__(self, index)>,
              '__len__': <function __main__.Sentence.__len__(self)>,
              '__repr__': <function __main__.Sentence.__repr__(self)>,
              '__dict__': <attribute '__dict__' of 'Sentence' objects>,
              '__weakref__': <attribute '__weakref__' of 'Sentence' objects>,
              '__doc__': None})

In [9]:
class Foo:
    def __iter__(self):
        pass

In [10]:
from collections import abc

issubclass(Foo, abc.Iterable)

True

In [11]:
f = Foo()
isinstance(f, abc.Iterable)

True

In [12]:
issubclass(Sentence, abc.Iterable)

False

In [13]:
isinstance(s, abc.Iterable)

False

In [14]:
s = 'ABC'

for char in s:
    print(char)

A
B
C


In [15]:
it = iter(s)

while True:
    try:
        print(next(it))
    except StopIteration:
        del it
        break

A
B
C


In [16]:
s3 = Sentence('Pig and Pepper')
it = iter(s3)
it

<iterator at 0x7f7f40e57220>

In [17]:
next(it)

'Pig'

In [18]:
next(it)

'and'

In [19]:
next(it)

'Pepper'

In [20]:
next(it)

StopIteration: 

In [22]:
list(it)

[]

In [23]:
list(iter(s3))

['Pig', 'and', 'Pepper']

In [24]:
import re
import reprlib

RE_WORD = re.compile('\w+')


class Sentence:
    
    def __init__(self, text):
        self.text = text
        self.words = RE_WORD.findall(text)
        
    def __repr__(self):
        return 'Sentence(%s)' % reprlib.repr(self.text)
    
    def __iter__(self):
        return SentenceIterator(self.words)
    

class SentenceIterator:
    
    def __init__(self, words):
        self.words = words
        self.index = 0
        
    def __next__(self):
        try:
            word = self.words[self.index]
        except IndexError:
            raise StopIteration
        self.index += 1
        return word
    
    def __iter__(self):
        return self

## Sentence类第3版：生成器函数

In [25]:
import re
import reprlib

RE_WORD = re.compile('\w+')


class Sentence:
    
    def __init__(self, text):
        self.text = text
        self.words = RE_WORD.findall(text)
        
    def __repr__(self):
        return 'Sentence(%s)' % reprlib.repr(self.text)
    
    def __iter__(self):    # 生成器函数也是迭代器实例的一种
        for word in self.words:
            yield word
        return

In [26]:
s = Sentence('"The time has come," the Walrus said,')
s

Sentence('"The time ha... Walrus said,')

In [27]:
for word in s:
    print(word)

The
time
has
come
the
Walrus
said


In [28]:
def gen_123():
    yield 1
    yield 2
    yield 3

In [29]:
gen_123

<function __main__.gen_123()>

In [30]:
gen_123()

<generator object gen_123 at 0x7f7f40dcbb30>

In [31]:
for i in gen_123():
    print(i)

1
2
3


In [32]:
g = gen_123()

In [33]:
next(g)

1

In [34]:
next(g)

2

In [35]:
next(g)

3

In [36]:
next(g)

StopIteration: 

In [38]:
def gen_AB():
    print('start')
    yield 'A'
    print('continue')
    yield 'B'
    print('end.')

In [39]:
for c in gen_AB():
    print('-->', c)

start
--> A
continue
--> B
end.


In [40]:
import re
import reprlib

RE_WORD = re.compile('\w+')


class Sentence:
    
    def __init__(self, text):
        self.text = text
        
    def __repr__(self):
        return 'Sentence(%s)' % reprlib.repr(self.text)
    
    def __iter__(self):
        for match in RE_WORD.finditer(self.text):
            yield match.group()

In [41]:
def gen_AB():
    print('start')
    yield 'A'
    print('continue')
    yield 'B'
    print('end.')


res1 = [x*3 for x in gen_AB()]

start
continue
end.


In [42]:
for i in res1:
    print('-->', i)

--> AAA
--> BBB


In [43]:
res2 = (x*3 for x in gen_AB())
res2

<generator object <genexpr> at 0x7f7f40de15f0>

In [44]:
for i in res2:
    print('-->', i)

start
--> AAA
continue
--> BBB
end.


In [45]:
import re
import reprlib

RE_WORD = re.compile('\w+')


class Sentence:
    
    def __init__(self, text):
        self.text = text
        
    def __repr__(self):
        return 'Sentence(%s)' % reprlib.repr(self.text)
    
    def __iter__(self):
        return (match.group() for match in RE_WORD.finditer(self.text))

In [46]:
class ArithmeticProgression:
    
    def __init__(self, begin, step, end=None):
        self.begin = begin
        self.step = step
        self.end = end    # None -> 无穷数列
        
    def __iter__(self):
        result = type(self.begin + self.step)(self.begin)
        forever = self.end is None
        index = 0
        while forever or result < self.end:
            yield result
            index += 1
            result = self.begin + self.step * index

In [47]:
ap = ArithmeticProgression(0, 1, 3)
list(ap)

[0, 1, 2]

In [48]:
ap = ArithmeticProgression(1, .5, 3)
list(ap)

[1.0, 1.5, 2.0, 2.5]

In [49]:
ap = ArithmeticProgression(0, 1/3, 1)
list(ap)

[0.0, 0.3333333333333333, 0.6666666666666666]

In [50]:
from fractions import Fraction

ap = ArithmeticProgression(0, Fraction(1, 3), 1)
list(ap)

[Fraction(0, 1), Fraction(1, 3), Fraction(2, 3)]

In [51]:
from decimal import Decimal

ap = ArithmeticProgression(0, Decimal('.1'), .3)
list(ap)

[Decimal('0'), Decimal('0.1'), Decimal('0.2')]

In [52]:
def aritprog_gen(begin, step, end=None):
    result = type(begin + step)(begin)
    forever = end is None
    index = 0
    while forever or result < end:
        yield result
        index += 1
        result = begin + step * index

In [53]:
import itertools

gen = itertools.count(1, .5)

In [54]:
next(gen)

1

In [55]:
next(gen)

1.5

In [56]:
next(gen)

2.0

In [57]:
next(gen)

2.5

In [58]:
gen = itertools.takewhile(lambda n: n < 3, itertools.count(1, .5))
list(gen)

[1, 1.5, 2.0, 2.5]

In [59]:
import itertools


def aritprog_gen(begin, step, end=None):    # 不是生成器函数(没有yield关键字)，但它是生成器工厂(函数)，因为它返回一个生成器对象
    first = type(begin + step)(begin)
    ap_gen = itertools.count(begin, step)
    if end is not None:
        ap_gen = itertools.takewhile(lambda n: n < end, ap_gen)
    return ap_gen

### 用于过滤的生成器函数

In [60]:
def vowel(c):
    return c.lower() in 'aeiou'

In [61]:
list(filter(vowel, 'Aardvark'))

['A', 'a', 'a']

In [62]:
import itertools

list(itertools.filterfalse(vowel, 'Aardvark'))

['r', 'd', 'v', 'r', 'k']

In [100]:
list(itertools.dropwhile(vowel, 'Aardvark'))

['r', 'd', 'v', 'a', 'r', 'k']

In [98]:
list(itertools.takewhile(vowel, 'Aardvark'))

['A', 'a']

In [65]:
list(itertools.compress('Aardvark', (1,0,1,1,0,1)))

['A', 'r', 'd', 'a']

In [66]:
list(itertools.islice('Aardvark', 4))

['A', 'a', 'r', 'd']

In [67]:
list(itertools.islice('Aardvark', 4, 7))

['v', 'a', 'r']

In [68]:
list(itertools.islice('Aardvark', 1, 7, 2))

['a', 'd', 'a']

### 用于映射的生成器函数

In [69]:
sample = [5, 4, 2, 8, 7, 6, 3, 0, 9, 1]

In [70]:
import itertools

list(itertools.accumulate(sample))

[5, 9, 11, 19, 26, 32, 35, 35, 44, 45]

In [71]:
list(itertools.accumulate(sample, min))

[5, 4, 2, 2, 2, 2, 2, 0, 0, 0]

In [72]:
list(itertools.accumulate(sample, max))

[5, 5, 5, 8, 8, 8, 8, 8, 9, 9]

In [73]:
import operator

list(itertools.accumulate(sample, operator.mul))

[5, 20, 40, 320, 2240, 13440, 40320, 0, 0, 0]

In [74]:
list(itertools.accumulate(range(1, 11), operator.mul))

[1, 2, 6, 24, 120, 720, 5040, 40320, 362880, 3628800]

In [75]:
list(enumerate('albatroz', 1))

[(1, 'a'),
 (2, 'l'),
 (3, 'b'),
 (4, 'a'),
 (5, 't'),
 (6, 'r'),
 (7, 'o'),
 (8, 'z')]

In [76]:
list(map(operator.mul, range(11), range(11)))

[0, 1, 4, 9, 16, 25, 36, 49, 64, 81, 100]

In [77]:
list(map(operator.mul, range(11), [2, 4, 8]))

[0, 4, 16]

In [78]:
list(map(lambda a, b: (a, b), range(11), [2, 4, 8]))

[(0, 2), (1, 4), (2, 8)]

In [79]:
list(itertools.starmap(operator.mul, enumerate('albatroz', 1)))

['a', 'll', 'bbb', 'aaaa', 'ttttt', 'rrrrrr', 'ooooooo', 'zzzzzzzz']

In [80]:
list(itertools.starmap(lambda a, b: b/a, enumerate(itertools.accumulate(sample), 1)))

[5.0,
 4.5,
 3.6666666666666665,
 4.75,
 5.2,
 5.333333333333333,
 5.0,
 4.375,
 4.888888888888889,
 4.5]

### 合并多个可迭代对象的生成器函数

In [81]:
list(itertools.chain('ABC', range(2)))

['A', 'B', 'C', 0, 1]

In [82]:
list(itertools.chain(enumerate('ABC')))

[(0, 'A'), (1, 'B'), (2, 'C')]

In [83]:
list(itertools.chain.from_iterable(enumerate('ABC')))

[0, 'A', 1, 'B', 2, 'C']

In [84]:
list(zip('ABC', range(5)))

[('A', 0), ('B', 1), ('C', 2)]

In [85]:
list(zip('ABC', range(5), [10, 20, 30, 40]))

[('A', 0, 10), ('B', 1, 20), ('C', 2, 30)]

In [86]:
list(itertools.zip_longest('ABC', range(5)))

[('A', 0), ('B', 1), ('C', 2), (None, 3), (None, 4)]

In [87]:
list(itertools.zip_longest('ABC', range(5), fillvalue='?'))

[('A', 0), ('B', 1), ('C', 2), ('?', 3), ('?', 4)]

In [88]:
list(itertools.product('ABC', range(2)))

[('A', 0), ('A', 1), ('B', 0), ('B', 1), ('C', 0), ('C', 1)]

In [89]:
suits = 'spade hearts diamonds clubs'.split()
list(itertools.product('AK', suits))

[('A', 'spade'),
 ('A', 'hearts'),
 ('A', 'diamonds'),
 ('A', 'clubs'),
 ('K', 'spade'),
 ('K', 'hearts'),
 ('K', 'diamonds'),
 ('K', 'clubs')]

In [90]:
list(itertools.product('ABC'))

[('A',), ('B',), ('C',)]

In [91]:
list(itertools.product('ABC', repeat=2))

[('A', 'A'),
 ('A', 'B'),
 ('A', 'C'),
 ('B', 'A'),
 ('B', 'B'),
 ('B', 'C'),
 ('C', 'A'),
 ('C', 'B'),
 ('C', 'C')]

In [92]:
list(itertools.product(range(2), repeat=3))

[(0, 0, 0),
 (0, 0, 1),
 (0, 1, 0),
 (0, 1, 1),
 (1, 0, 0),
 (1, 0, 1),
 (1, 1, 0),
 (1, 1, 1)]

In [93]:
rows = itertools.product('AB', range(2), repeat=2)

for row in rows:
    print(row)

('A', 0, 'A', 0)
('A', 0, 'A', 1)
('A', 0, 'B', 0)
('A', 0, 'B', 1)
('A', 1, 'A', 0)
('A', 1, 'A', 1)
('A', 1, 'B', 0)
('A', 1, 'B', 1)
('B', 0, 'A', 0)
('B', 0, 'A', 1)
('B', 0, 'B', 0)
('B', 0, 'B', 1)
('B', 1, 'A', 0)
('B', 1, 'A', 1)
('B', 1, 'B', 0)
('B', 1, 'B', 1)


### 把输入的各个元素扩展成多个输出元素的生成器函数

In [94]:
ct = itertools.count()
next(ct)

0

In [95]:
next(ct), next(ct), next(ct)

(1, 2, 3)

In [101]:
list(itertools.islice(itertools.count(1, .3), 3))

[1, 1.3, 1.6]

In [102]:
cy = itertools.cycle('ABC')
next(cy)

'A'

In [103]:
list(itertools.islice(cy, 7))

['B', 'C', 'A', 'B', 'C', 'A', 'B']

In [104]:
rp = itertools.repeat(7)
next(rp), next(rp)

(7, 7)

In [105]:
list(itertools.repeat(8, 4))

[8, 8, 8, 8]

In [106]:
list(map(operator.mul, range(11), itertools.repeat(5)))

[0, 5, 10, 15, 20, 25, 30, 35, 40, 45, 50]

### 组合学生成器函数

In [107]:
list(itertools.combinations('ABC', 2))

[('A', 'B'), ('A', 'C'), ('B', 'C')]

In [108]:
list(itertools.combinations_with_replacement('ABC', 2))

[('A', 'A'), ('A', 'B'), ('A', 'C'), ('B', 'B'), ('B', 'C'), ('C', 'C')]

In [109]:
list(itertools.permutations('ABC', 2))

[('A', 'B'), ('A', 'C'), ('B', 'A'), ('B', 'C'), ('C', 'A'), ('C', 'B')]

In [110]:
list(itertools.product('ABC', repeat=2))

[('A', 'A'),
 ('A', 'B'),
 ('A', 'C'),
 ('B', 'A'),
 ('B', 'B'),
 ('B', 'C'),
 ('C', 'A'),
 ('C', 'B'),
 ('C', 'C')]

### 用于重新排列元素的生成器函数

In [111]:
list(itertools.groupby('LLLAAGGG'))

[('L', <itertools._grouper at 0x7f7f2ba6f5b0>),
 ('A', <itertools._grouper at 0x7f7f2ba6f8e0>),
 ('G', <itertools._grouper at 0x7f7f2ba6f340>)]

In [112]:
for char, group in itertools.groupby('LLLAAGGG'):
    print(char, '->', list(group))

L -> ['L', 'L', 'L']
A -> ['A', 'A']
G -> ['G', 'G', 'G']


In [113]:
animals = ['duck', 'eagle', 'rat', 'giraffe', 'bear', 'bat', 'dolphin', 'shark', 'lion']
animals.sort(key=len)
animals

['rat', 'bat', 'duck', 'bear', 'lion', 'eagle', 'shark', 'giraffe', 'dolphin']

In [115]:
for length, group in itertools.groupby(animals, key=len):
    print(length, '->', list(group))

3 -> ['rat', 'bat']
4 -> ['duck', 'bear', 'lion']
5 -> ['eagle', 'shark']
7 -> ['giraffe', 'dolphin']


In [116]:
for length, group in itertools.groupby(reversed(animals), key=len):
    print(length, '->', list(group))

7 -> ['dolphin', 'giraffe']
5 -> ['shark', 'eagle']
4 -> ['lion', 'bear', 'duck']
3 -> ['bat', 'rat']


In [117]:
list(itertools.tee('ABC'))

[<itertools._tee at 0x7f7f2b95c800>, <itertools._tee at 0x7f7f2bb8f300>]

In [118]:
g1, g2 = itertools.tee('ABC')

In [119]:
next(g1)

'A'

In [120]:
next(g2)

'A'

In [121]:
next(g2)

'B'

In [122]:
list(g1)

['B', 'C']

In [123]:
list(g2)

['C']

In [124]:
list(zip(*itertools.tee('ABC')))

[('A', 'A'), ('B', 'B'), ('C', 'C')]

## 把不同的生成器(函数)结合在一起使用

In [128]:
def chain(*iterables):
    for it in iterables:
        for i in it:
            yield i

In [129]:
s = "ABC"
t = tuple(range(3))

In [130]:
list(chain(s, t))

['A', 'B', 'C', 0, 1, 2]

In [131]:
def chain(*iterables):
    for i in iterables:
        yield from i

In [132]:
list(chain(s, t))

['A', 'B', 'C', 0, 1, 2]

In [133]:
all([1, 2, 3])

True

In [134]:
all([1, 0, 3])

False

In [135]:
all([])

True

In [137]:
any([1, 2, 3])

True

In [138]:
any([1, 0, 3])

True

In [139]:
any([0, 0, 0])

False

In [140]:
any([])

False

In [141]:
g = (n for n in [0, 0.0, 7, 8])
any(g)

True

In [142]:
next(g)

8

In [143]:
from random import randint


def d6():
    return randint(1, 6)

In [144]:
d6_iter = iter(d6, 1)
d6_iter

<callable_iterator at 0x7f7f2b7da5b0>

In [145]:
for roll in d6_iter:
    print(roll)

3


In [1]:
from collections import abc

e = enumerate('ABC')
isinstance(e, abc.Iterator)

True

In [2]:
import types

e = enumerate('ABC')
isinstance(e, types.GeneratorType)    # 生成器类型： 迭代器实例的类型，调用生成器函数时生成

False

In [3]:
def fibonacci():    # 斐波纳契数列生成器函数
    a, b = 0, 1
    while True:
        yield a
        a, b = b, a+b