# Reviewing the Python Itertools Standard Lib
Because we perform a lot of iteration in coding

In [15]:
import operator
from itertools import *

## Accumulate
Make an iterator that returns accumulated sums, or accumulated results of other binary functions (specified via the optional func argument).
If func is supplied, it should be a function of two arguments
There are a number of uses for the func argument. It can be set to min() for a running minimum, max() for a running maximum, or operator.mul() for a running product. 
Amortization tables can be built by accumulating interest and applying payment

In [2]:
def func(a,b):
    return a-b

print('Summation',list(accumulate([1,2,3,4,5,6,7])))
print('Custom function',list(accumulate([1,2,3,4,5,6,7], func)))
print('Running min',list(accumulate([1,2,3,4,5,6,7], min)))
print('Running max',list(accumulate([1,2,3,4,5,6,7], max)))
print('Running product',list(accumulate([1,2,3,4,5,6,7], operator.mul)))

# Amortize a 5% loan of 1000 with 4 annual payments of 90
cashflows = [1000, -90, -90, -90, -90]
print(list(accumulate(cashflows, lambda bal, pmt: bal*1.05 + pmt)))

Summation [1, 3, 6, 10, 15, 21, 28]
Custom function [1, -1, -4, -8, -13, -19, -26]
Running min [1, 1, 1, 1, 1, 1, 1]
Running max [1, 2, 3, 4, 5, 6, 7]
Running product [1, 2, 6, 24, 120, 720, 5040]
[1000, 960.0, 918.0, 873.9000000000001, 827.5950000000001]


## Chain
Make an iterator that returns elements from the first iterable until it is exhausted, then proceeds to the next iterable, until all of the iterables are exhausted. Used for treating consecutive sequences as a single sequence.

In [16]:
a = [1,2,3,4,5]
b = ['a','b', 'c','d']
chain(a,b)

<itertools.chain at 0x7f8806113210>

In [17]:
list(chain(a,b))

[1, 2, 3, 4, 5, 'a', 'b', 'c', 'd']

## Combinations
Return r length subsequences of elements from the input iterable

The combination tuples are emitted in lexicographic ordering according to the order of the input iterable.
So, if the input iterable is sorted, the combination tuples will be produced in sorted order

Elements are treated as unique based on their position, not their value. So if the input elements are unique, there will be no repeat values in each combination

In [5]:
list(combinations(a,2))

[(1, 2),
 (1, 3),
 (1, 4),
 (1, 5),
 (2, 3),
 (2, 4),
 (2, 5),
 (3, 4),
 (3, 5),
 (4, 5)]

In [6]:
list(combinations(b,3))

[('a', 'b', 'c'), ('a', 'b', 'd'), ('a', 'c', 'd'), ('b', 'c', 'd')]

## combinations_with_replacement
Return r length subsequences of elements from the input iterable, allowing individual elements to be repeated more than once

In [7]:
list(combinations_with_replacement(b,3))

[('a', 'a', 'a'),
 ('a', 'a', 'b'),
 ('a', 'a', 'c'),
 ('a', 'a', 'd'),
 ('a', 'b', 'b'),
 ('a', 'b', 'c'),
 ('a', 'b', 'd'),
 ('a', 'c', 'c'),
 ('a', 'c', 'd'),
 ('a', 'd', 'd'),
 ('b', 'b', 'b'),
 ('b', 'b', 'c'),
 ('b', 'b', 'd'),
 ('b', 'c', 'c'),
 ('b', 'c', 'd'),
 ('b', 'd', 'd'),
 ('c', 'c', 'c'),
 ('c', 'c', 'd'),
 ('c', 'd', 'd'),
 ('d', 'd', 'd')]

## compress
Make an iterator that filters elements from data returning only those that have a corresponding element in selectors that evaluates to True.
Stops when either the data or selectors iterables has been exhausted

In [8]:
data = 'abcdefgh'
sel = [1,0,1,0,1,0,1,0,]
list(compress(data, sel))

['a', 'c', 'e', 'g']

# Infinite iterables
count, cycle

count(start=0, step=1)

    Make an iterator that returns evenly spaced values starting with number start. Often used as an argument to map() to generate consecutive data points. Also, used with zip() to add sequence numbers.
    
    cycle(iterable)

    Make an iterator returning elements from the iterable and saving a copy of each.

In [9]:
list(zip(count(2.5,0.5), data))

[(2.5, 'a'),
 (3.0, 'b'),
 (3.5, 'c'),
 (4.0, 'd'),
 (4.5, 'e'),
 (5.0, 'f'),
 (5.5, 'g'),
 (6.0, 'h')]

In [10]:
fruits = ('apple', 'banana', 'cherry')
list(map(len, fruits))

[5, 6, 6]

In [11]:
list(map(lambda x,y: list(compress(chain(x,y), sel)), fruits, fruits))

[['a', 'p', 'e', 'p'], ['b', 'n', 'n', 'b'], ['c', 'e', 'r', 'c']]

In [14]:
fruits = ('apple', 'banana', 'cherry')
pos = [0,1,2]
', '.join(list(map(lambda x: fruits[x], pos)))

'apple, banana, cherry'

# dropwhile
Make an iterator that drops elements from the iterable as long as the predicate is true; afterwards, returns every element. Note, the iterator does not produce any output until the predicate first becomes false, so it may have a lengthy start-up time.

In [19]:
list(dropwhile(lambda x: x<5, [1,4,6,4,1]))

[6, 4, 1]

# filterfalse
Make an iterator that filters elements from iterable returning only those for which the predicate is `False`. If predicate is `None`, return the items that are false

In [20]:
list(filterfalse(lambda x: x%2, range(10)))

[0, 2, 4, 6, 8]

# groupby
Make an iterator that returns consecutive keys and groups from the iterable. The key is a function computing a key value for each element. If not specified or is None, key defaults to an identity function and returns the element unchanged. Generally, the iterable needs to already be sorted on the same key function

In [21]:
[k for k, g in groupby('AAAABBBCCDAABBB')]

['A', 'B', 'C', 'D', 'A', 'B']

In [23]:
[list(g) for k, g in groupby('AAAABBBCCDAABBB')]

[['A', 'A', 'A', 'A'],
 ['B', 'B', 'B'],
 ['C', 'C'],
 ['D'],
 ['A', 'A'],
 ['B', 'B', 'B']]

In [25]:
{k: list(g) for k, g in groupby('AAAAAABBBBCCCD')}

{'A': ['A', 'A', 'A', 'A', 'A', 'A'],
 'B': ['B', 'B', 'B', 'B'],
 'C': ['C', 'C', 'C'],
 'D': ['D']}

# islice(iterable, start, stop[, step])
Make an iterator that returns selected elements from the iterable. If start is non-zero, then elements from the iterable are skipped until start is reached. Afterward, elements are returned consecutively unless step is set higher than one which results in items being skipped. If stop is None, then iteration continues until the iterator is exhausted, if at all; otherwise, it stops at the specified position. Unlike regular slicing, `islice()` does not support negative values for start, stop, or step. Can be used to extract related fields from data where the internal structure has been flattened (for example, a multi-line report may list a name field on every third line).

In [28]:
list(islice('ABCEDFGH',2)) # STOP At 2 index

['A', 'B']

In [29]:
list(islice('ABCEDFGH',2, 4)) # start at 2 index, stop at 4

['C', 'E']

In [30]:
list(islice('ABCEDFGH',2, None)) # start at 2 index, dont stop

['C', 'E', 'D', 'F', 'G', 'H']

In [31]:
list(islice('ABCEDFGH',0, None, 2)) # start, dont stop, jump by 2

['A', 'C', 'D', 'G']

# permutations(iterable, r=None)

Return successive r length permutations of elements in the iterable.

If r is not specified or is None, then r defaults to the length of the iterable and all possible full-length permutations are generated.

In [32]:
list(permutations('ABCD', 2))

[('A', 'B'),
 ('A', 'C'),
 ('A', 'D'),
 ('B', 'A'),
 ('B', 'C'),
 ('B', 'D'),
 ('C', 'A'),
 ('C', 'B'),
 ('C', 'D'),
 ('D', 'A'),
 ('D', 'B'),
 ('D', 'C')]

In [33]:
list(permutations('ABCD'))

[('A', 'B', 'C', 'D'),
 ('A', 'B', 'D', 'C'),
 ('A', 'C', 'B', 'D'),
 ('A', 'C', 'D', 'B'),
 ('A', 'D', 'B', 'C'),
 ('A', 'D', 'C', 'B'),
 ('B', 'A', 'C', 'D'),
 ('B', 'A', 'D', 'C'),
 ('B', 'C', 'A', 'D'),
 ('B', 'C', 'D', 'A'),
 ('B', 'D', 'A', 'C'),
 ('B', 'D', 'C', 'A'),
 ('C', 'A', 'B', 'D'),
 ('C', 'A', 'D', 'B'),
 ('C', 'B', 'A', 'D'),
 ('C', 'B', 'D', 'A'),
 ('C', 'D', 'A', 'B'),
 ('C', 'D', 'B', 'A'),
 ('D', 'A', 'B', 'C'),
 ('D', 'A', 'C', 'B'),
 ('D', 'B', 'A', 'C'),
 ('D', 'B', 'C', 'A'),
 ('D', 'C', 'A', 'B'),
 ('D', 'C', 'B', 'A')]

# product(*iterables, repeat=1)
Cartesian product of input iterables.

Roughly equivalent to nested for-loops in a generator expression.

In [34]:
list1 = [1,2,3,4,5,6]
list2 = ['a','b','c','d','e','f']
list(product(list1, list2))

[(1, 'a'),
 (1, 'b'),
 (1, 'c'),
 (1, 'd'),
 (1, 'e'),
 (1, 'f'),
 (2, 'a'),
 (2, 'b'),
 (2, 'c'),
 (2, 'd'),
 (2, 'e'),
 (2, 'f'),
 (3, 'a'),
 (3, 'b'),
 (3, 'c'),
 (3, 'd'),
 (3, 'e'),
 (3, 'f'),
 (4, 'a'),
 (4, 'b'),
 (4, 'c'),
 (4, 'd'),
 (4, 'e'),
 (4, 'f'),
 (5, 'a'),
 (5, 'b'),
 (5, 'c'),
 (5, 'd'),
 (5, 'e'),
 (5, 'f'),
 (6, 'a'),
 (6, 'b'),
 (6, 'c'),
 (6, 'd'),
 (6, 'e'),
 (6, 'f')]

In [36]:
list(product(list1, list2, repeat=2))

[(1, 'a', 1, 'a'),
 (1, 'a', 1, 'b'),
 (1, 'a', 1, 'c'),
 (1, 'a', 1, 'd'),
 (1, 'a', 1, 'e'),
 (1, 'a', 1, 'f'),
 (1, 'a', 2, 'a'),
 (1, 'a', 2, 'b'),
 (1, 'a', 2, 'c'),
 (1, 'a', 2, 'd'),
 (1, 'a', 2, 'e'),
 (1, 'a', 2, 'f'),
 (1, 'a', 3, 'a'),
 (1, 'a', 3, 'b'),
 (1, 'a', 3, 'c'),
 (1, 'a', 3, 'd'),
 (1, 'a', 3, 'e'),
 (1, 'a', 3, 'f'),
 (1, 'a', 4, 'a'),
 (1, 'a', 4, 'b'),
 (1, 'a', 4, 'c'),
 (1, 'a', 4, 'd'),
 (1, 'a', 4, 'e'),
 (1, 'a', 4, 'f'),
 (1, 'a', 5, 'a'),
 (1, 'a', 5, 'b'),
 (1, 'a', 5, 'c'),
 (1, 'a', 5, 'd'),
 (1, 'a', 5, 'e'),
 (1, 'a', 5, 'f'),
 (1, 'a', 6, 'a'),
 (1, 'a', 6, 'b'),
 (1, 'a', 6, 'c'),
 (1, 'a', 6, 'd'),
 (1, 'a', 6, 'e'),
 (1, 'a', 6, 'f'),
 (1, 'b', 1, 'a'),
 (1, 'b', 1, 'b'),
 (1, 'b', 1, 'c'),
 (1, 'b', 1, 'd'),
 (1, 'b', 1, 'e'),
 (1, 'b', 1, 'f'),
 (1, 'b', 2, 'a'),
 (1, 'b', 2, 'b'),
 (1, 'b', 2, 'c'),
 (1, 'b', 2, 'd'),
 (1, 'b', 2, 'e'),
 (1, 'b', 2, 'f'),
 (1, 'b', 3, 'a'),
 (1, 'b', 3, 'b'),
 (1, 'b', 3, 'c'),
 (1, 'b', 3, 'd'),
 (1, 'b', 3,

# repeat(object[, times])
Make an iterator that returns object over and over again.

In [37]:
list(repeat('a', 3))

['a', 'a', 'a']

A common use for repeat is to supply a stream of constant values to map or zip:

In [39]:
list(map(pow, range(10), repeat(2)))

[0, 1, 4, 9, 16, 25, 36, 49, 64, 81]