# Lambda, map, filter, reduce

## Lambda

lambda params: func(params)

In [1]:
def square_fn(x):
    return x * x

square_ld = lambda x: x * x

for i in range(10):
    assert square_fn(i) == square_ld(i)

## Maps
`map(func, iterable)` which applies the func on each elements of iterable.

In [2]:
nums = [1/3, 333/7, 2323/2230, 40/34, 2/3]

In [3]:
nums_square = map(lambda x: x*x, nums)
print(list(nums_square))

[0.1111111111111111, 2263.0408163265306, 1.0851472983570953, 1.384083044982699, 0.4444444444444444]


You can also use map with more than one iterable. For example, if you want to calculate the mean squared error of a simple linear function f(x) = ax + b with the true label labels, these two methods are equivalent:

In [4]:
a, b = 3, -0.5
xs = [2, 3, 4, 5]
labels = [6.4, 8.9, 10.9, 15.3]

In [5]:
diff = map(lambda x,y: (a*x + b - y)**2, xs, labels)
res = sum(diff)**0.5/len(xs)
res

0.35089172119045514

## Filter

`filter(func, iterable)` which finds the elements in iterable match the func.

In [6]:
diff = map(lambda x,y: (a*x + b - y)**2, xs, labels)
bad_pred = filter(lambda x: x > 0.5, list(diff))
print(list(bad_pred))

[0.8100000000000006, 0.6400000000000011]


In [7]:
from collections import Iterator
isinstance(bad_pred, Iterator)

  """Entry point for launching an IPython kernel.


True

**Lambda functions are meant for one time use !**

In [8]:
list(diff)

[]

In [9]:
def _odd_iter():
    n = 1
    while True:
        n = n + 2
        yield n

def primes():
    yield 2
    it = _odd_iter() # 初始序列
    while True:
        n = next(it) # 返回序列的第一个数
        yield n
        it = filter(lambda x: x % n > 0, it) # 构造新序列

    
# 打印 50 以内的素数:
for n in primes():
    if n < 50:
        print(n)
    else:
        break

2
3
5
7
9
11
13
15
17
19
21
23
25
27
29
31
33
35
37
39
41
43
45
47
49


In [10]:
def is_palindrome(n):
    n_str = str(n)
    return n_str == n_str[::-1]

In [11]:
list(filter(is_palindrome, range(1, 200))) == [1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 22, 33, 44, 55, 66, 77, 88, 99, 101, 111, 121, 131, 141, 151, 161, 171, 181, 191]

True

## Reduce
`reduce(fn, iterable, initializer)` is used when we want to iteratively apply an operator to all elements in a list

In [12]:
from functools import reduce
product = reduce(lambda x, y: x * y, nums)
print(product)

12.95564683272412


## Map/Reduce

In [13]:
CHAR_TO_INT = {
    '0': 0,
    '1': 1,
    '2': 2,
    '3': 3,
    '4': 4,
    '5': 5,
    '6': 6,
    '7': 7,
    '8': 8,
    '9': 9
}

def str2int(s):
    ints = map(lambda ch: CHAR_TO_INT[ch], s)
    return reduce(lambda x, y: x * 10 + y, ints)

print(str2int('0'))
print(str2int('12300'))
print(str2int('0012345'))

0
12300
12345


# List

## Unpacking

In [14]:
elems = [1, 2, 3, 4]
a, b, c, d = elems
print(a, b, c, d)

1 2 3 4


In [15]:
a, *new_elems, d = elems
print(a)
print(new_elems)
print(d)

1
[2, 3]
4


## Slicing

The syntax [x:y:z] means "take every zth element of a list from index x to index y".`[begin:end:steps]`

In [16]:
elems = list(range(10))

In [17]:
elems = list(range(10))
print(elems)
print(elems[::-1])

[0, 1, 2, 3, 4, 5, 6, 7, 8, 9]
[9, 8, 7, 6, 5, 4, 3, 2, 1, 0]


In [18]:
odds = elems[1::2]
evens = elems[::2]

reversed_evens = elems[-2::-2]
reversed_odds = elems[-1::-2]

print(odds)
print(reversed_odds)
print(evens)
print(reversed_evens)

[1, 3, 5, 7, 9]
[9, 7, 5, 3, 1]
[0, 2, 4, 6, 8]
[8, 6, 4, 2, 0]


## Insertion

In [19]:
# replace 1 by 10

elems[1] = 10
print(elems)

[0, 10, 2, 3, 4, 5, 6, 7, 8, 9]


In [20]:
# replace 10 by 20, 40

elems[1:2] = [20, 40]
elems

[0, 20, 40, 2, 3, 4, 5, 6, 7, 8, 9]

In [21]:
# insert 0,2 0,4
elems = list(range(10))
elems[1:1] = [0.2, 0.4]
elems

[0, 0.2, 0.4, 1, 2, 3, 4, 5, 6, 7, 8, 9]

## Flattening

In [22]:
list_of_lists = [[1], [2, 3], [4, 5, 6]]
sum(list_of_lists, [])

[1, 2, 3, 4, 5, 6]

In [23]:
nested_lists = [[1, 2], [[3, 4], [5, 6], [[7, 8], [9, 10], [[11, [12, 13]]]]]]
flatten = lambda x: [y for l in x for y in flatten(l)] if type(x) is list else [x]
flatten(nested_lists)

[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13]

# List vs generator

Instead of using a list to store all n-grams(`list`), we can use a generator that generates the next n-gram when it's asked for(`generator`).

In [24]:
tokens = ['i', 'want', 'to', 'go', 'to', 'school']

## generator using yield

In [25]:
def ngrams(tokens, n):
    length = len(tokens)
    for i in range(length - n + 1):
        yield tokens[i:i+n]

ngrams_generator = ngrams(tokens, 3)
print(ngrams_generator)
for ngram in ngrams_generator:
    print(ngram)

<generator object ngrams at 0x1044f5b10>
['i', 'want', 'to']
['want', 'to', 'go']
['to', 'go', 'to']
['go', 'to', 'school']


## generator using ( )

In [26]:
def ngrams(tokens, n):
    length = len(tokens)
    slices = (tokens[i:length-n+i+1] for i in range(n)) #(.) returns a generator
    return zip(*slices)

ngrams_generator = ngrams(tokens, 3)
print(ngrams_generator) # zip objects are generators and Iterators
for ngram in ngrams_generator:
    print(ngram)

<zip object at 0x10450f288>
('i', 'want', 'to')
('want', 'to', 'go')
('to', 'go', 'to')
('go', 'to', 'school')


In [27]:
from collections import Iterator
isinstance(ngrams_generator, Iterator)

True

# Generator

## using ( )

In [47]:
L = [x * x for x in range(10)]
L

[0, 1, 4, 9, 16, 25, 36, 49, 64, 81]

In [48]:
g = (x * x for x in range(10))
g

<generator object <genexpr> at 0x104543de0>

In [30]:
for x in g:
    print(x)

0
1
4
9
16
25
36
49
64
81


## using yield

In [31]:
def fib(max):
    n, a, b = 0, 0, 1
    while n < max:
        yield b
        a, b = b, a + b # don't need tmp value
        n = n + 1
    return 'done'

In [32]:
for i in fib(4):
    print(i)

1
1
2
3


In [33]:
from collections import Iterable
isinstance(fib(4), Iterable)

  """Entry point for launching an IPython kernel.


True

# Iterable vs Iterator

1. All the Iterable can use `for`.

2. All the Iterator can apply `next()`, but not for all the Iterable.

In [34]:
from collections import Iterator
isinstance([], Iterator)

False

In [35]:
isinstance(iter([]), Iterator)

True

# Classes and magic methods

In [36]:
class Node:
    """ A struct to denote the node of a binary tree.
    It contains a value and pointers to left and right children.
    """
    def __init__(self, value, left=None, right=None):
        self.value = value
        self.left = left
        self.right = right

In [37]:
root = Node(5)
print(root)

<__main__.Node object at 0x10456d208>


we use the magic method `__repr__`, which must return a printable object, like string.

In [38]:
class Node:
    """ A struct to denote the node of a binary tree.
    It contains a value and pointers to left and right children.
    """
    def __init__(self, value, left=None, right=None):
        self.value = value
        self.left = left
        self.right = right
        
    def __repr__(self):    
        strings = [f'value: {self.value}'] # f-Strings for python 3.6 +
        strings.append(f'left: {self.left.value}' if self.left else 'left: None')
        strings.append(f'right: {self.right.value}' if self.right else 'right: None')
        return ', '.join(strings)

In [39]:
root = Node(5)
print(root)

value: 5, left: None, right: None


In [40]:
left = Node(4)
root = Node(5, left)
print(root)

value: 5, left: 4, right: None


In [41]:
class Node:
    """ A struct to denote the node of a binary tree.
    It contains a value and pointers to left and right children.
    """
    def __init__(self, value, left=None, right=None):
        self.value = value
        self.left = left
        self.right = right
    
    def __eq__(self, other):
        return self.value == other.value
    
    def __lt__(self, other):
        return self.value < other.value
    
    def __ge__(self, other):
        return self.value >= other.value


left = Node(4)
root = Node(5, left)
print(left == root)
print(left < root)
print(left >= root)

False
True
False


* `__len__`: to overload the len() function.
* `__str__`: to overload the str() function.
* `__iter__`: if you want to your objects to be iterators. This also allows you to call next() on your object.

> performance boost and memory saving `__slot__`

In [42]:
class Node:
    """ A struct to denote the node of a binary tree.
    It contains a value and pointers to left and right children.
    """
    __slots__ = ('value', 'left', 'right')
    def __init__(self, value, left=None, right=None):
        self.value = value
        self.left = left
        self.right = right

# local namespace, object's attributes

The `locals()` function returns a dictionary containing the variables defined in the local namespace

In [43]:
class Model1:
    def __init__(self, hidden_size=100, num_layers=3, learning_rate=3e-4):
        print(locals())
        self.hidden_size = hidden_size
        self.num_layers = num_layers
        self.learning_rate = learning_rate

model1 = Model1()

{'self': <__main__.Model1 object at 0x104568cf8>, 'hidden_size': 100, 'num_layers': 3, 'learning_rate': 0.0003}



All attributes of an object are stored in its `__dict__`

In [44]:
model1.__dict__

{'hidden_size': 100, 'num_layers': 3, 'learning_rate': 0.0003}

two very fast ways to initialize the attributs.

In [45]:
class Model2:
    def __init__(self, hidden_size=100, num_layers=3, learning_rate=3e-4):
        params = locals()
        del params['self']
        self.__dict__ = params

model2 = Model2()
model2.__dict__

{'hidden_size': 100, 'num_layers': 3, 'learning_rate': 0.0003}

In [46]:
class Model3:
    def __init__(self, **kwargs):
        self.__dict__ = kwargs

model3 = Model3(hidden_size=100, num_layers=3, learning_rate=3e-4)
model3.__dict__

{'hidden_size': 100, 'num_layers': 3, 'learning_rate': 0.0003}

# Wildcard import

In the source script, we add `__all__` to specify the functions that can be exported.

# Sort

## python `sorted()`

In [50]:
sorted([36, 5, -12, 9, -21], key=abs)

[5, 9, -12, -21, 36]

In [49]:
sorted(['bob', 'about', 'Zoo', 'Credit'], key=str.lower, reverse=True)

['Zoo', 'Credit', 'bob', 'about']