# 02_05: Advanced Containers

In [94]:
# note: this notebook requires Python 3.7 or higher;
# it will work with Python 3.6 if you run "!pip install dataclasses" in a cell

In [95]:
import math
import collections

import numpy as np
import pandas as pd
import matplotlib.pyplot as pp

%matplotlib inline

In [96]:
people = [("Michele", "Vallisneri", "July 15"),
          ("Albert", "Einstein", "March 14"),
          ("John", "Lennon", "October 9"),
          ("Jocelyn", "Bell Burnell", "July 15")]

In [97]:
people[0][0]

'Michele'

In [98]:
people[0][1]

'Vallisneri'

In [99]:
[person for person in people if person[2] == "July 15"]

[('Michele', 'Vallisneri', 'July 15'), ('Jocelyn', 'Bell Burnell', 'July 15')]

In [100]:
# defining the namedtuple "person"
persontype = collections.namedtuple('person', ['firstname', 'lastname', "birthday"])

In [101]:
michele = persontype("Michele", "Vallisneri", "July 15")

In [102]:
michele = persontype(lastname="Vallisneri", firstname="Michele", birthday="July 15")

In [103]:
michele

person(firstname='Michele', lastname='Vallisneri', birthday='July 15')

In [104]:
michele[0], michele[1], michele[2]

('Michele', 'Vallisneri', 'July 15')

In [105]:
michele.firstname, michele.lastname, michele.birthday

('Michele', 'Vallisneri', 'July 15')

In [107]:
persontype(people[0])

TypeError: person.__new__() missing 2 required positional arguments: 'lastname' and 'birthday'

In [108]:
# use tuple unpacking on people[0] to build a namedtuple
persontype(*people[0])

person(firstname='Michele', lastname='Vallisneri', birthday='July 15')

In [110]:
namedpeople = [persontype(*person) for person in people]

In [111]:
namedpeople

[person(firstname='Michele', lastname='Vallisneri', birthday='July 15'),
 person(firstname='Albert', lastname='Einstein', birthday='March 14'),
 person(firstname='John', lastname='Lennon', birthday='October 9'),
 person(firstname='Jocelyn', lastname='Bell Burnell', birthday='July 15')]

In [112]:
[person for person in namedpeople if person.birthday == "July 15"]

[person(firstname='Michele', lastname='Vallisneri', birthday='July 15'),
 person(firstname='Jocelyn', lastname='Bell Burnell', birthday='July 15')]

In [113]:
# !pip install dataclasses

In [114]:
from dataclasses import dataclass

In [115]:
# defining a data class with the same content as the "person" nametuple
# and with a default for "birthday"

@dataclass
class personclass:
    firstname: str
    lastname: str
    birthday: str = 'unknown'

In [116]:
michele = personclass('Michele', 'Vallisneri')

In [117]:
michele

personclass(firstname='Michele', lastname='Vallisneri', birthday='unknown')

In [118]:
michele = personclass(firstname='Michele', lastname='Vallisneri')

In [119]:
michele.firstname, michele.lastname, michele.birthday

('Michele', 'Vallisneri', 'unknown')

In [120]:
michele[0]

TypeError: 'personclass' object is not subscriptable

In [121]:
print(michele)

personclass(firstname='Michele', lastname='Vallisneri', birthday='unknown')


In [123]:
# updating the data class "personclass" so that it can compute a person's full name

@dataclass
class personclass2:
    firstname: str
    lastname: str
    birthday: str = 'unknown'

    # all methods in a class carry a conventional argument "self";
    # when the methods are called on an instance (here, a specific person),
    # "self" points the instance itself, so self.firstname and self.lastname
    # are the data fields in that instance
    def fullname(self):
        return self.firstname + ' ' + self.lastname

In [124]:
michele = personclass2('Michele', 'Vallisneri', 'July 15')

In [125]:
michele.fullname()

'Michele Vallisneri'

In [127]:
questions = collections.defaultdict(mydefault)

NameError: name 'mydefault' is not defined

In [128]:
questions['The meaning of life']

NameError: name 'questions' is not defined

In [129]:
questions

NameError: name 'questions' is not defined

In [130]:
# creating a dict where a key maps to a list requires awkward code
# to create the list when a key is first seen...

birthdays = {}

for person in namedpeople:
    if person.birthday in birthdays:
        birthdays[person.birthday].append(person.firstname)
    else:
        birthdays[person.birthday] = [person.firstname]

In [131]:
birthdays

{'July 15': ['Michele', 'Jocelyn'],
 'March 14': ['Albert'],
 'October 9': ['John']}

In [135]:
list()

[]

In [133]:
# ...but it happens elegantly with defaultdict

birthdays = collections.defaultdict(list)

for person in namedpeople:
    birthdays[person.birthday].append(person.firstname)

In [134]:
birthdays

defaultdict(list,
            {'July 15': ['Michele', 'Jocelyn'],
             'March 14': ['Albert'],
             'October 9': ['John']})