In [1]:
#hide

In [2]:
#hide
import utils
utils.hero("How to deal with a collection of objects?")

In [3]:
#hide
utils.h1("Data Structures")

In most real world scenerio, we interact with not just one data point but multiple, so we need to design some sort of optimised structure to hold multiple data points together. That is what we mean by **data structure**. \
A **data structure** defines a particular way of **storing**, **organizing**, **manipulating** and **accessing** a collection of data efficiently. For example, a list of friends, a dictionary (key-value pair)

<table border="1" cellpadding="6" cellspacing="0">
  <thead>
    <tr>
      <th>Data Structure</th>
      <th>Type</th>
      <th>Mutable?</th>
      <th>Ordered?</th>
      <th>Allows Duplicates?</th>
      <th>Example</th>
    </tr>
  </thead>
  <tbody>
    <tr>
      <td>list</td>
      <td>Built-in</td>
      <td>Yes</td>
      <td>Yes</td>
      <td>Yes</td>
      <td>[1, 2, 3, 2]</td>
    </tr>
    <tr>
      <td>tuple</td>
      <td>Built-in</td>
      <td>No</td>
      <td>Yes</td>
      <td>Yes</td>
      <td>(1, 2, 3)</td>
    </tr>
    <tr>
      <td>set</td>
      <td>Built-in</td>
      <td>Yes</td>
      <td>No</td>
      <td>No</td>
      <td>{1, 2, 3}</td>
    </tr>
    <tr>
      <td>frozenset</td>
      <td>Built-in</td>
      <td>No</td>
      <td>No</td>
      <td>No</td>
      <td>frozenset({1, 2})</td>
    </tr>
    <tr>
      <td>dict</td>
      <td>Built-in</td>
      <td>Yes</td>
      <td>Yes</td>
      <td>Keys: No<br>Values: Yes</td>
      <td>{"a": 1, "b": 2}</td>
    </tr>
    <tr>
      <td>deque</td>
      <td>From <code>collections</code></td>
      <td>Yes</td>
      <td>Yes</td>
      <td>Yes</td>
      <td>deque([1, 2, 3])</td>
    </tr>
    <tr>
      <td>defaultdict</td>
      <td>From <code>collections</code></td>
      <td>Yes</td>
      <td>Yes</td>
      <td>Keys: No<br>Values: Yes</td>
      <td>defaultdict(int)</td>
    </tr>
    <tr>
      <td>OrderedDict</td>
      <td>From <code>collections</code></td>
      <td>Yes</td>
      <td>Yes</td>
      <td>Keys: No<br>Values: Yes</td>
      <td>OrderedDict()</td>
    </tr>
    <tr>
      <td>namedtuple</td>
      <td>From <code>collections</code></td>
      <td>No</td>
      <td>Yes</td>
      <td>Yes</td>
      <td>Point(x=1, y=2)</td>
    </tr>
  </tbody>
</table>


In [4]:
#hide
utils.h1("List Data Structure")

In [5]:
import random
a = [random.randint(0, 100) for _  in range(20)] # Generate a collection of random integers and store then in a list data structure

How is `list` in python different from `array` in C? 
1. Python `list` is **dynamic** in nature. (meaning the size is not fixed.)
2. Python `list` can store **multiple datatypes** together as it is **referential array**.

In [6]:
#hide
utils.h2("Methods available for list")

In [7]:
# print
print(a)

[9, 93, 47, 12, 17, 11, 53, 44, 17, 36, 76, 67, 42, 59, 48, 70, 32, 59, 44, 40]


In [8]:
# append
a.append(10)
print(a)

[9, 93, 47, 12, 17, 11, 53, 44, 17, 36, 76, 67, 42, 59, 48, 70, 32, 59, 44, 40, 10]


In [9]:
# pop => remove last element
a.pop()
print(a)

[9, 93, 47, 12, 17, 11, 53, 44, 17, 36, 76, 67, 42, 59, 48, 70, 32, 59, 44, 40]


In [10]:
# remove element at a given index
a.pop(2)
print(a)

[9, 93, 12, 17, 11, 53, 44, 17, 36, 76, 67, 42, 59, 48, 70, 32, 59, 44, 40]


In [16]:
# remove => remove an element
a.remove(12)
print(a)

[9, 93, 17, 11, 53, 44, 17, 36, 76, 67, 42, 59, 48, 70, 32, 59, 44, 40]


In [17]:
# remove => remove an element that does not exist in the list
a.remove(50)
print(a)

ValueError: list.remove(x): x not in list

In [18]:
# count total number of elements
len(a)

18

In [19]:
# count occurence of an element
a.count(16)

0

In [23]:
# find the index of an element
a.index(17)

2

In [24]:
# reverse the list
a.reverse()
print(a)

[40, 44, 59, 32, 70, 48, 59, 42, 67, 76, 36, 17, 44, 53, 11, 17, 93, 9]


In [25]:
a.insert(2, 10)
print(a)

[40, 44, 10, 59, 32, 70, 48, 59, 42, 67, 76, 36, 17, 44, 53, 11, 17, 93, 9]


In [26]:
# append
a.append([1, 3, 4])
print(a)

[40, 44, 10, 59, 32, 70, 48, 59, 42, 67, 76, 36, 17, 44, 53, 11, 17, 93, 9, [1, 3, 4]]


In [27]:
# append
a.extend([1, 3, 4])
print(a)

[40, 44, 10, 59, 32, 70, 48, 59, 42, 67, 76, 36, 17, 44, 53, 11, 17, 93, 9, [1, 3, 4], 1, 3, 4]


In [28]:
# clear all element
a.clear()
print(a)

[]


In [29]:
# slicing
import random
a = [random.randint(0, 100) for _  in range(20)] # Generate a collection of random integers and store then in a list data structure

In [30]:
# slicing
print(a)
print(a[2:6])
print(a[0:7])
print(a[:7])
print(a[0:-4])
print(a[:-4])
print(a[:])
print(a[0:-1])
print(a[5:2])
print(a[2:8:2])
print(a[2:10:5])
print(a[2:10:-1])
print(a[10:2:-1])
print(a[10:2:-2])
print(a[19:0:-1]) # -1 => len(a) - 1
print(a[-1:0:-1])
print(a[::-1]) # special case

[45, 87, 84, 71, 34, 46, 19, 90, 73, 60, 23, 84, 57, 49, 22, 51, 35, 6, 30, 39]
[84, 71, 34, 46]
[45, 87, 84, 71, 34, 46, 19]
[45, 87, 84, 71, 34, 46, 19]
[45, 87, 84, 71, 34, 46, 19, 90, 73, 60, 23, 84, 57, 49, 22, 51]
[45, 87, 84, 71, 34, 46, 19, 90, 73, 60, 23, 84, 57, 49, 22, 51]
[45, 87, 84, 71, 34, 46, 19, 90, 73, 60, 23, 84, 57, 49, 22, 51, 35, 6, 30, 39]
[45, 87, 84, 71, 34, 46, 19, 90, 73, 60, 23, 84, 57, 49, 22, 51, 35, 6, 30]
[]
[84, 34, 19]
[84, 90]
[]
[23, 60, 73, 90, 19, 46, 34, 71]
[23, 73, 19, 34]
[39, 30, 6, 35, 51, 22, 49, 57, 84, 23, 60, 73, 90, 19, 46, 34, 71, 84, 87]
[39, 30, 6, 35, 51, 22, 49, 57, 84, 23, 60, 73, 90, 19, 46, 34, 71, 84, 87]
[39, 30, 6, 35, 51, 22, 49, 57, 84, 23, 60, 73, 90, 19, 46, 34, 71, 84, 87, 45]


In [31]:
#hide
utils.h1("dict")

In [80]:
info = {
    "name": "Ankit",
    "location": "Mumbai"
}

In [47]:
info.get("fullname")

In [74]:
info.keys(), info.values(), info.items(), list(info.keys())

(dict_keys(['name', 'location']),
 dict_values(['Ankit', 'Mumbai']),
 dict_items([('name', 'Ankit'), ('location', 'Mumbai')]),
 ['name', 'location'])

In [81]:
info.pop("name")

'Ankit'

In [88]:
print(id(info))
info["hometown"] = "Purnea"
print(id(info))

4559093056
4559093056


In [89]:
info

{'location': 'Mumbai', 'hometown': 'Purnea'}

In [90]:
#hide
utils.h1("Tuple")

In [111]:
a = (1, "Ankit", 1.0, {"name": "Ankit"}, (4, 2, 3))
a.count(1)

2

In [114]:
a.index("Ankit")

1

In [118]:
1 == 1.0

True

In [122]:
a = 60
b = 60
a is b

True

In [123]:
id(a), id(b)

(4528260000, 4528260000)