# 第一章:   数据结构以及算法

## 1.1 . Unpacking a Sequence into Separate Vairables

Problem:
- You have an N-element tuple or sequence that you would like to unpack into a collection of N variables.

In [1]:
p = (4, 5)

In [2]:
x, y = p


In [3]:
x

4

In [4]:
y

5

In [5]:
data = ['ACME', 50, 91.1, (2012, 12, 21)]

In [6]:
name, shares, price, date = data

In [7]:
name

'ACME'

In [8]:
date

(2012, 12, 21)

In [9]:
name, shares, price, (year, month, day) = data


In [10]:
name

'ACME'

In [11]:
year

2012

In [12]:
month

12

In [13]:
day

21

In [14]:
s = "Hello"

In [15]:
a, b, c, d, e = s


In [16]:
a

'H'

In [17]:
b

'e'

- discard certain values use _ 

In [18]:
data = ['ACME', 50, 91.1, (2012, 12, 21)]

In [19]:
_, shares, price, _ = data

In [20]:
shares

50

## 1.2  . Unpacking Elements from Iterables of Arbitrary Length
 

Problem

- You need to unpack N elements from an iterable, but the iterable may be longer than N
elements, causing a “too many values to unpack” exception.

In [21]:
def drop_first_last(grades):
    first, *middle, last = grades
    return avg(middle)

In [22]:
sale_record =  [10, 8, 7, 1, 9, 5, 10, 3]

In [23]:
*trailing_qtrs, current_qtr = sale_record

In [24]:
trailing_avg = sum(trailing_qtrs) / len(trailing_qtrs)

In [25]:
trailing_avg

7.142857142857143

In [26]:
trailing_qtrs

[10, 8, 7, 1, 9, 5, 10]

In [27]:
current_qtr

3

#### Discussion

In [28]:
records = [('foo', 1, 2),('bar', 'hello'), ('foo', 3, 4)]

In [29]:
def do_foo(x, y):
     print('for', x, y)

In [30]:
def do_bar(s):
    print('bar', s)

In [31]:
for tag, *args in records:
   if tag == "foo":
      do_foo(*args)
   elif tag == 'bar':
       do_bar(*args)

for 1 2
bar hello
for 3 4


### * unpacking can also be useful when combined with certain kinds of string processing opersion

In [32]:
line = 'nobody:*:-2:-2:Unprivileded User:/var/empy:/user/bin/fals'

In [33]:
uname, *field, homedir, sh = line.split(':')

In [34]:
uname

'nobody'

In [35]:
field

['*', '-2', '-2', 'Unprivileded User']

In [36]:
homedir

'/var/empy'

In [37]:
sh

'/user/bin/fals'

In [38]:
record = ('ACME', 50, 123.45, (12, 18, 2012))

In [39]:
name, *_, (*_, year) = record

In [40]:
name

'ACME'

In [41]:
year

2012

In [42]:
items = [1, 10, 7, 4, 5, 9]

In [43]:
head, *tail = items

In [44]:
head

1

In [45]:
tail

[10, 7, 4, 5, 9]

In [46]:
def sum(items):
    head, *tail = items
    return head + sum(tail) if tail else head

In [47]:
sum(tail)

35

## 1.3 Kepping The Last N Items

#### Problem
You want to keep a limited hoistory of the last few items seen during iteration or 
during some other kind of processing

In [48]:
from collections import deque

In [49]:
def searh(lines, pattern, hostroy=5):
    previous_lines = deque(maxlen=hostroy)
    for line in lines:
        if pattern in line:
            yield line, previous_lines
        previous_lines.append(line)

In [50]:
with open('sometxt.txt') as f:
    for line, prevlines in searh(f, 'python', 5):
        for pline in prevlines:
            print(pline, end='')
        print(line, end='')
        print("-"* 30)

mined by context.
This icon signifies a tip, suggestion, or general note.
Online Code Examples
Almost all of the code examples in this book are available online at http://github.com/
dabeaz/python-cookbook. The authors welcome bug fixes, improvements, and com‐
------------------------------
Sebastopol, CA 95472
800-998-9938 (in the United States or Canada)
707-829-0515 (international or local)
707-829-0104 (fax)
We have a web page for this book, where we list errata, examples, and any additional
information. You can access this page at http://oreil.ly/python_cookbook_3e.
------------------------------
 yield line, previous_lines
 previous_lines.append(line)
# Example use on a file
if __name__ == '__main__':
 with open('somefile.txt') as f:
 for line, prevlines in search(f, 'python', 5):
------------------------------
Here are a few other examples:
# Determine if any .py files exist in a directory
import os
files = os.listdir('dirname')
if any(name.endswith('.py') for name in files):
 p

### Discussion

In [51]:
q = deque(maxlen=3)

In [52]:
q.append(1)

In [53]:
q.append(2)

In [54]:
q.append(3)

In [55]:
q

deque([1, 2, 3])

In [56]:
q.append(4)

In [57]:
q

deque([2, 3, 4])

In [58]:
q.append(5)

In [59]:
q

deque([3, 4, 5])

### 1.4  Finding the Largest or Smallest N or Smallest N Items

In [60]:
nums = [1, 8, 2 ,11, -21, 20, 50, -1]

In [61]:
import heapq

In [62]:
heapq.nlargest(3, nums)

[50, 20, 11]

In [63]:
heapq.nsmallest(3, nums)

[-21, -1, 1]

In [64]:
portfolio = [
 {'name': 'IBM', 'shares': 100, 'price': 91.1},
 {'name': 'AAPL', 'shares': 50, 'price': 543.22},
 {'name': 'FB', 'shares': 200, 'price': 21.09},
 {'name': 'HPQ', 'shares': 35, 'price': 31.75},
 {'name': 'YHOO', 'shares': 45, 'price': 16.35},
 {'name': 'ACME', 'shares': 75, 'price': 115.65}
]

In [65]:
cheap = heapq.nsmallest(3, portfolio, key=lambda s: s['price'])

In [66]:
cheap

[{'name': 'YHOO', 'shares': 45, 'price': 16.35},
 {'name': 'FB', 'shares': 200, 'price': 21.09},
 {'name': 'HPQ', 'shares': 35, 'price': 31.75}]

In [67]:
expensive = heapq.nsmallest(3, portfolio, key=lambda s: s['price'])

In [68]:
expensive


[{'name': 'YHOO', 'shares': 45, 'price': 16.35},
 {'name': 'FB', 'shares': 200, 'price': 21.09},
 {'name': 'HPQ', 'shares': 35, 'price': 31.75}]

In [69]:
heapq.heapify(nums)

In [70]:
nums

[-21, -1, 2, 1, 8, 20, 50, 11]

In [71]:
heapq.heappop(nums)

-21

In [72]:
nums

[-1, 1, 2, 11, 8, 20, 50]

### 1.5.  Implementing a Priority Queue

#### Problem
You want to implement a queue that sorts items by a given priority and always returns
the item with the higtest priority on each pop operation


In [73]:
import heapq

In [74]:
class PriorityQueue:
    def __init__(self):
        self._queue = []
        self._index = 0
    def push(self, item, priority):
        heapq.heappush(self._queue, (-priority, self._index, item))
        self._index += 1
    def pop(self):
        return heapq.heappop(self._queue)[-1]

In [75]:
class Item:
    def __init__(self, name):
        self.name = name
    def __repr__(self):
        return 'Item({!r})'.format(self.name)

In [76]:
q = PriorityQueue()

In [77]:
q.push(Item('foo'), 1)

In [78]:
q.push(Item('bar'), 5)

In [79]:
q.push(Item('spam'), 4)

In [80]:
q.push(Item('grok'), 1)

In [81]:
q.pop()

Item('bar')

In [82]:
q.pop()

Item('spam')

In [83]:
q.pop()

Item('foo')

In [84]:
q.pop()

Item('grok')

In [85]:
from collections import OrderedDict

In [86]:
d = OrderedDict()
d['foo'] = 1
d['bar'] = 2
d['spam'] = 3
d['grok'] = 4

In [87]:
d

OrderedDict([('foo', 1), ('bar', 2), ('spam', 3), ('grok', 4)])

In [88]:
for key in d:
    print(key, d[key])

foo 1
bar 2
spam 3
grok 4


In [89]:
import json
json.dumps(d)

'{"foo": 1, "bar": 2, "spam": 3, "grok": 4}'

In [90]:
prices = {
 'ACME': 45.23,
 'AAPL': 612.78,
 'IBM': 205.55,
 'HPQ': 37.20,
 'FB': 10.75
}

In [91]:
min_price = min(zip(prices.values(), prices.keys()))

In [92]:
min_price

(10.75, 'FB')

In [93]:
prices_sorted = sorted(zip(prices.values(), prices.keys()))

In [94]:
prices_sorted

[(10.75, 'FB'),
 (37.2, 'HPQ'),
 (45.23, 'ACME'),
 (205.55, 'IBM'),
 (612.78, 'AAPL')]

In [95]:
prices_and_names = zip(prices.values(), prices.keys())
print(min(prices_and_names))
# print(max(prices_and_names))  # error

(10.75, 'FB')


In [96]:
min(prices, key=lambda k: prices[k]) # Returns 'FB'
max(prices, key=lambda k: prices[k]) # Returns 'AAPL'

'AAPL'

In [97]:
a = {
 'x' : 1,
 'y' : 2,
 'z' : 3
}

In [98]:
b = {
 'w' : 10,
 'x' : 11,
 'y' : 2
}

In [99]:
a.keys() & b.keys()

{'x', 'y'}

In [100]:
a.keys() - b.keys()

{'z'}

In [101]:
a.items() & b.items()

{('y', 2)}

In [102]:
c = {key:a[key] for key in a.keys() - {'z', 'w'}}

In [103]:
c

{'x': 1, 'y': 2}

In [104]:
def dedupe(items):
    seen = set()
    for item in items:
        if item not in seen:
            yield item
            seen.add(item)

In [105]:
 a = [1, 5, 2, 1, 9, 1, 5, 10]

In [106]:
list(dedupe(a))

[1, 5, 2, 9, 10]

In [107]:
def dedupe(items, key=None):
    seen = set()
    for item in items:
        val = item if key is None else key(item)
        if val not in seen:
            yield item
            seen.add(val)

In [151]:
a = [ {'x':1, 'y':2}, {'x':1, 'y':3}, {'x':1, 'y':2}, {'x':2, 'y':4}]

In [152]:
list(dedupe(a, key=lambda d: (d['x'],d['y'])))

[{'x': 1, 'y': 2}, {'x': 1, 'y': 3}, {'x': 2, 'y': 4}]

In [153]:
record = '01234567890123456789012345678901234567890123456789012345678900123456789012345678901234567890123456789012345678901234567890'

In [154]:
cost = int(record[20:32]) * float(record[40:48])

In [155]:
cost

1.5241567763770868e+16

In [156]:
SHARES = slice(20, 32)

In [157]:
PRICE = slice(40,48)

In [158]:
cost = int(record[SHARES]) * float(record[PRICE])

In [159]:
cost

1.5241567763770868e+16

In [160]:
 a = slice(10, 50, 2)

In [161]:
a.start

10

In [162]:
a.step

2

In [163]:
a.stop

50

In [164]:
 s = 'Hello World'

In [165]:
 a.indices(len(s))

(10, 11, 2)

In [166]:
 for i in range(*a.indices(len(s))):
        print(s[i])

d


In [169]:
 s = 'Hello World'
 a.indices(len(s))

(10, 11, 2)

In [170]:
words = [
 'look', 'into', 'my', 'eyes', 'look', 'into', 'my', 'eyes',
 'the', 'eyes', 'the', 'eyes', 'the', 'eyes', 'not', 'around', 'the',
 'eyes', "don't", 'look', 'around', 'the', 'eyes', 'look', 'into',
 'my', 'eyes', "you're", 'under'
]

In [171]:
from collections import Counter

In [172]:
word_counts = Counter(words)

In [173]:
word_counts

Counter({'look': 4,
         'into': 3,
         'my': 3,
         'eyes': 8,
         'the': 5,
         'not': 1,
         'around': 2,
         "don't": 1,
         "you're": 1,
         'under': 1})

In [174]:
top_three = word_counts.most_common(3)

In [175]:
top_three

[('eyes', 8), ('the', 5), ('look', 4)]

In [177]:
word_counts['look']

4

In [178]:
 morewords = ['why','are','you','not','looking','in','my','eyes']

In [179]:
word_counts.update(morewords)

In [180]:
word_counts

Counter({'look': 4,
         'into': 3,
         'my': 4,
         'eyes': 9,
         'the': 5,
         'not': 2,
         'around': 2,
         "don't": 1,
         "you're": 1,
         'under': 1,
         'why': 1,
         'are': 1,
         'you': 1,
         'looking': 1,
         'in': 1})

In [181]:
a = Counter(words)

In [182]:
b = Counter(morewords)

In [183]:
a + b

Counter({'look': 4,
         'into': 3,
         'my': 4,
         'eyes': 9,
         'the': 5,
         'not': 2,
         'around': 2,
         "don't": 1,
         "you're": 1,
         'under': 1,
         'why': 1,
         'are': 1,
         'you': 1,
         'looking': 1,
         'in': 1})

In [184]:
a - b

Counter({'look': 4,
         'into': 3,
         'my': 2,
         'eyes': 7,
         'the': 5,
         'around': 2,
         "don't": 1,
         "you're": 1,
         'under': 1})