-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy path692 Top K Frequent Words.py
67 lines (54 loc) · 1.9 KB
/
692 Top K Frequent Words.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
#!/usr/bin/python3
"""
Given a non-empty list of words, return the k most frequent elements.
Your answer should be sorted by frequency from highest to lowest. If two words
have the same frequency, then the word with the lower alphabetical order comes
first.
Example 1:
Input: ["i", "love", "leetcode", "i", "love", "coding"], k = 2
Output: ["i", "love"]
Explanation: "i" and "love" are the two most frequent words.
Note that "i" comes before "love" due to a lower alphabetical order.
Example 2:
Input: ["the", "day", "is", "sunny", "the", "the", "the", "sunny", "is", "is"], k = 4
Output: ["the", "is", "sunny", "day"]
Explanation: "the", "is", "sunny" and "day" are the four most frequent words,
with the number of occurrence being 4, 3, 2 and 1 respectively.
Note:
You may assume k is always valid, 1 ≤ k ≤ number of unique elements.
Input words contain only lowercase letters.
Follow up:
Try to solve it in O(n log k) time and O(n) extra space.
"""
import heapq
from collections import defaultdict
from typing import List
class Word:
def __init__(self, content, count):
self.content = content
self.count = count
def __lt__(self, other):
if self.count == other.count:
return self.content > other.content
return self.count < other.count
class Solution:
def topKFrequent(self, words: List[str], k: int) -> List[str]:
"""
quick select log n
heap log k
"""
h = []
counter = defaultdict(int)
for w in words:
counter[w] += 1
for w, c in counter.items():
heapq.heappush(h, Word(w, c))
if len(h) > k:
heapq.heappop(h)
ret = []
while h:
w = heapq.heappop(h).content
ret.append(w)
return ret[::-1]
if __name__ == "__main__":
assert Solution().topKFrequent(["i", "love", "leetcode", "i", "love", "coding"], 2)