## Part 1: Probabilistic context-free grammars

In [516]:
#importing libraries
import steven_tree
from collections import defaultdict

In [529]:
#example tree provided
t = steven_tree.Tree.from_string('''(S
    (NP
        (DT the)
        (NN teacher)
    )
    (S|
        (VP
            (MD will)
            (VP
                (VB lecture)
                (VP|
                    (NP
                        (NN today)
                    )
                    (PP
                        (IN in)
                        (NP
                            (DT the)
                            (NP|
                                (NN lecture)
                                (NN hall)
                            )
                        )
                    )
                )
            )
        )
        (. .)
    )
)''')

In [518]:
for x in t.collapse_unary().chomsky_normal_form().terminals():
    print(x)

the
teacher
will
lecture
today
in
the
lecture
hall
.


In [519]:
for (mother, daughters) in t.productions():
    print mother
    print daughters

S
('NP', 'S|')
NP
('DT', 'NN')
DT
('the',)
NN
('teacher',)
S|
('VP', '.')
VP
('MD', 'VP')
MD
('will',)
VP
('VB', 'VP|')
VB
('lecture',)
VP|
('NP', 'PP')
NP
('NN',)
NN
('today',)
PP
('IN', 'NP')
IN
('in',)
NP
('DT', 'NP|')
DT
('the',)
NP|
('NN', 'NN')
NN
('lecture',)
NN
('hall',)
.
('.',)


In [13]:
#additional functions for creating the grammar
def prob_productions(dict_productions):
    new_dict = defaultdict(lambda: defaultdict(float))
    for key in dict_productions:
        denom = sum(dict_productions[key].values())
        for value in dict_productions[key]:
            new_dict[key][value] = dict_productions[key][value]/denom
    return new_dict

def combine_dict_productions(dict_productions1, dict_productions2):
    new_dictionary = defaultdict(lambda: defaultdict(float))
    for key in dict_productions1:
        for value in dict_productions1[key]:
            new_dictionary[key][value] += dict_productions1[key][value]
    for key in dict_productions2:
        for value in dict_productions2[key]:
            new_dictionary[key][value] += dict_productions2[key][value]
    return new_dictionary

def make_pretty_dict(grammar_dictionary):
    new_dictionary = defaultdict(lambda: defaultdict(float))
    for key in grammar_dictionary:
        new_item = ""
        for value in grammar_dictionary[key]:
            print(value)
            new_item = ""
            for item in value:
                #print(item)
                #new_item = ""
                new_item+=item
                new_item+= " "
            print(new_item)
            new_dictionary[key][new_item[:-1]] = grammar_dictionary[key][value]
    return new_dictionary


In [14]:
t.collapse_unary().chomsky_normal_form().dict_productions()

defaultdict(<function steven_tree.<lambda>>,
            {'.': defaultdict(float, {('.',): 1.0}),
             'DT': defaultdict(float, {('the',): 2.0}),
             'IN': defaultdict(float, {('in',): 1.0}),
             'MD': defaultdict(float, {('will',): 1.0}),
             'NN': defaultdict(float,
                         {('hall',): 1.0,
                          ('lecture',): 1.0,
                          ('teacher',): 1.0,
                          ('today',): 1.0}),
             'NP': defaultdict(float,
                         {('DT', 'NN'): 1.0,
                          ('DT', 'NP|'): 1.0,
                          ('NN',): 1.0}),
             'NP|': defaultdict(float, {('NN', 'NN'): 1.0}),
             'PP': defaultdict(float, {('IN', 'NP'): 1.0}),
             'S': defaultdict(float, {('NP', 'S|'): 1.0}),
             'S|': defaultdict(float, {('VP', '.'): 1.0}),
             'VB': defaultdict(float, {('lecture',): 1.0}),
             'VP': defaultdict(float, {('MD', 'VP

In [534]:
x = prob_productions(t.dict_productions())
x2 = make_pretty_dict(x)
for key in x2:
    for value in x2[key]:
        print(key + " -> " + str(value) + " " + str(x2[key][value]))

('will',)
will 
('lecture',)
lecture 
('teacher',)
teacher 
('today',)
today 
('lecture',)
lecture 
('hall',)
hall 
('VP', '.')
VP . 
('NP', 'PP')
NP PP 
('IN', 'NP')
IN NP 
('.',)
. 
('MD', 'VP')
MD VP 
('VB', 'VP|')
VB VP| 
('NN', 'NN')
NN NN 
('NP', 'S|')
NP S| 
('in',)
in 
('DT', 'NN')
DT NN 
('NN',)
NN 
('DT', 'NP|')
DT NP| 
('the',)
the 
MD -> will 1.0
VB -> lecture 1.0
NN -> lecture 0.25
NN -> teacher 0.25
NN -> today 0.25
NN -> hall 0.25
S| -> VP . 1.0
VP| -> NP PP 1.0
PP -> IN NP 1.0
. -> . 1.0
VP -> MD VP 0.5
VP -> VB VP| 0.5
NP| -> NN NN 1.0
S -> NP S| 1.0
IN -> in 1.0
NP -> DT NN 0.333333333333
NP -> DT NP| 0.333333333333
NP -> NN 0.333333333333
DT -> the 1.0


In [20]:
trees = []
f = open("wsj-normalized.psd", "r")
x = steven_tree.Tree.from_stream(f)
for item in x:
    trees.append(item)
f.close()

<open file 'wsj-normalized.psd', mode 'r' at 0x10b43fed0>


In [21]:
trees[0]

(TOP
    (NP-SBJ
        (NP
            (NNP <NNP>)
            (NNP <NNP>)
        )
        (, ,)
        (ADJP
            (NP
                (CD <CD>)
                (NNS years)
            )
            (JJ old)
        )
        (, ,)
    )
    (VP
        (MD will)
        (VP
            (VB join)
            (NP
                (DT the)
                (NN board)
            )
            (PP-CLR
                (IN as)
                (NP
                    (DT a)
                    (JJ nonexecutive)
                    (NN director)
                )
            )
            (NP-TMP
                (NNP <NNP>)
                (CD <CD>)
            )
        )
    )
    (. .)
)

In [22]:
trees[0].collapse_unary().chomsky_normal_form()

(TOP
    (NP-SBJ
        (NP
            (NNP <NNP>)
            (NNP <NNP>)
        )
        (NP-SBJ|<,&ADJP>
            (, ,)
            (NP-SBJ|<ADJP&,>
                (ADJP
                    (NP
                        (CD <CD>)
                        (NNS years)
                    )
                    (JJ old)
                )
                (, ,)
            )
        )
    )
    (TOP|<VP&.>
        (VP
            (MD will)
            (VP
                (VB join)
                (VP|<NP&PP-CLR>
                    (NP
                        (DT the)
                        (NN board)
                    )
                    (VP|<PP-CLR&NP-TMP>
                        (PP-CLR
                            (IN as)
                            (NP
                                (DT a)
                                (NP|<JJ&NN>
                                    (JJ nonexecutive)
                                    (NN director)
                                )
     

In [23]:
len(trees)

14898

In [24]:
chomsky_normed_trees = []
i = 0
for my_tree in trees:
    #print(my_tree)
    if i %100 == 0:
        print(i)
    i+=1
    new_tree = my_tree.collapse_unary().chomsky_normal_form()
    chomsky_normed_trees.append(new_tree)
    #print(new_tree)

0
100
200
300
400
500
600
700
800
900
1000
1100
1200
1300
1400
1500
1600
1700
1800
1900
2000
2100
2200
2300
2400
2500
2600
2700
2800
2900
3000
3100
3200
3300
3400
3500
3600
3700
3800
3900
4000
4100
4200
4300
4400
4500
4600
4700
4800
4900
5000
5100
5200
5300
5400
5500
5600
5700
5800
5900
6000
6100
6200
6300
6400
6500
6600
6700
6800
6900
7000
7100
7200
7300
7400
7500
7600
7700
7800
7900
8000
8100
8200
8300
8400
8500
8600
8700
8800
8900
9000
9100
9200
9300
9400
9500
9600
9700
9800
9900
10000
10100
10200
10300
10400
10500
10600
10700
10800
10900
11000
11100
11200
11300
11400
11500
11600
11700
11800
11900
12000
12100
12200
12300
12400
12500
12600
12700
12800
12900
13000
13100
13200
13300
13400
13500
13600
13700
13800
13900
14000
14100
14200
14300
14400
14500
14600
14700
14800


In [25]:
test = chomsky_normed_trees[0]
prev_dict = test.dict_productions()
print(prev_dict)
i = 1
for my_tree in chomsky_normed_trees[1:]:
    #print(my_tree.collapse_unary().chomsky_normal_form())
    if i%100 == 0:
        print(i)
    #print(next_tree)
    next_tree_dict = my_tree.dict_productions()
    prev_dict = combine_dict_productions(prev_dict, next_tree_dict)
    i+=1

defaultdict(<function <lambda> at 0x10beb7de8>, {'VP|<PP-CLR&NP-TMP>': defaultdict(<type 'float'>, {('PP-CLR', 'NP-TMP'): 1.0}), 'TOP|<VP&.>': defaultdict(<type 'float'>, {('VP', '.'): 1.0}), 'NP-SBJ|<ADJP&,>': defaultdict(<type 'float'>, {('ADJP', ','): 1.0}), 'ADJP': defaultdict(<type 'float'>, {('NP', 'JJ'): 1.0}), 'TOP': defaultdict(<type 'float'>, {('NP-SBJ', 'TOP|<VP&.>'): 1.0}), 'NP-TMP': defaultdict(<type 'float'>, {('NNP', 'CD'): 1.0}), 'JJ': defaultdict(<type 'float'>, {('nonexecutive',): 1.0, ('old',): 1.0}), 'DT': defaultdict(<type 'float'>, {('the',): 1.0, ('a',): 1.0}), 'NN': defaultdict(<type 'float'>, {('board',): 1.0, ('director',): 1.0}), ',': defaultdict(<type 'float'>, {(',',): 2.0}), '.': defaultdict(<type 'float'>, {('.',): 1.0}), 'NP': defaultdict(<type 'float'>, {('CD', 'NNS'): 1.0, ('DT', 'NN'): 1.0, ('NNP', 'NNP'): 1.0, ('DT', 'NP|<JJ&NN>'): 1.0}), 'NNS': defaultdict(<type 'float'>, {('years',): 1.0}), 'NNP': defaultdict(<type 'float'>, {('<NNP>',): 3.0}), 'VB

In [26]:
len(prev_dict.keys())

3960

In [533]:
rules = 0
for key in prev_dict:
    rules+= len(prev_dict[key].values())
rules

30364

In [532]:
print(prob_productions(prev_dict))



#### A paragraph talking about your approach, what worked, what didn't, etc.
I used Steven's code from tree.py, since I believe I have a small error in my version of tree.py. I made one edit to the file "steven_tree.py"--I added a function to the Tree class called `dict_productions()`. I then used this to create the grammar, by also using two more functions in this jupyter notebook: `prob_productions()` and `combine_dict_productions()`. `combine_dict_productions()` allowed me to join together the productions from two trees. `prob_productions()` changed the count structure of the dictionary of productions to a probability.



## Part 2: The CYK algorithm

In [485]:
sentence = ['her', 'dog', 'is', 'mean', '. .']

In [418]:
def print_table_nicely(table):
    s = ""
    for ls in table:
        #print("{:10d}".format(str(ls)))
        print(str(ls).ljust(40))
        print("")
        #s += "        "

In [251]:
example_grammar = defaultdict(lambda: defaultdict(float))
example_grammar['S']['NP VP'] = .8
example_grammar['NP']['Det N'] = .3
example_grammar['VP']['V NP'] = .2
example_grammar['V']['includes'] = .05
example_grammar['Det']['the'] = .4
example_grammar['Det']['a'] = .4
example_grammar['N']['meal'] = .01
example_grammar['N']['flight'] = .02 

In [252]:
example_grammar

defaultdict(<function __main__.<lambda>>,
            {'Det': defaultdict(float, {'a': 0.4, 'the': 0.4}),
             'N': defaultdict(float, {'flight': 0.02, 'meal': 0.01}),
             'NP': defaultdict(float, {'Det N': 0.3}),
             'S': defaultdict(float, {'NP VP': 0.8}),
             'V': defaultdict(float, {'includes': 0.05}),
             'VP': defaultdict(float, {'V NP': 0.2})})

In [461]:
example_sentence = ["the", "flight", "includes", "a", "meal"]

In [504]:
def prob_cyk(words_in_sentence, grammar):
    whole_table = list()
    x = 0
    #making the table format
    while x<len(words_in_sentence):
        table = list()
        for i in range(x, len(words_in_sentence)):
            #table.append(dict())
            table.append((str(x) + "," + str(i+1),dict()))
        whole_table.append(table)
        x+=1
    print(whole_table)
    #filling in the table    
    for j in range(0, len(words_in_sentence)):
        for key in grammar:
            if words_in_sentence[j] in grammar[key]: #(words_in_sentence[j],)
                whole_table[j][0][1][key] = grammar[key][words_in_sentence[j]]#[(words_in_sentence[j],)]
    for i in range(1, len(words_in_sentence)):
        print("----")
        y = 1
        for x in range(i-1, -1, -1):
            a = y
            b = 1
            while b<=y:
                #print("x: " + str(x))
                #print("y: " + str(y-a))
                #print(whole_table[x][y-a])
                #print("x: " + str(x+b))
                #print("y: " + str(y-b))
                #print(whole_table[x+b][y-b]) 
                for key in whole_table[x][y-a][1]:
                    print(key)
                    print(whole_table[x][y-a][1][key])
                    for other_key in whole_table[x+b][y-b][1]:
                        for grammar_key in grammar:
                            for value in grammar[grammar_key]:
                                if key + " " + other_key == value:
                                    #check if higher
                                    print("uh")
                                    print(not whole_table[x][y][1])
                                    if not whole_table[x][y][1]:
                                        whole_table[x][y][1][grammar_key] =  (whole_table[x][y-a][1][key] * whole_table[x+b][y-b][1][other_key] * grammar[grammar_key][value])
                                    else:
                                        for yet_another_key in whole_table[x][y][1]:
                                            print(whole_table[x][y][1][yet_another_key])
                                            if (whole_table[x][y-a][1][key] * whole_table[x+b][y-b][1][other_key] * grammar[grammar_key][value]) > whole_table[x][y][1][yet_another_key]:
                                                del whole_table[x][y][1][yet_another_key]
                                                whole_table[x][y][1][grammar_key] = (whole_table[x][y-a][1][key] * whole_table[x+b][y-b][1][other_key] * grammar[grammar_key][value])
                a = a-1
                b = b+1
               #now should be able to access the right things...
                
            y+= 1
    return(whole_table)
        

In [505]:
my_grammar = prob_productions(prev_dict)

In [506]:
my_grammar['S']

defaultdict(float,
            {(',', 'S|<ADVP-TMP&,>'): 0.00013185654008438817,
             (',', 'S|<S-ADV&,>'): 0.00013185654008438817,
             ('-LRB-', 'S|<NP-SBJ&-RRB->'): 0.00039556962025316455,
             ('ADJP-PRD', 'NP-SBJ'): 0.0005274261603375527,
             ('ADJP-PRD', 'SBAR-SBJ'): 0.00039556962025316455,
             ('ADVP', 'S|<,&ADVP>'): 0.00013185654008438817,
             ('ADVP', 'S|<,&NP-SBJ>'): 0.002109704641350211,
             ('ADVP', 'S|<NP-SBJ&,>'): 0.00013185654008438817,
             ('ADVP', 'S|<NP-SBJ&VP>'): 0.0023734177215189874,
             ('ADVP', 'S|<NP-TMP&NP-SBJ>'): 0.00026371308016877635,
             ('ADVP', 'S|<PRN&NP-SBJ>'): 0.00013185654008438817,
             ('ADVP-LOC', 'S|<,&NP-SBJ>'): 0.00013185654008438817,
             ('ADVP-LOC', 'S|<NP-SBJ&VP>'): 0.00013185654008438817,
             ('ADVP-LOC', 'S|<PP-LOC&,>'): 0.00013185654008438817,
             ('ADVP-MNR', 'S|<,&NP-SBJ>'): 0.00026371308016877635,
             ('ADVP

In [510]:
x = prob_cyk(another, uhg)

[[('0,1', {}), ('0,2', {}), ('0,3', {}), ('0,4', {}), ('0,5', {}), ('0,6', {}), ('0,7', {}), ('0,8', {}), ('0,9', {}), ('0,10', {}), ('0,11', {}), ('0,12', {}), ('0,13', {})], [('1,2', {}), ('1,3', {}), ('1,4', {}), ('1,5', {}), ('1,6', {}), ('1,7', {}), ('1,8', {}), ('1,9', {}), ('1,10', {}), ('1,11', {}), ('1,12', {}), ('1,13', {})], [('2,3', {}), ('2,4', {}), ('2,5', {}), ('2,6', {}), ('2,7', {}), ('2,8', {}), ('2,9', {}), ('2,10', {}), ('2,11', {}), ('2,12', {}), ('2,13', {})], [('3,4', {}), ('3,5', {}), ('3,6', {}), ('3,7', {}), ('3,8', {}), ('3,9', {}), ('3,10', {}), ('3,11', {}), ('3,12', {}), ('3,13', {})], [('4,5', {}), ('4,6', {}), ('4,7', {}), ('4,8', {}), ('4,9', {}), ('4,10', {}), ('4,11', {}), ('4,12', {}), ('4,13', {})], [('5,6', {}), ('5,7', {}), ('5,8', {}), ('5,9', {}), ('5,10', {}), ('5,11', {}), ('5,12', {}), ('5,13', {})], [('6,7', {}), ('6,8', {}), ('6,9', {}), ('6,10', {}), ('6,11', {}), ('6,12', {}), ('6,13', {})], [('7,8', {}), ('7,9', {}), ('7,10', {}), ('7,11

In [511]:
print_table_nicely(x)

[('0,1', {'NNP': 1.0}), ('0,2', {'NX-TTL|<NNP&NNP>': 1.0}), ('0,3', {'NP|<NNP&NNP>': 9.779569383194227e-05}), ('0,4', {}), ('0,5', {}), ('0,6', {}), ('0,7', {}), ('0,8', {}), ('0,9', {}), ('0,10', {}), ('0,11', {}), ('0,12', {}), ('0,13', {})]

[('1,2', {'NNP': 1.0}), ('1,3', {'NP|<NNP&VBZ>': 0.3250728862973761}), ('1,4', {}), ('1,5', {}), ('1,6', {}), ('1,7', {}), ('1,8', {}), ('1,9', {}), ('1,10', {}), ('1,11', {}), ('1,12', {}), ('1,13', {})]

[('2,3', {'VBZ': 0.3250728862973761}), ('2,4', {}), ('2,5', {}), ('2,6', {}), ('2,7', {}), ('2,8', {}), ('2,9', {}), ('2,10', {}), ('2,11', {}), ('2,12', {}), ('2,13', {})]

[('3,4', {'NN': 0.0033125537963953153}), ('3,5', {'NP|<NN&IN>': 0.0008176381741766889}), ('3,6', {}), ('3,7', {}), ('3,8', {}), ('3,9', {}), ('3,10', {}), ('3,11', {}), ('3,12', {}), ('3,13', {})]

[('4,5', {'RB': 0.0001063264221158958, 'IN': 0.24683015716346518}), ('4,6', {'NP-TTL|<IN&NNP>': 0.24683015716346518}), ('4,7', {}), ('4,8', {}), ('4,9', {}), ('4,10', {}), ('4,1

In [450]:
uhg = make_pretty_dict(my_grammar)

('JJR', 'CD')
JJR CD 
('JJR', 'NP|<CD&NNS>')
JJR NP|<CD&NNS> 
('CD', 'NP|<VBN&NN>')
CD NP|<VBN&NN> 
('CD', 'NP|<VBN&NNS>')
CD NP|<VBN&NNS> 
('my',)
my 
('its',)
its 
('his',)
his 
('her',)
her 
('their',)
their 
('your',)
your 
('our',)
our 
("''", 'ADJP')
'' ADJP 
('NP', 'PP')
NP PP 
('IN', 'NP')
IN NP 
('TO', 'NP')
TO NP 
('IN', 'NP')
IN NP 
('IN', 'NP+QP')
IN NP+QP 
('PP', 'TOP|<PP&.>')
PP TOP|<PP&.> 
('PP', 'TOP|<PP&,>')
PP TOP|<PP&,> 
('PP', 'TOP|<PP&:>')
PP TOP|<PP&:> 
('PP', 'TOP|<PP&PP-LOC>')
PP TOP|<PP&PP-LOC> 
('PP', 'TOP|<PP&PP>')
PP TOP|<PP&PP> 
(',', 'JJ')
, JJ 
(',', 'ADJP|<JJ&,>')
, ADJP|<JJ&,> 
(',', 'ADJP|<JJ&CC>')
, ADJP|<JJ&CC> 
('NNP', 'NP|<IN&NNP>')
NNP NP|<IN&NNP> 
('NNP', 'NP|<IN&DT>')
NNP NP|<IN&DT> 
('NNP', 'POS')
NNP POS 
(',', 'ADJP|<CC&ADJP>')
, ADJP|<CC&ADJP> 
(',', 'ADJP|<CC&NN>')
, ADJP|<CC&NN> 
(',', 'ADJP|<CC&JJ>')
, ADJP|<CC&JJ> 
('NP-PRD', 'VP|<ADVP-TMP&,>')
NP-PRD VP|<ADVP-TMP&,> 
('NP-PRD', 'ADVP-TMP')
NP-PRD ADVP-TMP 
('NP-PRD', 'VP|<ADVP-TMP&VP>')

('cushioning',)
cushioning 
('pitching',)
pitching 
('approving',)
approving 
('locking',)
locking 
('snoring',)
snoring 
('re-enacting',)
re-enacting 
('signing',)
signing 
('agreeing',)
agreeing 
('protesting',)
protesting 
('creating',)
creating 
('thriving',)
thriving 
('hiring',)
hiring 
('running',)
running 
('funneling',)
funneling 
('giving',)
giving 
('closing',)
closing 
('retiring',)
retiring 
('enjoying',)
enjoying 
('sliding',)
sliding 
('starving',)
starving 
('describing',)
describing 
('participating',)
participating 
('crushing',)
crushing 
('working',)
working 
('budding',)
budding 
('staying',)
staying 
('pillorying',)
pillorying 
('writhing',)
writhing 
('employing',)
employing 
('preferred',)
preferred 
('balking',)
balking 
('failing',)
failing 
('exceeding',)
exceeding 
('involving',)
involving 
('accelerating',)
accelerating 
('flocking',)
flocking 
('trading',)
trading 
('hearing',)
hearing 
('outlawing',)
outlawing 
('settling',)
settling 
('learning',)
learni

('succeeded',)
succeeded 
('had',)
had 
('dispatched',)
dispatched 
('expressed',)
expressed 
('arrived',)
arrived 
('denuclearized',)
denuclearized 
('specialized',)
specialized 
('cultivated',)
cultivated 
('confirmed',)
confirmed 
('stolen',)
stolen 
('based',)
based 
('interested',)
interested 
('contravened',)
contravened 
('affiliated',)
affiliated 
('grabbed',)
grabbed 
('gone',)
gone 
('underestimated',)
underestimated 
('blamed',)
blamed 
('declined',)
declined 
('withheld',)
withheld 
('prepaid',)
prepaid 
('broken',)
broken 
('negotiated',)
negotiated 
('punished',)
punished 
('dyed',)
dyed 
('found',)
found 
('entered',)
entered 
('begun',)
begun 
('dismayed',)
dismayed 
('called',)
called 
('appeared',)
appeared 
('surprised',)
surprised 
('extended',)
extended 
('pressed',)
pressed 
('swung',)
swung 
('enrolled',)
enrolled 
('come',)
come 
('lived',)
lived 
('soared',)
soared 
('borne',)
borne 
('overseen',)
overseen 
('served',)
served 
('boasted',)
boasted 
('reacted',)

pokes 
('evokes',)
evokes 
('starts',)
starts 
('says',)
says 
('liquefies',)
liquefies 
('indicates',)
indicates 
('mounts',)
mounts 
('manages',)
manages 
('stops',)
stops 
('loses',)
loses 
('pampers',)
pampers 
('denies',)
denies 
('foresees',)
foresees 
('quacks',)
quacks 
('prefers',)
prefers 
('tends',)
tends 
('compromises',)
compromises 
('changes',)
changes 
("'s",)
's 
('leaves',)
leaves 
('kills',)
kills 
('beats',)
beats 
('restructures',)
restructures 
('defies',)
defies 
('diminishes',)
diminishes 
('stays',)
stays 
('commits',)
commits 
('is',)
is 
('handles',)
handles 
('anticipates',)
anticipates 
('confronts',)
confronts 
('provides',)
provides 
('moves',)
moves 
('disagrees',)
disagrees 
('sets',)
sets 
('fields',)
fields 
('unfolds',)
unfolds 
('exists',)
exists 
('criticizes',)
criticizes 
('approaches',)
approaches 
('thinks',)
thinks 
('lives',)
lives 
('nods',)
nods 
('represents',)
represents 
('makes',)
makes 
('rules',)
rules 
('builds',)
builds 
('expects',

("''", 'PP-LOC')
'' PP-LOC 
(',', 'TOP|<VP&.>')
, TOP|<VP&.> 
(',', 'TOP|<VP&:>')
, TOP|<VP&:> 
('``', 'NP|<DT&NNP>')
`` NP|<DT&NNP> 
('NP', 'PP')
NP PP 
(',', 'PRN|<NP&-RRB->')
, PRN|<NP&-RRB-> 
(',', 'PRN|<NP&:>')
, PRN|<NP&:> 
(',', 'PRN|<NP&,>')
, PRN|<NP&,> 
(',', 'NP')
, NP 
('NN', 'PRT')
NN PRT 
('NN', 'NN')
NN NN 
('NNP', 'NNPS')
NNP NNPS 
('NNP', 'NP-PRD|<NNPS&NNP>')
NNP NP-PRD|<NNPS&NNP> 
(':', 'TOP|<NP-TTL&.>')
: TOP|<NP-TTL&.> 
('NP-SBJ-1', 'TOP|<VP&.>')
NP-SBJ-1 TOP|<VP&.> 
(':', 'PRN|<CC&ADVP>')
: PRN|<CC&ADVP> 
(',', 'PRN|<PP-LOC&,>')
, PRN|<PP-LOC&,> 
('-LRB-', 'PRN|<CC&,>')
-LRB- PRN|<CC&,> 
(',', 'PRN|<PP-PRP&,>')
, PRN|<PP-PRP&,> 
(',', "PRN|<''&SINV>")
, PRN|<''&SINV> 
('-LRB-', 'PRN|<NP-TMP&-RRB->')
-LRB- PRN|<NP-TMP&-RRB-> 
(',', 'PRN|<CC&NNP>')
, PRN|<CC&NNP> 
(',', 'PRN|<SBAR&,>')
, PRN|<SBAR&,> 
('-LRB-', 'PRN|<FW&,>')
-LRB- PRN|<FW&,> 
('-LRB-', 'PRN|<NP-LOC&-RRB->')
-LRB- PRN|<NP-LOC&-RRB-> 
('-LRB-', 'PRN|<CC&FRAG>')
-LRB- PRN|<CC&FRAG> 
('-LRB-', 'PRN|<PP-L

('ADVP-TMP', 'VP|<VBZ&NP-1>')
ADVP-TMP VP|<VBZ&NP-1> 
('VBD', 'PP-TMP')
VBD PP-TMP 
('VBP', 'VP|<:&NP-PRD>')
VBP VP|<:&NP-PRD> 
('VBD', 'VP|<ADVP-MNR&SBAR-TMP>')
VBD VP|<ADVP-MNR&SBAR-TMP> 
('VBD', 'VP|<,&PP-LOC>')
VBD VP|<,&PP-LOC> 
('CONJP', 'VP|<VP&,>')
CONJP VP|<VP&,> 
('VBD', 'VP|<NP&PP-MNR>')
VBD VP|<NP&PP-MNR> 
('ADVP', 'VP|<VBZ&SBAR>')
ADVP VP|<VBZ&SBAR> 
('VB', 'VP|<NP&PP-PRP>')
VB VP|<NP&PP-PRP> 
('VBN', 'PP-LOC-CLR')
VBN PP-LOC-CLR 
('VBN', 'VP|<ADVP-CLR&NP>')
VBN VP|<ADVP-CLR&NP> 
('VBZ', 'VP|<PP-DIR&PP-MNR>')
VBZ VP|<PP-DIR&PP-MNR> 
('``', "VP|<VB&''>")
`` VP|<VB&''> 
('VBP', 'VP|<``&S-PRD>')
VBP VP|<``&S-PRD> 
('VBN', 'VP|<ADVP-MNR&,>')
VBN VP|<ADVP-MNR&,> 
('VBZ', 'VP|<ADVP-MNR&VP>')
VBZ VP|<ADVP-MNR&VP> 
('NNS', 'PP-CLR')
NNS PP-CLR 
('VBP', 'VP|<NP&SBAR-TMP>')
VBP VP|<NP&SBAR-TMP> 
('NP=1', 'PP-LOC=2')
NP=1 PP-LOC=2 
('VBD', 'VP|<``&NP-TTL>')
VBD VP|<``&NP-TTL> 
('VB', 'VP|<PP-LOC-PRD&PP-LOC>')
VB VP|<PP-LOC-PRD&PP-LOC> 
('ADVP', 'VP|<VBD&PP-CLR>')
ADVP VP|<VBD&PP-CLR>

('VBD', 'VP|<X&NP>')
VBD VP|<X&NP> 
('VBN', 'VP|<``&ADJP-PRD>')
VBN VP|<``&ADJP-PRD> 
('VBD', 'ADVP-CLR')
VBD ADVP-CLR 
('VBZ', 'VP|<NP&PRN>')
VBZ VP|<NP&PRN> 
('VBP', 'VP|<ADVP-EXT&PP-CLR>')
VBP VP|<ADVP-EXT&PP-CLR> 
('VBD', 'ADJP-CLR')
VBD ADJP-CLR 
('ADVP-TMP', 'VB')
ADVP-TMP VB 
('VBZ', 'VP|<S&PP-MNR>')
VBZ VP|<S&PP-MNR> 
('VBZ', 'VP|<NP&PP-MNR>')
VBZ VP|<NP&PP-MNR> 
('VBZ', 'VP|<NP&.>')
VBZ VP|<NP&.> 
('VB', 'VP|<NP&NP-MNR>')
VB VP|<NP&NP-MNR> 
('ADVP-MNR', 'VP|<VBZ&:>')
ADVP-MNR VP|<VBZ&:> 
('ADVP-TMP', 'VP|<VBP&NP>')
ADVP-TMP VP|<VBP&NP> 
('VBP', 'ADJP-PRD')
VBP ADJP-PRD 
('VBD', 'VP|<PP-EXT&PP-TMP>')
VBD VP|<PP-EXT&PP-TMP> 
('VB', 'VP|<ADJP-PRD&PP-TMP>')
VB VP|<ADJP-PRD&PP-TMP> 
('VB', 'VP|<PP-DIR&ADVP-TMP>')
VB VP|<PP-DIR&ADVP-TMP> 
('ADVP', 'VP|<VBN&PP-LOC>')
ADVP VP|<VBN&PP-LOC> 
('VB', 'VP|<PRT&,>')
VB VP|<PRT&,> 
('VBN', 'VP|<,&PP>')
VBN VP|<,&PP> 
('VBD', 'VP|<NP+QP&PP-DIR>')
VBD VP|<NP+QP&PP-DIR> 
('VBZ', 'PP-CLR-LOC')
VBZ PP-CLR-LOC 
('VBG', 'VP|<IN&PP-LOC>')
VBG VP|<IN

VBZ VP|<ADVP&NP-TMP-PRD> 
('VB', 'VP|<PP-CLR&NP-TMP>')
VB VP|<PP-CLR&NP-TMP> 
('VBN', 'PP-EXT')
VBN PP-EXT 
('VBP', 'VP|<ADJP-PRD&PP-LOC>')
VBP VP|<ADJP-PRD&PP-LOC> 
('VBN', 'VP|<PP-CLR&PP-TMP>')
VBN VP|<PP-CLR&PP-TMP> 
('VBG', 'VP|<ADVP-MNR&PP-CLR>')
VBG VP|<ADVP-MNR&PP-CLR> 
('VB', 'PP-PRD')
VB PP-PRD 
('VBG', 'VP|<ADVP-MNR&PP-LOC>')
VBG VP|<ADVP-MNR&PP-LOC> 
('VB', 'VP|<PP-CLR&PP-LOC>')
VB VP|<PP-CLR&PP-LOC> 
('VBG', 'VP|<PP-CLR&PP-CLR>')
VBG VP|<PP-CLR&PP-CLR> 
('VBD', 'VP|<PRT&NP-EXT>')
VBD VP|<PRT&NP-EXT> 
('VBN', 'VP|<PP-CLR-2&,>')
VBN VP|<PP-CLR-2&,> 
('VB', 'NP-CLR')
VB NP-CLR 
('VBZ', 'VP|<ADVP-MNR&PP-LOC>')
VBZ VP|<ADVP-MNR&PP-LOC> 
('VBP', 'VP|<NP&PP-LOC>')
VBP VP|<NP&PP-LOC> 
('VBP', 'ADVP-PRD')
VBP ADVP-PRD 
('VB', 'VP|<NP-CLR&PP>')
VB VP|<NP-CLR&PP> 
('VBD', 'VP|<PP-LOC&PP>')
VBD VP|<PP-LOC&PP> 
('VBZ', 'ADVP-LOC')
VBZ ADVP-LOC 
('VB', 'VP|<ADJP-PRD&PP-LOC-CLR>')
VB VP|<ADJP-PRD&PP-LOC-CLR> 
('VB', 'VP|<S&ADVP>')
VB VP|<S&ADVP> 
('VB', 'SBAR')
VB SBAR 
('VBZ', 'VP|<NP-1&

('VBN', 'VP|<PP&NP>')
VBN VP|<PP&NP> 
('VBN', 'VP|<NP-EXT+QP&PP-DIR>')
VBN VP|<NP-EXT+QP&PP-DIR> 
('JJ', 'VP|<NP&PP-MNR>')
JJ VP|<NP&PP-MNR> 
('VBD', 'VP|<``&PP-LOC-PRD>')
VBD VP|<``&PP-LOC-PRD> 
('VBG', 'VP|<SBAR&SBAR-ADV>')
VBG VP|<SBAR&SBAR-ADV> 
('ADVP-MNR', 'VP|<VBG&CC>')
ADVP-MNR VP|<VBG&CC> 
('ADVP-MNR', 'VP|<VBD&NP-TMP>')
ADVP-MNR VP|<VBD&NP-TMP> 
('VBG', 'VP|<ADVP-DIR&PP-TMP>')
VBG VP|<ADVP-DIR&PP-TMP> 
('ADVP-MNR', 'VP|<VBD&PP-CLR>')
ADVP-MNR VP|<VBD&PP-CLR> 
('VP', 'VP|<CC&``>')
VP VP|<CC&``> 
('NN', 'VP|<NP&PP-TMP>')
NN VP|<NP&PP-TMP> 
('ADVP-MNR', 'VP|<VB&SBAR>')
ADVP-MNR VP|<VB&SBAR> 
('VB', 'PP-MNR')
VB PP-MNR 
('ADVP-TMP', 'VP|<VBG&PP-CLR>')
ADVP-TMP VP|<VBG&PP-CLR> 
('VBD', 'VP|<``&PP-PRD>')
VBD VP|<``&PP-PRD> 
('VBD', 'VP|<ADVP-LOC&PP-LOC>')
VBD VP|<ADVP-LOC&PP-LOC> 
('VBP', 'VP|<NP&NP-ADV>')
VBP VP|<NP&NP-ADV> 
('MD', 'VP')
MD VP 
('VBP', 'ADVP-LOC-CLR')
VBP ADVP-LOC-CLR 
('VBG', 'VP|<ADVP-MNR-CLR&ADVP-LOC>')
VBG VP|<ADVP-MNR-CLR&ADVP-LOC> 
('VB', 'NP-PRD')
VB NP-PRD

, FRAG 
('NP-LOC-PRD', 'VP|<,&PP-LOC>')
NP-LOC-PRD VP|<,&PP-LOC> 
('CD', 'QP|<CD&NNS>')
CD QP|<CD&NNS> 
('CD', 'CD')
CD CD 
("'",)
' 
("'s",)
's 
('VB', 'NNS')
VB NNS 
('VBP', 'VP|<PP-DIR&,>')
VBP VP|<PP-DIR&,> 
('VBP', 'PP-DIR')
VBP PP-DIR 
('NNPS', 'TOP|<:&.>')
NNPS TOP|<:&.> 
('NNPS', ':')
NNPS : 
('NP', 'TOP|<PRN&.>')
NP TOP|<PRN&.> 
('NP', 'TOP|<PRN&,>')
NP TOP|<PRN&,> 
('PP', "''")
PP '' 
('SINV', ',')
SINV , 
('VBD', 'TOP|<NP-SBJ&NP-PRD>')
VBD TOP|<NP-SBJ&NP-PRD> 
('VBD', 'TOP|<NP-SBJ&SBAR-PRP-PRD>')
VBD TOP|<NP-SBJ&SBAR-PRP-PRD> 
('VBD', 'TOP|<NP-SBJ&VP>')
VBD TOP|<NP-SBJ&VP> 
('VBD', 'TOP|<NP-SBJ&ADJP-PRD>')
VBD TOP|<NP-SBJ&ADJP-PRD> 
(',', 'NX|<PP&,>')
, NX|<PP&,> 
('PP-DIR-2', 'PP-DIR-3')
PP-DIR-2 PP-DIR-3 
('quite',)
quite 
('both',)
both 
('half',)
half 
('all',)
all 
('nary',)
nary 
('such',)
such 
('PP-CLR', 'VP|<``&PP-TMP>')
PP-CLR VP|<``&PP-TMP> 
('RB', 'ADJP-PRD')
RB ADJP-PRD 
('PRN', 'NP')
PRN NP 
('ADVP-TMP', 'VP|<ADVP&VP>')
ADVP-TMP VP|<ADVP&VP> 
('ADVP-TMP', 'ADVP

('ingest',)
ingest 
('crimp',)
crimp 
('fly',)
fly 
('demand',)
demand 
('discourage',)
discourage 
('agonize',)
agonize 
('accomplish',)
accomplish 
('revise',)
revise 
('raise',)
raise 
('note',)
note 
('mop',)
mop 
('license',)
license 
('matter',)
matter 
('prefer',)
prefer 
('contact',)
contact 
('unravel',)
unravel 
('refund',)
refund 
('act',)
act 
('provide',)
provide 
('recall',)
recall 
('refocus',)
refocus 
('adopt',)
adopt 
('figure',)
figure 
('bring',)
bring 
('relax',)
relax 
('drag',)
drag 
('erase',)
erase 
('concede',)
concede 
('destroy',)
destroy 
('extinguish',)
extinguish 
('pull',)
pull 
('arrange',)
arrange 
('sprout',)
sprout 
('hide',)
hide 
('chop',)
chop 
('service',)
service 
('stop',)
stop 
('launch',)
launch 
('remain',)
remain 
('compensate',)
compensate 
('repeal',)
repeal 
('represent',)
represent 
('suffice',)
suffice 
('begin',)
begin 
('oversee',)
oversee 
('market',)
market 
('deserve',)
deserve 
('return',)
return 
('wait',)
wait 
('consume',)
con

careen 
('succeed',)
succeed 
('exist',)
exist 
('gain',)
gain 
('audit',)
audit 
('earn',)
earn 
('think',)
think 
('build',)
build 
('boil',)
boil 
('prolong',)
prolong 
('err',)
err 
('continue',)
continue 
('call',)
call 
('stay',)
stay 
('trust',)
trust 
('come',)
come 
('check',)
check 
('scrap',)
scrap 
('collapse',)
collapse 
('reflect',)
reflect 
('fold',)
fold 
('question',)
question 
('announce',)
announce 
('streamline',)
streamline 
('prod',)
prod 
('cinch',)
cinch 
('participate',)
participate 
('tell',)
tell 
('sponsor',)
sponsor 
('spring',)
spring 
('soar',)
soar 
('rebound',)
rebound 
('reverse',)
reverse 
('bolster',)
bolster 
('manage',)
manage 
('modify',)
modify 
('demilitarize',)
demilitarize 
('touch',)
touch 
('gasp',)
gasp 
('trade',)
trade 
('blast',)
blast 
('conform',)
conform 
('open',)
open 
('reject',)
reject 
('generate',)
generate 
('pursue',)
pursue 
('own',)
own 
('disappear',)
disappear 
('run',)
run 
('clear',)
clear 
('waive',)
waive 
('surrender'

('VBD', 'ADJP-PRD')
VBD ADJP-PRD 
('NNP', 'NP-TMP-1|<CD&,>')
NNP NP-TMP-1|<CD&,> 
('NN',)
NN 
('IN', 'NP')
IN NP 
('DT', 'NN')
DT NN 
('NN',)
NN 
('DT', 'NN')
DT NN 
('NP', 'PP')
NP PP 
('NNP', 'NP-TMP-2|<CD&,>')
NNP NP-TMP-2|<CD&,> 
(':', 'PP-TMP')
: PP-TMP 
('NP-CLR', 'PP-DIR')
NP-CLR PP-DIR 
('NNS', 'PRN')
NNS PRN 
('JJ', 'JJS')
JJ JJS 
('JJ', 'NP|<JJS&NN>')
JJ NP|<JJS&NN> 
('NP', 'VP|<PRT&PP-CLR>')
NP VP|<PRT&PP-CLR> 
('NP', 'PRT')
NP PRT 
('NP', "VP|<PRT&''>")
NP VP|<PRT&''> 
('NP', 'VP|<PRT&PP-LOC>')
NP VP|<PRT&PP-LOC> 
('NP', 'VP|<PRT&NP-ADV>')
NP VP|<PRT&NP-ADV> 
('NP', 'VP|<PRT&PP-MNR>')
NP VP|<PRT&PP-MNR> 
('NP', 'VP|<PRT&PP-TMP>')
NP VP|<PRT&PP-TMP> 
('NP', 'VP|<PRT&NP>')
NP VP|<PRT&NP> 
('NN', '.')
NN . 
(',', 'TOP|<ADVP-TMP&.>')
, TOP|<ADVP-TMP&.> 
(',', 'TOP|<ADVP-TMP&PP-TMP>')
, TOP|<ADVP-TMP&PP-TMP> 
(',', 'TOP|<ADVP-TMP&VP>')
, TOP|<ADVP-TMP&VP> 
(',', 'TOP|<ADVP-TMP&,>')
, TOP|<ADVP-TMP&,> 
(',', 'TOP|<ADVP-TMP&NP-SBJ>')
, TOP|<ADVP-TMP&NP-SBJ> 
('VBN', 'VP|<ADVP-LOC-

likewise 
('wickedly',)
wickedly 
('center',)
center 
('generally',)
generally 
('seemingly',)
seemingly 
('awfully',)
awfully 
('hugely',)
hugely 
('systematically',)
systematically 
('often',)
often 
('devastatingly',)
devastatingly 
('casually',)
casually 
('statewide',)
statewide 
('as',)
as 
('properly',)
properly 
('allegedly',)
allegedly 
('continually',)
continually 
('promptly',)
promptly 
('about',)
about 
('once',)
once 
('heavily',)
heavily 
('conditionally',)
conditionally 
('cheap',)
cheap 
('not',)
not 
('dead',)
dead 
('moreover',)
moreover 
('characteristically',)
characteristically 
('flat',)
flat 
('delectably',)
delectably 
('yet',)
yet 
('morever',)
morever 
('strictly',)
strictly 
('horticulturally',)
horticulturally 
('meanwhile',)
meanwhile 
('completely',)
completely 
('factually',)
factually 
('awake',)
awake 
('voluntarily',)
voluntarily 
('additionally',)
additionally 
('easily',)
easily 
('instantly',)
instantly 
('many',)
many 
('picturesquely',)
picturesq

NP VP|<:&ADVP-MNR> 
('NP', 'VP|<:&ADVP>')
NP VP|<:&ADVP> 
('ADJP-PRD', 'VP|<,&S-ADV>')
ADJP-PRD VP|<,&S-ADV> 
('ADJP-PRD', 'VP|<,&PP-PRP>')
ADJP-PRD VP|<,&PP-PRP> 
('ADJP-PRD', "VP|<,&''>")
ADJP-PRD VP|<,&''> 
('ADJP-PRD', 'VP|<,&ADVP>')
ADJP-PRD VP|<,&ADVP> 
('ADJP-PRD', 'VP|<,&``>')
ADJP-PRD VP|<,&``> 
('ADJP-PRD', 'VP|<,&NP-VOC>')
ADJP-PRD VP|<,&NP-VOC> 
('ADJP-PRD', 'VP|<,&SBAR-ADV>')
ADJP-PRD VP|<,&SBAR-ADV> 
('ADJP-PRD', 'VP|<,&INTJ>')
ADJP-PRD VP|<,&INTJ> 
('ADJP-PRD', 'VP|<,&PP-TMP>')
ADJP-PRD VP|<,&PP-TMP> 
('ADJP-PRD', 'VP|<,&PP-LOC>')
ADJP-PRD VP|<,&PP-LOC> 
('ADJP-PRD', 'VP|<,&PP>')
ADJP-PRD VP|<,&PP> 
('ADJP-PRD', 'VP|<,&SBAR-TMP>')
ADJP-PRD VP|<,&SBAR-TMP> 
('ADJP-PRD', 'VP|<,&SBAR-PRP>')
ADJP-PRD VP|<,&SBAR-PRP> 
('JJ', 'VBG')
JJ VBG 
('JJ', 'NP|<VBG&JJ>')
JJ NP|<VBG&JJ> 
('JJ', 'NP|<VBG&NN>')
JJ NP|<VBG&NN> 
('JJ', 'NP|<VBG&NNS>')
JJ NP|<VBG&NNS> 
('ADVP-LOC', 'PP-TMP')
ADVP-LOC PP-TMP 
('CC', 'PP')
CC PP 
('ADVP', 'TOP|<NP-SBJ&VP>')
ADVP TOP|<NP-SBJ&VP> 
('PP', 'ADVP')

('DT', 'JJ')
DT JJ 
('ADJP-PRD', 'SBAR-ADV')
ADJP-PRD SBAR-ADV 
('ADJP-PRD', 'VP|<SBAR-ADV&,>')
ADJP-PRD VP|<SBAR-ADV&,> 
(',', 'NAC-TMP|<CD&,>')
, NAC-TMP|<CD&,> 
('VBP', 'ADVP-TMP')
VBP ADVP-TMP 
('VBP', 'VP|<ADVP-TMP&VP>')
VBP VP|<ADVP-TMP&VP> 
('PP-EXT', 'VP|<PP-DIR&PP-TMP>')
PP-EXT VP|<PP-DIR&PP-TMP> 
('PP-EXT', 'VP|<PP-DIR&PP-DIR>')
PP-EXT VP|<PP-DIR&PP-DIR> 
('PP-EXT', 'VP|<PP-DIR&PP>')
PP-EXT VP|<PP-DIR&PP> 
('PP-EXT', 'PP-DIR')
PP-EXT PP-DIR 
('ADVP-TMP-1', 'PP-DIR-2')
ADVP-TMP-1 PP-DIR-2 
('NNP', 'NP|<-LRB-&NNP>')
NNP NP|<-LRB-&NNP> 
('VP', "TOP|<:&''>")
VP TOP|<:&''> 
('VP', ':')
VP : 
('VP', 'TOP|<:&S>')
VP TOP|<:&S> 
('VP', 'TOP|<:&.>')
VP TOP|<:&.> 
('RB', 'CD')
RB CD 
('JJ', '.')
JJ . 
('JJS', 'CD')
JJS CD 
(',', 'NP|<VP&,>')
, NP|<VP&,> 
(',', 'VP')
, VP 
('PP-TMP', ':')
PP-TMP : 
('NP', 'JJR')
NP JJR 
('PP-DIR', 'UCP')
PP-DIR UCP 
('NP-1', 'VP|<PP-DIR-2&PP-DIR-3>')
NP-1 VP|<PP-DIR-2&PP-DIR-3> 
('PP-LOC', 'VP|<NP-TMP&SBAR-TMP>')
PP-LOC VP|<NP-TMP&SBAR-TMP> 
('PP-LOC', '

congressman 
('college',)
college 
('euphoria',)
euphoria 
('mutual-fund',)
mutual-fund 
('occupant',)
occupant 
('revolutionary',)
revolutionary 
('shipbuilding',)
shipbuilding 
('cut',)
cut 
('filing',)
filing 
('hemoglobin',)
hemoglobin 
('trade-off',)
trade-off 
('red',)
red 
('fighter',)
fighter 
('handicap',)
handicap 
('dissolution',)
dissolution 
('newscast',)
newscast 
('host',)
host 
('awarding',)
awarding 
('natural',)
natural 
('seizure',)
seizure 
('57-year-old',)
57-year-old 
('adoption',)
adoption 
('mailbox',)
mailbox 
('view',)
view 
('cholesterol',)
cholesterol 
('fifth-grade',)
fifth-grade 
('introduction',)
introduction 
('designer',)
designer 
('gem',)
gem 
('politicking',)
politicking 
('utility',)
utility 
('string',)
string 
('subcommitee',)
subcommitee 
('affidavit',)
affidavit 
('disregard',)
disregard 
('cornfield',)
cornfield 
('helicopter',)
helicopter 
('real-estate',)
real-estate 
('passing',)
passing 
('everybody',)
everybody 
('trash',)
trash 
('suitor'

('revolt',)
revolt 
('fortune',)
fortune 
('con',)
con 
('globe',)
globe 
('purhasing',)
purhasing 
('killer',)
killer 
('break-up',)
break-up 
('dancing',)
dancing 
('cue',)
cue 
('dome',)
dome 
('wardrobe',)
wardrobe 
('slowing',)
slowing 
('hell',)
hell 
('cabinet',)
cabinet 
('catheter',)
catheter 
('a.m.',)
a.m. 
('modernist',)
modernist 
('gaming',)
gaming 
('homelessness',)
homelessness 
('resilience',)
resilience 
('rivalry',)
rivalry 
('hormone',)
hormone 
('gimmickry',)
gimmickry 
('merchandising',)
merchandising 
('spokeswoman',)
spokeswoman 
('upset',)
upset 
('courtesy',)
courtesy 
('telemarketing',)
telemarketing 
('tie',)
tie 
('fiction',)
fiction 
('key',)
key 
('king',)
king 
('formulation',)
formulation 
('ex-dividend',)
ex-dividend 
('marketer',)
marketer 
('lobbyist',)
lobbyist 
('task',)
task 
('bonfire',)
bonfire 
('money',)
money 
('capacity',)
capacity 
('advice',)
advice 
('motion',)
motion 
('propensity',)
propensity 
('portico',)
portico 
('primary',)
primary

('continuity',)
continuity 
('monastery',)
monastery 
('ore',)
ore 
('outpatient',)
outpatient 
('fertilizer',)
fertilizer 
('peasant',)
peasant 
('sharpness',)
sharpness 
('den',)
den 
('conservative',)
conservative 
('bit',)
bit 
('disappointment',)
disappointment 
('expectancy',)
expectancy 
('branch',)
branch 
('rapier',)
rapier 
('fish',)
fish 
('reformer',)
reformer 
('liberal',)
liberal 
('bunch',)
bunch 
('section',)
section 
('allocation',)
allocation 
('consciousness',)
consciousness 
('edition',)
edition 
('marketability',)
marketability 
('days',)
days 
('weather',)
weather 
('former',)
former 
('idealist',)
idealist 
('survivor',)
survivor 
('air',)
air 
('bay',)
bay 
('imitation',)
imitation 
('completion',)
completion 
('objectivity',)
objectivity 
('windfall',)
windfall 
('outcry',)
outcry 
('fairness',)
fairness 
('direct-seller',)
direct-seller 
('enhancement',)
enhancement 
('house',)
house 
('preoccupation',)
preoccupation 
('plaster',)
plaster 
('excitement',)
exci

('warehousing',)
warehousing 
('sweep',)
sweep 
('anger',)
anger 
('sulfur-dioxide',)
sulfur-dioxide 
('constituent',)
constituent 
('responsibility',)
responsibility 
('hog',)
hog 
('cold',)
cold 
('vote',)
vote 
('physicist',)
physicist 
('coup',)
coup 
('fix',)
fix 
('administrator',)
administrator 
('hire',)
hire 
('revolution',)
revolution 
('hiding',)
hiding 
('enrollment',)
enrollment 
('delivery',)
delivery 
('acne',)
acne 
('excuse',)
excuse 
('protest',)
protest 
('securities-law',)
securities-law 
('graduate-student',)
graduate-student 
('trading',)
trading 
('guideline',)
guideline 
('box',)
box 
('life-insurance',)
life-insurance 
('applicability',)
applicability 
('instrumentation',)
instrumentation 
('protein',)
protein 
('television',)
television 
('order',)
order 
('familiarity',)
familiarity 
('contrast',)
contrast 
('poster',)
poster 
('theater',)
theater 
('whirlwind',)
whirlwind 
('laptop',)
laptop 
('backhoe',)
backhoe 
('aluminum',)
aluminum 
('wrestling',)
wrest

('match',)
match 
('iceberg',)
iceberg 
('wine',)
wine 
('seasonality',)
seasonality 
('exclusion',)
exclusion 
('crush',)
crush 
('tally',)
tally 
('reform',)
reform 
('regulation',)
regulation 
('academy',)
academy 
('contest',)
contest 
('choice',)
choice 
('loser',)
loser 
('dashboard',)
dashboard 
('embryo',)
embryo 
('shortening',)
shortening 
('maneuver',)
maneuver 
('tariff',)
tariff 
('time',)
time 
('layer',)
layer 
('reasoning',)
reasoning 
('defamation',)
defamation 
('parting',)
parting 
('birth',)
birth 
('shuttle',)
shuttle 
('pimp',)
pimp 
('break',)
break 
('casino',)
casino 
('presenter',)
presenter 
('megabillion',)
megabillion 
('campus',)
campus 
('new',)
new 
('district',)
district 
('personal',)
personal 
('conservatory',)
conservatory 
('clump',)
clump 
('justification',)
justification 
('stop',)
stop 
('loop',)
loop 
('clause',)
clause 
('end',)
end 
('personality',)
personality 
("lion's-head",)
lion's-head 
('war',)
war 
('impatient',)
impatient 
('health-car

('contempt',)
contempt 
('danger',)
danger 
('grandmother',)
grandmother 
('nobody',)
nobody 
('investment-house',)
investment-house 
('new-business',)
new-business 
('midnight',)
midnight 
('effect',)
effect 
('humor',)
humor 
('ounce',)
ounce 
('sightseeing',)
sightseeing 
('attendant',)
attendant 
('can',)
can 
('seattle',)
seattle 
('rupture',)
rupture 
('vodka',)
vodka 
('availability',)
availability 
('timing',)
timing 
('diamond',)
diamond 
('structure',)
structure 
('delisting',)
delisting 
('criminology',)
criminology 
('ballpark',)
ballpark 
('offensive',)
offensive 
('fluke',)
fluke 
('centerfielder',)
centerfielder 
('securities-firm',)
securities-firm 
('stowaway',)
stowaway 
('weeklong',)
weeklong 
('capitalism',)
capitalism 
('department',)
department 
('somebody',)
somebody 
('conscience',)
conscience 
('advertisement',)
advertisement 
('violet',)
violet 
('story',)
story 
('dominance',)
dominance 
('dining',)
dining 
('adventure',)
adventure 
dog
d o g 
('twin-deficit'

courtesan 
('suppressor',)
suppressor 
('excess',)
excess 
('patriot',)
patriot 
('influence-peddling',)
influence-peddling 
('runner',)
runner 
('forfeiture',)
forfeiture 
('bicycle',)
bicycle 
('sauerkraut',)
sauerkraut 
('cigar',)
cigar 
('assistant',)
assistant 
('firefighting',)
firefighting 
('donation',)
donation 
('privacy',)
privacy 
('plateau',)
plateau 
('repurchase',)
repurchase 
('litmus',)
litmus 
('partner',)
partner 
('bravura',)
bravura 
('masonry',)
masonry 
('principle',)
principle 
('control',)
control 
('shipment',)
shipment 
('dismay',)
dismay 
('fitness',)
fitness 
('monthly',)
monthly 
('printer',)
printer 
('specialization',)
specialization 
('fault',)
fault 
('halt',)
halt 
('conglomerate',)
conglomerate 
('thumb',)
thumb 
('juice',)
juice 
('cemetery',)
cemetery 
('betwen',)
betwen 
('subindustry',)
subindustry 
('robot',)
robot 
('cachet',)
cachet 
('scientist',)
scientist 
('havoc',)
havoc 
('g-2',)
g-2 
('tomb',)
tomb 
('national-service',)
national-servic

level 
('1\\/10th',)
1\/10th 
('owner',)
owner 
('rollover',)
rollover 
('government-bond',)
government-bond 
('son',)
son 
('lyricism',)
lyricism 
('wedge',)
wedge 
('economist',)
economist 
('member',)
member 
('entrance',)
entrance 
('antibody',)
antibody 
('co-author',)
co-author 
('transport',)
transport 
('pain',)
pain 
('furniture',)
furniture 
('peace',)
peace 
('lifetime',)
lifetime 
('bellwether',)
bellwether 
('police',)
police 
('nature',)
nature 
('toy',)
toy 
('tightening',)
tightening 
('graveyard',)
graveyard 
('wire',)
wire 
('understanding',)
understanding 
('boiler',)
boiler 
('fondness',)
fondness 
('sea',)
sea 
('city',)
city 
('resignation',)
resignation 
('wedding',)
wedding 
('marble',)
marble 
('copying',)
copying 
('brawl',)
brawl 
('laser',)
laser 
('wording',)
wording 
('chip',)
chip 
('hardware-maintenance',)
hardware-maintenance 
('content',)
content 
('home-shopping',)
home-shopping 
('waterworks',)
waterworks 
('rod',)
rod 
('beer',)
beer 
('zinc',)
zinc

RB NP|<DT&JJS> 
('NP', 'NP|<``&NX-TTL>')
NP NP|<``&NX-TTL> 
('CD', 'NP|<NNP&JJ>')
CD NP|<NNP&JJ> 
('DT', 'NP|<VBG&NNP>')
DT NP|<VBG&NNP> 
('VBG', 'NNS')
VBG NNS 
('CD', 'NP|<NN&NNP>')
CD NP|<NN&NNP> 
('IN', 'NP|<DT&NN>')
IN NP|<DT&NN> 
('NP', 'NP|<PP&NP-TMP>')
NP NP|<PP&NP-TMP> 
('PRP$', 'NP|<NN&PRN>')
PRP$ NP|<NN&PRN> 
('NP', 'NP|<ADVP&PP-LOC>')
NP NP|<ADVP&PP-LOC> 
('PRP$', 'NP|<JJS&NNS>')
PRP$ NP|<JJS&NNS> 
('RB', 'NP|<DT&NN>')
RB NP|<DT&NN> 
('NP', 'NP|<,&NP-LOC>')
NP NP|<,&NP-LOC> 
('NP', 'NP|<,&ADVP>')
NP NP|<,&ADVP> 
('NN', 'NP|<NX&NX>')
NN NP|<NX&NX> 
('DT', 'NP|<CD&NN>')
DT NP|<CD&NN> 
('DT', 'NP|<``&NN>')
DT NP|<``&NN> 
('NN', 'NP|<NNP&JJ>')
NN NP|<NNP&JJ> 
('VBG', 'NP|<NNS&PP-LOC>')
VBG NP|<NNS&PP-LOC> 
('IN', 'CD')
IN CD 
('NP', 'NP|<,&NP>')
NP NP|<,&NP> 
('JJR', 'NP|<NN&NNS>')
JJR NP|<NN&NNS> 
('JJ', 'DT')
JJ DT 
('RB', 'NP|<QP&NNS>')
RB NP|<QP&NNS> 
('DT', 'NP|<CD&JJ>')
DT NP|<CD&JJ> 
('DT', 'NP|<CD&VBN>')
DT NP|<CD&VBN> 
('JJS', 'NP|<NNP&NNS>')
JJS NP|<NNP&NNS> 
('NP', '

CD NP|<ADJP&JJ> 
('DT', 'NP|<NAC-LOC&NNP>')
DT NP|<NAC-LOC&NNP> 
('NNP', 'NP|<NNP&ADJP>')
NNP NP|<NNP&ADJP> 
('IN', 'NP|<JJ&NN>')
IN NP|<JJ&NN> 
('``', 'NP|<DT&NN>')
`` NP|<DT&NN> 
('VBG', 'NP|<NN&NNS>')
VBG NP|<NN&NNS> 
('NP', 'NP|<PP&UCP-LOC>')
NP NP|<PP&UCP-LOC> 
('DT', 'NP|<NNP&NNS>')
DT NP|<NNP&NNS> 
('DT', 'NP|<RB&VBN>')
DT NP|<RB&VBN> 
('ADJP', 'NP')
ADJP NP 
('NP', 'NP|<ADVP&NNP>')
NP NP|<ADVP&NNP> 
('DT', 'NP|<QP&JJ>')
DT NP|<QP&JJ> 
('PRP$', 'NP|<NNS&POS>')
PRP$ NP|<NNS&POS> 
('NP', 'NNP')
NP NNP 
('PRP$', 'NP|<ADJP&NP>')
PRP$ NP|<ADJP&NP> 
('CD', 'NP|<NN&POS>')
CD NP|<NN&POS> 
('NP', 'NP|<NN&RP>')
NP NP|<NN&RP> 
('PRP$', 'NP|<CD&CC>')
PRP$ NP|<CD&CC> 
('PRP$', 'NP|<VBN&NN>')
PRP$ NP|<VBN&NN> 
('CD', 'NP|<JJS&NNS>')
CD NP|<JJS&NNS> 
('DT', 'NP|<VBN&ADJP>')
DT NP|<VBN&ADJP> 
('RBR', 'NP|<VBG&CC>')
RBR NP|<VBG&CC> 
('NP', 'NP|<CC&ADVP-TMP>')
NP NP|<CC&ADVP-TMP> 
('NNP', 'NP|<CD&NN>')
NNP NP|<CD&NN> 
('DT', 'NP|<NNS&CC>')
DT NP|<NNS&CC> 
('DT', 'NP|<VBN&NNS>')
DT NP|<VBN&NNS> 
(

('VBN', 'PRT')
VBN PRT 
('PP-LOC', 'NP-SBJ|<PP-LOC&NP-TMP>')
PP-LOC NP-SBJ|<PP-LOC&NP-TMP> 
('PP-LOC', 'SBAR-PRP')
PP-LOC SBAR-PRP 
(',', 'PP')
, PP 
(',', 'UCP|<CC&ADVP-TMP>')
, UCP|<CC&ADVP-TMP> 
(',', 'UCP|<CC&ADVP-MNR>')
, UCP|<CC&ADVP-MNR> 
(',', 'UCP|<CC&NN>')
, UCP|<CC&NN> 
('``', 'NX-TTL')
`` NX-TTL 
('RB', 'PP')
RB PP 
('NNS', 'NNS')
NNS NNS 
('VBN', 'SBAR-TMP')
VBN SBAR-TMP 
('0',)
0 
('ADVP', 'UCP-MNR|<,&PP>')
ADVP UCP-MNR|<,&PP> 
('PP', 'UCP-MNR|<,&CC>')
PP UCP-MNR|<,&CC> 
('ADVP', 'UCP-MNR|<CC&PP>')
ADVP UCP-MNR|<CC&PP> 
(',', 'S|<INTJ&,>')
, S|<INTJ&,> 
('ADJP-PRD', 'UCP-ADV')
ADJP-PRD UCP-ADV 
('VBD', 'VP|<NP&PP-DIR>')
VBD VP|<NP&PP-DIR> 
('VBD', 'VP|<NP&ADVP-DIR>')
VBD VP|<NP&ADVP-DIR> 
('VBD', 'VP|<NP&NP-TMP>')
VBD VP|<NP&NP-TMP> 
('VBD', 'VP|<NP&PP-CLR>')
VBD VP|<NP&PP-CLR> 
('VBD', 'VP|<NP&SBAR-PRP>')
VBD VP|<NP&SBAR-PRP> 
('VBD', 'NP')
VBD NP 
('VBD', 'VP|<NP&PP-DTV>')
VBD VP|<NP&PP-DTV> 
('VBD', "VP|<NP&''>")
VBD VP|<NP&''> 
('VBD', 'VP|<NP&PP-TMP>')
VBD VP|<NP&PP-

('VP', 'NP-SBJ')
VP NP-SBJ 
('CC', 'SINV|<VBP&NP-SBJ>')
CC SINV|<VBP&NP-SBJ> 
('CONJP', 'SINV|<VBZ&NP-SBJ>')
CONJP SINV|<VBZ&NP-SBJ> 
('MD', 'SINV|<NP-SBJ&VP>')
MD SINV|<NP-SBJ&VP> 
('ADVP', 'SINV|<VP&NP-SBJ>')
ADVP SINV|<VP&NP-SBJ> 
('PP-TMP', 'SINV|<VP&NP-SBJ>')
PP-TMP SINV|<VP&NP-SBJ> 
('VBZ', 'SINV|<NP-SBJ&VP>')
VBZ SINV|<NP-SBJ&VP> 
('VBD', 'NP-SBJ')
VBD NP-SBJ 
('ADVP-TMP', 'SINV|<PP-TMP&VBD>')
ADVP-TMP SINV|<PP-TMP&VBD> 
(':', 'NP-PRD=2')
: NP-PRD=2 
('JJ', 'VBG')
JJ VBG 
('PP', 'SBAR-PRP')
PP SBAR-PRP 
('CC', 'PP')
CC PP 
(':', 'SBAR|<CC&SBAR>')
: SBAR|<CC&SBAR> 
('VB', "VP|<''&NP>")
VB VP|<''&NP> 
('JJ', 'NP|<NNPS&CC>')
JJ NP|<NNPS&CC> 
('JJ', 'NNPS')
JJ NNPS 
('JJ', 'NP|<NNPS&NN>')
JJ NP|<NNPS&NN> 
('JJ', 'NP-SBJ|<NNS&NN>')
JJ NP-SBJ|<NNS&NN> 
('JJ', 'NP-SBJ|<NNS&-RRB->')
JJ NP-SBJ|<NNS&-RRB-> 
('JJ', 'NP-SBJ|<NNS&CC>')
JJ NP-SBJ|<NNS&CC> 
('JJ', 'NP-SBJ|<NNS&NNS>')
JJ NP-SBJ|<NNS&NNS> 
('JJ', "NP-SBJ|<NNS&''>")
JJ NP-SBJ|<NNS&''> 
('JJ', 'NNS')
JJ NNS 
('JJ', 'NP-SBJ|<NNS&,>

('frequent',)
frequent 
('network-buying',)
network-buying 
('ethiopian',)
ethiopian 
('newborn',)
newborn 
('discouraging',)
discouraging 
('polish',)
polish 
('arcane',)
arcane 
('non-religious',)
non-religious 
('common',)
common 
('sterile',)
sterile 
('conflicting',)
conflicting 
('important',)
important 
('photographic',)
photographic 
('chicago-based',)
chicago-based 
('lavish',)
lavish 
('fertile',)
fertile 
('concerned',)
concerned 
('inaccurate',)
inaccurate 
('later',)
later 
('indicated',)
indicated 
('soluble',)
soluble 
('short-wave',)
short-wave 
('populous',)
populous 
('image-building',)
image-building 
('short-lived',)
short-lived 
('analytic',)
analytic 
('corporate',)
corporate 
('generous',)
generous 
('all-too-sincere',)
all-too-sincere 
('imported',)
imported 
('audio-visual',)
audio-visual 
('hurricane-stricken',)
hurricane-stricken 
('sizzling',)
sizzling 
('immune',)
immune 
('do-everything',)
do-everything 
('functional',)
functional 
('ready',)
ready 
('unpl

('non-interstate',)
non-interstate 
('60.25-point',)
60.25-point 
('old-fashioned',)
old-fashioned 
('bottled',)
bottled 
('bioequivalence-therapeutic-equivalence',)
bioequivalence-therapeutic-equivalence 
('intraday',)
intraday 
('sore',)
sore 
('mild',)
mild 
('expected',)
expected 
('stuttgart-based',)
stuttgart-based 
('horrific',)
horrific 
('autographed',)
autographed 
('placid',)
placid 
('held',)
held 
('forced',)
forced 
('kind',)
kind 
('then-president',)
then-president 
('highway-relief',)
highway-relief 
('instruction-set',)
instruction-set 
('transitional',)
transitional 
('unpaid',)
unpaid 
('carefree',)
carefree 
('above-average',)
above-average 
('procedural',)
procedural 
('pessimistic',)
pessimistic 
('bustling',)
bustling 
('well-intentioned',)
well-intentioned 
('distinct',)
distinct 
('spanish-language',)
spanish-language 
('subordinated',)
subordinated 
('old',)
old 
('speculative',)
speculative 
('less-educated',)
less-educated 
('haunted',)
haunted 
('underlying

('prosperous',)
prosperous 
('1-for-10',)
1-for-10 
('appreciable',)
appreciable 
('three-day',)
three-day 
('tweety-bird',)
tweety-bird 
('nontraditional',)
nontraditional 
('industrywide',)
industrywide 
('magical',)
magical 
('witty',)
witty 
('civil',)
civil 
('test-coaching',)
test-coaching 
('capital-markets',)
capital-markets 
('unfinished',)
unfinished 
('apparent',)
apparent 
('seesaw',)
seesaw 
('secret',)
secret 
('index-linked',)
index-linked 
('electrical',)
electrical 
('top-tier',)
top-tier 
('classy',)
classy 
('irish',)
irish 
('self-regulatory',)
self-regulatory 
('excessive',)
excessive 
('non-nms',)
non-nms 
('barren',)
barren 
('shocking',)
shocking 
('defense-related',)
defense-related 
('booming',)
booming 
('lovely',)
lovely 
('whole',)
whole 
('power-transmission',)
power-transmission 
('futures-related',)
futures-related 
('genuine',)
genuine 
('business-class',)
business-class 
('inauspicious',)
inauspicious 
('corrupt',)
corrupt 
('three-digit',)
three-digit

('uninterruptable',)
uninterruptable 
('creative',)
creative 
('60-second',)
60-second 
('home-produced',)
home-produced 
('seven-year',)
seven-year 
('strapped',)
strapped 
('compound',)
compound 
('day-today',)
day-today 
('afraid',)
afraid 
('relaxing',)
relaxing 
('unsteady',)
unsteady 
('refined',)
refined 
('inept',)
inept 
('sleepy',)
sleepy 
('unobtrusive',)
unobtrusive 
('soft-sell',)
soft-sell 
('choice',)
choice 
('coming-out',)
coming-out 
('disliked',)
disliked 
('snobbish',)
snobbish 
('chi-chi',)
chi-chi 
('85-title',)
85-title 
('sobering',)
sobering 
('swift',)
swift 
('incoherent',)
incoherent 
('angry',)
angry 
('computer-generated',)
computer-generated 
('unclassified',)
unclassified 
('classical',)
classical 
('infectious',)
infectious 
('earnings-growth',)
earnings-growth 
('diverse',)
diverse 
('new',)
new 
('understandable',)
understandable 
('unforeseen',)
unforeseen 
('gray',)
gray 
('non-patent',)
non-patent 
('end',)
end 
('health-care',)
health-care 
('thir

('lower-volume',)
lower-volume 
('rigorous',)
rigorous 
('clinical',)
clinical 
('market-share',)
market-share 
('unanticipated',)
unanticipated 
('comic',)
comic 
('first-half',)
first-half 
('stable',)
stable 
('across-the-board',)
across-the-board 
('second-quarter',)
second-quarter 
('touchy',)
touchy 
('nonessential',)
nonessential 
('definitive',)
definitive 
('three-party',)
three-party 
('foreign-exchange',)
foreign-exchange 
('quantitative',)
quantitative 
('capacity-expansion',)
capacity-expansion 
('divisive',)
divisive 
('thick',)
thick 
('recipient',)
recipient 
('joint-venture',)
joint-venture 
('assistant',)
assistant 
('before-and-after',)
before-and-after 
('stereotyped',)
stereotyped 
('program-bashing',)
program-bashing 
('contained',)
contained 
('phony',)
phony 
('rolling',)
rolling 
('ever-narrowing',)
ever-narrowing 
('curious',)
curious 
('usual',)
usual 
('heavy',)
heavy 
('then',)
then 
('keynesian',)
keynesian 
('blood-and-guts',)
blood-and-guts 
('constant',

center-stage 
('aids-research',)
aids-research 
('chest-swelling',)
chest-swelling 
('44-year-old',)
44-year-old 
('bureacratic',)
bureacratic 
('authorized',)
authorized 
('garish',)
garish 
('manageable',)
manageable 
('latvian',)
latvian 
('electronic',)
electronic 
('winning',)
winning 
('dubious',)
dubious 
('average',)
average 
('unmarked',)
unmarked 
('plausible',)
plausible 
('unencumbered',)
unencumbered 
('onerous',)
onerous 
('straight',)
straight 
('dazzling',)
dazzling 
('ancillary',)
ancillary 
('urban',)
urban 
('boxy',)
boxy 
('have',)
have 
('numerous',)
numerous 
('n.c.-based',)
n.c.-based 
('institutional',)
institutional 
('tigrean',)
tigrean 
('zealand-based',)
zealand-based 
('national',)
national 
('guest',)
guest 
('chemical',)
chemical 
('recessionary',)
recessionary 
('184-day',)
184-day 
('would-be',)
would-be 
('non-socialist',)
non-socialist 
('imperative',)
imperative 
('aware',)
aware 
('medium-grade',)
medium-grade 
('burnt',)
burnt 
('tactical',)
tactic

('DT', 'NP-SBJ|<-LRB-&JJ>')
DT NP-SBJ|<-LRB-&JJ> 
('DT', 'NP-SBJ|<NN&RB>')
DT NP-SBJ|<NN&RB> 
('RB', 'NP-SBJ|<JJ&JJ>')
RB NP-SBJ|<JJ&JJ> 
('NP', 'NP-TMP')
NP NP-TMP 
('DT', 'NP-SBJ|<-LRB-&NN>')
DT NP-SBJ|<-LRB-&NN> 
('JJS', 'NNPS')
JJS NNPS 
('JJ', 'NP-SBJ|<CD&NN>')
JJ NP-SBJ|<CD&NN> 
('DT', 'NP-SBJ|<NAC&NN>')
DT NP-SBJ|<NAC&NN> 
('DT', 'NP-SBJ|<JJS&NN>')
DT NP-SBJ|<JJS&NN> 
('DT', 'NP-SBJ|<CD&VBN>')
DT NP-SBJ|<CD&VBN> 
('RB', 'NP-SBJ|<RB&DT>')
RB NP-SBJ|<RB&DT> 
('NNP', 'NP-SBJ|<NNP&CD>')
NNP NP-SBJ|<NNP&CD> 
('NAC', 'NP-SBJ|<VBD&NNS>')
NAC NP-SBJ|<VBD&NNS> 
('UCP', 'NNS')
UCP NNS 
('VBG', 'NP-SBJ|<NN&NNS>')
VBG NP-SBJ|<NN&NNS> 
('PRP$', 'NP-SBJ|<``&JJ>')
PRP$ NP-SBJ|<``&JJ> 
('DT', 'NP-SBJ|<NN&NNP>')
DT NP-SBJ|<NN&NNP> 
('NNP', 'NP-SBJ|<,&NNP>')
NNP NP-SBJ|<,&NNP> 
('NN', 'NP-SBJ|<NNP&NNP>')
NN NP-SBJ|<NNP&NNP> 
('NP', 'NP-SBJ|<,&NP-LOC>')
NP NP-SBJ|<,&NP-LOC> 
('NP', 'NP-SBJ|<JJS&NNS>')
NP NP-SBJ|<JJS&NNS> 
('JJ', 'NP-SBJ|<UCP&NNS>')
JJ NP-SBJ|<UCP&NNS> 
('JJS', 'NNS')
JJS NNS 
('PR

hats 
('measures',)
measures 
('stockbrokers',)
stockbrokers 
('resins',)
resins 
('mountains',)
mountains 
('blends',)
blends 
('starts',)
starts 
('syms',)
syms 
('prostitutes',)
prostitutes 
('pools',)
pools 
('coups',)
coups 
('flavors',)
flavors 
('minutes',)
minutes 
('upgrades',)
upgrades 
('speakers',)
speakers 
('hearings',)
hearings 
('police',)
police 
('counters',)
counters 
('settlements',)
settlements 
('belts',)
belts 
('forklifts',)
forklifts 
('miners',)
miners 
('achievements',)
achievements 
('factories',)
factories 
('chauffeurs',)
chauffeurs 
('tabacs',)
tabacs 
('kinds',)
kinds 
('instructions',)
instructions 
('apologists',)
apologists 
('offerings',)
offerings 
('provisions',)
provisions 
('automakers',)
automakers 
('certificates',)
certificates 
('forest-products',)
forest-products 
('rebates',)
rebates 
('lbos',)
lbos 
('columns',)
columns 
('cars',)
cars 
('songs',)
songs 
('scammers',)
scammers 
('linkages',)
linkages 
('neighborhoods',)
neighborhoods 
('po

('accusers',)
accusers 
('reruns',)
reruns 
('gloaters',)
gloaters 
('aircraft',)
aircraft 
('grounds',)
grounds 
('troops',)
troops 
('fighters',)
fighters 
('metals',)
metals 
('lesbians',)
lesbians 
('blossoms',)
blossoms 
('chips',)
chips 
('babelists',)
babelists 
('counties',)
counties 
('delays',)
delays 
('vehicles',)
vehicles 
('conferences',)
conferences 
('facilities',)
facilities 
('dwellers',)
dwellers 
('rackets',)
rackets 
('necessities',)
necessities 
('memorandums',)
memorandums 
('professionals',)
professionals 
('athletes',)
athletes 
('claimants',)
claimants 
('frailties',)
frailties 
('guns',)
guns 
('nests',)
nests 
('gods',)
gods 
('pence',)
pence 
('stations',)
stations 
('cows',)
cows 
('rubles',)
rubles 
('facsimiles',)
facsimiles 
('expressions',)
expressions 
('revels',)
revels 
('wills',)
wills 
('criteria',)
criteria 
('aspects',)
aspects 
('ious',)
ious 
('representatives',)
representatives 
('pigs',)
pigs 
('taxes',)
taxes 
('wiretaps',)
wiretaps 
('woes

('enterprises',)
enterprises 
('payments',)
payments 
('stones',)
stones 
('filings',)
filings 
('administrators',)
administrators 
('investors',)
investors 
('rings',)
rings 
('tries',)
tries 
('routes',)
routes 
('surfers',)
surfers 
('shops',)
shops 
('members',)
members 
('organizations',)
organizations 
('transports',)
transports 
('kilograms',)
kilograms 
('smokescreens',)
smokescreens 
('trillions',)
trillions 
('polyps',)
polyps 
('aggregates',)
aggregates 
('museums',)
museums 
('fliers',)
fliers 
('proposals',)
proposals 
('statements',)
statements 
('movements',)
movements 
('boxes',)
boxes 
('shots',)
shots 
('segments',)
segments 
('buy-outs',)
buy-outs 
('attacks',)
attacks 
('earthworms',)
earthworms 
('observers',)
observers 
('underwriters',)
underwriters 
('neanderthals',)
neanderthals 
('gunmen',)
gunmen 
('nationalists',)
nationalists 
('others',)
others 
('tuitions',)
tuitions 
('restaurants',)
restaurants 
('preferences',)
preferences 
('responsibilities',)
respon

('types',)
types 
('fields',)
fields 
('creatures',)
creatures 
('centuries',)
centuries 
('months',)
months 
('instances',)
instances 
('appointments',)
appointments 
('articles',)
articles 
('arts',)
arts 
('beasts',)
beasts 
('pressures',)
pressures 
('bastions',)
bastions 
('extensions',)
extensions 
('photographs',)
photographs 
('rises',)
rises 
('yearbooks',)
yearbooks 
('matters',)
matters 
('gimmicks',)
gimmicks 
('founders',)
founders 
('claims',)
claims 
("'70s",)
'70s 
('sections',)
sections 
('ships',)
ships 
('t-shirts',)
t-shirts 
('containers',)
containers 
('warrants',)
warrants 
('plainclothes',)
plainclothes 
('suggestions',)
suggestions 
('wars',)
wars 
('authorities',)
authorities 
('sexes',)
sexes 
('barrels',)
barrels 
('boomers',)
boomers 
('proprietors',)
proprietors 
('readers',)
readers 
('judgments',)
judgments 
('girls',)
girls 
('sharks',)
sharks 
('aides',)
aides 
('programmers',)
programmers 
('recessions',)
recessions 
('demographics',)
demographics 
('

('PP-LOC', 'NP')
PP-LOC NP 
('``', 'ADJP')
`` ADJP 
(',', 'VP|<CC&SBAR-PRP>')
, VP|<CC&SBAR-PRP> 
(',', 'VP|<CC&VP+VP>')
, VP|<CC&VP+VP> 
(',', 'VP|<CC&``>')
, VP|<CC&``> 
(',', 'VP|<CC&VBD>')
, VP|<CC&VBD> 
(',', 'VP|<CC&RB>')
, VP|<CC&RB> 
(',', 'VP|<CC&ADVP>')
, VP|<CC&ADVP> 
(',', 'VP|<CC&VP+PP-TMP=1>')
, VP|<CC&VP+PP-TMP=1> 
(',', 'VP|<CC&VP>')
, VP|<CC&VP> 
('ADJP', 'NN')
ADJP NN 
('NP', 'NP-SBJ|<,&NP>')
NP NP-SBJ|<,&NP> 
('NP', 'NP-SBJ|<,&CC>')
NP NP-SBJ|<,&CC> 
('NP', ',')
NP , 
('NP', "NP-SBJ|<,&''>")
NP NP-SBJ|<,&''> 
('NP', 'NP-SBJ|<,&ADVP>')
NP NP-SBJ|<,&ADVP> 
('NP', 'NP-SBJ|<,&PP>')
NP NP-SBJ|<,&PP> 
('ADVP-MNR', 'SBAR-PRP')
ADVP-MNR SBAR-PRP 
('PRT', 'VP|<NP-PRD&,>')
PRT VP|<NP-PRD&,> 
('PRT', 'NP-PRD')
PRT NP-PRD 
('RBR', 'NP|<ADJP&NN>')
RBR NP|<ADJP&NN> 
('PP-LOC', 'SBAR')
PP-LOC SBAR 
('PP-DIR', 'VP|<PP-LOC&PP-TMP>')
PP-DIR VP|<PP-LOC&PP-TMP> 
('PP-DIR', 'VP|<PP-LOC&PP-LOC>')
PP-DIR VP|<PP-LOC&PP-LOC> 
('PP-DIR', 'PP-LOC')
PP-DIR PP-LOC 
('PP-DIR', 'VP|<PP-LOC&PP-DIR>

UH TOP|<.&UH> 
('SBAR-SBJ', 'TOP|<VP&.>')
SBAR-SBJ TOP|<VP&.> 
('NP-SBJ', 'TOP|<PP&VP>')
NP-SBJ TOP|<PP&VP> 
('CC', 'TOP|<PP-LOC&NP-TMP>')
CC TOP|<PP-LOC&NP-TMP> 
('NP-SBJ', 'TOP|<ADVP-LOC&VP>')
NP-SBJ TOP|<ADVP-LOC&VP> 
('S', 'TOP|<:&``>')
S TOP|<:&``> 
('PP-LOC', 'TOP|<:&:>')
PP-LOC TOP|<:&:> 
('PP', 'TOP|<PRN&NP-SBJ>')
PP TOP|<PRN&NP-SBJ> 
('DT', 'TOP|<NNP&NNP>')
DT TOP|<NNP&NNP> 
('CC', 'TOP|<NP-SBJ&ADVP-TMP>')
CC TOP|<NP-SBJ&ADVP-TMP> 
('PP', 'TOP|<,&``>')
PP TOP|<,&``> 
('NP', 'TOP|<PRN&.>')
NP TOP|<PRN&.> 
('NP', 'TOP|<PP-LOC&PP>')
NP TOP|<PP-LOC&PP> 
('NP-ADV', 'TOP|<NP-SBJ&VP>')
NP-ADV TOP|<NP-SBJ&VP> 
('RB', 'TOP|<RB&DT>')
RB TOP|<RB&DT> 
('``', 'TOP|<WHADVP&MD>')
`` TOP|<WHADVP&MD> 
('NNP', 'TOP|<NNP&NN>')
NNP TOP|<NNP&NN> 
('ADVP', 'TOP|<,&NP-TMP>')
ADVP TOP|<,&NP-TMP> 
('NP-VOC', 'TOP|<,&NP-SBJ>')
NP-VOC TOP|<,&NP-SBJ> 
('NP-SBJ', 'TOP|<PP-TMP&VP>')
NP-SBJ TOP|<PP-TMP&VP> 
('NNPS', 'NNP')
NNPS NNP 
('NP', 'TOP|<:&S>')
NP TOP|<:&S> 
('NP-TMP', 'TOP|<S&CC>')
NP-TMP TOP|<S&CC

RB VP 
('RB', 'TOP|<DT&NN>')
RB TOP|<DT&NN> 
('ADVP-TMP', '.')
ADVP-TMP . 
(',', 'PP-CLR')
, PP-CLR 
('IN', 'NP')
IN NP 
('RB', 'ADVP-PRD')
RB ADVP-PRD 
(',', 'PRN')
, PRN 
('NNS', 'NP|<NP&NNS>')
NNS NP|<NP&NNS> 
('NNP', 'NP|<CD&ADJP>')
NNP NP|<CD&ADJP> 
('NNP', 'NP|<CD&,>')
NNP NP|<CD&,> 
('NNP', 'CD')
NNP CD 
('NNP', 'NP|<CD&NN>')
NNP NP|<CD&NN> 
('NNP', 'NP|<CD&NNS>')
NNP NP|<CD&NNS> 
('NNP', 'NP|<CD&JJ>')
NNP NP|<CD&JJ> 
('NNP', 'NP|<CD&NNP>')
NNP NP|<CD&NNP> 
('NP-LOC', '.')
NP-LOC . 
('JJ', 'NP+QP|<IN&CD>')
JJ NP+QP|<IN&CD> 
('NP', 'NN')
NP NN 
('NP', 'NP|<NN&NNS>')
NP NP|<NN&NNS> 
('NP', 'NP|<NN&NN>')
NP NP|<NN&NN> 
('NP-PRD', "VP|<''&PP-LOC>")
NP-PRD VP|<''&PP-LOC> 
('IN', 'QP|<CD&IN>')
IN QP|<CD&IN> 
('IN', 'QP|<CD&NNS>')
IN QP|<CD&NNS> 
('IN', 'CD')
IN CD 
('IN', 'QP|<CD&CC>')
IN QP|<CD&CC> 
('IN', 'QP|<CD&CD>')
IN QP|<CD&CD> 
('CD', 'NP|<VBG&NNS>')
CD NP|<VBG&NNS> 
("''", 'VP|<ADVP&,>')
'' VP|<ADVP&,> 
('VBG', 'VP|<CC&VBG>')
VBG VP|<CC&VBG> 
('CC', 'PRN|<NNP&,>')
CC PRN|<NNP

(',', 'SBAR')
, SBAR 
(',', 'VP|<SBAR&SBAR-PRP>')
, VP|<SBAR&SBAR-PRP> 
("''", 'VP|<PP-TMP&,>')
'' VP|<PP-TMP&,> 
("''", 'PP-TMP')
'' PP-TMP 
('NP-SBJ', 'TOP|<ADVP-LOC&VP>')
NP-SBJ TOP|<ADVP-LOC&VP> 
('PP-LOC', 'NP-TMP')
PP-LOC NP-TMP 
("''", 'SBAR')
'' SBAR 
('``', "NX|<NX-TTL&''>")
`` NX|<NX-TTL&''> 
('``', 'NX-TTL')
`` NX-TTL 
('ADJP', 'TOP|<,&PP>')
ADJP TOP|<,&PP> 
('ADJP', 'TOP|<,&VP>')
ADJP TOP|<,&VP> 
('ADJP', 'TOP|<,&NP-SBJ>')
ADJP TOP|<,&NP-SBJ> 
('NNP', 'CD')
NNP CD 
('NP-TMP', 'VP|<:&PP-LOC>')
NP-TMP VP|<:&PP-LOC> 
('ADJP', 'PP-TMP')
ADJP PP-TMP 
('PP', '-RRB-')
PP -RRB- 
('JJ', 'TOP|<JJ&NN>')
JJ TOP|<JJ&NN> 
('VBG', 'VP')
VBG VP 
('PP-LOC-PRD', 'ADVP-TMP')
PP-LOC-PRD ADVP-TMP 
('NP-2', 'PP-TMP')
NP-2 PP-TMP 
('CC', 'SBAR')
CC SBAR 
('NP+NP', '-RRB-')
NP+NP -RRB- 
('NNPS', 'NP|<CC&NNP>')
NNPS NP|<CC&NNP> 
('NNPS', 'NP|<CC&NNPS>')
NNPS NP|<CC&NNPS> 
('PP', ':')
PP : 
('PRT', 'ADJP-PRD')
PRT ADJP-PRD 
('JJR', 'NP|<,&ADJP>')
JJR NP|<,&ADJP> 
('JJR', 'NP|<,&JJ>')
JJR NP|<,&JJ> 


('missed',)
missed 
('trekked',)
trekked 
('divided',)
divided 
('averaged',)
averaged 
('lied',)
lied 
('canceled',)
canceled 
('batted',)
batted 
('relented',)
relented 
('finished',)
finished 
('jolted',)
jolted 
('invested',)
invested 
('swamped',)
swamped 
('swelled',)
swelled 
('received',)
received 
('ousted',)
ousted 
('conspired',)
conspired 
('made',)
made 
('dipped',)
dipped 
('bought',)
bought 
('reversed',)
reversed 
('stuck',)
stuck 
('presented',)
presented 
('preferred',)
preferred 
('spooked',)
spooked 
('voted',)
voted 
('protected',)
protected 
('restrained',)
restrained 
('trailed',)
trailed 
('marked',)
marked 
('ruled',)
ruled 
('invited',)
invited 
('prompted',)
prompted 
('brought',)
brought 
('tucked',)
tucked 
('met',)
met 
('attached',)
attached 
('headed',)
headed 
('fared',)
fared 
('marketed',)
marketed 
('arose',)
arose 
('introduced',)
introduced 
('surrendered',)
surrendered 
('backed',)
backed 
('bottomed',)
bottomed 
('reappraised',)
reappraised 
('so

('NP', 'NP-PRD|<:&CC>')
NP NP-PRD|<:&CC> 
('NP', 'NP-PRD|<PP-TMP&PP-LOC>')
NP NP-PRD|<PP-TMP&PP-LOC> 
('NNP', 'NP-PRD|<NNP&NN>')
NNP NP-PRD|<NNP&NN> 
('DT', 'NP-PRD|<``&NX-TTL>')
DT NP-PRD|<``&NX-TTL> 
('NP', 'NP-PRD|<JJ&JJ>')
NP NP-PRD|<JJ&JJ> 
('NP', 'JJ')
NP JJ 
('``', 'NP-PRD|<NP-TTL&,>')
`` NP-PRD|<NP-TTL&,> 
('NP', 'NP-PRD|<,&ADVP-TMP>')
NP NP-PRD|<,&ADVP-TMP> 
('NNP', 'NNP')
NNP NNP 
('RB', 'NP-PRD|<DT&NN>')
RB NP-PRD|<DT&NN> 
('JJ', 'NP-PRD|<NNP&NN>')
JJ NP-PRD|<NNP&NN> 
('QP', 'NP-PRD|<DT&NN>')
QP NP-PRD|<DT&NN> 
('DT', 'NP-PRD|<NNP&NNPS>')
DT NP-PRD|<NNP&NNPS> 
('JJ', 'NNP')
JJ NNP 
('RB', 'NP-PRD|<DT&JJ>')
RB NP-PRD|<DT&JJ> 
('PRP$', 'NP-PRD|<ADJP&NN>')
PRP$ NP-PRD|<ADJP&NN> 
('NP', 'NP-PRD|<ADVP&:>')
NP NP-PRD|<ADVP&:> 
('NP', 'NP-PRD|<PP&PP-TMP>')
NP NP-PRD|<PP&PP-TMP> 
('DT', 'NP-PRD|<JJ&,>')
DT NP-PRD|<JJ&,> 
('NP', 'NP-PRD|<PP&,>')
NP NP-PRD|<PP&,> 
('NP', 'NP-PRD|<JJS&NN>')
NP NP-PRD|<JJS&NN> 
('NP', 'NP-PRD|<PP&.>')
NP NP-PRD|<PP&.> 
('``', "NP-PRD|<NP&''>")
`` NP-PRD

NP-ADV JJR 
('NP-ADV', 'ADJP-PRD|<JJR&PP>')
NP-ADV ADJP-PRD|<JJR&PP> 
('VBN', 'PP')
VBN PP 
('RB',)
RB 
('RB', 'RB')
RB RB 
('``', "ADJP-PRD|<JJ&''>")
`` ADJP-PRD|<JJ&''> 
('ADJP', 'ADJP-PRD|<PRN&SBAR>')
ADJP ADJP-PRD|<PRN&SBAR> 
('JJ', 'SBAR-ADV')
JJ SBAR-ADV 
('RB', 'ADJP-PRD|<JJR&PP>')
RB ADJP-PRD|<JJR&PP> 
('JJR',)
JJR 
('RB', 'ADJP-PRD|<VBN&PP-LOC>')
RB ADJP-PRD|<VBN&PP-LOC> 
('JJ', 'RB')
JJ RB 
('ADJP', 'PP')
ADJP PP 
('CC', 'ADJP-PRD|<JJ&CC>')
CC ADJP-PRD|<JJ&CC> 
('DT', 'ADJP-PRD|<JJ&CC>')
DT ADJP-PRD|<JJ&CC> 
('NNP',)
NNP 
('``', 'ADJP-PRD|<RB&JJ>')
`` ADJP-PRD|<RB&JJ> 
('JJ', 'ADJP-PRD|<CC&JJR>')
JJ ADJP-PRD|<CC&JJR> 
('ADJP', 'ADJP-PRD|<,&CC>')
ADJP ADJP-PRD|<,&CC> 
('NN', 'VBN')
NN VBN 
('RB', 'ADJP-PRD|<RBR&JJ>')
RB ADJP-PRD|<RBR&JJ> 
('ADVP', 'ADJP-PRD|<JJ&PP>')
ADVP ADJP-PRD|<JJ&PP> 
('RB', 'NP')
RB NP 
('RB', 'PP')
RB PP 
('RB', 'ADJP-PRD|<JJ&CC>')
RB ADJP-PRD|<JJ&CC> 
('NP-ADV', 'ADJP-PRD|<JJ&PP>')
NP-ADV ADJP-PRD|<JJ&PP> 
('NN', 'ADJP-PRD|<JJ&PP>')
NN ADJP-PRD|<JJ&PP>

In [453]:
print(uhg)



In [515]:
uhg["TOP"]

defaultdict(float,
            {"'' TOP|<ADVP&,>": 6.712310377231843e-05,
             "'' TOP|<NP&PP>": 6.712310377231843e-05,
             "'' TOP|<NP-SBJ&ADVP>": 6.712310377231843e-05,
             "'' TOP|<PP-LOC&,>": 6.712310377231843e-05,
             "'' TOP|<S&:>": 6.712310377231843e-05,
             '-LRB- TOP|<ADVP&,>': 6.712310377231843e-05,
             '-LRB- TOP|<ADVP&-RRB->': 6.712310377231843e-05,
             '-LRB- TOP|<FRAG&-RRB->': 6.712310377231843e-05,
             '-LRB- TOP|<NP&,>': 6.712310377231843e-05,
             '-LRB- TOP|<NP&:>': 0.0002013693113169553,
             '-LRB- TOP|<NP&PP>': 0.0002013693113169553,
             '-LRB- TOP|<NP-SBJ&,>': 6.712310377231843e-05,
             '-LRB- TOP|<NP-SBJ&ADVP-TMP>': 0.00013424620754463686,
             '-LRB- TOP|<NP-SBJ&VP>': 0.0022150624244865083,
             '-LRB- TOP|<PP&,>': 0.00013424620754463686,
             '-LRB- TOP|<PP-LOC&,>': 0.00013424620754463686,
             '-LRB- TOP|<PP-TMP&,>': 0.000134

In [488]:
another_sentence = ["the", "<CD>", "additional", "defendants", "were", "n't", "parties", "to", "the", "settlement", "."]


In [491]:
ugh_sentence = ["the", "company", "and", "its", "executives", "deny", "the", "charges", "."]

In [499]:
bigger_trees = []
f = open("bigger_treebank_2.psd", "r")
print(f)
x = steven_tree.Tree.from_stream(f)
for item in x:
    bigger_trees.append(item)
f.close()

<open file 'bigger_treebank_2.psd', mode 'r' at 0x10b43fc90>


In [500]:
len(bigger_trees)

1187

In [501]:
bigger_trees[0]

(TOP
    (NP-SBJ
        (NP
            (NNP <NNP>)
            (NNP <NNP>)
        )
        (, ,)
        (ADJP
            (NP
                (CD <CD>)
                (NNS years)
            )
            (JJ old)
        )
        (, ,)
    )
    (VP
        (MD will)
        (VP
            (VB join)
            (NP
                (DT the)
                (NN board)
            )
            (PP-CLR
                (IN as)
                (NP
                    (DT a)
                    (JJ nonexecutive)
                    (NN director)
                )
            )
            (NP-TMP
                (NNP <NNP>)
                (CD <CD>)
            )
        )
    )
    (. .)
)

In [509]:
another = ["<NNP>", "<NNP>", "is", "chairman", "of", "<NNP>", "<NNP>", ",", "the", "<NNP>", "publishing", "group", "."]