In [None]:
## Natural Language Understanding

In [None]:
## Querying a Database using sql

In [1]:
import nltk

In [2]:
nltk.data.show_cfg('grammars/book_grammars/sql0.fcfg')

% start S
S[SEM=(?np + WHERE + ?vp)] -> NP[SEM=?np] VP[SEM=?vp]
VP[SEM=(?v + ?pp)] -> IV[SEM=?v] PP[SEM=?pp]
VP[SEM=(?v + ?ap)] -> IV[SEM=?v] AP[SEM=?ap]
NP[SEM=(?det + ?n)] -> Det[SEM=?det] N[SEM=?n]
PP[SEM=(?p + ?np)] -> P[SEM=?p] NP[SEM=?np]
AP[SEM=?pp] -> A[SEM=?a] PP[SEM=?pp]
NP[SEM='Country="greece"'] -> 'Greece'
NP[SEM='Country="china"'] -> 'China'
Det[SEM='SELECT'] -> 'Which' | 'What'
N[SEM='City FROM city_table'] -> 'cities'
IV[SEM=''] -> 'are'
A[SEM=''] -> 'located'
P[SEM=''] -> 'in'


In [18]:
nltk.data.show_cfg('grammars/book_grammars/sql1.fcfg')

% start S
S[SEM=(?np + WHERE + ?vp)] -> NP[SEM=?np] VP[SEM=?vp]
VP[SEM=(?v + ?pp)] -> IV[SEM=?v] PP[SEM=?pp]
VP[SEM=(?v + ?ap)] -> IV[SEM=?v] AP[SEM=?ap]
VP[SEM=(?v + ?np)] -> TV[SEM=?v] NP[SEM=?np]
VP[SEM=(?vp1 + ?c + ?vp2)] -> VP[SEM=?vp1] Conj[SEM=?c] VP[SEM=?vp2]
NP[SEM=(?det + ?n)] -> Det[SEM=?det] N[SEM=?n]
NP[SEM=(?n + ?pp)]  -> N[SEM=?n] PP[SEM=?pp]
NP[SEM=?n]  -> N[SEM=?n]  | CardN[SEM=?n] 
CardN[SEM='1000'] -> '1,000,000' 
PP[SEM=(?p + ?np)] -> P[SEM=?p] NP[SEM=?np]
AP[SEM=?pp] -> A[SEM=?a] PP[SEM=?pp]
NP[SEM='Country="greece"'] -> 'Greece'
NP[SEM='Country="china"'] -> 'China'
Det[SEM='SELECT'] -> 'Which' | 'What'
Conj[SEM='AND'] -> 'and'
N[SEM='City FROM city_table'] -> 'cities'
N[SEM='Population'] -> 'populations'
IV[SEM=''] -> 'are'
TV[SEM=''] -> 'have'
A -> 'located'
P[SEM=''] -> 'in'
P[SEM='>'] -> 'above'


In [None]:
nltk.

In [None]:
## This allows us to parse a query into SQL

In [3]:
from nltk import load_parser

In [5]:
cp = load_parser('grammars/book_grammars/sql0.fcfg')

In [6]:
query = 'What cities are located in China'

In [20]:
query1 = 'What cities are in China and have populations above 1,000,000'

In [21]:
tree1 = list(cp.parse(query1.split()))

ValueError: Grammar does not cover some of the input words: "'and', 'have', 'populations', 'above', '1,000,000'".

In [7]:
trees = list(cp.parse(query.split()))

In [None]:
tree = list(cp.parse(query1.split()))

In [8]:
answer = trees[0].label()['SEM']

In [None]:
ans1 = tree[0].label()['SEM'] 

In [9]:
ans = [s for s in answer if s]

In [None]:
ans1 = [s for s in ans1 if s]

In [None]:
q1 = ' '.join(ans1)
print(q1)

In [10]:
q = ' '.join(answer)
print(q)

SELECT City FROM city_table WHERE   Country="china"


In [11]:
cp = load_parser('grammars/book_grammars/sql0.fcfg', trace=3)

In [12]:
cp

<nltk.parse.featurechart.FeatureChartParser at 0x1c65bd5be88>

In [13]:
from nltk.sem import chat80

In [14]:
rows = chat80.sql_query('corpora/city_database/city.db', q)

In [15]:
for r in rows: print(r[0], end=" ")

canton chungking dairen harbin kowloon mukden peking shanghai sian tientsin 

## Propositional Logic

In [22]:
nltk.boolean_ops()

negation       	-
conjunction    	&
disjunction    	|
implication    	->
equivalence    	<->


In [24]:
read_exp = nltk.sem.Expression.fromstring

In [25]:
read_exp('-(P & Q)')

<NegatedExpression -(P & Q)>

In [26]:
read_exp('P & Q')

<AndExpression (P & Q)>

In [27]:
read_exp('P | (R -> Q)')

<OrExpression (P | (R -> Q))>

In [28]:
read_exp('P <-> -- p')

<IffExpression (P <-> --p)>

In [32]:
lp = nltk.sem.Expression.fromstring
SnF = read_exp('SnF')
NotFnS = read_exp('-FnS')
R = read_exp('SnF -> -FnS')
prover = nltk.Prover9()
prover.prove(NotFnS, [SnF, R])

LookupError: 

===========================================================================
NLTK was unable to find the prover9 file!
Use software specific configuration paramaters or set the PROVER9 environment variable.

  Searched in:
    - /usr/local/bin/prover9
    - /usr/local/bin/prover9/bin
    - /usr/local/bin
    - /usr/bin
    - /usr/local/prover9
    - /usr/local/share/prover9

  For more information on prover9, see:
    <http://www.cs.unm.edu/~mccune/prover9/>
===========================================================================

In [33]:
val = nltk.Valuation([('P', True), ('Q', True), ('R', False)])

In [34]:
val['P']

True

In [35]:
dom = set()

In [36]:
g = nltk.Assignment(dom)

In [37]:
m = nltk.Model(dom, val)

In [39]:
print(m.evaluate('(P & Q)', g))

True


In [40]:
print(m.evaluate('-(P & Q)', g))

False


In [43]:
print(m.evaluate('(P & R)', g))

False


In [44]:
print(m.evaluate('(P | R)', g))

True


## First Order Logic

#### Syntax

In [49]:
read_exp = nltk.sem.Expression.fromstring

In [50]:
exp = read_exp('walk(angus)', type_check=True)

In [51]:
exp.argument

<ConstantExpression angus>

In [52]:
exp.function

<ConstantExpression walk>

In [53]:
exp.function.type

<e,?>

In [54]:
sig = {'walk': '<e, t>'}
exp = read_exp('walk(angus)', signature=sig)
exp.function.type

e

In [55]:
read_expr = nltk.sem.Expression.fromstring
read_expr('dog(cyril)').free()

set()

In [56]:
read_expr('dog(x)').free()

{Variable('x')}

In [57]:
read_expr('own(angus, cyril)').free()

set()

In [58]:
read_expr('exists x.dog(x)').free()

set()

In [59]:
read_expr('((some x.walk(x)) -> sing(x))').free()

{Variable('x')}

In [60]:
read_expr('exists x.own(y, x)').free()

{Variable('y')}

In [61]:
dom = {'b', 'o', 'c'}

In [62]:
v = """
    bertie => b
    olive => o
    cyril => c
    boy => {b}
    girl => {o}
    dog => {c}
    walk => {o, c}
    see => {(b, o), (c, b), (o, c)}
"""
val = nltk.Valuation.fromstring(v)
print(val)

{'bertie': 'b',
 'boy': {('b',)},
 'cyril': 'c',
 'dog': {('c',)},
 'girl': {('o',)},
 'olive': 'o',
 'see': {('b', 'o'), ('o', 'c'), ('c', 'b')},
 'walk': {('o',), ('c',)}}


In [63]:
('o', 'c') in val['see']

True

In [72]:
('o',), ('c') in val['walk']

(('o',), False)

In [69]:
('o',) in val['girl']

True

## Individual Variables and Assignments

In [73]:
g = nltk.Assignment(dom, [('x', 'o'), ('y', 'c')])

In [74]:
g

{'x': 'o', 'y': 'c'}

In [75]:
print(g)

g[c/y][o/x]


In [76]:
m = nltk.Model(dom, val)
m.evaluate('see(olive, y)', g)

True

In [77]:
g['y']

'c'

In [78]:
m.evaluate('see(y, x)', g)

False

In [79]:
g.purge()
g

{}

In [80]:
m.evaluate('see(olive, y)', g)

'Undefined'

In [81]:
m.evaluate('see(bertie, olive) & boy(bertie) & -walk(bertie)', g)

True

## Quantification

In [82]:
m.evaluate('exists x.(girl(x) & walk(x))', g)

True

In [83]:
m.evaluate('girl(x) & walk(x)', g.add('x', 'o'))

True

In [84]:
fmla1 = read_expr('girl(x) | boy(x)')
m.satisfiers(fmla1, 'x', g)

{'b', 'o'}

In [85]:
fmla2 = read_expr('girl(x) -> walk(x)')
m.satisfiers(fmla2, 'x', g)

{'b', 'c', 'o'}

In [86]:
fmla3 = read_expr('walk(x) -> girl(x)')
m.satisfiers(fmla3, 'x', g)

{'b', 'o'}

In [87]:
m.evaluate('all x.(girl(x) -> walk(x))', g)

True

## Quantifier Scope Ambiguity

In [88]:
v2 = """
    bruce => b
    elspeth => e
    julia => j
    matthew => m
    person => {b, e, j, m}
    admire => {(j, b), (b, b), (m, e), (e, m)}
"""
val2 = nltk.Valuation.fromstring(v2)

In [89]:
dom2 = val2.domain
m2 = nltk.Model(dom2, val2)
g2 = nltk.Assignment(dom2)
fmla4 = read_expr('(person(x) -> exists y.(person(y) & admire(x, y)))')
m2.satisfiers(fmla4, 'x', g2)

{'b', 'e', 'j', 'm'}

In [90]:
fmla5 = read_exp('(person(y) & all x.(person(x) -> admire(x, y)))')
m2.satisfiers(fmla5, 'y', g2)

set()

In [91]:
fmla6 = read_expr('(person(y) & all x.((x = bruce | x = julia) -> admire(x, y)))')
m2.satisfiers(fmla6, 'y', g2)

{'b'}

## Model Building

In [92]:
a3 = read_exp('exists x.(man(x) & walks(x))')

In [93]:
c1 = read_exp('mortal(socrate)')

In [94]:
c2 = read_exp('-mortal(socrates)')

In [95]:
mb = nltk.Mace(5)

# The Semantics of English Sentences

### Compositional Semantice in Feature Based Grammar

In [99]:
read_expr = nltk.sem.Expression.fromstring
expr = read_expr(r'\x.(walk(x) & chew_gum(x))')
expr

<LambdaExpression \x.(walk(x) & chew_gum(x))>

In [100]:
expr.free()

set()

In [101]:
print(read_expr(r'\x.(walk(x) & chew_gum(y))'))

\x.(walk(x) & chew_gum(y))


In [102]:
expr = read_expr(r'\x.(walk(x) & chew_gum(x))(gerald)')
print(expr)

\x.(walk(x) & chew_gum(x))(gerald)


In [103]:
print(expr.simplify())

(walk(gerald) & chew_gum(gerald))


In [104]:
print(read_expr(r'\x.\y.(dog(x) & own(y, x))(cyril)').simplify())

\y.(dog(cyril) & own(y,cyril))


In [105]:
 print(read_expr(r'\x.\y.(dog(x) & own(y, x))(cyril, angus)').simplify())

(dog(cyril) & own(angus,cyril))


In [106]:
expr1 = read_expr('exists x.P(x)')
print(expr1)

exists x.P(x)


In [107]:
expr2 = expr1.alpha_convert(nltk.sem.Variable('z'))
print(expr2)

exists z.P(z)


In [108]:
expr1 == expr2

True

In [109]:
expr3 = read_expr('\P.(exists x.P(x))(\y.see(y, x))')
print(expr3)

(\P.exists x.P(x))(\y.see(y,x))


In [110]:
print(expr3.simplify())

exists z1.see(z1,x)


In [111]:
read_expr = nltk.sem.Expression.fromstring
tvp = read_expr(r'\X x.X(\y.chase(x,y))')
np = read_expr(r'(\P.exists x.(dog(x) & P(x)))')
vp = nltk.sem.ApplicationExpression(tvp, np)
print(vp)

(\X x.X(\y.chase(x,y)))(\P.exists x.(dog(x) & P(x)))


In [112]:
print(vp.simplify())

\x.exists z2.(dog(z2) & chase(x,z2))


In [113]:
from nltk import load_parser
parser = load_parser('grammars/book_grammars/simple-sem.fcfg', trace=0)
sentence = 'Angus gives a bone to every dog'
tokens = sentence.split()
for tree in parser.parse(tokens):
    print(tree.label()['SEM'])

all z4.(dog(z4) -> exists z3.(bone(z3) & give(angus,z3,z4)))


In [114]:
sents = ['Irene walks', 'Cyril bites an ankle']
grammar_file = 'grammars/book_grammars/simple-sem.fcfg'
for results in nltk.interpret_sents(sents, grammar_file):
    for (synrep, semrep) in results:
         print(synrep)

(S[SEM=<walk(irene)>]
  (NP[-LOC, NUM='sg', SEM=<\P.P(irene)>]
    (PropN[-LOC, NUM='sg', SEM=<\P.P(irene)>] Irene))
  (VP[NUM='sg', SEM=<\x.walk(x)>]
    (IV[NUM='sg', SEM=<\x.walk(x)>, TNS='pres'] walks)))
(S[SEM=<exists z5.(ankle(z5) & bite(cyril,z5))>]
  (NP[-LOC, NUM='sg', SEM=<\P.P(cyril)>]
    (PropN[-LOC, NUM='sg', SEM=<\P.P(cyril)>] Cyril))
  (VP[NUM='sg', SEM=<\x.exists z5.(ankle(z5) & bite(x,z5))>]
    (TV[NUM='sg', SEM=<\X x.X(\y.bite(x,y))>, TNS='pres'] bites)
    (NP[NUM='sg', SEM=<\Q.exists x.(ankle(x) & Q(x))>]
      (Det[NUM='sg', SEM=<\P Q.exists x.(P(x) & Q(x))>] an)
      (Nom[NUM='sg', SEM=<\x.ankle(x)>]
        (N[NUM='sg', SEM=<\x.ankle(x)>] ankle)))))


In [115]:
v = """
    bertie => b
    olive => o
    cyril => c
    boy => {b}
    girl => {o}
    dog => {c}
    walk => {o, c}
    see => {(b, o), (c, b), (o, c)}
"""
val = nltk.Valuation.fromstring(v)
g = nltk.Assignment(val.domain)
m = nltk.Model(val.domain, val)
sent = 'Cyril sees every boy'
grammar_file = 'grammars/book_grammars/simple-sem.fcfg'
results = nltk.evaluate_sents([sent], grammar_file, m, g)[0]
for (syntree, semrep, value) in results:
    print(semrep)
    print(value)

all z6.(boy(z6) -> see(cyril,z6))
True


## Quantifier Ambiguity Revisited

In [116]:
from nltk.sem import cooper_storage as cs
sentence = 'every girl chases a dog'
trees = cs.parse_with_bindops(sentence, grammar='grammars/book_grammars/storage.fcfg')
semrep = trees[0].label()['SEM']
cs_semrep = cs.CooperStore(semrep)
print(cs_semrep.core)

chase(z2,z3)


In [117]:
for bo in cs_semrep.store:
    print(bo)

bo(\P.all x.(girl(x) -> P(x)),z2)
bo(\P.exists x.(dog(x) & P(x)),z3)


In [119]:
cs_semrep.s_retrieve(trace=True)

Permutation 1
   (\P.all x.(girl(x) -> P(x)))(\z2.chase(z2,z3))
   (\P.exists x.(dog(x) & P(x)))(\z3.all x.(girl(x) -> chase(x,z3)))
Permutation 2
   (\P.exists x.(dog(x) & P(x)))(\z3.chase(z2,z3))
   (\P.all x.(girl(x) -> P(x)))(\z2.exists x.(dog(x) & chase(z2,x)))


In [120]:
for reading in cs_semrep.readings:
    print(reading)

exists x.(dog(x) & all z9.(girl(z9) -> chase(z9,x)))
all x.(girl(x) -> exists z10.(dog(z10) & chase(x,z10)))


## Discourse Semantics

In [None]:
drs1.draw()

In [None]:
print(drs1.fol())

In [None]:
drs2 = read_dexpr('([x], [walk(x)]) + ([y], [run(y)])')
print(drs2)

#>>> print(drs2.simplify())

In [122]:
from nltk import load_parser
parser = load_parser('grammars/book_grammars/drt.fcfg', logic_parser=nltk.sem.drt.DrtParser())
trees = list(parser.parse('Angus owns a dog'.split()))
print(trees[0].label()['SEM'].simplify())

([x,z12],[Angus(x), dog(z12), own(x,z12)])


In [123]:
drs3 = read_dexpr('([], [(([x], [dog(x)]) -> ([y],[ankle(y), bite(x, y)]))])')
print(drs3.fol())

all x.(dog(x) -> exists y.(ankle(y) & bite(x,y)))


In [None]:
>>> drs4 = read_dexpr('([x, y], [angus(x), dog(y), own(x, y)])')
>>> drs5 = read_dexpr('([u, z], [PRO(u), irene(z), bite(u, z)])')
>>> drs6 = drs4 + drs5
>>> print(drs6.simplify())
([u,x,y,z],[angus(x), dog(y), own(x,y), PRO(u), irene(z), bite(u,z)])
>>> print(drs6.simplify().resolve_anaphora())

## Discourse Processing

In [2]:
dt = nltk.DiscourseTester(['A student dances', 'Every student is a person'])

NameError: name 'nltk' is not defined

In [3]:
dt.readings()

NameError: name 'dt' is not defined

In [4]:
dt.add_sentence('No person dances', consistchk=True)

NameError: name 'dt' is not defined

In [None]:
dt.retract_sentence('No person dances', verbose=True)

In [None]:
dt.add_sentence('A person dances', informchk=True)

In [None]:
from nltk.tag import RegexpTagger
tagger = RegexpTagger(
    [('^(chases|runs)$', 'VB'),
     ('^(a)$', 'ex_quant'),
     ('^(every)$', 'univ_quant'),
     ('^(dog|boy)$', 'NN'),
     ('^(He)$', 'PRP') 
])

In [None]:
rc = nltk.DrtGlueReadingCommand(depparser=nltk.MaltParser(tagger=tagger))
dt = nltk.DiscourseTester(['Every dog chases a boy', 'He runs'], rc)
dt.readings()

In [None]:
dt.readings(show_thread_readings=True)

In [None]:
dt.readings(show_thread_readings=True, filter=True)

## Summary