stanfordnlp
diff --git a/‎README.md‎
Lines changed: 3 additions & 0 deletions b/‎README.md‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎build.gradle‎
Lines changed: 3 additions & 0 deletions b/‎build.gradle‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎build.xml‎
Lines changed: 42 additions & 53 deletions b/‎build.xml‎
Lines changed: 42 additions & 53 deletions
diff --git a/‎data/edu/stanford/nlp/process/ptblexer.gold‎
Lines changed: 1 addition & 1 deletion b/‎data/edu/stanford/nlp/process/ptblexer.gold‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎data/edu/stanford/nlp/upos/ENUniversalPOS.tsurgeon‎
Lines changed: 39 additions & 12 deletions b/‎data/edu/stanford/nlp/upos/ENUniversalPOS.tsurgeon‎
Lines changed: 39 additions & 12 deletions
diff --git a/‎doc/classify/README.txt‎
Lines changed: 4 additions & 2 deletions b/‎doc/classify/README.txt‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎doc/corenlp/CoreNLP-to-HTML.xsl‎
Lines changed: 8 additions & 11 deletions b/‎doc/corenlp/CoreNLP-to-HTML.xsl‎
Lines changed: 8 additions & 11 deletions
diff --git a/‎doc/corenlp/README.txt‎
Lines changed: 5 additions & 2 deletions b/‎doc/corenlp/README.txt‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎doc/corenlp/corenlp.sh‎
Lines changed: 4 additions & 2 deletions b/‎doc/corenlp/corenlp.sh‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎doc/corenlp/pom-full.xml‎
Lines changed: 4 additions & 4 deletions b/‎doc/corenlp/pom-full.xml‎
Lines changed: 4 additions & 4 deletions
@@ -12,3 +12,6 @@ You can find more explanation and documentation on [the Stanford CoreNLP homepag
 The most recent models associated with the code in the HEAD of this repository can be found [here](http://nlp.stanford.edu/software/stanford-corenlp-models-current.jar).
 
 For information about making contributions to Stanford CoreNLP, see the file `CONTRIBUTING.md`.
+
+Questions about CoreNLP can either be posted on StackOverflow with the tag [stanford-nlp](http://stackoverflow.com/questions/tagged/stanford-nlp), 
+  or on the [mailing lists](http://nlp.stanford.edu/software/corenlp.shtml#Mail).
@@ -6,8 +6,11 @@ apply plugin: 'java'
 apply plugin: 'eclipse'
 apply plugin: 'application'
 
+// Gradle java plugin
 sourceCompatibility = 1.8
 targetCompatibility = 1.8
+compileJava.options.encoding = 'UTF-8'
+
 version = '3.4.1'
 
 // Gradle application plugin
 
@@ -316,6 +316,48 @@
       <zipfileset file="${source.path}/edu/stanford/nlp/time/suservlet/prototype.js"/>
     </war>
   </target>
+  
+  <target name="openie.war" depends="compile,jar"
+          description="build the openie webapp">
+    <war destfile="openie.war"
+         webxml="${source.path}/edu/stanford/nlp/naturalli/demo/web.xml">
+      <lib dir=".">
+        <include name="javanlp-core.jar"/>
+      </lib>
+      <zipfileset prefix="WEB-INF/data"
+                  file="/u/nlp/data/pos-tagger/distrib/english-left3words-distsim.tagger"/>
+      <zipfileset prefix="WEB-INF/data"
+                  file="${source.path}/edu/stanford/nlp/time/rules/*"/>
+      <zipfileset prefix="WEB-INF/data"
+                    file="${source.path}/edu/stanford/nlp/time/holidays/*"/>
+      <zipfileset prefix="WEB-INF/data"
+                  file="/u/nlp/data/ner/goodClassifiers/english.all.3class.distsim.crf.ser.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                  file="/u/nlp/data/ner/goodClassifiers/english.conll.4class.distsim.crf.ser.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                  file="/u/nlp/data/ner/goodClassifiers/english.muc.7class.distsim.crf.ser.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                  file="/u/nlp/data/depparser/nn/distrib/english_SD.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                  file="/u/nlp/data/lexparser/englishPCFG.ser.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/clauseSplitterModel.ser.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/pp.tab.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/obj.tab.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/privative.tab.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/subj_obj_pp.tab.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/subj_pp_obj.tab.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/subj_pp_pp.tab.gz"/>
+      <zipfileset prefix="WEB-INF/data"
+                   file="/home/gabor/workspace/naturalli/etc/subj_pp.tab.gz"/>
+    </war>
+  </target>
 
   <target name="parser.war" depends="compile,jar"
           description="build the parser webapp">
@@ -409,59 +451,6 @@
     </war>
   </target>
 
-  <target name="spied.war" depends="compile,jar"
-            description="build the spied webapp">
-        <war destfile="spied.war"
-             webxml="${source.path}/edu/stanford/nlp/patterns/demo/web.xml">
-            <lib dir=".">
-                <include name="javanlp-core.jar"/>
-            </lib>
-            <lib dir="${basedir}/lib">
-                <include name="commons-lang3-3.1.jar"/>
-                <include name="xom-1.2.10.jar"/>
-                <include name="xml-apis.jar"/>
-                <include name="joda-time.jar"/>
-		<include name="jollyday-0.4.7.jar"/>
-		<include name="javax.json.jar"/>
-            </lib>
-            <lib dir="/u/nlp/data/StanfordCoreNLPModels">
-                <include name="stanford-corenlp-models-current.jar"/>
-            </lib>
-            <zipfileset file="${source.path}/edu/stanford/nlp/patterns/demo/frontend/*"/>
-            <zipfileset file="${source.path}/edu/stanford/nlp/patterns/*.properties"/>
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/u/nlp/data/pos-tagger/distrib/english-left3words-distsim.tagger"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="${source.path}/edu/stanford/nlp/time/rules/*"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="${source.path}/edu/stanford/nlp/time/holidays/*"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/u/nlp/data/ner/goodClassifiers/english.all.3class.distsim.crf.ser.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/u/nlp/data/ner/goodClassifiers/english.conll.4class.distsim.crf.ser.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/u/nlp/data/ner/goodClassifiers/english.muc.7class.distsim.crf.ser.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/u/nlp/data/depparser/nn/distrib/english_SD.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/u/nlp/data/lexparser/englishPCFG.ser.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/clauseSplitterModel.ser.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/pp.tab.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/obj.tab.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/privative.tab.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/subj_obj_pp.tab.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/subj_pp_obj.tab.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-                        <!--file="/home/gabor/workspace/naturalli/etc/subj_pp_pp.tab.gz"/>-->
-            <!--<zipfileset prefix="WEB-INF/data"-->
-	   </war>
-         </target>
   <property environment="env" />
 
   <condition property="version1.7">
 
@@ -885,7 +885,7 @@ origins
 ''
 Libyan
 ruler
-Mu‘ammar
+Mu`ammar
 al-Qaddafi
 referred
 to
 
@@ -5,17 +5,35 @@
 % Author: Sebastian Schuster
 % Author: Christopher Manning
 %
+% The original Penn Treebank WSJ contains 45 POS tags (but almost certainly # for British pound currency is a bad idea!)
+% {#=173, $=9,039, ''=8,658, ,=60,489, -LRB-=1,672, -RRB-=1,689, .=48,733, :=6,087, CC=29,462, CD=44,937, DT=101,190,
+%  EX=1,077, FW=268, IN=121,903, JJ=75,266, JJR=4,042, JJS=2,396, LS=64, MD=11,997, NN=163,935, NNP=114,053,
+%  NNPS=3,087, NNS=73,964, PDT=441, POS=10,801, PRP=21,357, PRP$=10,241, RB=38,197, RBR=2,175, RBS=555, RP=3,275,
+%  SYM=70, TO=27,449, UH=117, VB=32,565, VBD=37,493, VBG=18,239, VBN=24,865, VBP=15,377, VBZ=26,436, WDT=5,323,
+%  WP=2,887, WP$=219, WRB=2,625, ``=8,878}
 %
-% Context-sensitive mappings
+% The Web Treebank corpus adds 6 tags, but doesn't have #, yielding 50 POS tags:
+% ADD, AFX, GW, HYPH, NFP, XX
+%
+% OntoNotes 4.0 has 53 tags. It doesn't have # but adds: -LSB-, -RSB- [both mistakes!], ADD, AFX, CODE, HYPH, NFP,
+% X [mistake!], XX.
 %
 %
+% ------------------------------
+% Context-sensitive mappings
+%
 % TO -> PART (in CONJP phrases)
-CONJP < TO=target < VB
+@CONJP < TO=target < VB
 
 relabel target PART
 
 % TO -> PART
-VP < VP < (/^TO$/=target <... {/.*/})
+@VP < @VP < (/^TO$/=target <... {/.*/})
+
+relabel target PART
+
+% TO -> PART
+@VP <: (/^TO$/=target <... {/.*/})
 
 relabel target PART
 
@@ -24,13 +42,22 @@ TO=target <... {/.*/}
 
 relabel target ADP
 
-% delete the next two rules, third one should also cover them
-%
-% VB -> AUX (passive, case 1)
-%VP < (/^VB/=target < /^(?i:am|is|are|r|be|being|'s|'re|'m|was|were|been|s|ai|m|art|ar|wase|get|got|getting|gets|gotten)$/ ) < (VP|ADJP [ < VBN|VBD | < (VP|ADJP < VBN|VBD) < CC ] )
+% Don't do this, we are now treating these as copular constructions
+% VB.* -> AUX (for passives where main verb is part of an ADJP)
+%@VP < (/^VB/=target < /^(?i:am|is|are|r|be|being|'s|'re|'m|was|were|been|s|ai|m|art|ar|wase|get|got|getting|gets|gotten)$/ ) < (@ADJP [ < VBN|VBD | < (@VP|ADJP < VBN|VBD) < CC ] )
 %
 %relabel target AUX
 %
+% VB.* -> AUX (for cases with fronted main VPs)
+@SINV < (@VP < (/^VB/=target <  /^(?i:am|is|are|r|be|being|'s|'re|'m|was|were|been|s|ai|m|art|ar|wase)$/ ) $-- (@VP < VBD|VBN))
+
+relabel target AUX
+
+% VB.* -> AUX (another, rarer case of fronted VPs)
+@SINV < (@VP < (@VP < (/^VB/=target <  /^(?i:am|is|are|r|be|being|'s|'re|'m|was|were|been|s|ai|m|art|ar|wase)$/ )) $-- (@VP < VBD|VBN))
+
+relabel target AUX
+
 % VB.* -> AUX (passive, case 2)
 %SQ|SINV < (/^VB/=target < /^(?i:am|is|are|r|be|being|'s|'re|'m|was|were|been|s|ai|m|art|ar|wase)$/ $++ (VP < VBD|VBN))
 %
@@ -42,7 +69,7 @@ VP < VP < (/^VB.*$/=target <... {/.*/})
 relabel target AUX
 
 % VB -> AUX (active, case 2)
-SQ|SINV < (/^VB/=target $++ /^(?:VP|ADJP)/ <... {/.*/})
+@SQ|SINV < (/^VB/=target $++ /^(?:VP)/ <... {/.*/})
 
 relabel target AUX
 
@@ -91,7 +118,7 @@ RB=target <... {/.*/}
 
 relabel target ADV
 
-%
+% ------------------------------
 % 1 to 1 mappings
 %
 %
@@ -110,10 +137,10 @@ DT=target <... {/.*/}
 
 relabel target DET
 
-% EX -> DET
+% EX -> PRON
 EX=target <... {/.*/}
 
-relabel target DET
+relabel target PRON
 
 % FW -> X
 FW=target <... {/.*/}
@@ -280,7 +307,7 @@ AFX=target <... {/.*/}
 
 relabel target X
 
- %GW -> X
+% GW -> X
 GW=target <... {/.*/}
 
 relabel target X
 
@@ -1,4 +1,4 @@
-Stanford Classifier v3.5.1 - 2015-01-29
+Stanford Classifier v3.5.2 - 2015-04-20
 -------------------------------------------------
 
 Copyright (c) 2003-2012 The Board of Trustees of 
@@ -15,7 +15,7 @@ This package contains a maximum entropy classifier.
 
 For more information about the classifier, point a web browser at the included javadoc directory, starting at the Package page for the edu.stanford.nlp.classify package, and looking also at the ColumnDataClassifier class documentation therein.
 
-This software requires Java 5 (JDK 1.6.0+).  (You must have installed it
+This software requires Java 8 (JDK 1.8.0+).  (You must have installed it
 separately. Check the command "java -version".)
 
 
@@ -76,6 +76,8 @@ LICENSE
 CHANGES
 -------------------------
 
+2015-04-20    3.5.2     Update for compatibility 
+
 2015-01-29    3.5.1     New input/output options, support for GloVe 
                         word vectors 
 
 
@@ -66,7 +66,11 @@ xmlns:d="http://nlp.stanford.edu/CoreNLP/v1">
 
 <xsl:template match="root/document/sentences/sentence">
   <xsl:param name="position" select="'0'"/>
-  <i><b>Sentence #<xsl:value-of select="$position"/></b></i>
+  <p><i><b>Sentence #<xsl:value-of select="$position"/></b></i>
+  <xsl:if test="@sentiment">
+        <xsl:text> Sentiment: </xsl:text><xsl:value-of select="@sentiment"/>
+  </xsl:if>
+  </p>
 
   <p>
   <i>Tokens</i><br/>
@@ -88,16 +92,7 @@ xmlns:d="http://nlp.stanford.edu/CoreNLP/v1">
   </p>
 
   <p>
-  <i>Collapsed dependencies</i>
-  <ul>
-  <xsl:for-each select="dependencies[@type='collapsed-dependencies']">
-    <xsl:apply-templates select="dep"/>
-  </xsl:for-each>
-  </ul>
-  </p>
-
-  <p>
-  <i>Collapsed dependencies with CC processed</i>
+  <i>Enhanced dependencies</i>
   <ul>
   <xsl:for-each select="dependencies[@type='collapsed-ccprocessed-dependencies']">
     <xsl:apply-templates select="dep"/>
@@ -118,6 +113,7 @@ xmlns:d="http://nlp.stanford.edu/CoreNLP/v1">
     <th>NER</th>
     <th>Normalized NER</th>
     <th>Speaker</th>
+    <th>Sentiment</th>
   </tr>
   <xsl:for-each select="token">
     <tr>
@@ -130,6 +126,7 @@ xmlns:d="http://nlp.stanford.edu/CoreNLP/v1">
       <td><xsl:value-of select="NER"/></td>
       <td><xsl:value-of select="NormalizedNER"/></td>
       <td><xsl:value-of select="Speaker"/></td>
+      <td><xsl:value-of select="sentiment"/></td>
     </tr>
   </xsl:for-each>
   </table>
 
@@ -1,7 +1,7 @@
 Stanford CoreNLP - Stanford's Suite of NLP Tools
 ------------------------------------------------
 
-Copyright © 2009-2014 The Board of Trustees of
+Copyright © 2009-2015 The Board of Trustees of
 The Leland Stanford Junior University. All Rights Reserved.
 
 DOCUMENTATION
@@ -14,7 +14,7 @@ LICENSE
 
 //
 // StanfordCoreNLP -- a suite of NLP tools
-// Copyright © 2009-2014 The Board of Trustees of
+// Copyright © 2009-2015 The Board of Trustees of
 // The Leland Stanford Junior University. All Rights Reserved.
 //
 // This program is free software; you can redistribute it and/or
@@ -42,6 +42,9 @@ LICENSE
 CHANGES
 ---------------------------------
 
+2015-04-20    3.5.2     Switch to Universal dependencies, add Chinese 
+                        coreference systemCore NLP 
+
 2015-01-29    3.5.1     NER, dependency parser, SPIED improvements; 
                         general bugfixes 
 
 
@@ -4,12 +4,14 @@
 # Simple uses for xml and plain text output to files are:
 #    ./corenlp.sh -file filename
 #    ./corenlp.sh -file filename -outputFormat text 
+# Split into sentences, run POS tagger and NER, write CoNLL-style TSV file:
+#    ./corenlp.sh -annotators tokenize,ssplit,pos,lemma,ner -outputFormat conll -file input.txt
 # You can also start a simple shell where you can enter sentences to be processed:
 #    ./corenlp.sh
 
 OS=`uname`
-# Macs (BSD) don't support readlink -e
-if [ "$OS" == "Darwin" ]; then
+# Some machines (older OS X, BSD, Windows environments) don't support readlink -e
+if hash readlink 2>/dev/null; then
   scriptdir=`dirname $0`
 else
   scriptpath=$(readlink -e "$0") || scriptpath=$0
 
@@ -2,7 +2,7 @@
   <modelVersion>4.0.0</modelVersion>
   <groupId>edu.stanford.nlp</groupId>
   <artifactId>stanford-corenlp</artifactId>
-  <version>3.5.1</version>
+  <version>3.5.2</version>
   <packaging>jar</packaging>
   <name>Stanford CoreNLP</name>
   <description>Stanford CoreNLP provides a set of natural language analysis tools which can take raw English language text input and give the base forms of words, their parts of speech, whether they are names of companies, people, etc., normalize dates, times, and numeric quantities, mark up the structure of sentences in terms of phrases and word dependencies, and indicate which noun phrases refer to the same entities. It provides the foundational building blocks for higher level text understanding applications.</description>
@@ -14,8 +14,8 @@
     </license>
   </licenses>
   <scm>
-    <url>http://nlp.stanford.edu/software/stanford-corenlp-2015-01-29.zip</url>
-    <connection>http://nlp.stanford.edu/software/stanford-corenlp-2015-01-29.zip</connection>
+    <url>http://nlp.stanford.edu/software/stanford-corenlp-2015-04-21.zip</url>
+    <connection>http://nlp.stanford.edu/software/stanford-corenlp-2015-04-21.zip</connection>
   </scm>
   <developers>
     <developer>
@@ -78,7 +78,7 @@
             <configuration>
               <artifacts>
                 <artifact>
-                  <file>${project.basedir}/stanford-corenlp-3.5.1-models.jar</file>
+                  <file>${project.basedir}/stanford-corenlp-3.5.2-models.jar</file>
                   <type>jar</type>
                   <classifier>models</classifier>
                 </artifact>