Revision: 7191
http://languagetool.svn.sourceforge.net/languagetool/?rev=7191&view=rev
Author: milek_pl
Date: 2012-06-02 21:18:14 +0000 (Sat, 02 Jun 2012)
Log Message:
-----------
[en] and fix most outstanding false alarms for CD_NN
Modified Paths:
--------------
trunk/JLanguageTool/src/resource/en/disambiguation.xml
trunk/JLanguageTool/src/rules/en/grammar.xml
Modified: trunk/JLanguageTool/src/resource/en/disambiguation.xml
===================================================================
--- trunk/JLanguageTool/src/resource/en/disambiguation.xml 2012-06-02
21:12:08 UTC (rev 7190)
+++ trunk/JLanguageTool/src/resource/en/disambiguation.xml 2012-06-02
21:18:14 UTC (rev 7191)
@@ -111,7 +111,7 @@
<marker>
<token>are</token>
</marker>
- <token postag="JJ.*|VBG|IN|DT" postag_regexp="yes"></token>
+ <token postag="JJ.*|VBG|IN|DT|RB" postag_regexp="yes"></token>
</pattern>
<disambig><match no="1" postag="VBP"
postag_regexp="yes"></match></disambig>
<example type="ambiguous" inputform="are[are/NN,be/VBP]"
outputform="are[be/VBP]">What follows <marker>are</marker> the terms used by
the Aikikai Foundation</example>
@@ -1389,7 +1389,7 @@
<disambig postag="VBZ"/>
<example type="untouched">He comes from another city.</example>
<example type="ambiguous" inputform="comes[come/VBZ,comes/NN]"
outputform="comes[come/VBZ]">What we know <marker>comes</marker> from a
book.</example>
- </rule>
+ </rule>
<!-- This is a special cascade, do not change the order of these rules!
-->
<rulegroup id="POS" name="Else's -> POS">
@@ -1462,5 +1462,22 @@
<disambig postag="NNP"/>
<example type="untouched">1 ad for you</example>
<example type="ambiguous" inputform="AD[AD/NNP,ad/NN]"
outputform="AD[AD/NNP]">24 <marker>AD</marker> is a memorable date.</example>
- </rule>
+ </rule>
+
+ <rule id="CAME_FROM" name="came -> vbd">
+ <pattern>
+ <marker><token>came</token></marker>
+ <token>from</token>
+ </pattern>
+ <disambig postag="VBD" />
+ </rule>
+
+ <rule id="SAW_PRP" name='saw him'>
+ <pattern>
+ <marker><token>saw</token></marker>
+ <token postag="PRP"/>
+ </pattern>
+ <disambig postag="VBD"/>
+ <example type="ambiguous"
inputform="saw[saw/NN,saw/VB,saw/VBP,see/VBD]" outputform="saw[see/VBD]">The
years 1812 and 1813 <marker>saw</marker> him in Germany and France
again</example>
+ </rule>
</rules>
Modified: trunk/JLanguageTool/src/rules/en/grammar.xml
===================================================================
--- trunk/JLanguageTool/src/rules/en/grammar.xml 2012-06-02 21:12:08 UTC
(rev 7190)
+++ trunk/JLanguageTool/src/rules/en/grammar.xml 2012-06-02 21:18:14 UTC
(rev 7191)
@@ -7790,10 +7790,11 @@
<rule id="CD_NN" name="Possible agreement error: numeral + singular
countable noun">
<pattern>
<marker>
- <token postag="CD"><exception
regexp="yes">one|thou|zero|1</exception><exception scope="previous"
postag="DT|PRP\$" postag_regexp="yes"/></token>
- <token postag="NN:UN|NN" postag_regexp="yes"><exception
postag="NN:U|NNS|NNPS|JJ.*|IN"
postag_regexp="yes"></exception><exception>will</exception></token>
- </marker>
- <token><exception postag="NN.*"
postag_regexp="yes"></exception><exception>'</exception></token>
+ <token spacebefore="yes" postag="CD"><exception
regexp="yes">one|thou|zero|1</exception><exception scope="previous"
postag="DT|PRP\$|POS" postag_regexp="yes"/><exception regexp="yes"
scope="previous">January|February|March|April|May|June|July|August|September|October|November|December|size|\$\d+</exception><exception
spacebefore="no" scope="previous">.</exception></token>
+ <token postag="NN:UN|NN" postag_regexp="yes"><exception
postag="NN:U|NNS|NNPS|JJ.*|IN"
postag_regexp="yes"></exception><exception>will</exception>
+ <exception
regexp="yes">mm|lb|yd|ft|Msec|km|cm|mg|kg|gm|cc|stat|kc|hr</exception></token>
+ </marker>
+ <token><exception postag="NN.*"
postag_regexp="yes"></exception><exception>'</exception></token>
</pattern>
<message>Possible agreement error. The noun <match no="2"></match>
seems to be countable, so probably you should use: <suggestion><match
no="1"></match> <match no="2" postag="NNS|NNPS"
postag_regexp="yes"></match></suggestion>.</message>
<short>Grammatical problem</short>
@@ -7804,6 +7805,11 @@
<example type="correct">I have two book readers in my
palmtop.</example>
<example type="correct">At its 1864 convention, the Republican
Party selected Andrew Johnson.</example>
<example type="correct">The 2007 ceremony was watched by more than
40 million Americans.</example>
+ <example type="correct">The $6,100,000,000 measure, which was
passed last Monday by the Senate...</example>
+ <example type="correct">Friday's letters asked for a Nov. 15
meeting.</example>
+ <example type="correct">It takes about 16 Msec. to traverse 25 mm.
of tissue.</example>
+ <example type="correct">$800 billion economy was envisioned for
the 1970s</example>
+ <example type="correct">Middle East peace after Israel's 1956
invasion of Egypt</example>
</rule>
<rule id="MANY_NN" name="Possible agreement error: 'many/several/few'
+ singular countable noun">
<pattern>
This was sent by the SourceForge.net collaborative development platform, the
world's largest Open Source development site.
------------------------------------------------------------------------------
Live Security Virtual Conference
Exclusive live event will cover all the ways today's security and
threat landscape has changed and how IT managers can respond. Discussions
will include endpoint security, mobile security and the latest in malware
threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/
_______________________________________________
Languagetool-cvs mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs