Revision: 7273
http://languagetool.svn.sourceforge.net/languagetool/?rev=7273&view=rev
Author: milek_pl
Date: 2012-06-06 22:22:25 +0000 (Wed, 06 Jun 2012)
Log Message:
-----------
really fix bugs with AnalyzedTokenReadings removing the last tag
Modified Paths:
--------------
trunk/JLanguageTool/src/java/org/languagetool/AnalyzedTokenReadings.java
trunk/JLanguageTool/src/resource/pl/disambiguation.xml
trunk/JLanguageTool/src/test/org/languagetool/AnalyzedTokenReadingsTest.java
Modified:
trunk/JLanguageTool/src/java/org/languagetool/AnalyzedTokenReadings.java
===================================================================
--- trunk/JLanguageTool/src/java/org/languagetool/AnalyzedTokenReadings.java
2012-06-06 21:31:22 UTC (rev 7272)
+++ trunk/JLanguageTool/src/java/org/languagetool/AnalyzedTokenReadings.java
2012-06-06 22:22:25 UTC (rev 7273)
@@ -176,7 +176,7 @@
}
}
if (l.isEmpty()) {
- l.add(new AnalyzedToken(token.getToken(), null, null));
+ l.add(new AnalyzedToken(anTokReadings[0].getToken(), null, null));
}
anTokReadings = l.toArray(new AnalyzedToken[l.size()]);
setNoRealPOStag();
@@ -198,7 +198,7 @@
}
}
if (l.isEmpty()) {
- l.add(new AnalyzedToken(token.getToken(), null, null));
+ l.add(new AnalyzedToken(anTokReadings[0].getToken(), null, null));
}
anTokReadings = l.toArray(new AnalyzedToken[l.size()]);
setNoRealPOStag();
Modified: trunk/JLanguageTool/src/resource/pl/disambiguation.xml
===================================================================
--- trunk/JLanguageTool/src/resource/pl/disambiguation.xml 2012-06-06
21:31:22 UTC (rev 7272)
+++ trunk/JLanguageTool/src/resource/pl/disambiguation.xml 2012-06-06
22:22:25 UTC (rev 7273)
@@ -94,7 +94,7 @@
</pattern>
<disambig action="remove"><wd lemma="przejść"></wd></disambig>
<example type="untouched">Przeszło trzydziestu panów pije
wódkę.</example>
- <example type="ambiguous"
inputform="Przeszło[przejść/verb:praet:sg:ter:n:perf]"
outputform="Przeszło[]"><marker>Przeszło</marker> 30 panów pije wódkę.</example>
+ <example type="ambiguous"
inputform="Przeszło[przejść/verb:praet:sg:ter:n:perf]"
outputform="Przeszło[Przeszło]"><marker>Przeszło</marker> 30 panów pije
wódkę.</example>
</rule>
<rule name="prawie/subst -> kublik" id="prawie">
<pattern>
@@ -785,5 +785,43 @@
<disambig action="replace"><match no="1" postag_regexp="yes"
postag="brev:npun" postag_replace="brev:pun"/></disambig>
<example type="ambiguous" inputform="m[metr/brev:npun]"
outputform="m[metr/brev:pun]">Jest to <marker>m</marker>.in. kretyn.</example>
</rule>
-
+
+ <rule name=".pl" id="PL_DOMAIN_NAME">
+ <pattern>
+ <token>.</token>
+ <marker>
+ <token spacebefore="no">pl</token>
+ </marker>
+ </pattern>
+ <disambig action="remove"><wd lemma="plac"/></disambig>
+ <example type="ambiguous" inputform="pl[plac/brev:pun]"
outputform="pl[pl]">Alergie.mp.<marker>pl</marker> - serwis</example>
+ <example type="untouched">Adres: pl. Zbawiciela 122</example>
+ </rule>
+ <rule name=".jp" id="JP_DOMAIN_NAME">
+ <pattern>
+ <token>.</token>
+ <marker>
+ <token spacebefore="no">jp</token>
+ </marker>
+ </pattern>
+ <disambig action="remove"><wd lemma="jak poprzednio"/></disambig>
+ <example type="ambiguous" inputform="jp[jak poprzednio/brev:pun]"
outputform="jp[jp]">Alergie.mp.<marker>jp</marker> - serwis</example>
+ <example type="untouched">Skrót - jp.</example>
+ </rule>
+ <rule name="KC" id="KC">
+ <pattern case_sensitive="yes">
+ <marker><token>KC</token></marker>
+ <token regexp="yes">KPZR|PZPR</token>
+ </pattern>
+ <disambig action="remove"><wd lemma="kodeks cywilny"/></disambig>
+ <example type="ambiguous" inputform="KC[kodeks cywilny/brev:pun]"
outputform="KC[KC]"><marker>KC</marker> KPZR</example>
+ </rule>
+ <rule name="R - nie rok" id="NON_START_POS_R">
+ <pattern case_sensitive="yes">
+ <marker><token>R<exception scope="previous"
postag="SENT_START"></exception></token></marker>
+ </pattern>
+ <disambig action="remove"><wd lemma="rok"/></disambig>
+ <example type="untouched">R. 2012</example>
+ <example type="ambiguous" inputform="R[rok/brev:pun]"
outputform="R[R]">Enancjomer <marker>R</marker> jest ważny.</example>
+ </rule>
</rules>
\ No newline at end of file
Modified:
trunk/JLanguageTool/src/test/org/languagetool/AnalyzedTokenReadingsTest.java
===================================================================
---
trunk/JLanguageTool/src/test/org/languagetool/AnalyzedTokenReadingsTest.java
2012-06-06 21:31:22 UTC (rev 7272)
+++
trunk/JLanguageTool/src/test/org/languagetool/AnalyzedTokenReadingsTest.java
2012-06-06 22:22:25 UTC (rev 7273)
@@ -63,6 +63,11 @@
testReadings.leaveReading(aTok2);
assertEquals(testReadings.getToken(), "word");
assertTrue(!testReadings.hasPosTag("POS"));
+
+ testReadings.removeReading(aTok2);
+ assertEquals(testReadings.getToken(), "word");
+ assertTrue(!testReadings.hasPosTag("POS"));
+
}
public void testHasPosTag() {
This was sent by the SourceForge.net collaborative development platform, the
world's largest Open Source development site.
------------------------------------------------------------------------------
Live Security Virtual Conference
Exclusive live event will cover all the ways today's security and
threat landscape has changed and how IT managers can respond. Discussions
will include endpoint security, mobile security and the latest in malware
threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/
_______________________________________________
Languagetool-cvs mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs