burton 2005/01/18 22:01:41 Modified: feedparser/src/java/org/apache/commons/feedparser/locate AnchorParser.java feedparser/src/java/org/apache/commons/feedparser/test TestAtom.java TestFeedFilter.java TestFeedLocator.java TestFeedParser.java TestFeedParserUTF8.java Log: updated anchor parser to support rel... updated tests to remove lucene build dependency (extra imports removed) Revision Changes Path 1.7 +5 -5 jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/locate/AnchorParser.java Index: AnchorParser.java =================================================================== RCS file: /home/cvs/jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/locate/AnchorParser.java,v retrieving revision 1.6 retrieving revision 1.7 diff -u -r1.6 -r1.7 --- AnchorParser.java 18 Jan 2005 19:39:36 -0000 1.6 +++ AnchorParser.java 19 Jan 2005 06:01:41 -0000 1.7 @@ -52,6 +52,9 @@ int index = 0; + //FIXME: what if there are HTML comments here? We would parse links + //within comments which isn't what we want. + //FIXME: what if href isn't the first attribute? Will it fail here??? //FIXME: how do we pass back the content of the href: <a href=''> this @@ -68,13 +71,11 @@ String title = (String)map.get( "title" ); - if ( title != null ) { - title = title.trim(); + if ( title != null ) title = EntityDecoder.decode( title ); - } String rel = (String)map.get( "rel" ); - + if ( resource == null || resource.equals( "" ) ) continue; @@ -112,7 +113,6 @@ //parse( "<a title=\"linux\" rel=\"linux\" href=\"http://peerfear.org\" >adf</a>", listener ); parse( "<a href='http://peerfear.org' rel='linux' title='linux' >adf</a>", listener ); - } 1.6 +1 -8 jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestAtom.java Index: TestAtom.java =================================================================== RCS file: /home/cvs/jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestAtom.java,v retrieving revision 1.5 retrieving revision 1.6 diff -u -r1.5 -r1.6 --- TestAtom.java 31 Aug 2004 21:00:32 -0000 1.5 +++ TestAtom.java 19 Jan 2005 06:01:41 -0000 1.6 @@ -22,13 +22,6 @@ import java.net.*; import java.security.*; -import org.apache.lucene.index.*; -import org.apache.lucene.search.*; -import org.apache.lucene.queryParser.*; -import org.apache.lucene.analysis.*; -import org.apache.lucene.analysis.standard.*; -import org.apache.lucene.document.*; - import org.peerfear.newsmonster.tools.*; import org.peerfear.newsmonster.network.*; 1.6 +1 -8 jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedFilter.java Index: TestFeedFilter.java =================================================================== RCS file: /home/cvs/jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedFilter.java,v retrieving revision 1.5 retrieving revision 1.6 diff -u -r1.5 -r1.6 --- TestFeedFilter.java 22 Oct 2004 00:37:08 -0000 1.5 +++ TestFeedFilter.java 19 Jan 2005 06:01:41 -0000 1.6 @@ -22,13 +22,6 @@ import java.net.*; import java.security.*; -import org.apache.lucene.index.*; -import org.apache.lucene.search.*; -import org.apache.lucene.queryParser.*; -import org.apache.lucene.analysis.*; -import org.apache.lucene.analysis.standard.*; -import org.apache.lucene.document.*; - import org.peerfear.newsmonster.tools.*; import org.peerfear.newsmonster.network.*; 1.7 +1 -8 jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedLocator.java Index: TestFeedLocator.java =================================================================== RCS file: /home/cvs/jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedLocator.java,v retrieving revision 1.6 retrieving revision 1.7 diff -u -r1.6 -r1.7 --- TestFeedLocator.java 22 Oct 2004 00:37:08 -0000 1.6 +++ TestFeedLocator.java 19 Jan 2005 06:01:41 -0000 1.7 @@ -22,13 +22,6 @@ import java.net.*; import java.security.*; -import org.apache.lucene.index.*; -import org.apache.lucene.search.*; -import org.apache.lucene.queryParser.*; -import org.apache.lucene.analysis.*; -import org.apache.lucene.analysis.standard.*; -import org.apache.lucene.document.*; - import org.peerfear.newsmonster.tools.*; import org.peerfear.newsmonster.network.*; 1.4 +1 -8 jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedParser.java Index: TestFeedParser.java =================================================================== RCS file: /home/cvs/jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedParser.java,v retrieving revision 1.3 retrieving revision 1.4 diff -u -r1.3 -r1.4 --- TestFeedParser.java 3 Sep 2004 19:46:47 -0000 1.3 +++ TestFeedParser.java 19 Jan 2005 06:01:41 -0000 1.4 @@ -22,13 +22,6 @@ import java.net.*; import java.security.*; -import org.apache.lucene.index.*; -import org.apache.lucene.search.*; -import org.apache.lucene.queryParser.*; -import org.apache.lucene.analysis.*; -import org.apache.lucene.analysis.standard.*; -import org.apache.lucene.document.*; - import org.peerfear.newsmonster.tools.*; import org.peerfear.newsmonster.network.*; 1.5 +1 -8 jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedParserUTF8.java Index: TestFeedParserUTF8.java =================================================================== RCS file: /home/cvs/jakarta-commons-sandbox/feedparser/src/java/org/apache/commons/feedparser/test/TestFeedParserUTF8.java,v retrieving revision 1.4 retrieving revision 1.5 diff -u -r1.4 -r1.5 --- TestFeedParserUTF8.java 28 Feb 2004 03:35:22 -0000 1.4 +++ TestFeedParserUTF8.java 19 Jan 2005 06:01:41 -0000 1.5 @@ -22,13 +22,6 @@ import java.net.*; import java.security.*; -import org.apache.lucene.index.*; -import org.apache.lucene.search.*; -import org.apache.lucene.queryParser.*; -import org.apache.lucene.analysis.*; -import org.apache.lucene.analysis.standard.*; -import org.apache.lucene.document.*; - import org.peerfear.newsmonster.tools.*; import junit.framework.*;
--------------------------------------------------------------------- To unsubscribe, e-mail: [EMAIL PROTECTED] For additional commands, e-mail: [EMAIL PROTECTED]