vgritsenko    02/02/28 06:11:42

  Modified:    src/java/org/apache/cocoon/components/crawler
                        SimpleCocoonCrawlerImpl.java
               src/java/org/apache/cocoon/components/search
                        SimpleLuceneXMLIndexerImpl.java
  Log:
  Don't use jdk1.3 methods, use jdk1.2
  
  Revision  Changes    Path
  1.9       +15 -19    
xml-cocoon2/src/java/org/apache/cocoon/components/crawler/SimpleCocoonCrawlerImpl.java
  
  Index: SimpleCocoonCrawlerImpl.java
  ===================================================================
  RCS file: 
/home/cvs/xml-cocoon2/src/java/org/apache/cocoon/components/crawler/SimpleCocoonCrawlerImpl.java,v
  retrieving revision 1.8
  retrieving revision 1.9
  diff -u -r1.8 -r1.9
  --- SimpleCocoonCrawlerImpl.java      27 Feb 2002 05:28:38 -0000      1.8
  +++ SimpleCocoonCrawlerImpl.java      28 Feb 2002 14:11:42 -0000      1.9
  @@ -82,7 +82,7 @@
    * A simple cocoon crawler.
    *
    * @author     <a href="mailto:[EMAIL PROTECTED]";>Bernhard Huber</a>
  - * @version CVS $Id: SimpleCocoonCrawlerImpl.java,v 1.8 2002/02/27 05:28:38 
vgritsenko Exp $
  + * @version CVS $Id: SimpleCocoonCrawlerImpl.java,v 1.9 2002/02/28 14:11:42 
vgritsenko Exp $
    */
   public class SimpleCocoonCrawlerImpl extends AbstractLoggable
       implements CocoonCrawler, Configurable, Disposable, Recyclable
  @@ -118,6 +118,7 @@
        * @since
        */
       public final static String LINK_VIEW_QUERY_CONFIG = "link-view-query";
  +
       /**
        * Default value of <code>link-view-query</code> configuration value.
        * <p>
  @@ -157,6 +158,7 @@
        * @since
        */
       public final static String USER_AGENT_CONFIG = "user-agent";
  +
       /**
        * Default value of <code>user-agent</code> configuration value.
        * <p>
  @@ -176,6 +178,7 @@
        * @since
        */
       public final static String ACCEPT_CONFIG = "accept";
  +
       /**
        * Default value of <code>accept</code> configuration value.
        * <p>
  @@ -445,37 +448,30 @@
        */
       private List getLinks(URL url) {
           ArrayList url_links = null;
  +        String sURL = url.toString();
   
  -        if (getLogger().isDebugEnabled()) {
  -            getLogger().debug("getLinks URL " + url);
  -        }
  -
  -        if (!isIncludedURL(url.toString())) {
  -            return null;
  -        }
  -        // don't try to get links for url which is excluded
  -        if (isExcludedURL(url.toString())) {
  +        if (!isIncludedURL(sURL) || isExcludedURL(sURL)) {
               return null;
           }
   
           // don't try to get links for url which has been crawled already
  -        if (crawled.contains(url.toString())) {
  +        if (crawled.contains(sURL)) {
               return null;
           }
   
           // mark it as crawled
  -        crawled.add(url.toString());
  +        crawled.add(sURL);
   
  +        // get links of url
           if (getLogger().isDebugEnabled()) {
  -            getLogger().debug("Get links of URL: " + url.toString());
  +            getLogger().debug("Getting links of URL " + sURL);
           }
  -
  -        // get links of url
           try {
  -            URL links_url = new URL(url, url.getPath()
  -                + ((url.getPath().indexOf("?") == -1) ? "?" : "&")
  +            sURL = url.getFile();
  +            URL links = new URL(url, sURL
  +                + ((sURL.indexOf("?") == -1) ? "?" : "&")
                   + linkViewQuery);
  -            URLConnection links_url_connection = links_url.openConnection();
  +            URLConnection links_url_connection = links.openConnection();
               InputStream is = links_url_connection.getInputStream();
               BufferedReader br = new BufferedReader(new InputStreamReader(is));
   
  @@ -602,7 +598,7 @@
        * </p>
        *
        * @author     <a href="mailto:[EMAIL PROTECTED]>Bernhard Huber</a>
  -     * @version    $Id: SimpleCocoonCrawlerImpl.java,v 1.8 2002/02/27 05:28:38 
vgritsenko Exp $
  +     * @version    $Id: SimpleCocoonCrawlerImpl.java,v 1.9 2002/02/28 14:11:42 
vgritsenko Exp $
        */
       public static class CocoonCrawlerIterator implements Iterator
       {
  
  
  
  1.9       +3 -3      
xml-cocoon2/src/java/org/apache/cocoon/components/search/SimpleLuceneXMLIndexerImpl.java
  
  Index: SimpleLuceneXMLIndexerImpl.java
  ===================================================================
  RCS file: 
/home/cvs/xml-cocoon2/src/java/org/apache/cocoon/components/search/SimpleLuceneXMLIndexerImpl.java,v
  retrieving revision 1.8
  retrieving revision 1.9
  diff -u -r1.8 -r1.9
  --- SimpleLuceneXMLIndexerImpl.java   27 Feb 2002 05:28:38 -0000      1.8
  +++ SimpleLuceneXMLIndexerImpl.java   28 Feb 2002 14:11:42 -0000      1.9
  @@ -97,7 +97,7 @@
    * A simple class building lucene documents from xml content.
    *
    * @author     <a href="mailto:[EMAIL PROTECTED]";>Bernhard Huber</a>
  - * @version CVS $Id: SimpleLuceneXMLIndexerImpl.java,v 1.8 2002/02/27 05:28:38 
vgritsenko Exp $
  + * @version CVS $Id: SimpleLuceneXMLIndexerImpl.java,v 1.9 2002/02/28 14:11:42 
vgritsenko Exp $
    */
   public class SimpleLuceneXMLIndexerImpl extends AbstractLoggable
            implements LuceneXMLIndexer, Configurable, Composable, ThreadSafe
  @@ -170,8 +170,8 @@
                throws ProcessingException {
   
           try {
  -            URL contentURL = new URL(url, url.getPath()
  -                + ((url.getPath().indexOf("?") == -1) ? "?" : "&")
  +            URL contentURL = new URL(url, url.getFile()
  +                + ((url.getFile().indexOf("?") == -1) ? "?" : "&")
                   + CONTENT_QUERY);
               URLConnection contentURLConnection = contentURL.openConnection();
               String contentType = contentURLConnection.getContentType();
  
  
  

----------------------------------------------------------------------
In case of troubles, e-mail:     [EMAIL PROTECTED]
To unsubscribe, e-mail:          [EMAIL PROTECTED]
For additional commands, e-mail: [EMAIL PROTECTED]

Reply via email to