Page: http://wiki.cocoondev.org/Wiki.jsp?page=Con , version: 2 on Sun Jun 22 
03:59:42 2003 by Con

- [Conal Tuohy|mailto:[EMAIL PROTECTED]
+ My name is [Conal Tuohy|mailto:[EMAIL PROTECTED]
? +++++++++++                                           +

+ I work part time at the [New Zealand Electronic Text 
Centre|http://www.nzetc.org/] which has a Cocoon-based website.
+ I also teach web publishing and do some other consultancy work.
+ Recently I've been working with the [LuceneIndexTransformer], indexing the 
nzetc site. This is a far better way to index a website than with a crawler. 


Page: http://wiki.cocoondev.org/Wiki.jsp?page=LuceneIndexTransformer , version: 
12 on Sun Jun 22 03:55:10 2003 by Con

-       <map:components>
? ^

+    <map:components>
? ^^^

-               ...
+       ...
-               <map:transformers default="xslt">
? ^^

+       <map:transformers default="xslt">
? ^^^^^^

-                       <map:transformer name="index" 
? ^^^

+          <map:transformer name="index" 
? ^^^^^^^^^

-                               
logger="sitemap.transformer.luceneindextransformer" 
? ^^^^

+             logger="sitemap.transformer.luceneindextransformer" 
? ^^^^^^^^^^^^

-                               
src="org.apache.cocoon.transformation.LuceneIndexTransformer"/>
? ^^^^

+             src="org.apache.cocoon.transformation.LuceneIndexTransformer"/>
? ^^^^^^^^^^^^

-               </map:transformers>
? ^^

+       </map:transformers>
? ^^^^^^

-               ...
+       ...
-       </map:components>
? ^

+    </map:components>
? ^^^

-       ...
+    ...
-       analyzer="org.apache.lucene.analysis.standard.StandardAnalyzer" 
? ^

+    analyzer="org.apache.lucene.analysis.standard.StandardAnalyzer" 
? ^^^

-       directory="index" 
? ^

+    directory="index" 
? ^^^

-       create="false" 
? ^

+    create="false" 
? ^^^

-       merge-factor="20">
? ^

+    merge-factor="20">
? ^^^

-       <lucene:document url="http://localhost/sample.html";>
? ^

+    <lucene:document url="http://localhost/sample.html";>
? ^^^

-               <!-- here is some sample content -->
? ^^

+       <!-- here is some sample content -->
? ^^^^^^

-               <html>
-                       <head>
-                               <title>Sample</title>
-                       </head>
-                       <body>
-                               <h1>Blah</h1>
+       <html>
+          <head>
+             <title>Sample</title>
+          </head>
+          <body>
+             <h1>Blah</h1>
-                               <a href="blah.jpg" title="download blah image"
? ^^^^

+             <a href="blah.jpg" title="download blah image"
? ^^^^^^^^^^^^

-                                       lucene:text-attr="title">
+                lucene:text-attr="title">
-                                       <img src="blah-small.jpg" alt="Blah"
? ^^^^^

+                <img src="blah-small.jpg" alt="Blah"
? ^^^^^^^^^^^^^^^

-                                               lucene:text-attr="alt"/>
-                               </a>
-                       </body>
-               </html>
+                   lucene:text-attr="alt"/>
+             </a>
+          </body>
+       </html>
-       </lucene:document>
? ^

+    </lucene:document>
? ^^^

-       <lucene:document url="http://localhost/sample-2.html";>
? ^

+    <lucene:document url="http://localhost/sample-2.html";>
? ^^^

-               <!-- Another sample doc -->
? ^^

+       <!-- Another sample doc -->
? ^^^^^^

-               <html>
-                       <head>
+       <html>
+          <head>
-                               <title>Second Sample</title>
? ^^^^

+             <title>Second Sample</title>
? ^^^^^^^^^^^^

-                       </head>
-                       <body>
-                               <h1>Foo</h1>
+          </head>
+          <body>
+             <h1>Foo</h1>
-                               <p>Lorem ipsum dolor sit amet, 
? ^^^^

+             <p>Lorem ipsum dolor sit amet, 
? ^^^^^^^^^^^^

-                               consectetuer adipiscing elit. </p>
? ^^^^

+             consectetuer adipiscing elit. </p>
? ^^^^^^^^^^^^

-                       </body>
-               </html>
+          </body>
+       </html>
-       </lucene:document>
? ^

+    </lucene:document>
? ^^^



Reply via email to