Update of /cvsroot/monetdb/pathfinder/modules/pftijah
In directory 23jxhf1.ch3.sourceforge.com:/tmp/cvs-serv25493
Modified Files:
pftijah_stem.mx
Log Message:
add the possibility to use stop words removal without stemming
U pftijah_stem.mx
Index: pftijah_stem.mx
===================================================================
RCS file: /cvsroot/monetdb/pathfinder/modules/pftijah/pftijah_stem.mx,v
retrieving revision 1.14
retrieving revision 1.15
diff -u -d -r1.14 -r1.15
--- pftijah_stem.mx 19 Feb 2009 11:54:36 -0000 1.14
+++ pftijah_stem.mx 20 Apr 2009 23:30:46 -0000 1.15
@@ -507,6 +507,13 @@
static tjStemCtx debug = { "debug", NULL, debugStem, NULL, NULL,
NULL_STOPWORDS };
+
+/*
+ * no stemming with english stopwords
+ */
+
+static tjStemCtx stopwords_english = { "stopwords-english", NULL, NULL, NULL,
NULL, ENGLISH_STOPWORDS };
+
/*
*
* Definition of the pftijah interface to the "porter" Snowball stemmer
@@ -761,12 +768,14 @@
static tjStemCtx porter_dutch = { "porter-dutch", porter_dutch_init,
porter_dutch_stem, porter_dutch_clear, NULL , NULL_STOPWORDS };
+
/*
*
* end of fast porter stemmer experiment
*
*/
+
/*
* The getStemmingContext() function is the extern function called to get
* the stemming context.
@@ -782,6 +791,8 @@
res = & nostemming;
else if ( strcmp(name,"debug")==0 )
res = & debug;
+ else if ( strcmp(name,"stopwords-english")==0 )
+ res = & stopwords_english;
else if ( strcmp(name,"snowball-porter")==0 )
res = & snb_porter;
else if ( strcmp(name,"snowball-english")==0 )
------------------------------------------------------------------------------
Stay on top of everything new and different, both inside and
around Java (TM) technology - register by April 22, and save
$200 on the JavaOne (SM) conference, June 2-5, 2009, San Francisco.
300 plus technical and hands-on sessions. Register today.
Use priority code J9JMT32. http://p.sf.net/sfu/p
_______________________________________________
Monetdb-pf-checkins mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/monetdb-pf-checkins