Author: srowen
Date: Mon Apr 25 11:36:59 2011
New Revision: 1096459

URL: http://svn.apache.org/viewvc?rev=1096459&view=rev
Log:
MAHOUT-681 remove deprecated models/distributions

Removed:
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/AsymmetricSampledNormalDistribution.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/AsymmetricSampledNormalModel.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/L1Model.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/L1ModelDistribution.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/NormalModel.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/NormalModelDistribution.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/SampledNormalDistribution.java
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/SampledNormalModel.java
Modified:
    
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/DirichletDriver.java
    
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestClusterInterface.java
    
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestVectorModelClassifier.java
    
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestDirichletClustering.java
    
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestMapReduce.java
    
mahout/trunk/examples/src/main/java/org/apache/mahout/clustering/syntheticcontrol/dirichlet/Job.java
    
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/TestClusterDumper.java
    
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/dirichlet/TestL1ModelClustering.java

Modified: 
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/DirichletDriver.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/DirichletDriver.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/DirichletDriver.java
 (original)
+++ 
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/DirichletDriver.java
 Mon Apr 25 11:36:59 2011
@@ -36,7 +36,7 @@ import org.apache.hadoop.util.ToolRunner
 import org.apache.mahout.clustering.Cluster;
 import org.apache.mahout.clustering.WeightedVectorWritable;
 import org.apache.mahout.clustering.dirichlet.models.DistributionDescription;
-import org.apache.mahout.clustering.dirichlet.models.NormalModelDistribution;
+import 
org.apache.mahout.clustering.dirichlet.models.GaussianClusterDistribution;
 import org.apache.mahout.common.AbstractJob;
 import org.apache.mahout.common.HadoopUtil;
 import org.apache.mahout.common.commandline.DefaultOptionCreator;
@@ -78,8 +78,8 @@ public class DirichletDriver extends Abs
     addOption(ALPHA_OPTION, "a0", "The alpha0 value for the 
DirichletDistribution. Defaults to 1.0", "1.0");
     addOption(MODEL_DISTRIBUTION_CLASS_OPTION,
               "md",
-              "The ModelDistribution class name. Defaults to 
NormalModelDistribution",
-              NormalModelDistribution.class.getName());
+              "The ModelDistribution class name. Defaults to 
GaussianClusterDistribution",
+              GaussianClusterDistribution.class.getName());
     addOption(MODEL_PROTOTYPE_CLASS_OPTION,
               "mp",
               "The ModelDistribution prototype Vector class name. Defaults to 
RandomAccessSparseVector",

Modified: 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestClusterInterface.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestClusterInterface.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestClusterInterface.java
 (original)
+++ 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestClusterInterface.java
 Mon Apr 25 11:36:59 2011
@@ -19,10 +19,6 @@ package org.apache.mahout.clustering;
 
 import org.apache.mahout.clustering.canopy.Canopy;
 import org.apache.mahout.clustering.dirichlet.DirichletCluster;
-import 
org.apache.mahout.clustering.dirichlet.models.AsymmetricSampledNormalModel;
-import org.apache.mahout.clustering.dirichlet.models.L1Model;
-import org.apache.mahout.clustering.dirichlet.models.NormalModel;
-import org.apache.mahout.clustering.dirichlet.models.SampledNormalModel;
 import org.apache.mahout.clustering.meanshift.MeanShiftCanopy;
 import org.apache.mahout.common.MahoutTestCase;
 import org.apache.mahout.common.distance.DistanceMeasure;
@@ -38,72 +34,6 @@ public final class TestClusterInterface 
   private static final DistanceMeasure measure = new 
ManhattanDistanceMeasure();
 
   @Test
-  public void testDirichletNormalModel() {
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    Cluster model = new NormalModel(5, m, 0.75);
-    String format = model.asFormatString(null);
-    assertEquals("nm{n=0 m=[1.100, 2.200, 3.300] sd=0.75}", format);
-  }
-
-  @Test
-  public void testDirichletSampledNormalModel() {
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    Cluster model = new SampledNormalModel(5, m, 0.75);
-    String format = model.asFormatString(null);
-    assertEquals("snm{n=0 m=[1.100, 2.200, 3.300] sd=0.75}", format);
-  }
-
-  @Test
-  public void testDirichletASNormalModel() {
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    Cluster model = new AsymmetricSampledNormalModel(5, m, m);
-    String format = model.asFormatString(null);
-    assertEquals("asnm{n=0 m=[1.100, 2.200, 3.300] sd=[1.100, 2.200, 3.300]}", 
format);
-  }
-
-  @Test
-  public void testDirichletL1Model() {
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    Cluster model = new L1Model(5, m);
-    String format = model.asFormatString(null);
-    assertEquals("l1m{n=0 c=[1.100, 2.200, 3.300]}", format);
-  }
-
-  @Test
-  public void testDirichletNormalModelClusterAsFormatString() {
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    NormalModel model = new NormalModel(5, m, 0.75);
-    Cluster cluster = new DirichletCluster(model, 35.0);
-    String format = cluster.asFormatString(null);
-    assertEquals("C-5: nm{n=0 m=[1.100, 2.200, 3.300] sd=0.75}", format);
-  }
-
-  @Test
-  public void testDirichletAsymmetricSampledNormalModelClusterAsFormatString() 
{
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    AsymmetricSampledNormalModel model = new AsymmetricSampledNormalModel(5, 
m, m);
-    Cluster cluster = new DirichletCluster(model, 35.0);
-    String format = cluster.asFormatString(null);
-    assertEquals("C-5: asnm{n=0 m=[1.100, 2.200, 3.300] sd=[1.100, 2.200, 
3.300]}", format);
-  }
-
-  @Test
-  public void testDirichletL1ModelClusterAsFormatString() {
-    double[] d = { 1.1, 2.2, 3.3 };
-    Vector m = new DenseVector(d);
-    L1Model model = new L1Model(5, m);
-    Cluster cluster = new DirichletCluster(model, 35.0);
-    String format = cluster.asFormatString(null);
-    assertEquals("C-5: l1m{n=0 c=[1.100, 2.200, 3.300]}", format);
-  }
-
-  @Test
   public void testCanopyAsFormatString() {
     double[] d = { 1.1, 2.2, 3.3 };
     Vector m = new DenseVector(d);

Modified: 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestVectorModelClassifier.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestVectorModelClassifier.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestVectorModelClassifier.java
 (original)
+++ 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/TestVectorModelClassifier.java
 Mon Apr 25 11:36:59 2011
@@ -23,7 +23,6 @@ import java.util.List;
 import org.apache.commons.lang.NotImplementedException;
 import org.apache.mahout.classifier.AbstractVectorClassifier;
 import org.apache.mahout.clustering.canopy.Canopy;
-import 
org.apache.mahout.clustering.dirichlet.models.AsymmetricSampledNormalModel;
 import org.apache.mahout.clustering.dirichlet.models.GaussianCluster;
 import org.apache.mahout.clustering.fuzzykmeans.SoftCluster;
 import org.apache.mahout.clustering.kmeans.Cluster;
@@ -136,22 +135,4 @@ public final class TestVectorModelClassi
         AbstractCluster.formatVector(pdf, null));
   }
   
-  @Test
-  public void testASNClusterClassification() {
-    List<Model<VectorWritable>> models = new 
ArrayList<Model<VectorWritable>>();
-    models.add(new AsymmetricSampledNormalModel(0,
-        new DenseVector(2).assign(1), new DenseVector(2).assign(1)));
-    models.add(new AsymmetricSampledNormalModel(1, new DenseVector(2),
-        new DenseVector(2).assign(1)));
-    models.add(new AsymmetricSampledNormalModel(2, new DenseVector(2)
-        .assign(-1), new DenseVector(2).assign(1)));
-    AbstractVectorClassifier classifier = new VectorModelClassifier(models);
-    Vector pdf = classifier.classify(new DenseVector(2));
-    assertEquals("[0,0]", "[0.212, 0.576, 0.212]",
-        AbstractCluster.formatVector(pdf, null));
-    pdf = classifier.classify(new DenseVector(2).assign(2));
-    assertEquals("[2,2]", "[0.952, 0.047, 0.000]",
-        AbstractCluster.formatVector(pdf, null));
-  }
-  
 }

Modified: 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestDirichletClustering.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestDirichletClustering.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestDirichletClustering.java
 (original)
+++ 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestDirichletClustering.java
 Mon Apr 25 11:36:59 2011
@@ -21,11 +21,8 @@ import java.util.ArrayList;
 import java.util.List;
 
 import org.apache.mahout.clustering.Cluster;
-import 
org.apache.mahout.clustering.dirichlet.models.AsymmetricSampledNormalDistribution;
 import 
org.apache.mahout.clustering.dirichlet.models.DistanceMeasureClusterDistribution;
 import 
org.apache.mahout.clustering.dirichlet.models.GaussianClusterDistribution;
-import org.apache.mahout.clustering.dirichlet.models.NormalModelDistribution;
-import org.apache.mahout.clustering.dirichlet.models.SampledNormalDistribution;
 import org.apache.mahout.common.MahoutTestCase;
 import org.apache.mahout.math.DenseVector;
 import org.apache.mahout.math.VectorWritable;
@@ -96,97 +93,7 @@ public final class TestDirichletClusteri
     generateSamples(30, 0, 1, 0.1);
 
     DirichletClusterer dc = new DirichletClusterer(sampleData,
-                                                   new 
NormalModelDistribution(new VectorWritable(new DenseVector(2))),
-                                                   1.0,
-                                                   10,
-                                                   1,
-                                                   0);
-    List<Cluster[]> result = dc.cluster(30);
-    printResults(result, 2);
-    assertNotNull(result);
-  }
-
-  @Test
-  public void testDirichletCluster100s() {
-    System.out.println("testDirichletCluster100s");
-    generateSamples(40, 1, 1, 3);
-    generateSamples(30, 1, 0, 0.1);
-    generateSamples(30, 0, 1, 0.1);
-
-    DirichletClusterer dc = new DirichletClusterer(sampleData,
-                                                   new 
SampledNormalDistribution(new VectorWritable(new DenseVector(2))),
-                                                   1.0,
-                                                   10,
-                                                   1,
-                                                   0);
-    List<Cluster[]> result = dc.cluster(30);
-    printResults(result, 2);
-    assertNotNull(result);
-  }
-
-  @Test
-  public void testDirichletCluster100as() {
-    System.out.println("testDirichletCluster100as");
-    generateSamples(40, 1, 1, 3);
-    generateSamples(30, 1, 0, 0.1);
-    generateSamples(30, 0, 1, 0.1);
-
-    DirichletClusterer dc = new DirichletClusterer(sampleData,
-                                                   new 
AsymmetricSampledNormalDistribution(new VectorWritable(new DenseVector(2))),
-                                                   1.0,
-                                                   10,
-                                                   1,
-                                                   0);
-    List<Cluster[]> result = dc.cluster(30);
-    printResults(result, 2);
-    assertNotNull(result);
-  }
-
-  @Test
-  public void testDirichletCluster100C3() {
-    System.out.println("testDirichletCluster100");
-    generateSamples(40, 1, 1, 3, 3);
-    generateSamples(30, 1, 0, 0.1, 3);
-    generateSamples(30, 0, 1, 0.1, 3);
-
-    DirichletClusterer dc = new DirichletClusterer(sampleData,
-                                                   new 
NormalModelDistribution(new VectorWritable(new DenseVector(3))),
-                                                   1.0,
-                                                   10,
-                                                   1,
-                                                   0);
-    List<Cluster[]> result = dc.cluster(30);
-    printResults(result, 2);
-    assertNotNull(result);
-  }
-
-  @Test
-  public void testDirichletCluster100sC3() {
-    System.out.println("testDirichletCluster100s");
-    generateSamples(40, 1, 1, 3, 3);
-    generateSamples(30, 1, 0, 0.1, 3);
-    generateSamples(30, 0, 1, 0.1, 3);
-
-    DirichletClusterer dc = new DirichletClusterer(sampleData,
-                                                   new 
SampledNormalDistribution(new VectorWritable(new DenseVector(3))),
-                                                   1.0,
-                                                   10,
-                                                   1,
-                                                   0);
-    List<Cluster[]> result = dc.cluster(30);
-    printResults(result, 2);
-    assertNotNull(result);
-  }
-
-  @Test
-  public void testDirichletCluster100asC3() {
-    System.out.println("testDirichletCluster100as");
-    generateSamples(40, 1, 1, 3, 3);
-    generateSamples(30, 1, 0, 0.1, 3);
-    generateSamples(30, 0, 1, 0.1, 3);
-
-    DirichletClusterer dc = new DirichletClusterer(sampleData,
-                                                   new 
AsymmetricSampledNormalDistribution(new VectorWritable(new DenseVector(3))),
+                                                   new 
GaussianClusterDistribution(new VectorWritable(new DenseVector(2))),
                                                    1.0,
                                                    10,
                                                    1,

Modified: 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestMapReduce.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestMapReduce.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestMapReduce.java
 (original)
+++ 
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/dirichlet/TestMapReduce.java
 Mon Apr 25 11:36:59 2011
@@ -38,13 +38,10 @@ import org.apache.hadoop.util.ToolRunner
 import org.apache.mahout.clustering.Cluster;
 import org.apache.mahout.clustering.ClusteringTestUtils;
 import org.apache.mahout.clustering.Model;
-import 
org.apache.mahout.clustering.dirichlet.models.AsymmetricSampledNormalModel;
 import 
org.apache.mahout.clustering.dirichlet.models.DistanceMeasureClusterDistribution;
 import org.apache.mahout.clustering.dirichlet.models.DistributionDescription;
-import org.apache.mahout.clustering.dirichlet.models.NormalModel;
-import org.apache.mahout.clustering.dirichlet.models.NormalModelDistribution;
-import org.apache.mahout.clustering.dirichlet.models.SampledNormalDistribution;
-import org.apache.mahout.clustering.dirichlet.models.SampledNormalModel;
+import org.apache.mahout.clustering.dirichlet.models.GaussianCluster;
+import 
org.apache.mahout.clustering.dirichlet.models.GaussianClusterDistribution;
 import org.apache.mahout.common.DummyRecordWriter;
 import org.apache.mahout.common.MahoutTestCase;
 import org.apache.mahout.common.commandline.DefaultOptionCreator;
@@ -127,7 +124,7 @@ public final class TestMapReduce extends
   public void testMapper() throws Exception {
     generateSamples(10, 0, 0, 1);
     DirichletState state =
-        new DirichletState(new NormalModelDistribution(new VectorWritable(new 
DenseVector(2))), 5, 1);
+        new DirichletState(new GaussianClusterDistribution(new 
VectorWritable(new DenseVector(2))), 5, 1);
     DirichletMapper mapper = new DirichletMapper();
     mapper.setup(state);
 
@@ -150,7 +147,7 @@ public final class TestMapReduce extends
     generateSamples(100, 0, 2, 1);
     generateSamples(100, 2, 2, 1);
     DirichletState state =
-        new DirichletState(new SampledNormalDistribution(new 
VectorWritable(new DenseVector(2))), 20, 1);
+        new DirichletState(new GaussianClusterDistribution(new 
VectorWritable(new DenseVector(2))), 20, 1);
     DirichletMapper mapper = new DirichletMapper();
     mapper.setup(state);
 
@@ -182,7 +179,7 @@ public final class TestMapReduce extends
     generateSamples(100, 0, 2, 1);
     generateSamples(100, 2, 2, 1);
     DirichletState state =
-        new DirichletState(new SampledNormalDistribution(new 
VectorWritable(new DenseVector(2))), 20, 1.0);
+        new DirichletState(new GaussianClusterDistribution(new 
VectorWritable(new DenseVector(2))), 20, 1.0);
 
     Collection<Model<VectorWritable>[]> models = new 
ArrayList<Model<VectorWritable>[]>();
 
@@ -254,7 +251,7 @@ public final class TestMapReduce extends
     // Now run the driver using the run() method. Others can use runJob() as 
before
     Integer maxIterations = 5;
     DistributionDescription description =
-        new DistributionDescription(SampledNormalDistribution.class.getName(),
+        new 
DistributionDescription(GaussianClusterDistribution.class.getName(),
                                     DenseVector.class.getName(),
                                     null,
                                     2);
@@ -294,7 +291,7 @@ public final class TestMapReduce extends
     // Now run the driver using the run() method. Others can use runJob() as 
before
     Integer maxIterations = 5;
     DistributionDescription description =
-        new DistributionDescription(SampledNormalDistribution.class.getName(),
+        new 
DistributionDescription(GaussianClusterDistribution.class.getName(),
                                     DenseVector.class.getName(),
                                     null,
                                     2);
@@ -327,7 +324,7 @@ public final class TestMapReduce extends
     // Now run the driver
     int maxIterations = 3;
     DistributionDescription description =
-        new DistributionDescription(SampledNormalDistribution.class.getName(),
+        new 
DistributionDescription(GaussianClusterDistribution.class.getName(),
                                     DenseVector.class.getName(),
                                     null,
                                     2);
@@ -513,59 +510,4 @@ public final class TestMapReduce extends
     ClusteringTestUtils.writePointsToFile(sampleData, 
getTestTempFilePath("input/data4.txt"), fs, conf);
   }
 
-  @Test
-  public void testNormalModelWritableSerialization() throws Exception {
-    double[] m = { 1.1, 2.2, 3.3 };
-    Writable model = new NormalModel(5, new DenseVector(m), 3.3);
-    DataOutputBuffer out = new DataOutputBuffer();
-    model.write(out);
-    Writable model2 = new NormalModel();
-    DataInputBuffer in = new DataInputBuffer();
-    in.reset(out.getData(), out.getLength());
-    model2.readFields(in);
-    assertEquals("models", model.toString(), model2.toString());
-  }
-
-  @Test
-  public void testSampledNormalModelWritableSerialization() throws Exception {
-    double[] m = { 1.1, 2.2, 3.3 };
-    Writable model = new SampledNormalModel(5, new DenseVector(m), 3.3);
-    DataOutputBuffer out = new DataOutputBuffer();
-    model.write(out);
-    Writable model2 = new SampledNormalModel();
-    DataInputBuffer in = new DataInputBuffer();
-    in.reset(out.getData(), out.getLength());
-    model2.readFields(in);
-    assertEquals("models", model.toString(), model2.toString());
-  }
-
-  @Test
-  public void testAsymmetricSampledNormalModelWritableSerialization() throws 
Exception {
-    double[] m = { 1.1, 2.2, 3.3 };
-    double[] s = { 3.3, 4.4, 5.5 };
-    Writable model = new AsymmetricSampledNormalModel(5, new DenseVector(m), 
new DenseVector(s));
-    DataOutputBuffer out = new DataOutputBuffer();
-    model.write(out);
-    Writable model2 = new AsymmetricSampledNormalModel();
-    DataInputBuffer in = new DataInputBuffer();
-    in.reset(out.getData(), out.getLength());
-    model2.readFields(in);
-    assertEquals("models", model.toString(), model2.toString());
-  }
-
-  @Test
-  public void testClusterWritableSerialization() throws Exception {
-    double[] m = { 1.1, 2.2, 3.3 };
-    DirichletCluster cluster = new DirichletCluster(new NormalModel(5, new 
DenseVector(m), 4), 10);
-    DataOutputBuffer out = new DataOutputBuffer();
-    cluster.write(out);
-    DirichletCluster cluster2 = new DirichletCluster();
-    DataInputBuffer in = new DataInputBuffer();
-    in.reset(out.getData(), out.getLength());
-    cluster2.readFields(in);
-    assertEquals("count", cluster.getTotalCount(), cluster2.getTotalCount(), 
EPSILON);
-    assertNotNull("model null", cluster2.getModel());
-    assertEquals("model", cluster.getModel().toString(), 
cluster2.getModel().toString());
-  }
-
 }

Modified: 
mahout/trunk/examples/src/main/java/org/apache/mahout/clustering/syntheticcontrol/dirichlet/Job.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/examples/src/main/java/org/apache/mahout/clustering/syntheticcontrol/dirichlet/Job.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/examples/src/main/java/org/apache/mahout/clustering/syntheticcontrol/dirichlet/Job.java
 (original)
+++ 
mahout/trunk/examples/src/main/java/org/apache/mahout/clustering/syntheticcontrol/dirichlet/Job.java
 Mon Apr 25 11:36:59 2011
@@ -29,7 +29,6 @@ import org.apache.mahout.clustering.conv
 import org.apache.mahout.clustering.dirichlet.DirichletDriver;
 import org.apache.mahout.clustering.dirichlet.models.DistributionDescription;
 import 
org.apache.mahout.clustering.dirichlet.models.GaussianClusterDistribution;
-import org.apache.mahout.clustering.dirichlet.models.NormalModelDistribution;
 import org.apache.mahout.common.AbstractJob;
 import org.apache.mahout.common.HadoopUtil;
 import org.apache.mahout.common.commandline.DefaultOptionCreator;
@@ -78,8 +77,8 @@ public final class Job extends AbstractJ
     addOption(new 
DefaultOptionBuilder().withLongName(DirichletDriver.MODEL_DISTRIBUTION_CLASS_OPTION)
         .withRequired(false).withShortName("md").withArgument(new 
ArgumentBuilder()
             .withName(DirichletDriver.MODEL_DISTRIBUTION_CLASS_OPTION)
-            
.withDefault(NormalModelDistribution.class.getName()).withMinimum(1).withMaximum(1).create())
-        .withDescription("The ModelDistribution class name. " + "Defaults to 
NormalModelDistribution").create());
+            
.withDefault(GaussianClusterDistribution.class.getName()).withMinimum(1).withMaximum(1).create())
+        .withDescription("The ModelDistribution class name. Defaults to 
GaussianClusterDistribution").create());
     addOption(new 
DefaultOptionBuilder().withLongName(DirichletDriver.MODEL_PROTOTYPE_CLASS_OPTION).withRequired(false)
         .withShortName("mp").withArgument(new 
ArgumentBuilder().withName("prototypeClass")
             
.withDefault(RandomAccessSparseVector.class.getName()).withMinimum(1).withMaximum(1).create())

Modified: 
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/TestClusterDumper.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/TestClusterDumper.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/TestClusterDumper.java
 (original)
+++ 
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/TestClusterDumper.java
 Mon Apr 25 11:36:59 2011
@@ -35,7 +35,6 @@ import org.apache.mahout.clustering.diri
 import 
org.apache.mahout.clustering.dirichlet.models.DistanceMeasureClusterDistribution;
 import org.apache.mahout.clustering.dirichlet.models.DistributionDescription;
 import 
org.apache.mahout.clustering.dirichlet.models.GaussianClusterDistribution;
-import org.apache.mahout.clustering.dirichlet.models.SampledNormalDistribution;
 import org.apache.mahout.clustering.fuzzykmeans.FuzzyKMeansDriver;
 import org.apache.mahout.clustering.kmeans.KMeansDriver;
 import org.apache.mahout.clustering.meanshift.MeanShiftCanopyDriver;
@@ -237,23 +236,6 @@ public final class TestClusterDumper ext
   }
 
   @Test
-  public void testDirichlet() throws Exception {
-    Path output = getTestTempDirPath("output");
-    NamedVector prototype = (NamedVector) sampleData.get(0).get();
-    DistributionDescription description =
-        new DistributionDescription(SampledNormalDistribution.class.getName(),
-                                    RandomAccessSparseVector.class.getName(),
-                                    null,
-                                    prototype.getDelegate().size());
-    Configuration conf = new Configuration();
-    DirichletDriver.run(conf, getTestTempDirPath("testdata"), output, 
description, 15, 10, 1.0, true, true, 0, true);
-    // run ClusterDumper
-    ClusterDumper clusterDumper =
-        new ClusterDumper(finalClusterPath(conf, output, 10), new Path(output, 
"clusteredPoints"));
-    clusterDumper.printClusters(termDictionary);
-  }
-
-  @Test
   public void testDirichlet2() throws Exception {
     Path output = getTestTempDirPath("output");
     NamedVector prototype = (NamedVector) sampleData.get(0).get();

Modified: 
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/dirichlet/TestL1ModelClustering.java
URL: 
http://svn.apache.org/viewvc/mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/dirichlet/TestL1ModelClustering.java?rev=1096459&r1=1096458&r2=1096459&view=diff
==============================================================================
--- 
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/dirichlet/TestL1ModelClustering.java
 (original)
+++ 
mahout/trunk/utils/src/test/java/org/apache/mahout/clustering/dirichlet/TestL1ModelClustering.java
 Mon Apr 25 11:36:59 2011
@@ -35,7 +35,7 @@ import org.apache.lucene.util.Version;
 import org.apache.mahout.clustering.Cluster;
 import org.apache.mahout.clustering.Model;
 import 
org.apache.mahout.clustering.dirichlet.models.DistanceMeasureClusterDistribution;
-import org.apache.mahout.clustering.dirichlet.models.L1ModelDistribution;
+import 
org.apache.mahout.clustering.dirichlet.models.GaussianClusterDistribution;
 import org.apache.mahout.math.Vector;
 import org.apache.mahout.math.VectorWritable;
 import org.apache.mahout.utils.MahoutTestCase;
@@ -206,7 +206,8 @@ public final class TestL1ModelClustering
   @Test
   public void testDocs() throws Exception {
     getSampleData(DOCS);
-    DirichletClusterer dc = new DirichletClusterer(sampleData, new 
L1ModelDistribution(sampleData.get(0)), 1.0, 15, 1, 0);
+    DirichletClusterer dc =
+        new DirichletClusterer(sampleData, new 
GaussianClusterDistribution(sampleData.get(0)), 1.0, 15, 1, 0);
     List<Cluster[]> result = dc.cluster(10);
     assertNotNull(result);
     printSamples(result, 0);
@@ -231,7 +232,8 @@ public final class TestL1ModelClustering
   @Test
   public void testDocs2() throws Exception {
     getSampleData(DOCS2);
-    DirichletClusterer dc = new DirichletClusterer(sampleData, new 
L1ModelDistribution(sampleData.get(0)), 1.0, 15, 1, 0);
+    DirichletClusterer dc =
+        new DirichletClusterer(sampleData, new 
GaussianClusterDistribution(sampleData.get(0)), 1.0, 15, 1, 0);
     List<Cluster[]> result = dc.cluster(10);
     assertNotNull(result);
     printSamples(result, 0);


Reply via email to