Repository: bigtop
Updated Branches:
  refs/heads/master aaffc1e2c -> 4cee56bdc


http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/linkanalysis/PageRankTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/linkanalysis/PageRankTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/linkanalysis/PageRankTests.java
deleted file mode 100644
index 11d31bd..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/linkanalysis/PageRankTests.java
+++ /dev/null
@@ -1,120 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.linkanalysis;
-
-
-import static org.junit.Assert.*;
-
-import java.io.BufferedWriter;
-import java.io.File;
-import java.io.FileWriter;
-import java.util.HashMap;
-import java.util.Iterator;
-import java.util.Map;
-
-import org.apache.pig.data.Tuple;
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-
-import org.apache.bigtop.itest.datafu.linkanalysis.PageRankTest;
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class PageRankTests extends PigTests
-{
-  @Test
-  public void pigPageRankTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/linkanalysis/pageRankTest.pig");
-
-    String[] edges = PageRankTest.getWikiExampleEdges();
-
-    Map<String,Integer> nodeIds = new HashMap<String,Integer>();
-    Map<Integer,String> nodeIdsReversed = new HashMap<Integer,String>();
-    Map<String,Float> expectedRanks = 
PageRankTest.parseExpectedRanks(PageRankTest.getWikiExampleExpectedRanks());
-
-    File f = new File(System.getProperty("user.dir"), 
"input").getAbsoluteFile();
-    if (f.exists())
-    {
-      f.delete();
-    }
-
-    FileWriter writer = new FileWriter(f);
-    BufferedWriter bufferedWriter = new BufferedWriter(writer);
-
-    for (String edge : edges)
-    {
-      String[] edgeParts = edge.split(" ");
-      String source = edgeParts[0];
-      String dest = edgeParts[1];
-      if (!nodeIds.containsKey(source))
-      {
-        int id = nodeIds.size();
-        nodeIds.put(source,id);
-        nodeIdsReversed.put(id, source);
-      }
-      if (!nodeIds.containsKey(dest))
-      {
-        int id = nodeIds.size();
-        nodeIds.put(dest,id);
-        nodeIdsReversed.put(id, dest);
-      }
-      Integer sourceId = nodeIds.get(source);
-      Integer destId = nodeIds.get(dest);
-
-      StringBuffer sb = new StringBuffer();
-
-      sb.append("1\t"); // topic
-      sb.append(sourceId.toString() + "\t");
-      sb.append(destId.toString() + "\t");
-      sb.append("1.0\n"); // weight
-
-      bufferedWriter.write(sb.toString());
-    }
-
-    bufferedWriter.close();
-
-    test.runScript();
-    Iterator<Tuple> tuples = test.getAlias("data_grouped3");
-
-    System.out.println("Final node ranks:");
-    int nodeCount = 0;
-    while (tuples.hasNext())
-    {
-      Tuple nodeTuple = tuples.next();
-
-      Integer topic = (Integer)nodeTuple.get(0);
-      Integer nodeId = (Integer)nodeTuple.get(1);
-      Float nodeRank = (Float)nodeTuple.get(2);
-
-      assertEquals(1, topic.intValue());
-
-      System.out.println(String.format("%d => %f", nodeId, nodeRank));
-
-      Float expectedNodeRank = expectedRanks.get(nodeIdsReversed.get(nodeId));
-
-      assertTrue(String.format("expected: %f, actual: %f", expectedNodeRank, 
nodeRank),
-                 Math.abs(expectedNodeRank - nodeRank * 100.0f) < 0.1);
-
-      nodeCount++;
-    }
-
-    assertEquals(nodeIds.size(),nodeCount);
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/numbers/NumberTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/numbers/NumberTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/numbers/NumberTests.java
deleted file mode 100644
index 4408a55..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/numbers/NumberTests.java
+++ /dev/null
@@ -1,65 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.numbers;
-
-import static org.junit.Assert.*;
-
-import java.util.ArrayList;
-import java.util.List;
-
-import org.apache.pig.data.Tuple;
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class NumberTests extends PigTests
-{
-  /**
-   * Test the RandomIntRange UDF.  The main purpose is to make sure it can be 
used in a Pig script.
-   * Also the range of output values is tested.
-   * 
-   * @throws Exception
-   */
-  @Test
-  public void randomIntRangeTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/numbers/randomIntRangeTest.pig",
-                                 "MIN=1", "MAX=10");
-        
-    List<String> input = new ArrayList<String>();
-    for (int i=0; i<100; i++)
-    {
-      input.add(String.format("(%d)", i));
-    }
-    
-    writeLinesToFile("input", 
-                     input.toArray(new String[0]));
-            
-    test.runScript();
-        
-    List<Tuple> tuples = getLinesForAlias(test, "data2", false);
-    for (Tuple tuple : tuples)
-    {
-      Integer randValue = (Integer)tuple.get(1);
-      assertTrue(randValue >= 1);
-      assertTrue(randValue <= 10);
-    }
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/sessions/SessionTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/sessions/SessionTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/sessions/SessionTests.java
deleted file mode 100644
index d13f1c3..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/sessions/SessionTests.java
+++ /dev/null
@@ -1,92 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.sessions;
-
-import static org.junit.Assert.*;
-
-import java.util.HashMap;
-
-import org.apache.pig.data.Tuple;
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class SessionTests extends PigTests
-{
-  @Test
-  public void sessionizeTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/sessions/sessionizeTest.pig",
-                                 "TIME_WINDOW=30m",
-                                 "JAR_PATH=" + getJarPath());
-
-    this.writeLinesToFile("input", 
-                          "2010-01-01T01:00:00Z\t1\t10",
-                          "2010-01-01T01:15:00Z\t1\t20",
-                          "2010-01-01T01:31:00Z\t1\t10",
-                          "2010-01-01T01:35:00Z\t1\t20",
-                          "2010-01-01T02:30:00Z\t1\t30",
-
-                          "2010-01-01T01:00:00Z\t2\t10",
-                          "2010-01-01T01:31:00Z\t2\t20",
-                          "2010-01-01T02:10:00Z\t2\t30",
-                          "2010-01-01T02:40:30Z\t2\t40",
-                          "2010-01-01T03:30:00Z\t2\t50",
-
-                          "2010-01-01T01:00:00Z\t3\t10",
-                          "2010-01-01T01:01:00Z\t3\t20",
-                          "2010-01-01T01:02:00Z\t3\t5",
-                          "2010-01-01T01:10:00Z\t3\t25",
-                          "2010-01-01T01:15:00Z\t3\t50",
-                          "2010-01-01T01:25:00Z\t3\t30",
-                          "2010-01-01T01:30:00Z\t3\t15");
-    
-    test.runScript();
-    
-    HashMap<Integer,HashMap<Integer,Boolean>> userValues = new 
HashMap<Integer,HashMap<Integer,Boolean>>();
-    
-    for (Tuple t : this.getLinesForAlias(test, "max_value"))
-    {
-      Integer userId = (Integer)t.get(0);
-      Integer max = (Integer)t.get(1);
-      if (!userValues.containsKey(userId))
-      {
-        userValues.put(userId, new HashMap<Integer,Boolean>());
-      }
-      userValues.get(userId).put(max, true);
-    }
-    
-    assertEquals(2, userValues.get(1).size());
-    assertEquals(5, userValues.get(2).size());
-    assertEquals(1, userValues.get(3).size());
-    
-    assertTrue(userValues.get(1).containsKey(20));
-    assertTrue(userValues.get(1).containsKey(30));
-    
-    assertTrue(userValues.get(2).containsKey(10));
-    assertTrue(userValues.get(2).containsKey(20));
-    assertTrue(userValues.get(2).containsKey(30));
-    assertTrue(userValues.get(2).containsKey(40));
-    assertTrue(userValues.get(2).containsKey(50));    
-
-    assertTrue(userValues.get(3).containsKey(50));
-  }
-}
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/MarkovPairTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/MarkovPairTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/MarkovPairTests.java
deleted file mode 100644
index f1f1c2f..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/MarkovPairTests.java
+++ /dev/null
@@ -1,105 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.stats;
-
-import static org.junit.Assert.*;
-
-import java.util.Iterator;
-
-import org.apache.pig.data.Tuple;
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class MarkovPairTests extends PigTests
-{
-  @Test
-  public void markovPairDefaultTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/markovPairDefault.pig",
-                                 "schema=(data: bag {t: tuple(val:int)})");
-    
-    writeLinesToFile("input", "{(10),(20),(30),(40),(50),(60)}");
-    
-    String[] expectedOutput = {
-        "({((10),(20)),((20),(30)),((30),(40)),((40),(50)),((50),(60))})"
-      };
-    
-    test.runScript();
-    
-    Iterator<Tuple> actualOutput = test.getAlias("data_out");
-    
-    assertTuplesMatch(expectedOutput, actualOutput);
-  }
-  
-  @Test
-  public void markovPairMultipleInput() throws Exception
-  {    
-    PigTest test = createPigTest("datafu/stats/markovPairDefault.pig",
-                                 "schema=(data: bag {t: 
tuple(val1:int,val2:int)})");
-    
-    writeLinesToFile("input", 
"{(10,100),(20,200),(30,300),(40,400),(50,500),(60,600)}");
-    
-    String[] expectedOutput = {
-        
"({((10,100),(20,200)),((20,200),(30,300)),((30,300),(40,400)),((40,400),(50,500)),((50,500),(60,600))})"
-      };    
-    
-    
-    test.runScript();
-    
-    Iterator<Tuple> actualOutput = test.getAlias("data_out");
-    
-    assertTuplesMatch(expectedOutput, actualOutput);
-  }
-  
-  @Test
-  public void markovPairLookaheadTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/markovPairLookahead.pig", 
-                                 "schema=(data: bag {t: tuple(val:int)})",
-                                 "lookahead=3");
-    
-    writeLinesToFile("input", "{(10),(20),(30),(40),(50)}");
-    
-    String[] expectedOutput = {
-        
"({((10),(20)),((10),(30)),((10),(40)),((20),(30)),((20),(40)),((20),(50)),((30),(40)),((30),(50)),((40),(50))})"
-      };
-    
-    test.runScript();
-    
-    Iterator<Tuple> actualOutput = test.getAlias("data_out");
-    
-    assertTuplesMatch(expectedOutput, actualOutput);
-  }
-  
-  private void assertTuplesMatch(String[] expectedOutput, Iterator<Tuple> 
actualOutput)
-  {
-    Iterator<Tuple> tuples = actualOutput;
-    
-    for (String outputLine : expectedOutput)
-    {
-      assertTrue(tuples.hasNext());
-      Tuple outputTuple = tuples.next();
-      System.out.println(String.format("expected: %s", outputLine));
-      System.out.println(String.format("actual: %s", outputTuple.toString()));
-      assertEquals(outputLine,outputTuple.toString());
-    }
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/QuantileTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/QuantileTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/QuantileTests.java
deleted file mode 100644
index e9ef05d..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/QuantileTests.java
+++ /dev/null
@@ -1,196 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.stats;
-
-import static org.junit.Assert.*;
-
-import java.util.ArrayList;
-import java.util.List;
-
-import org.apache.pig.data.Tuple;
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class QuantileTests  extends PigTests
-{
-  @Test
-  public void quantileTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/quantileTest.pig",
-                                 "QUANTILES='0.0','0.25','0.5','0.75','1.0'");
-
-    String[] input = {"1","2","3","4","10","5","6","7","8","9"};
-    writeLinesToFile("input", input);
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(1.0,3.0,5.5,8.0,10.0)", output.get(0).toString());
-  }
-  
-  @Test
-  public void quantile2Test() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/quantileTest.pig",
-                                 "QUANTILES='5'");
-
-    String[] input = {"1","2","3","4","10","5","6","7","8","9"};
-    writeLinesToFile("input", input);
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(1.0,3.0,5.5,8.0,10.0)", output.get(0).toString());
-  }
-  
-  @Test
-  public void medianTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/medianTest.pig");
-
-    String[] input = {"4","5","6","9","10","7","8","2","3","1"};
-    writeLinesToFile("input", input);
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(5.5)", output.get(0).toString());
-  }
-  
-  @Test
-  public void streamingMedianTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/streamingMedianTest.pig");
-
-    String[] input = {"0","4","5","6","9","10","7","8","2","3","1"};
-    writeLinesToFile("input", input);
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(5.0)", output.get(0).toString());
-  }
-
-  @Test
-  public void streamingQuantileTest() throws Exception {
-    PigTest test = createPigTest("datafu/stats/streamingQuantileTest.pig",
-                                 "QUANTILES='5'");
-
-    String[] input = {"1","2","3","4","10","5","6","7","8","9"};
-    writeLinesToFile("input", input);
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(1.0,3.0,5.0,8.0,10.0)", output.get(0).toString());
-  }
-  
-  @Test
-  public void streamingQuantile2Test() throws Exception {
-    PigTest test = createPigTest("datafu/stats/streamingQuantileTest.pig",
-                                 "QUANTILES='0.5','0.75','1.0'");
-
-    String[] input = {"1","2","3","4","10","5","6","7","8","9"};
-    writeLinesToFile("input", input);
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(5.0,8.0,10.0)", output.get(0).toString());
-  }
-  
-  @Test
-  public void streamingQuantile3Test() throws Exception {
-    PigTest test = createPigTest("datafu/stats/streamingQuantileTest.pig",
-                                 "QUANTILES='0.07','0.03','0.37','1.0','0.0'");
-
-    List<String> input = new ArrayList<String>();
-    for (int i=1000; i>=1; i--)
-    {
-      input.add(Integer.toString(i));
-    }
-    
-    writeLinesToFile("input", input.toArray(new String[0]));
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(70.0,30.0,370.0,1000.0,1.0)", output.get(0).toString());
-  }
-  
-  @Test
-  public void streamingQuantile4Test() throws Exception {
-    PigTest test = createPigTest("datafu/stats/streamingQuantileTest.pig",
-                                 
"QUANTILES='0.0013','0.0228','0.1587','0.5','0.8413','0.9772','0.9987'");
-
-    List<String> input = new ArrayList<String>();
-    for (int i=100000; i>=0; i--)
-    {
-      input.add(Integer.toString(i));
-    }
-    
-    writeLinesToFile("input", input.toArray(new String[0]));
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(130.0,2280.0,15870.0,50000.0,84130.0,97720.0,99870.0)", 
output.get(0).toString());
-  }
-  
-
-  
-  @Test
-  public void quantile3Test() throws Exception {
-    PigTest test = createPigTest("datafu/stats/quantileTest.pig",
-                                 
"QUANTILES='0.0013','0.0228','0.1587','0.5','0.8413','0.9772','0.9987'");
-
-    List<String> input = new ArrayList<String>();
-    for (int i=100000; i>=0; i--)
-    {
-      input.add(Integer.toString(i));
-    }
-    
-    writeLinesToFile("input", input.toArray(new String[0]));
-        
-    test.runScript();
-    
-    List<Tuple> output = getLinesForAlias(test, "data_out", true);
-    
-    assertEquals(1,output.size());
-    assertEquals("(130.0,2280.0,15870.0,50000.0,84130.0,97720.0,99870.0)", 
output.get(0).toString());
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/WilsonBinConfTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/WilsonBinConfTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/WilsonBinConfTests.java
deleted file mode 100644
index cb43ce1..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/stats/WilsonBinConfTests.java
+++ /dev/null
@@ -1,81 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.stats;
-
-import static org.junit.Assert.*;
-
-import java.util.ArrayList;
-import java.util.Iterator;
-import java.util.List;
-
-import org.apache.pig.data.Tuple;
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class WilsonBinConfTests extends PigTests
-{
-  @Test
-  public void wilsonTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/stats/wilsonBinConfTests.pig",
-                                 "alpha=0.05"); // alpha is 0.05 for 95% 
confidence
-    
-    writeLinesToFile("input",
-                     "1\t1",
-                     "1\t2",
-                     "50\t100",
-                     "500\t1000",
-                     "999\t1000",
-                     "1000\t1000",
-                     "998\t1000");
-        
-    test.runScript();
-    
-    /* Add expected values, computed using R:
-     * 
-     * e.g.
-     * 
-     * library(Hmisc)
-     * 
-     * binconf(50,100)
-     * binconf(500,1000)
-     * 
-     */
-    List<String> expectedOutput = new ArrayList<String>();
-    expectedOutput.add("0.05129,1.00000");
-    expectedOutput.add("0.02565,0.97435");
-    expectedOutput.add("0.40383,0.59617");
-    expectedOutput.add("0.46907,0.53093");
-    expectedOutput.add("0.99436,0.99995");
-    expectedOutput.add("0.99617,1.00000");
-    expectedOutput.add("0.99274,0.99945");
-    
-    List<Tuple> output = this.getLinesForAlias(test, "data_out");
-    Iterator<String> expectationIterator = expectedOutput.iterator();
-    for (Tuple t : output)
-    {
-      assertTrue(expectationIterator.hasNext());
-      Double lower = (Double)t.get(0);
-      Double upper = (Double)t.get(1);
-      
assertEquals(expectationIterator.next(),String.format("%.5f,%.5f",lower,upper));
-    }
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/urls/UserAgentTest.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/urls/UserAgentTest.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/urls/UserAgentTest.java
deleted file mode 100644
index e742c0d..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/urls/UserAgentTest.java
+++ /dev/null
@@ -1,57 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.urls;
-
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class UserAgentTest extends PigTests
-{
-  
-  @Test
-  public void userAgentTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/urls/userAgentTest.pig");
-  
-    String[] input = {
-        "Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_3_3 like Mac OS X; en-us) 
AppleWebKit/533.17.9 (KHTML, like Gecko) Version/5.0.2 Mobile/8J2 
Safari/6533.18.5",
-        "Mozilla/5.0 (compatible; Konqueror/3.5; Linux; X11; de) KHTML/3.5.2 
(like Gecko) Kubuntu 6.06 Dapper",
-        "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:2.2a1pre) Gecko/20110331 
Firefox/4.2a1pre Fennec/4.1a1pre",
-        "Opera/9.00 (X11; Linux i686; U; en)",
-        "Wget/1.10.2",
-        "Opera/9.80 (Android; Linux; Opera Mobi/ADR-1012221546; U; pl) 
Presto/2.7.60 Version/10.5",
-        "Mozilla/5.0 (Linux; U; Android 2.2; en-us; DROID2 Build/VZW) 
AppleWebKit/533.1 (KHTML, like Gecko) Version/4.0 Mobile Safari/533.1"
-    };
-    
-    String[] output = {
-        "(mobile)",
-        "(desktop)",
-        "(mobile)",
-        "(desktop)",
-        "(desktop)",
-        "(mobile)",
-        "(mobile)",
-      };
-    
-    test.assertOutput("data",input,"data_out",output);
-  }
-
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/AssertTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/AssertTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/AssertTests.java
deleted file mode 100644
index 0379ae7..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/AssertTests.java
+++ /dev/null
@@ -1,93 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.util;
-
-import static org.junit.Assert.*;
-
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class AssertTests extends PigTests
-{
-  @Test
-  public void shouldAssertWithMessageOnZero() throws Exception
-  {
-    try
-    {
-      PigTest test = createPigTest("datafu/util/assertWithMessageTest.pig");
-      
-      this.writeLinesToFile("input", "0");
-      
-      test.runScript();
-      
-      this.getLinesForAlias(test, "data2");
-      
-      fail("test should have failed, but it didn't");
-    }
-    catch (Exception e)
-    {
-    }
-  }
-  
-  @Test
-  public void shouldNotAssertWithMessageOnOne() throws Exception
-  {
-    PigTest test = createPigTest("datafu/util/assertWithMessageTest.pig");
-    
-    this.writeLinesToFile("input", "1");
-    
-    test.runScript();
-    
-    this.getLinesForAlias(test, "data2");
-  }
-  
-  @Test
-  public void shouldAssertWithoutMessageOnZero() throws Exception
-  {
-    try
-    {
-      PigTest test = createPigTest("datafu/util/assertWithoutMessageTest.pig");
-      
-      this.writeLinesToFile("input", "0");
-      
-      test.runScript();
-      
-      this.getLinesForAlias(test, "data2");
-      
-      fail("test should have failed, but it didn't");
-    }
-    catch (Exception e)
-    {
-    }
-  }
-  
-  @Test
-  public void shouldNotAssertWithoutMessageOnOne() throws Exception
-  {
-    PigTest test = createPigTest("datafu/util/assertWithoutMessageTest.pig");
-    
-    this.writeLinesToFile("input", "1");
-    
-    test.runScript();
-    
-    this.getLinesForAlias(test, "data2");
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/IntBoolConversionPigTests.java
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/IntBoolConversionPigTests.java
 
b/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/IntBoolConversionPigTests.java
deleted file mode 100644
index 2653060..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/groovy/org/apache/bigtop/itest/datafu/util/IntBoolConversionPigTests.java
+++ /dev/null
@@ -1,77 +0,0 @@
-/**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- * <p/>
- * http://www.apache.org/licenses/LICENSE-2.0
- * <p/>
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.bigtop.itest.datafu.util;
-
-import org.apache.pig.pigunit.PigTest;
-import org.junit.Test;
-
-import org.apache.bigtop.itest.datafu.PigTests;
-
-public class IntBoolConversionPigTests extends PigTests
-{
-  @Test
-  public void intToBoolTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/util/intToBoolTest.pig");
-        
-    String[] input = {
-      "", // null
-      "0",
-      "1"
-    };
-    
-    String[] output = {
-        "(false)",
-        "(false)",
-        "(true)"
-      };
-    
-    test.assertOutput("data",input,"data2",output);
-  }
-  
-  @Test
-  public void intToBoolToIntTest() throws Exception
-  {
-    PigTest test = createPigTest("datafu/util/intToBoolToIntTest.pig");
-        
-    String[] input = {
-      "", // null
-      "0",
-      "1",
-      "2",
-      "-1",
-      "-2",
-      "0",
-      ""
-    };
-    
-    String[] output = {
-        "(0)",
-        "(0)",
-        "(1)",
-        "(1)",
-        "(1)",
-        "(1)",
-        "(0)",
-        "(0)"
-      };
-    
-    test.assertOutput("data",input,"data3",output);
-  }
-}

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/aliasBagFieldsTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/aliasBagFieldsTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/aliasBagFieldsTest.pig
deleted file mode 100644
index 247c832..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/aliasBagFieldsTest.pig
+++ /dev/null
@@ -1,20 +0,0 @@
-register $JAR_PATH
-
-define AliasBagFields datafu.pig.bags.AliasBagFields('[a#alpha,b#numeric]');
-
-data = LOAD 'input' AS (data: bag {T: tuple(a:CHARARRAY, b:INT, c:INT)});
-
-data2 = FOREACH data GENERATE AliasBagFields(data) as data;
-
-describe data2;
-
-data3 = FOREACH data2 GENERATE FLATTEN(data);
-
-describe data3;
-
-data4 = FOREACH data3 GENERATE data::alpha, data::numeric;
-
-describe data4;
-
-STORE data4 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/appendToBagTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/appendToBagTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/appendToBagTest.pig
deleted file mode 100644
index d906bc4..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/appendToBagTest.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define AppendToBag datafu.pig.bags.AppendToBag();
-
-data = LOAD 'input' AS (key:INT, B: bag{T: tuple(v:INT)}, T: tuple(v:INT));
-
-data2 = FOREACH data GENERATE key, AppendToBag(B,T) as B;
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagConcatTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagConcatTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagConcatTest.pig
deleted file mode 100644
index 30d46a0..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagConcatTest.pig
+++ /dev/null
@@ -1,11 +0,0 @@
-register $JAR_PATH
-
-define BagConcat datafu.pig.bags.BagConcat();
-
-data = LOAD 'input' AS (A: bag{T: tuple(v:INT)}, B: bag{T: tuple(v:INT)}, C: 
bag{T: tuple(v:INT)});
-
-data2 = FOREACH data GENERATE BagConcat(A,B,C);
-
-describe data2
-
-STORE data2 INTO 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitTest.pig
deleted file mode 100644
index ee4f538..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitTest.pig
+++ /dev/null
@@ -1,14 +0,0 @@
-register $JAR_PATH
-
-define BagSplit datafu.pig.bags.BagSplit();
-
-data = LOAD 'input' AS (B:bag{T:tuple(val1:INT,val2:INT)});
-
-data2 = FOREACH data GENERATE BagSplit($MAX,B);
-describe data2;
-
-data3 = FOREACH data2 GENERATE FLATTEN($0);
-
-describe data3
-
-STORE data3 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitWithBagNumTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitWithBagNumTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitWithBagNumTest.pig
deleted file mode 100644
index 833e912..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/bagSplitWithBagNumTest.pig
+++ /dev/null
@@ -1,11 +0,0 @@
-register $JAR_PATH
-
-define BagSplit datafu.pig.bags.BagSplit('true');
-
-data = LOAD 'input' AS (B:bag{T:tuple(val1:INT,val2:INT)});
-
-data2 = FOREACH data GENERATE BagSplit($MAX,B);
-
-data3 = FOREACH data2 GENERATE FLATTEN($0);
-
-STORE data3 INTO 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/comprehensiveBagSplitAndEnumerate.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/comprehensiveBagSplitAndEnumerate.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/comprehensiveBagSplitAndEnumerate.pig
deleted file mode 100644
index 88d7392..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/comprehensiveBagSplitAndEnumerate.pig
+++ /dev/null
@@ -1,26 +0,0 @@
-register $JAR_PATH
-
-define BagSplit datafu.pig.bags.BagSplit();
-define Enumerate datafu.pig.bags.Enumerate('1');
-
-data = LOAD 'input' AS (data: bag {T: tuple(name:CHARARRAY, score:double)});
-
-data2 = FOREACH data GENERATE BagSplit(3,data) as the_bags;
-
-describe data2
-
-data3 = FOREACH data2 GENERATE Enumerate(the_bags) as enumerated_bags;
-
-describe data3
-
-data4 = FOREACH data3 GENERATE FLATTEN(enumerated_bags) as (data,i);
-
-describe data4
-
-data5 = FOREACH data4 GENERATE data as the_data, i as the_key;
-
-describe data5
-
-data_out = FOREACH data5 GENERATE FLATTEN(the_data), the_key;
-
-describe data_out
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/distinctByTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/distinctByTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/distinctByTest.pig
deleted file mode 100644
index 9532d07..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/distinctByTest.pig
+++ /dev/null
@@ -1,12 +0,0 @@
-register $JAR_PATH
-
-define DistinctBy datafu.pig.bags.DistinctBy('0');
-
-data = LOAD 'input' AS (data: bag {T: tuple(a:CHARARRAY, b:INT, c:INT)});
-
-data2 = FOREACH data GENERATE DistinctBy(data);
-
-describe data2;
-
-STORE data2 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateTest.pig
deleted file mode 100644
index 1647485..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateTest.pig
+++ /dev/null
@@ -1,16 +0,0 @@
-register $JAR_PATH
-
-define Enumerate datafu.pig.bags.Enumerate();
-
-data = LOAD 'input' AS (data: bag {T: tuple(v1:INT,B: bag{T: tuple(v2:INT)})});
-
-data2 = FOREACH data GENERATE Enumerate(data);
-describe data2;
-
-data3 = FOREACH data2 GENERATE FLATTEN($0);
-describe data3;
-
-data4 = FOREACH data3 GENERATE $0 as v1, $1 as B, $2 as i;
-describe data4;
-
-STORE data4 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithReverseTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithReverseTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithReverseTest.pig
deleted file mode 100644
index 1f04b04..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithReverseTest.pig
+++ /dev/null
@@ -1,16 +0,0 @@
-register $JAR_PATH
-
-define Enumerate datafu.pig.bags.Enumerate('1', 'true');
-
-data = LOAD 'input' AS (data: bag {T: tuple(v1:INT,B: bag{T: tuple(v2:INT)})});
-
-data2 = FOREACH data GENERATE Enumerate(data);
-describe data2;
-
-data3 = FOREACH data2 GENERATE FLATTEN($0);
-describe data3;
-
-data4 = FOREACH data3 GENERATE $0 as v1, $1 as B, $2 as i;
-describe data4;
-
-STORE data4 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithStartTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithStartTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithStartTest.pig
deleted file mode 100644
index d288a6e..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/enumerateWithStartTest.pig
+++ /dev/null
@@ -1,16 +0,0 @@
-register $JAR_PATH
-
-define Enumerate datafu.pig.bags.Enumerate('1');
-
-data = LOAD 'input' AS (data: bag {T: tuple(v1:INT,B: bag{T: tuple(v2:INT)})});
-
-data2 = FOREACH data GENERATE Enumerate(data);
-describe data2;
-
-data3 = FOREACH data2 GENERATE FLATTEN($0);
-describe data3;
-
-data4 = FOREACH data3 GENERATE $0 as v1, $1 as B, $2 as i;
-describe data4;
-
-STORE data4 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/firstTupleFromBagTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/firstTupleFromBagTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/firstTupleFromBagTest.pig
deleted file mode 100644
index 921787e..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/firstTupleFromBagTest.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define FirstTupleFromBag datafu.pig.bags.FirstTupleFromBag();
-
-data = LOAD 'input' AS (key:INT, B: bag{T: tuple(v:INT)});
-
-data2 = FOREACH data GENERATE key, FirstTupleFromBag(B, null) as B;
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/nullToEmptyBagTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/nullToEmptyBagTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/nullToEmptyBagTest.pig
deleted file mode 100644
index 3e809b3..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/nullToEmptyBagTest.pig
+++ /dev/null
@@ -1,14 +0,0 @@
-register $JAR_PATH
-
-define NullToEmptyBag datafu.pig.bags.NullToEmptyBag();
-
-data = LOAD 'input' AS (B: bag {T: tuple(v:INT)});
-
-dump data;
-
-data2 = FOREACH data GENERATE NullToEmptyBag(B) as P;
-
-dump data2;
-
-STORE data2 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/prependToBagTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/prependToBagTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/prependToBagTest.pig
deleted file mode 100644
index c852346..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/prependToBagTest.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define PrependToBag datafu.pig.bags.PrependToBag();
-
-data = LOAD 'input' AS (key:INT, B: bag{T: tuple(v:INT)}, T: tuple(v:INT));
-
-data2 = FOREACH data GENERATE key, PrependToBag(B,T) as B;
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setIntersectTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setIntersectTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setIntersectTest.pig
deleted file mode 100644
index 6f590e8..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setIntersectTest.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define SetIntersect datafu.pig.bags.sets.SetIntersect();
-
-data = LOAD 'input' AS 
(B1:bag{T:tuple(val1:int,val2:int)},B2:bag{T:tuple(val1:int,val2:int)});
-
-data2 = FOREACH data GENERATE SetIntersect(B1,B2);
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setUnionTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setUnionTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setUnionTest.pig
deleted file mode 100644
index a5e1c4d..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/sets/setUnionTest.pig
+++ /dev/null
@@ -1,13 +0,0 @@
-register $JAR_PATH
-
-define SetUnion datafu.pig.bags.sets.SetUnion();
-
-data = LOAD 'input' AS 
(B1:bag{T:tuple(val1:int,val2:int)},B2:bag{T:tuple(val1:int,val2:int)});
-
-dump data
-
-data2 = FOREACH data GENERATE SetUnion(B1,B2);
-
-dump data2
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests.pig
deleted file mode 100644
index 1bf68bd..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests.pig
+++ /dev/null
@@ -1,16 +0,0 @@
-register $JAR_PATH
-
-define UnorderedPairs datafu.pig.bags.UnorderedPairs();
-
-data = LOAD 'input' AS (B: bag {T: tuple(v:INT)});
-
-data2 = FOREACH data GENERATE UnorderedPairs(B) as P;
-
-data3 = FOREACH data2 GENERATE FLATTEN(P);
-
-data4 = FOREACH data3 GENERATE FLATTEN(elem1), FLATTEN(elem2);
-
-data5 = ORDER data4 BY $0, $1;
-
-STORE data5 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests2.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests2.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests2.pig
deleted file mode 100644
index aada011..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/bags/unorderedPairsTests2.pig
+++ /dev/null
@@ -1,12 +0,0 @@
-register $JAR_PATH
-
-define UnorderedPairs datafu.pig.bags.UnorderedPairs();
-
-data = LOAD 'input' AS (A:int, B: bag {T: tuple(v:INT)});
-
-data2 = FOREACH data GENERATE A, UnorderedPairs(B) as P;
-
-data3 = FOREACH data2 GENERATE A, FLATTEN(P);
-
-STORE data3 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/date/timeCountPageViewsTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/date/timeCountPageViewsTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/date/timeCountPageViewsTest.pig
deleted file mode 100644
index 1e23a41..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/date/timeCountPageViewsTest.pig
+++ /dev/null
@@ -1,13 +0,0 @@
-register $JAR_PATH
-
-define TimeCount datafu.pig.date.TimeCount('$TIME_WINDOW');
-
-views = LOAD 'input' AS (user_id:int, page_id:int, time:chararray);
-
-views_grouped = GROUP views BY (user_id, page_id);
-view_counts = foreach views_grouped {
-  views = order views by time;
-  generate group.user_id as user_id, group.page_id as page_id, 
TimeCount(views.(time)) as count;
-}
-
-STORE view_counts INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/geo/haversineTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/geo/haversineTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/geo/haversineTest.pig
deleted file mode 100644
index e52cc1f..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/geo/haversineTest.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define HaversineDistInMiles datafu.pig.geo.HaversineDistInMiles();
-
-data = LOAD 'input' AS (lat1:double,lng1:double,lat2:double,lng2:double);
-
-data2 = FOREACH data GENERATE HaversineDistInMiles(lat1,lng1,lat2,lng2);
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Base64Test.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Base64Test.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Base64Test.pig
deleted file mode 100644
index 5a12c2e..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Base64Test.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define MD5 datafu.pig.hash.MD5Base64();
-
-data_in = LOAD 'input' as (val:chararray);
-
-data_out = FOREACH data_in GENERATE MD5(val) as val;
-
-STORE data_out INTO 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Test.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Test.pig 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Test.pig
deleted file mode 100644
index 3fc6aaa..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/hash/md5Test.pig
+++ /dev/null
@@ -1,9 +0,0 @@
-register $JAR_PATH
-
-define MD5 datafu.pig.hash.MD5();
-
-data_in = LOAD 'input' as (val:chararray);
-
-data_out = FOREACH data_in GENERATE MD5(val) as val;
-
-STORE data_out INTO 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/linkanalysis/pageRankTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/linkanalysis/pageRankTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/linkanalysis/pageRankTest.pig
deleted file mode 100644
index a0e439c..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/linkanalysis/pageRankTest.pig
+++ /dev/null
@@ -1,25 +0,0 @@
-register $JAR_PATH
-
-/* Need to enable dangling node handling since the Wikipedia example has them,
-   otherwise the ranks won't be right. */
-define PageRank datafu.pig.linkanalysis.PageRank('dangling_nodes','true');
-
-data = LOAD 'input' AS (topic:INT,source:INT,dest:INT,weight:DOUBLE);
-
-data_grouped = GROUP data by (topic,source);
-
-data_grouped = foreach data_grouped {
-  generate group.topic as topic, group.source as source, data.(dest,weight) as 
edges;
-};
-
-data_grouped2 = GROUP data_grouped by topic;
-data_grouped2 = foreach data_grouped2 {
-  generate group as topic, FLATTEN(PageRank(data_grouped.(source,edges))) as 
(source,rank);
-};
-
-data_grouped3 = FOREACH data_grouped2 GENERATE
-  topic,
-  source,
-  rank;
-  
-STORE data_grouped3 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/numbers/randomIntRangeTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/numbers/randomIntRangeTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/numbers/randomIntRangeTest.pig
deleted file mode 100644
index 3ca45c7..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/numbers/randomIntRangeTest.pig
+++ /dev/null
@@ -1,8 +0,0 @@
-register $JAR_PATH
-
-define RandInt datafu.pig.numbers.RandInt();
-
-data = LOAD 'input' AS (key:INT);
-data2 = FOREACH data GENERATE key, RandInt($MIN,$MAX) as val;
-
-STORE data2 INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/sessions/sessionizeTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/sessions/sessionizeTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/sessions/sessionizeTest.pig
deleted file mode 100644
index 6a4939e..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/sessions/sessionizeTest.pig
+++ /dev/null
@@ -1,17 +0,0 @@
-register $JAR_PATH
-
-define Sessionize datafu.pig.sessions.Sessionize('$TIME_WINDOW');
-
-views = LOAD 'input' AS (time:chararray, user_id:int, value:int);
-
-views_grouped = GROUP views BY user_id;
-view_counts = FOREACH views_grouped {
-  views = ORDER views BY time;
-  GENERATE flatten(Sessionize(views)) as (time,user_id,value,session_id);
-}
-
-max_value = GROUP view_counts BY (user_id, session_id);
-
-max_value = FOREACH max_value GENERATE group.user_id, MAX(view_counts.value) 
AS val;
-
-STORE max_value INTO 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairDefault.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairDefault.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairDefault.pig
deleted file mode 100644
index a121cb1..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairDefault.pig
+++ /dev/null
@@ -1,14 +0,0 @@
-register $JAR_PATH
-
-define markovPairs datafu.pig.stats.MarkovPairs();
-
-data = load 'input' as $schema;
-describe data;
-
-data_out1 = foreach data generate data as orig_bag;
-describe data_out1;
-
-data_out = foreach data_out1 generate markovPairs(orig_bag) as markov_bag;
-describe data_out;
-
-store data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairLookahead.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairLookahead.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairLookahead.pig
deleted file mode 100644
index 269a1bc..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/markovPairLookahead.pig
+++ /dev/null
@@ -1,14 +0,0 @@
-register $JAR_PATH
-
-define markovPairs datafu.pig.stats.MarkovPairs('$lookahead');
-
-data = load 'input' as $schema;
-describe data;
-
-data_out1 = foreach data generate data as orig_bag;
-describe data_out1;
-
-data_out = foreach data_out1 generate markovPairs(orig_bag) as markov_bag;
-describe data_out;
-
-store data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/medianTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/medianTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/medianTest.pig
deleted file mode 100644
index 0a439ce..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/medianTest.pig
+++ /dev/null
@@ -1,21 +0,0 @@
-register $JAR_PATH
-
-define Median datafu.pig.stats.Median();
-
-data_in = LOAD 'input' as (val:int);
-
-/*describe data_in;*/
-
-data_out = GROUP data_in ALL;
-
-/*describe data_out;*/
-
-data_out = FOREACH data_out {
-  sorted = ORDER data_in BY val;
-  GENERATE Median(sorted) as medians;
-}
-data_out = FOREACH data_out GENERATE FLATTEN(medians);
-
-/*describe data_out;*/
-
-STORE data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/quantileTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/quantileTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/quantileTest.pig
deleted file mode 100644
index 604d179..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/quantileTest.pig
+++ /dev/null
@@ -1,21 +0,0 @@
-register $JAR_PATH
-
-define Quantile datafu.pig.stats.Quantile($QUANTILES);
-
-data_in = LOAD 'input' as (val:int);
-
-/*describe data_in;*/
-
-data_out = GROUP data_in ALL;
-
-/*describe data_out;*/
-
-data_out = FOREACH data_out {
-  sorted = ORDER data_in BY val;
-  GENERATE Quantile(sorted) as quantiles;
-}
-data_out = FOREACH data_out GENERATE FLATTEN(quantiles);
-
-/*describe data_out;*/
-
-STORE data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingMedianTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingMedianTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingMedianTest.pig
deleted file mode 100644
index 27d64f3..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingMedianTest.pig
+++ /dev/null
@@ -1,21 +0,0 @@
-register $JAR_PATH
-
-define Median datafu.pig.stats.StreamingMedian();
-
-data_in = LOAD 'input' as (val:int);
-
-/*describe data_in;*/
-
-data_out = GROUP data_in ALL;
-
-/*describe data_out;*/
-
-data_out = FOREACH data_out {
-  sorted = ORDER data_in BY val;
-  GENERATE Median(sorted) as medians;
-}
-data_out = FOREACH data_out GENERATE FLATTEN(medians);
-
-/*describe data_out;*/
-
-STORE data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingQuantileTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingQuantileTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingQuantileTest.pig
deleted file mode 100644
index 51c3bc5..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/streamingQuantileTest.pig
+++ /dev/null
@@ -1,18 +0,0 @@
-register $JAR_PATH
-
-define Quantile datafu.pig.stats.StreamingQuantile($QUANTILES);
-
-data_in = LOAD 'input' as (val:int);
-
-/*describe data_in;*/
-
-data_out = GROUP data_in ALL;
-
-/*describe data_out;*/
-
-data_out = FOREACH data_out GENERATE Quantile(data_in.val) as quantiles;
-data_out = FOREACH data_out GENERATE FLATTEN(quantiles);
-
-/*describe data_out;*/
-
-STORE data_out into 'output';

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/wilsonBinConfTests.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/wilsonBinConfTests.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/wilsonBinConfTests.pig
deleted file mode 100644
index 19fa466..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/stats/wilsonBinConfTests.pig
+++ /dev/null
@@ -1,11 +0,0 @@
-register $JAR_PATH
-
-define WilsonBinConf datafu.pig.stats.WilsonBinConf('$alpha');
-
-data = load 'input' as (successes:long, totals:long);
-describe data;
-
-data_out = FOREACH data GENERATE WilsonBinConf(successes, totals) as interval;
-data_out = FOREACH data_out GENERATE FLATTEN(interval);
-
-store data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/urls/userAgentTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/urls/userAgentTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/urls/userAgentTest.pig
deleted file mode 100644
index 4548755..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/urls/userAgentTest.pig
+++ /dev/null
@@ -1,8 +0,0 @@
-register $JAR_PATH
-
-define UserAgentClassify datafu.pig.urls.UserAgentClassify();
-
-data = load 'input' as (usr_agent:chararray);
-data_out = foreach data generate UserAgentClassify(usr_agent) as class;
-describe data_out;
-store data_out into 'output';
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithMessageTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithMessageTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithMessageTest.pig
deleted file mode 100644
index f240987..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithMessageTest.pig
+++ /dev/null
@@ -1,10 +0,0 @@
-register $JAR_PATH
-
-define ASSERT datafu.pig.util.ASSERT();
-
-data = LOAD 'input' AS (val:INT);
-
-data2 = FILTER data BY ASSERT(val,'assertion appears to have failed, doh!');
-
-STORE data2 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithoutMessageTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithoutMessageTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithoutMessageTest.pig
deleted file mode 100644
index c6368e7..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/assertWithoutMessageTest.pig
+++ /dev/null
@@ -1,10 +0,0 @@
-register $JAR_PATH
-
-define ASSERT datafu.pig.util.ASSERT();
-
-data = LOAD 'input' AS (val:INT);
-
-data2 = FILTER data BY ASSERT(val);
-
-STORE data2 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolTest.pig
deleted file mode 100644
index 18cda42..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolTest.pig
+++ /dev/null
@@ -1,10 +0,0 @@
-register $JAR_PATH
-
-define IntToBool datafu.pig.util.IntToBool();
-
-data = LOAD 'input' AS (val:INT);
-
-data2 = FOREACH data GENERATE IntToBool(val);
-
-STORE data2 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolToIntTest.pig
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolToIntTest.pig
 
b/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolToIntTest.pig
deleted file mode 100644
index 82d3ee0..0000000
--- 
a/bigtop-tests/test-artifacts/datafu/src/main/resources/datafu/util/intToBoolToIntTest.pig
+++ /dev/null
@@ -1,12 +0,0 @@
-register $JAR_PATH
-
-define IntToBool datafu.pig.util.IntToBool();
-define BoolToInt datafu.pig.util.BoolToInt();
-
-data = LOAD 'input' AS (val:INT);
-
-data2 = FOREACH data GENERATE IntToBool(val) as val;
-data3 = FOREACH data2 GENERATE BoolToInt(val) as val;
-
-STORE data3 INTO 'output';
-

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/package/src/main/resources/package_data.xml
----------------------------------------------------------------------
diff --git 
a/bigtop-tests/test-artifacts/package/src/main/resources/package_data.xml 
b/bigtop-tests/test-artifacts/package/src/main/resources/package_data.xml
index 19365e8..d9afcb3 100644
--- a/bigtop-tests/test-artifacts/package/src/main/resources/package_data.xml
+++ b/bigtop-tests/test-artifacts/package/src/main/resources/package_data.xml
@@ -446,25 +446,6 @@ easy to test, and efficient to run.</description>
       <hive-hcatalog>/self</hive-hcatalog>
     </deps>
   </hive-hcatalog-server>
-  <pig-udf-datafu>
-    <metadata>
-      <summary>A collection of user-defined functions for Hadoop and 
Pig.</summary>
-      <description> DataFu is a collection of user-defined functions for 
working with large-scale
- data in Hadoop and Pig. This library was born out of the need for a stable,
- well-tested library of UDFs for data mining and statistics. It is used
- at LinkedIn in many of our off-line workflows for data derived products like
- "People You May Know" and "Skills".
-
- It contains functions for: PageRank, Quantiles (median), variance, 
Sessionization,
- Convenience bag functions (e.g., set operations, enumerating bags, etc),
- Convenience utility functions (e.g., assertions, easier writing of EvalFuncs)
- and more...</description>
-      <url>https://github.com/linkedin/datafu</url>
-    </metadata>
-    <deps>
-      <pig/>
-    </deps>
-  </pig-udf-datafu>
   <hive-jdbc>
     <metadata>
       <summary>Provides libraries necessary to connect to Apache Hive via 
JDBC</summary>

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-artifacts/pom.xml
----------------------------------------------------------------------
diff --git a/bigtop-tests/test-artifacts/pom.xml 
b/bigtop-tests/test-artifacts/pom.xml
index f8dea78..b0af51e 100644
--- a/bigtop-tests/test-artifacts/pom.xml
+++ b/bigtop-tests/test-artifacts/pom.xml
@@ -45,7 +45,6 @@
     <module>hue</module>
     <module>solr</module>
     <module>crunch</module>
-    <module>datafu</module>
     <module>longevity</module>
     <module>hcatalog</module>
     <module>spark</module>

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop-tests/test-execution/smokes/datafu/pom.xml
----------------------------------------------------------------------
diff --git a/bigtop-tests/test-execution/smokes/datafu/pom.xml 
b/bigtop-tests/test-execution/smokes/datafu/pom.xml
deleted file mode 100644
index 45b007f..0000000
--- a/bigtop-tests/test-execution/smokes/datafu/pom.xml
+++ /dev/null
@@ -1,140 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
-   Licensed to the Apache Software Foundation (ASF) under one or more
-   contributor license agreements.  See the NOTICE file distributed with
-   this work for additional information regarding copyright ownership.
-   The ASF licenses this file to You under the Apache License, Version 2.0
-   (the "License"); you may not use this file except in compliance with
-   the License.  You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
--->
-<project xmlns="http://maven.apache.org/POM/4.0.0";
-         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance";
-         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 
http://maven.apache.org/maven-v4_0_0.xsd";>
-  <modelVersion>4.0.0</modelVersion>
-
-  <parent>
-    <groupId>org.apache.bigtop.itest</groupId>
-    <artifactId>smoke-tests</artifactId>
-    <version>1.3.1-SNAPSHOT</version>
-    <relativePath>../pom.xml</relativePath>
-  </parent>
-
-  <groupId>org.apache.bigtop.itest</groupId>
-  <artifactId>datafu-smoke-execution</artifactId>
-  <version>1.3.1-SNAPSHOT</version>
-  <name>datafu smoke test execution</name>
-
-  <properties>
-    
<org.apache.maven-dependency-plugin.groupId>org.apache.bigtop.itest</org.apache.maven-dependency-plugin.groupId>
-    
<org.apache.maven-dependency-plugin.artifactId>datafu-smoke</org.apache.maven-dependency-plugin.artifactId>
-    
<org.apache.maven-dependency-plugin.version>${project.version}</org.apache.maven-dependency-plugin.version>
-    
<org.apache.maven-dependency-plugin.output>${project.build.directory}</org.apache.maven-dependency-plugin.output>
-    
<org.apache.maven-dependency-plugin.type>jar</org.apache.maven-dependency-plugin.type>
-    
<org.apache.maven-failsafe-plugin.testInclude>**/*Tests*</org.apache.maven-failsafe-plugin.testInclude>
-
-    <HADOOP_MAPRED_HOME>${env.HADOOP_MAPRED_HOME}</HADOOP_MAPRED_HOME>
-    <HADOOP_CONF_DIR>${env.HADOOP_CONF_DIR}</HADOOP_CONF_DIR>
-    <PIG_HOME>${env.PIG_HOME}</PIG_HOME>
-  </properties>
-
-  <dependencies>
-    <dependency>
-      <groupId>${org.apache.maven-dependency-plugin.groupId}</groupId>
-      <artifactId>${org.apache.maven-dependency-plugin.artifactId}</artifactId>
-      <version>${project.version}</version>
-    </dependency>
-  </dependencies>
-
-  <build>
-    <plugins>
-      <plugin>
-        <groupId>org.apache.maven.plugins</groupId>
-        <artifactId>maven-install-plugin</artifactId>
-        <executions>
-        <execution>
-          <phase>initialize</phase>
-          <goals>
-            <goal>install-file</goal>
-          </goals>
-        </execution>
-        </executions>
-        <configuration>
-          <file>${PIG_HOME}/pig.jar</file>
-          <groupId>org.apache.pig</groupId>
-          <artifactId>pig</artifactId>
-          <version>${pig.version}</version>
-          <packaging>jar</packaging>
-        </configuration>
-      </plugin>
-
-
-      <plugin>
-        <groupId>org.apache.maven.plugins</groupId>
-        <artifactId>maven-dependency-plugin</artifactId>
-      </plugin>
-
-      <plugin>
-        <groupId>org.apache.maven.plugins</groupId>
-        <artifactId>maven-enforcer-plugin</artifactId>
-        <version>1.0</version>
-        <executions>
-          <execution>
-            <id>enforce-property</id>
-            <goals>
-              <goal>enforce</goal>
-            </goals>
-            <configuration>
-              <rules>
-                <requireProperty>
-                  <property>HADOOP_MAPRED_HOME</property>
-                  <message>HADOOP_MAPRED_HOME env. variable has to be 
set</message>
-                </requireProperty>
-                <requireProperty>
-                  <property>HADOOP_CONF_DIR</property>
-                  <message>HADOOP_CONF_DIR env. variable has to be 
set</message>
-                </requireProperty>
-                <requireProperty>
-                  <property>PIG_HOME</property>
-                  <message>PIG_HOME env. variable has to be set</message>
-                </requireProperty>
-              </rules>
-              <fail>true</fail>
-            </configuration>
-          </execution>
-        </executions>
-      </plugin>
-
-      <plugin>
-        <groupId>org.apache.maven.plugins</groupId>
-        <artifactId>maven-failsafe-plugin</artifactId>
-        <version>2.11</version>
-        <configuration>
-          <forkMode>always</forkMode>
-          <argLine>-Dpigunit.exectype.cluster=true</argLine>
-          <additionalClasspathElements>
-            
<additionalClasspathElement>${HADOOP_CONF_DIR}</additionalClasspathElement>
-          </additionalClasspathElements>
-          <systemPropertyVariables>
-            <datafu.jar.dir>${PIG_HOME}</datafu.jar.dir>
-          </systemPropertyVariables>
-        </configuration>
-
-        <!-- Disabling for now: configuration>
-          <testSourceDirectory>src</testSourceDirectory>
-          <testClassesDirectory>target/classes</testClassesDirectory>
-          <skipTests>false</skipTests>
-          <testFailureIgnore>false</testFailureIgnore>
-          <argLine>-Dsun.lang.ClassLoader.allowArraySyntax=true 
-Djava.endorsed.dirs=${project.build.testOutputDirectory}/endorsed</argLine>
-        </configuration -->
-      </plugin>
-    </plugins>
-  </build>
-</project>

http://git-wip-us.apache.org/repos/asf/bigtop/blob/4cee56bd/bigtop.bom
----------------------------------------------------------------------
diff --git a/bigtop.bom b/bigtop.bom
index 02e5b96..3664f7f 100644
--- a/bigtop.bom
+++ b/bigtop.bom
@@ -252,17 +252,6 @@ bigtop {
                 site = "${apache.APACHE_MIRROR}/${download_path}"
                 archive = "${apache.APACHE_ARCHIVE}/${download_path}" }
     }
-    'datafu' {
-      name    = 'datafu'
-      pkg     = 'pig-udf-datafu'
-      relNotes = 'Pig UDF Datafu'
-      version { base = '1.3.0'; pkg = base; release = 1 }
-      tarball { destination = "$name-${version.base}.tar.gz"
-                source      = 
"apache-$name-incubating-sources-${version.base}.tgz" }
-      url     { download_path = 
"incubator/$name/apache-$name-incubating-${version.base}"
-                site = "${apache.APACHE_MIRROR}/${download_path}"
-                archive = "${apache.APACHE_ARCHIVE}/${download_path}" }
-    }
     'solr' {
       name    = 'solr'
       relNotes = 'Apache Solr'

Reply via email to