svn commit: r955682 - in /hadoop/pig/trunk: ./ src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/ src/org/apache/pig/backend/hadoop/executionengine/physicalLayer/ src/org/apache/pig/dat

2010-06-17 Thread dvryaboy
Author: dvryaboy
Date: Thu Jun 17 17:24:00 2010
New Revision: 955682

URL: http://svn.apache.org/viewvc?rev=955682&view=rev
Log:
PIG-1428: Make a StatusReporter singleton available for incrementing counters 
(dvryaboy)

Modified:
hadoop/pig/trunk/CHANGES.txt

hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/MapReducePOStoreImpl.java

hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigCombiner.java

hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigHadoopLogger.java

hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigMapBase.java

hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigMapReduce.java

hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/physicalLayer/PigLogger.java
hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java
hadoop/pig/trunk/src/org/apache/pig/tools/pigstats/PigStatusReporter.java

Modified: hadoop/pig/trunk/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/CHANGES.txt?rev=955682&r1=955681&r2=955682&view=diff
==
--- hadoop/pig/trunk/CHANGES.txt (original)
+++ hadoop/pig/trunk/CHANGES.txt Thu Jun 17 17:24:00 2010
@@ -24,6 +24,8 @@ INCOMPATIBLE CHANGES
 
 IMPROVEMENTS
 
+PIG-1428: Make a StatusReporter singleton available for incrementing counters 
(dvryaboy)
+
 PIG-972: Make describe work with nested foreach (aniket486 via daijy)
 
 PIG-1438: [Performance] MultiQueryOptimizer should also merge DISTINCT jobs

Modified: 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/MapReducePOStoreImpl.java
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/MapReducePOStoreImpl.java?rev=955682&r1=955681&r2=955682&view=diff
==
--- 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/MapReducePOStoreImpl.java
 (original)
+++ 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/MapReducePOStoreImpl.java
 Thu Jun 17 17:24:00 2010
@@ -51,8 +51,8 @@ public class MapReducePOStoreImpl extend
 // configuration below (like setting the output location) do
 // not affect the caller's copy
 Configuration outputConf = new 
Configuration(context.getConfiguration());
-
-reporter = new PigStatusReporter(context);
+PigStatusReporter.setContext(context);
+reporter = PigStatusReporter.getInstance();

 // make a copy of the Context to use here - since in the same
 // task (map or reduce) we could have multiple stores, we should

Modified: 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigCombiner.java
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigCombiner.java?rev=955682&r1=955681&r2=955682&view=diff
==
--- 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigCombiner.java
 (original)
+++ 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigCombiner.java
 Thu Jun 17 17:24:00 2010
@@ -135,7 +135,8 @@ public class PigCombiner {
 
 PigHadoopLogger pigHadoopLogger = 
PigHadoopLogger.getInstance();
 pigHadoopLogger.setAggregate(aggregateWarning);
-pigHadoopLogger.setReporter(new PigStatusReporter(context));
+PigStatusReporter.setContext(context);
+pigHadoopLogger.setReporter(PigStatusReporter.getInstance());
 
 PhysicalOperator.setPigLogger(pigHadoopLogger);
 }

Modified: 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigHadoopLogger.java
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigHadoopLogger.java?rev=955682&r1=955681&r2=955682&view=diff
==
--- 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigHadoopLogger.java
 (original)
+++ 
hadoop/pig/trunk/src/org/apache/pig/backend/hadoop/executionengine/mapReduceLayer/PigHadoopLogger.java
 Thu Jun 17 17:24:00 2010
@@ -19,8 +19,6 @@ package org.apache.pig.backend.hadoop.ex
 
 import org.apache.commons.logging.Log;
 import org.apache.commons.logging.LogFactory;
-import org.apache.hadoop.mapreduce.Counter;
-import org.apache.hadoop.mapreduce.TaskInputOutputContext;
 import org.apache.pig.backend.hadoop.executionengine.physicalLayer.PigLogger;
 import org.apache.pig.tools.pigstats.Pig

svn commit: r955696 - in /hadoop/pig/trunk: CHANGES.txt build.xml

2010-06-17 Thread daijy
Author: daijy
Date: Thu Jun 17 18:21:28 2010
New Revision: 955696

URL: http://svn.apache.org/viewvc?rev=955696&view=rev
Log:
PIG-1450: TestAlgebraicEvalLocal failures due to OOM

Modified:
hadoop/pig/trunk/CHANGES.txt
hadoop/pig/trunk/build.xml

Modified: hadoop/pig/trunk/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/CHANGES.txt?rev=955696&r1=955695&r2=955696&view=diff
==
--- hadoop/pig/trunk/CHANGES.txt (original)
+++ hadoop/pig/trunk/CHANGES.txt Thu Jun 17 18:21:28 2010
@@ -86,6 +86,8 @@ PIG-1309: Map-side Cogroup (ashutoshc)
 
 BUG FIXES
 
+PIG-1450: TestAlgebraicEvalLocal failures due to OOM (daijy)
+
 PIG-1433: pig should create success file if
 mapreduce.fileoutputcommitter.marksuccessfuljobs is true (pradeepkth)
 

Modified: hadoop/pig/trunk/build.xml
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/build.xml?rev=955696&r1=955695&r2=955696&view=diff
==
--- hadoop/pig/trunk/build.xml (original)
+++ hadoop/pig/trunk/build.xml Thu Jun 17 18:21:28 2010
@@ -553,7 +553,7 @@
 
 
 
-
+
 
 
 




svn commit: r955701 - in /hadoop/pig/trunk/contrib/zebra: CHANGES.txt build.xml

2010-06-17 Thread yanz
Author: yanz
Date: Thu Jun 17 18:44:31 2010
New Revision: 955701

URL: http://svn.apache.org/viewvc?rev=955701&view=rev
Log:
PIG-1455 Addition of test-unit as an ant target (yanz)

Modified:
hadoop/pig/trunk/contrib/zebra/CHANGES.txt
hadoop/pig/trunk/contrib/zebra/build.xml

Modified: hadoop/pig/trunk/contrib/zebra/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/contrib/zebra/CHANGES.txt?rev=955701&r1=955700&r2=955701&view=diff
==
--- hadoop/pig/trunk/contrib/zebra/CHANGES.txt (original)
+++ hadoop/pig/trunk/contrib/zebra/CHANGES.txt Thu Jun 17 18:44:31 2010
@@ -4,6 +4,8 @@ Trunk (unreleased changes)
 
   INCOMPATIBLE CHANGES
 
+PIG-1455 Addition of test-unit as an ant target (yanz)
+
 PIG-1451 Change the build.test property in build to test.build.dir to be 
consistent with PIG (yanz)
 
 PIG-1444 Addition of test-smoke ant target (gauravj via yanz)

Modified: hadoop/pig/trunk/contrib/zebra/build.xml
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/contrib/zebra/build.xml?rev=955701&r1=955700&r2=955701&view=diff
==
--- hadoop/pig/trunk/contrib/zebra/build.xml (original)
+++ hadoop/pig/trunk/contrib/zebra/build.xml Thu Jun 17 18:44:31 2010
@@ -176,6 +176,49 @@ to call at top-level: ant deploy-contrib
 Tests failed!
   
 
+  
+
+
+
+
+
+
+  
+  
+  
+  
+  
+   
+ 
+  
+  
+  
+  
+  
+   
+  
+  
+
+  
+
+  
+  
+
+  
+
+
+
+Tests failed!
+  
   
   
   




svn commit: r955702 - in /hadoop/pig/branches/branch-0.7/contrib/zebra: CHANGES.txt build.xml

2010-06-17 Thread yanz
Author: yanz
Date: Thu Jun 17 18:45:27 2010
New Revision: 955702

URL: http://svn.apache.org/viewvc?rev=955702&view=rev
Log:
PIG-1455 Addition of test-unit as an ant target (yanz)

Modified:
hadoop/pig/branches/branch-0.7/contrib/zebra/CHANGES.txt
hadoop/pig/branches/branch-0.7/contrib/zebra/build.xml

Modified: hadoop/pig/branches/branch-0.7/contrib/zebra/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/branches/branch-0.7/contrib/zebra/CHANGES.txt?rev=955702&r1=955701&r2=955702&view=diff
==
--- hadoop/pig/branches/branch-0.7/contrib/zebra/CHANGES.txt (original)
+++ hadoop/pig/branches/branch-0.7/contrib/zebra/CHANGES.txt Thu Jun 17 
18:45:27 2010
@@ -4,6 +4,8 @@ Trunk (unreleased changes)
 
   INCOMPATIBLE CHANGES
 
+PIG-1455 Addition of test-unit as an ant target (yanz)
+
 PIG-1451 Change the build.test property in build to test.build.dir to be 
consistent with PIG (yanz)
 
 PIG-1444 Addition of test-smoke ant target (gauravj via yanz)

Modified: hadoop/pig/branches/branch-0.7/contrib/zebra/build.xml
URL: 
http://svn.apache.org/viewvc/hadoop/pig/branches/branch-0.7/contrib/zebra/build.xml?rev=955702&r1=955701&r2=955702&view=diff
==
--- hadoop/pig/branches/branch-0.7/contrib/zebra/build.xml (original)
+++ hadoop/pig/branches/branch-0.7/contrib/zebra/build.xml Thu Jun 17 18:45:27 
2010
@@ -176,6 +176,49 @@ to call at top-level: ant deploy-contrib
 Tests failed!
   
 
+  
+
+
+
+
+
+
+  
+  
+  
+  
+  
+   
+ 
+  
+  
+  
+  
+  
+   
+  
+  
+
+  
+
+  
+  
+
+  
+
+
+
+Tests failed!
+  
   
   
   




svn commit: r955703 - in /hadoop/pig/branches/branch-0.6/contrib/zebra: CHANGES.txt build.xml

2010-06-17 Thread yanz
Author: yanz
Date: Thu Jun 17 18:46:24 2010
New Revision: 955703

URL: http://svn.apache.org/viewvc?rev=955703&view=rev
Log:
PIG-1455 Addition of test-unit as an ant target (yanz)

Modified:
hadoop/pig/branches/branch-0.6/contrib/zebra/CHANGES.txt
hadoop/pig/branches/branch-0.6/contrib/zebra/build.xml

Modified: hadoop/pig/branches/branch-0.6/contrib/zebra/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/branches/branch-0.6/contrib/zebra/CHANGES.txt?rev=955703&r1=955702&r2=955703&view=diff
==
--- hadoop/pig/branches/branch-0.6/contrib/zebra/CHANGES.txt (original)
+++ hadoop/pig/branches/branch-0.6/contrib/zebra/CHANGES.txt Thu Jun 17 
18:46:24 2010
@@ -4,6 +4,8 @@ Trunk (unreleased changes)
 
   INCOMPATIBLE CHANGES
 
+PIG-1455 Addition of test-unit as an ant target (yanz)
+
 PIG-1451 Change the build.test property in build to test.build.dir to be 
consistent with PIG (yanz)
 
 PIG-1444 Addition of test-smoke ant target (gauravj via yanz)

Modified: hadoop/pig/branches/branch-0.6/contrib/zebra/build.xml
URL: 
http://svn.apache.org/viewvc/hadoop/pig/branches/branch-0.6/contrib/zebra/build.xml?rev=955703&r1=955702&r2=955703&view=diff
==
--- hadoop/pig/branches/branch-0.6/contrib/zebra/build.xml (original)
+++ hadoop/pig/branches/branch-0.6/contrib/zebra/build.xml Thu Jun 17 18:46:24 
2010
@@ -144,6 +144,49 @@ to call at top-level: ant deploy-contrib
 Tests failed!
   
 
+  
+
+
+
+
+
+
+  
+  
+  
+  
+  
+   
+ 
+  
+  
+  
+  
+  
+   
+  
+  
+
+  
+
+  
+  
+
+  
+
+
+
+Tests failed!
+  
   
   
   




svn commit: r955733 - in /hadoop/pig/trunk: CHANGES.txt build.xml

2010-06-17 Thread daijy
Author: daijy
Date: Thu Jun 17 20:43:41 2010
New Revision: 955733

URL: http://svn.apache.org/viewvc?rev=955733&view=rev
Log:
PIG-1457: Pig will run complete zebra test even we give -Dtestcase=xxx

Modified:
hadoop/pig/trunk/CHANGES.txt
hadoop/pig/trunk/build.xml

Modified: hadoop/pig/trunk/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/CHANGES.txt?rev=955733&r1=955732&r2=955733&view=diff
==
--- hadoop/pig/trunk/CHANGES.txt (original)
+++ hadoop/pig/trunk/CHANGES.txt Thu Jun 17 20:43:41 2010
@@ -86,6 +86,8 @@ PIG-1309: Map-side Cogroup (ashutoshc)
 
 BUG FIXES
 
+PIG-1457: Pig will run complete zebra test even we give -Dtestcase=xxx (daijy)
+
 PIG-1450: TestAlgebraicEvalLocal failures due to OOM (daijy)
 
 PIG-1433: pig should create success file if

Modified: hadoop/pig/trunk/build.xml
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/build.xml?rev=955733&r1=955732&r2=955733&view=diff
==
--- hadoop/pig/trunk/build.xml (original)
+++ hadoop/pig/trunk/build.xml Thu Jun 17 20:43:41 2010
@@ -612,9 +612,13 @@
 
 

-   
+   
 
 
+
+
+
+
 
 
   




svn commit: r955753 - /hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java

2010-06-17 Thread daijy
Author: daijy
Date: Thu Jun 17 21:34:40 2010
New Revision: 955753

URL: http://svn.apache.org/viewvc?rev=955753&view=rev
Log:
Fix TestDataBag failure for PIG-1428

Modified:
hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java

Modified: hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java?rev=955753&r1=955752&r2=955753&view=diff
==
--- hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java (original)
+++ hadoop/pig/trunk/src/org/apache/pig/data/DefaultAbstractBag.java Thu Jun 17 
21:34:40 2010
@@ -375,7 +375,7 @@ public abstract class DefaultAbstractBag
 
 protected void incSpillCount(Enum counter) {
 PigStatusReporter reporter = PigStatusReporter.getInstance();
-if (reporter != null) {
+if (reporter != null && reporter.getCounter(counter)!=null) {
 reporter.getCounter(counter).increment(1);
 } else {
 PigHadoopLogger.getInstance().warn(this, "Spill counter 
incremented", counter);




svn commit: r955763 [1/4] - in /hadoop/pig/trunk: CHANGES.txt test/org/apache/pig/test/TestMultiQuery.java test/org/apache/pig/test/TestMultiQueryBasic.java test/org/apache/pig/test/TestMultiQueryComp

2010-06-17 Thread rding
Author: rding
Date: Thu Jun 17 22:05:21 2010
New Revision: 955763

URL: http://svn.apache.org/viewvc?rev=955763&view=rev
Log:
PIG-1456: TestMultiQuery takes a long time to run

Added:
hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQueryBasic.java
hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQueryCompiler.java
Modified:
hadoop/pig/trunk/CHANGES.txt
hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQuery.java

Modified: hadoop/pig/trunk/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/CHANGES.txt?rev=955763&r1=955762&r2=955763&view=diff
==
--- hadoop/pig/trunk/CHANGES.txt (original)
+++ hadoop/pig/trunk/CHANGES.txt Thu Jun 17 22:05:21 2010
@@ -86,6 +86,8 @@ PIG-1309: Map-side Cogroup (ashutoshc)
 
 BUG FIXES
 
+PIG-1456: TestMultiQuery takes a long time to run (rding)
+
 PIG-1457: Pig will run complete zebra test even we give -Dtestcase=xxx (daijy)
 
 PIG-1450: TestAlgebraicEvalLocal failures due to OOM (daijy)




svn commit: r955763 [3/4] - in /hadoop/pig/trunk: CHANGES.txt test/org/apache/pig/test/TestMultiQuery.java test/org/apache/pig/test/TestMultiQueryBasic.java test/org/apache/pig/test/TestMultiQueryComp

2010-06-17 Thread rding
Added: hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQueryBasic.java
URL: 
http://svn.apache.org/viewvc/hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQueryBasic.java?rev=955763&view=auto
==
--- hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQueryBasic.java (added)
+++ hadoop/pig/trunk/test/org/apache/pig/test/TestMultiQueryBasic.java Thu Jun 
17 22:05:21 2010
@@ -0,0 +1,764 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.pig.test;
+
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertFalse;
+import static org.junit.Assert.assertTrue;
+
+import java.io.File;
+import java.io.FileWriter;
+import java.io.IOException;
+import java.io.PrintWriter;
+import java.io.StringReader;
+import java.util.HashMap;
+import java.util.Iterator;
+import java.util.List;
+import java.util.Map;
+
+import junit.framework.Assert;
+
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.FileSystem;
+import org.apache.hadoop.fs.Path;
+import org.apache.hadoop.io.WritableComparable;
+import org.apache.hadoop.mapreduce.Job;
+import org.apache.hadoop.mapreduce.JobContext;
+import org.apache.hadoop.mapreduce.OutputCommitter;
+import org.apache.hadoop.mapreduce.OutputFormat;
+import org.apache.hadoop.mapreduce.TaskAttemptContext;
+import org.apache.pig.ExecType;
+import org.apache.pig.LoadFunc;
+import org.apache.pig.PigServer;
+import org.apache.pig.ResourceSchema;
+import org.apache.pig.StoreFunc;
+import org.apache.pig.backend.executionengine.ExecJob;
+import org.apache.pig.data.DataBag;
+import org.apache.pig.data.Tuple;
+import org.apache.pig.impl.io.FileLocalizer;
+import org.apache.pig.tools.grunt.GruntParser;
+import org.junit.After;
+import org.junit.AfterClass;
+import org.junit.Before;
+import org.junit.BeforeClass;
+import org.junit.Test;
+import org.junit.runner.RunWith;
+import org.junit.runners.JUnit4;
+...@runwith(JUnit4.class)
+public class TestMultiQueryBasic {
+
+private static final MiniCluster cluster = MiniCluster.buildCluster();
+
+private PigServer myPig;
+
+@BeforeClass
+public static void setUpBeforeClass() throws IOException {
+Util.copyFromLocalToCluster(cluster,
+"test/org/apache/pig/test/data/passwd", "passwd");
+Util.copyFromLocalToCluster(cluster,
+"test/org/apache/pig/test/data/passwd2", "passwd2");
+}
+
+@AfterClass
+public static void tearDownAfterClass() throws IOException {
+Util.deleteFile(cluster, "passwd");
+Util.deleteFile(cluster, "passwd2");
+cluster.shutDown();
+}
+
+@Before
+public void setUp() throws Exception {
+cluster.setProperty("opt.multiquery", ""+true);
+myPig = new PigServer(ExecType.MAPREDUCE, cluster.getProperties());
+deleteOutputFiles();
+}
+
+@After
+public void tearDown() throws Exception {
+myPig = null;
+}
+
+ 
+@Test
+public void testMultiQueryWithTwoStores2() {
+
+System.out.println("= multi-query with 2 stores (2) =");
+
+try {
+myPig.setBatchOn();
+
+myPig.registerQuery("a = load 'passwd' " +
+"using PigStorage(':') as (uname:chararray, 
passwd:chararray, uid:int,gid:int);");
+myPig.registerQuery("b = filter a by uid > 5;");
+myPig.registerQuery("store b into '/tmp/output1';");
+myPig.registerQuery("c = group b by gid;");
+myPig.registerQuery("store c into '/tmp/output2';");
+
+List jobs = myPig.executeBatch();
+assertTrue(jobs.size() == 2);
+
+for (ExecJob job : jobs) {
+assertTrue(job.getStatus() == ExecJob.JOB_STATUS.COMPLETED);
+}
+
+} catch (Exception e) {
+e.printStackTrace();
+Assert.fail();
+} 
+}
+
+@Test
+public void testMultiQueryWithTwoLoads2() {
+
+System.out.println("= multi-query with two loads (2) =");
+
+try {
+myPig.setBatchOn();
+
+myPig.registerQuery("a = load 'passwd'