Author: jbellis
Date: Wed Dec 23 18:56:10 2009
New Revision: 893594
URL: http://svn.apache.org/viewvc?rev=893594&view=rev
Log:
throw out uninteresting rows in anticompaction before collating & reducing.
patch by jbellis and Stu Hood for CASSANDRA-607
Modified:
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/db/ColumnFamilyStore.java
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/io/CompactionIterator.java
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/utils/FBUtilities.java
Modified:
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/db/ColumnFamilyStore.java
URL:
http://svn.apache.org/viewvc/incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/db/ColumnFamilyStore.java?rev=893594&r1=893593&r2=893594&view=diff
==============================================================================
---
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/db/ColumnFamilyStore.java
(original)
+++
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/db/ColumnFamilyStore.java
Wed Dec 23 18:56:10 2009
@@ -53,12 +53,12 @@
import org.apache.commons.lang.ArrayUtils;
import org.apache.commons.collections.IteratorUtils;
import org.apache.commons.collections.PredicateUtils;
+import org.apache.commons.collections.iterators.CollatingIterator;
import org.apache.commons.collections.iterators.FilterIterator;
import org.cliffc.high_scale_lib.NonBlockingHashMap;
-
-import com.google.common.base.Predicate;
import com.google.common.collect.Iterators;
+import com.google.common.base.Predicate;
public final class ColumnFamilyStore implements ColumnFamilyStoreMBean
{
@@ -655,7 +655,6 @@
// if we have too many to compact all at once, compact older
ones first -- this avoids
// re-compacting files we just created.
Collections.sort(sstables);
- boolean major = sstables.size() == ssTables_.size();
filesCompacted += doFileCompaction(sstables.subList(0,
Math.min(sstables.size(), maxThreshold)));
}
logger_.debug(filesCompacted + " files compacted");
@@ -812,7 +811,7 @@
logger_.debug("Expected bloom filter size : " +
expectedBloomFilterSize);
SSTableWriter writer = null;
- CompactionIterator ci = new CompactionIterator(sstables,
getDefaultGCBefore(), sstables.size() == ssTables_.size());
+ CompactionIterator ci = new AntiCompactionIterator(sstables, ranges,
getDefaultGCBefore(), sstables.size() == ssTables_.size());
Iterator nni = new FilterIterator(ci,
PredicateUtils.notNullPredicate());
try
@@ -825,17 +824,14 @@
while (nni.hasNext())
{
CompactionIterator.CompactedRow row =
(CompactionIterator.CompactedRow) nni.next();
- if (Range.isTokenInRanges(row.key.token, ranges))
- {
- if (writer == null)
- {
- FileUtils.createDirectory(compactionFileLocation);
- String newFilename = new File(compactionFileLocation,
getTempSSTableFileName()).getAbsolutePath();
- writer = new SSTableWriter(newFilename,
expectedBloomFilterSize, StorageService.getPartitioner());
- }
- writer.append(row.key, row.buffer);
- totalkeysWritten++;
- }
+ if (writer == null)
+ {
+ FileUtils.createDirectory(compactionFileLocation);
+ String newFilename = new File(compactionFileLocation,
getTempSSTableFileName()).getAbsolutePath();
+ writer = new SSTableWriter(newFilename,
expectedBloomFilterSize, StorageService.getPartitioner());
+ }
+ writer.append(row.key, row.buffer);
+ totalkeysWritten++;
}
}
finally
@@ -1599,4 +1595,39 @@
ssTables_.clearUnsafe();
}
+ private static class AntiCompactionIterator extends CompactionIterator
+ {
+ public AntiCompactionIterator(Collection<SSTableReader> sstables,
Collection<Range> ranges, int gcBefore, boolean isMajor)
+ throws IOException
+ {
+ super(getCollatedRangeIterator(sstables, ranges), gcBefore,
isMajor);
+ }
+
+ private static Iterator
getCollatedRangeIterator(Collection<SSTableReader> sstables, final
Collection<Range> ranges)
+ throws IOException
+ {
+ org.apache.commons.collections.Predicate rangesPredicate = new
org.apache.commons.collections.Predicate()
+ {
+ public boolean evaluate(Object row)
+ {
+ return
Range.isTokenInRanges(((IteratingRow)row).getKey().token, ranges);
+ }
+ };
+ CollatingIterator iter =
FBUtilities.<IteratingRow>getCollatingIterator();
+ for (SSTableReader sstable : sstables)
+ {
+ SSTableScanner scanner = sstable.getScanner(FILE_BUFFER_SIZE);
+ iter.addIterator(new FilterIterator(scanner, rangesPredicate));
+ }
+ return iter;
+ }
+
+ public void close() throws IOException
+ {
+ for (Object o : ((CollatingIterator)source).getIterators())
+ {
+ ((SSTableScanner)((FilterIterator)o).getIterator()).close();
+ }
+ }
+ }
}
Modified:
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/io/CompactionIterator.java
URL:
http://svn.apache.org/viewvc/incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/io/CompactionIterator.java?rev=893594&r1=893593&r2=893594&view=diff
==============================================================================
---
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/io/CompactionIterator.java
(original)
+++
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/io/CompactionIterator.java
Wed Dec 23 18:56:10 2009
@@ -26,12 +26,13 @@
import java.io.IOError;
import java.util.List;
import java.util.ArrayList;
-import java.util.Comparator;
+import java.util.Iterator;
import org.apache.log4j.Logger;
import org.apache.commons.collections.iterators.CollatingIterator;
import org.apache.cassandra.utils.ReducingIterator;
+import org.apache.cassandra.utils.FBUtilities;
import org.apache.cassandra.db.ColumnFamily;
import org.apache.cassandra.db.DecoratedKey;
import org.apache.cassandra.db.ColumnFamilyStore;
@@ -40,31 +41,29 @@
{
private static Logger logger = Logger.getLogger(CompactionIterator.class);
- private static final int FILE_BUFFER_SIZE = 1024 * 1024;
+ protected static final int FILE_BUFFER_SIZE = 1024 * 1024;
private final List<IteratingRow> rows = new ArrayList<IteratingRow>();
private final int gcBefore;
private boolean major;
- @SuppressWarnings("unchecked")
public CompactionIterator(Iterable<SSTableReader> sstables, int gcBefore,
boolean major) throws IOException
{
- super(getCollatingIterator(sstables));
+ this(getCollatingIterator(sstables), gcBefore, major);
+ }
+
+ @SuppressWarnings("unchecked")
+ protected CompactionIterator(Iterator iter, int gcBefore, boolean major)
+ {
+ super(iter);
this.gcBefore = gcBefore;
this.major = major;
}
@SuppressWarnings("unchecked")
- private static CollatingIterator
getCollatingIterator(Iterable<SSTableReader> sstables) throws IOException
+ protected static CollatingIterator
getCollatingIterator(Iterable<SSTableReader> sstables) throws IOException
{
- // CollatingIterator has a bug that causes NPE when you try to use
default comparator. :(
- CollatingIterator iter = new CollatingIterator(new Comparator()
- {
- public int compare(Object o1, Object o2)
- {
- return ((Comparable)o1).compareTo(o2);
- }
- });
+ CollatingIterator iter =
FBUtilities.<IteratingRow>getCollatingIterator();
for (SSTableReader sstable : sstables)
{
iter.addIterator(sstable.getScanner(FILE_BUFFER_SIZE));
Modified:
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/utils/FBUtilities.java
URL:
http://svn.apache.org/viewvc/incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/utils/FBUtilities.java?rev=893594&r1=893593&r2=893594&view=diff
==============================================================================
---
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/utils/FBUtilities.java
(original)
+++
incubator/cassandra/branches/cassandra-0.5/src/java/org/apache/cassandra/utils/FBUtilities.java
Wed Dec 23 18:56:10 2009
@@ -30,6 +30,8 @@
import org.apache.log4j.Logger;
+import org.apache.commons.collections.iterators.CollatingIterator;
+
import org.apache.cassandra.config.DatabaseDescriptor;
public class FBUtilities
@@ -304,4 +306,16 @@
throw new IOException("rename failed of " + filename);
}
}
+
+ public static <T extends Comparable<T>> CollatingIterator
getCollatingIterator()
+ {
+ // CollatingIterator will happily NPE if you do not specify a
comparator explicitly
+ return new CollatingIterator(new Comparator<T>()
+ {
+ public int compare(T o1, T o2)
+ {
+ return o1.compareTo(o2);
+ }
+ });
+ }
}