Re: [PR] WIP - Create new test that creates lots of splits [accumulo-testing]

via GitHub Thu, 14 Dec 2023 12:24:42 -0800


DomGarguilo commented on code in PR #267:
URL: https://github.com/apache/accumulo-testing/pull/267#discussion_r1427234075



##########
src/main/java/org/apache/accumulo/testing/continuous/ManySplits.java:
##########
@@ -0,0 +1,254 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   https://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+package org.apache.accumulo.testing.continuous;
+
+import static java.util.concurrent.TimeUnit.MILLISECONDS;
+import static java.util.concurrent.TimeUnit.NANOSECONDS;
+import static java.util.concurrent.TimeUnit.SECONDS;
+
+import java.util.Collection;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Properties;
+import java.util.Random;
+import java.util.Set;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+import org.apache.accumulo.core.client.AccumuloClient;
+import org.apache.accumulo.core.client.AccumuloException;
+import org.apache.accumulo.core.client.AccumuloSecurityException;
+import org.apache.accumulo.core.client.NamespaceExistsException;
+import org.apache.accumulo.core.client.Scanner;
+import org.apache.accumulo.core.client.TableExistsException;
+import org.apache.accumulo.core.client.TableNotFoundException;
+import org.apache.accumulo.core.client.admin.CloneConfiguration;
+import org.apache.accumulo.core.client.admin.NewTableConfiguration;
+import org.apache.accumulo.core.conf.ConfigurationTypeHelper;
+import org.apache.accumulo.core.conf.Property;
+import org.apache.accumulo.core.data.TableId;
+import org.apache.accumulo.core.dataImpl.KeyExtent;
+import org.apache.accumulo.core.metadata.MetadataTable;
+import org.apache.accumulo.core.metadata.schema.DataFileValue;
+import org.apache.accumulo.core.metadata.schema.MetadataSchema;
+import org.apache.accumulo.testing.TestProps;
+import org.apache.hadoop.io.Text;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import com.google.common.base.Preconditions;
+
+public class ManySplits {
+  private static final Logger log = LoggerFactory.getLogger(ManySplits.class);
+
+  private static final String NAMESPACE = "manysplits";
+
+  public static void main(String[] args) throws Exception {
+    try (ContinuousEnv env = new ContinuousEnv(args)) {
+
+      AccumuloClient client = env.getAccumuloClient();
+      Properties testProps = env.getTestProperties();
+      final int tableCount =
+          
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_TABLE_COUNT));
+      final long rowMin = 
Long.parseLong(testProps.getProperty(TestProps.CI_SPLIT_INGEST_ROW_MIN));
+      final long rowMax = 
Long.parseLong(testProps.getProperty(TestProps.CI_SPLIT_INGEST_ROW_MAX));
+      final int maxColF = 
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_INGEST_MAX_CF));
+      final int maxColQ = 
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_INGEST_MAX_CQ));
+      final int initialSplits =
+          
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_INITIAL_SPLITS));
+      final int initialData =
+          
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_WRITE_SIZE));
+      String initialSplitThresholdStr = 
testProps.getProperty(TestProps.CI_SPLIT_THRESHOLD);
+      final long initialSplitThreshold =
+          
ConfigurationTypeHelper.getFixedMemoryAsBytes(initialSplitThresholdStr);
+      final int splitThresholdReductionFactor =
+          
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_THRESHOLD_REDUCTION_FACTOR));
+      final int testRounds =
+          
Integer.parseInt(testProps.getProperty(TestProps.CI_SPLIT_TEST_ROUNDS));
+
+      // disable deletes for ingest
+      testProps.setProperty(TestProps.CI_INGEST_DELETE_PROBABILITY, "0.0");
+
+      final Random random = env.getRandom();
+
+      Preconditions.checkArgument(tableCount > 0, "Test cannot run without any 
tables");
+
+      final List<String> tableNames = IntStream.range(1, tableCount + 1)
+          .mapToObj(i -> NAMESPACE + ".table" + 
i).collect(Collectors.toList());
+
+      try {
+        client.namespaceOperations().create(NAMESPACE);
+      } catch (NamespaceExistsException e) {
+        log.info("The namespace '{}' already exists. Continuing with existing 
namespace.",
+            NAMESPACE);
+      }
+
+      final NewTableConfiguration ntc = new NewTableConfiguration();
+      ntc.setProperties(Map.of(Property.TABLE_SPLIT_THRESHOLD.getKey(), 
initialSplitThresholdStr));
+
+      log.info("Properties being used to create tables for this test: {}",
+          ntc.getProperties().toString());
+
+      final String firstTable = tableNames.get(0);
+
+      log.info("Creating initial table: {}", firstTable);
+      try {
+        client.tableOperations().create(firstTable, ntc);
+      } catch (TableExistsException e) {
+        log.info("Test probably wont work if the table already exists with 
data present", e);
+      }
+
+      log.info("Ingesting {} entries into first table, {}.", initialData, 
firstTable);
+      ContinuousIngest.doIngest(client, rowMin, rowMax, firstTable, testProps, 
maxColF, maxColQ,
+          initialData, false, random);
+
+      client.tableOperations().flush(firstTable);
+
+      // clone tables instead of ingesting into each. it's a lot quicker
+      log.info("Creating {} more tables by cloning the first", tableCount - 1);
+      tableNames.stream().parallel().skip(1).forEach(tableName -> {
+        try {
+          client.tableOperations().clone(firstTable, tableName,
+              CloneConfiguration.builder().build());
+        } catch (TableExistsException e) {
+          log.info(
+              "table {} already exists. Continuing with existing table. This 
might mess with the expected values",
+              tableName);
+        } catch (Exception e) {
+          throw new RuntimeException(e);
+        }
+      });
+
+      // main loop
+      // reduce the split threshold then wait for the expected file size per 
tablet to be reached
+      long previousSplitThreshold = initialSplitThreshold;
+      for (int i = 0; i < testRounds; i++) {
+
+        // apply the reduction factor to the previous threshold
+        final long splitThreshold = previousSplitThreshold / 
splitThresholdReductionFactor;
+        final String splitThresholdStr = bytesToMemoryString(splitThreshold);
+
+        log.info("Changing split threshold on all tables from {} to {}",
+            bytesToMemoryString(previousSplitThreshold), splitThresholdStr);
+
+        previousSplitThreshold = splitThreshold;
+
+        long beforeThresholdUpdate = System.nanoTime();
+
+        // update the split threshold on all tables
+        tableNames.stream().parallel().forEach(tableName -> {
+          try {
+            client.tableOperations().setProperty(tableName, 
Property.TABLE_SPLIT_THRESHOLD.getKey(),
+                splitThresholdStr);
+          } catch (Exception e) {
+            throw new RuntimeException(e);
+          }
+        });
+
+        log.info("Waiting for all tablets to have a sum file size <= {}", 
splitThreshold);
+
+        // wait for all tablets to reach the expected sum file size
+        tableNames.stream().parallel().forEach(tableName -> {
+          int elapsedMillis = 0;
+          long sleepMillis = SECONDS.toMillis(1);
+          try {
+            // wait for each tablet to reach the expected sum file size
+            while (true) {
+              Collection<Long> tabletFileSizes = getTabletFileSizes(client, 
tableName).values();
+              // filter out the tablets that are already the expected size
+              Set<Long> offendingTabletSizes =
+                  tabletFileSizes.stream().filter(tabletFileSize -> 
tabletFileSize > splitThreshold)
+                      .collect(Collectors.toSet());
+              // if all tablets are good, move on
+              if (offendingTabletSizes.isEmpty()) {
+                break;
+              }
+
+              elapsedMillis += sleepMillis;
+              // log every 3 seconds
+              if (elapsedMillis % SECONDS.toMillis(3) == 0) {
+                double averageFileSize =
+                    offendingTabletSizes.stream().mapToLong(l -> 
l).average().orElse(0);
+                log.info(
+                    "{} has {} tablets whose file sizes are not yet <= {}. 
Avg. offending file size: {}",
+                    tableName, offendingTabletSizes.size(), splitThreshold,
+                    String.format("%.0f", averageFileSize));
+              }
+              MILLISECONDS.sleep(sleepMillis);
+            }
+          } catch (Exception e) {
+            throw new RuntimeException(e);
+          }
+        });
+
+        long timeTaken = System.nanoTime() - beforeThresholdUpdate;
+
+        log.info(
+            "Time taken for all tables to reach expected total file size ({}): 
{} seconds ({}ms)",
+            splitThresholdStr, NANOSECONDS.toSeconds(timeTaken), 
NANOSECONDS.toMillis(timeTaken));
+      }
+
+      log.info("Deleting tables");
+      tableNames.stream().parallel().forEach(tableName -> {
+        try {
+          client.tableOperations().delete(tableName);
+        } catch (Exception e) {
+          throw new RuntimeException(e);
+        }
+      });
+      log.info("Deleting namespace");
+      client.namespaceOperations().delete(NAMESPACE);
+
+    }
+  }
+
+  /**
+   * @return a map of tablets to the sum of their file size
+   */
+  private static Map<Text,Long> getTabletFileSizes(AccumuloClient client, 
String tableName)
+      throws TableNotFoundException, AccumuloException, 
AccumuloSecurityException {
+    TableId tableId = 
TableId.of(client.tableOperations().tableIdMap().get(tableName));
+    try (Scanner scanner = client.createScanner(MetadataTable.NAME)) {

Review Comment:
   Also had an observation/question here. It seems like using a BatchScanner 
with a list of only the tabets whos file size sum is not what we want would be 
more efficient here. I was wondering if there is a way to supply an inverse set 
of ranges to use. For this case we know the tablets that have already reached 
that condition so could we somehow construct a list of ranges around those 
tablets as opposed to a list of ranges on those tablets?
   
   For this case I don't think it would be very practical because we are not 
particularly worried about efficiency here, plus the set of tablets is expected 
to change frequently. But was curious so I thought I would ask.



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Re: [PR] WIP - Create new test that creates lots of splits [accumulo-testing]

Reply via email to