This is an automated email from the ASF dual-hosted git repository.
dataroaring pushed a commit to branch branch-2.1
in repository https://gitbox.apache.org/repos/asf/doris.git
The following commit(s) were added to refs/heads/branch-2.1 by this push:
new 97e4025ee05 [branch-2.1](routine-load) increase routine load job
default max batch size and rows (#37388)
97e4025ee05 is described below
commit 97e4025ee055a26bc1d4986a21780a714dad409a
Author: hui lai <[email protected]>
AuthorDate: Sun Jul 7 18:35:08 2024 +0800
[branch-2.1](routine-load) increase routine load job default max batch size
and rows (#37388)
pick #36632
Most users only care about the size of **max_batch_interval**, but in
order to achieve an interval effect, they have to configure
**max_batch_rows** and **max_batch_size** according to the
characteristics of the data. By adjusting these two default values,
users do not need to worry about configuration in most scenarios.
## Proposed changes
Issue Number: close #xxx
<!--Describe your changes.-->
---
.../main/java/org/apache/doris/load/routineload/RoutineLoadJob.java | 4 ++--
.../java/org/apache/doris/load/routineload/RoutineLoadJobTest.java | 3 +--
2 files changed, 3 insertions(+), 4 deletions(-)
diff --git
a/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadJob.java
b/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadJob.java
index 130bd87b018..0a85bc63ac1 100644
---
a/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadJob.java
+++
b/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadJob.java
@@ -109,8 +109,8 @@ public abstract class RoutineLoadJob extends
AbstractTxnStateChangeCallback impl
public static final double DEFAULT_MAX_FILTER_RATIO = 1.0;
public static final long DEFAULT_MAX_INTERVAL_SECOND = 10;
- public static final long DEFAULT_MAX_BATCH_ROWS = 200000;
- public static final long DEFAULT_MAX_BATCH_SIZE = 100 * 1024 * 1024; //
100MB
+ public static final long DEFAULT_MAX_BATCH_ROWS = 20000000;
+ public static final long DEFAULT_MAX_BATCH_SIZE = 1024 * 1024 * 1024; //
1GB
public static final long DEFAULT_EXEC_MEM_LIMIT = 2 * 1024 * 1024 * 1024L;
public static final boolean DEFAULT_STRICT_MODE = false; // default is
false
public static final int DEFAULT_SEND_BATCH_PARALLELISM = 1;
diff --git
a/fe/fe-core/src/test/java/org/apache/doris/load/routineload/RoutineLoadJobTest.java
b/fe/fe-core/src/test/java/org/apache/doris/load/routineload/RoutineLoadJobTest.java
index d9494374c03..863cc6807c7 100644
---
a/fe/fe-core/src/test/java/org/apache/doris/load/routineload/RoutineLoadJobTest.java
+++
b/fe/fe-core/src/test/java/org/apache/doris/load/routineload/RoutineLoadJobTest.java
@@ -355,7 +355,6 @@ public class RoutineLoadJobTest {
11, "localhost:9092", "test_topic", UserIdentity.ADMIN);
Deencapsulation.setField(routineLoadJob, "maxErrorNum", 10);
Deencapsulation.setField(routineLoadJob, "maxBatchRows", 10);
- Deencapsulation.setField(routineLoadJob, "maxBatchRows", 10);
String showCreateInfo = routineLoadJob.getShowCreateInfo();
String expect = "CREATE ROUTINE LOAD test_load ON 11\n"
+ "WITH APPEND\n"
@@ -366,7 +365,7 @@ public class RoutineLoadJobTest {
+ "\"max_filter_ratio\" = \"1.0\",\n"
+ "\"max_batch_interval\" = \"10\",\n"
+ "\"max_batch_rows\" = \"10\",\n"
- + "\"max_batch_size\" = \"104857600\",\n"
+ + "\"max_batch_size\" = \"1073741824\",\n"
+ "\"format\" = \"csv\",\n"
+ "\"strip_outer_array\" = \"false\",\n"
+ "\"num_as_string\" = \"false\",\n"
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]