This is an automated email from the ASF dual-hosted git repository. dwysakowicz pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/flink.git
commit fe3d9a42995cfee0dfd90e8031768cb130543189 Author: bvarghese1 <bvargh...@confluent.io> AuthorDate: Tue Jan 16 17:54:46 2024 -0800 [FLINK-34118] Implement restore tests for Sort node --- .../plan/nodes/exec/stream/SortRestoreTest.java | 38 +++++ .../plan/nodes/exec/stream/SortTestPrograms.java | 48 +++++- .../plan/nodes/exec/testutils/RestoreTestBase.java | 9 +- .../stream-exec-sort_1/sort-asc/plan/sort-asc.json | 164 +++++++++++++++++++++ .../sort-desc/plan/sort-desc.json | 164 +++++++++++++++++++++ 5 files changed, 421 insertions(+), 2 deletions(-) diff --git a/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortRestoreTest.java b/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortRestoreTest.java new file mode 100644 index 00000000000..18e9792f9ed --- /dev/null +++ b/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortRestoreTest.java @@ -0,0 +1,38 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.flink.table.planner.plan.nodes.exec.stream; + +import org.apache.flink.table.planner.plan.nodes.exec.testutils.RestoreTestBase; +import org.apache.flink.table.test.program.TableTestProgram; + +import java.util.Arrays; +import java.util.List; + +/** Restore tests for {@link StreamExecSort}. */ +public class SortRestoreTest extends RestoreTestBase { + + public SortRestoreTest() { + super(StreamExecSort.class, AfterRestoreSource.NO_RESTORE); + } + + @Override + public List<TableTestProgram> programs() { + return Arrays.asList(SortTestPrograms.SORT_ASC, SortTestPrograms.SORT_DESC); + } +} diff --git a/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortTestPrograms.java b/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortTestPrograms.java index 0a6f68d4e76..2959e2e6a0e 100644 --- a/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortTestPrograms.java +++ b/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/stream/SortTestPrograms.java @@ -18,6 +18,7 @@ package org.apache.flink.table.planner.plan.nodes.exec.stream; +import org.apache.flink.table.planner.utils.InternalConfigOptions; import org.apache.flink.table.test.program.SinkTestStep; import org.apache.flink.table.test.program.SourceTestStep; import org.apache.flink.table.test.program.TableTestProgram; @@ -25,7 +26,8 @@ import org.apache.flink.types.Row; /** * {@link TableTestProgram} definitions for testing {@link - * org.apache.flink.table.planner.plan.nodes.exec.stream.StreamExecSortLimit}. + * org.apache.flink.table.planner.plan.nodes.exec.stream.StreamExecSortLimit} and {@link + * org.apache.flink.table.planner.plan.nodes.exec.stream.StreamExecSort}. */ public class SortTestPrograms { @@ -123,4 +125,48 @@ public class SortTestPrograms { .build()) .runSql("INSERT INTO sink_t SELECT * from source_t ORDER BY a DESC LIMIT 3") .build(); + + static final TableTestProgram SORT_ASC = + TableTestProgram.of("sort-asc", "validates sort node by sorting integers in asc mode") + .setupConfig(InternalConfigOptions.TABLE_EXEC_NON_TEMPORAL_SORT_ENABLED, true) + .setupTableSource( + SourceTestStep.newBuilder("source_t") + .addSchema("a INT", "b VARCHAR", "c INT") + .producedValues(DATA) + .build()) + .setupTableSink( + SinkTestStep.newBuilder("sink_t") + .addSchema("a INT", "b VARCHAR", "c BIGINT") + .consumedValues( + "+I[1, a, 5]", + "+I[2, a, 6]", + "+I[3, b, 7]", + "+I[4, b, 8]", + "+I[5, c, 9]", + "+I[6, c, 10]") + .build()) + .runSql("INSERT INTO sink_t SELECT * from source_t ORDER BY a") + .build(); + + static final TableTestProgram SORT_DESC = + TableTestProgram.of("sort-desc", "validates sort node by sorting integers in desc mode") + .setupConfig(InternalConfigOptions.TABLE_EXEC_NON_TEMPORAL_SORT_ENABLED, true) + .setupTableSource( + SourceTestStep.newBuilder("source_t") + .addSchema("a INT", "b VARCHAR", "c INT") + .producedValues(DATA) + .build()) + .setupTableSink( + SinkTestStep.newBuilder("sink_t") + .addSchema("a INT", "b VARCHAR", "c BIGINT") + .consumedValues( + "+I[6, c, 10]", + "+I[5, c, 9]", + "+I[4, b, 8]", + "+I[3, b, 7]", + "+I[2, a, 6]", + "+I[1, a, 5]") + .build()) + .runSql("INSERT INTO sink_t SELECT * from source_t ORDER BY a DESC") + .build(); } diff --git a/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/testutils/RestoreTestBase.java b/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/testutils/RestoreTestBase.java index 5b766a62ac9..702d03370f5 100644 --- a/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/testutils/RestoreTestBase.java +++ b/flink-table/flink-table-planner/src/test/java/org/apache/flink/table/planner/plan/nodes/exec/testutils/RestoreTestBase.java @@ -43,6 +43,7 @@ import org.apache.flink.table.test.program.TableTestProgram; import org.apache.flink.table.test.program.TableTestProgramRunner; import org.apache.flink.table.test.program.TestStep.TestKind; import org.apache.flink.test.junit5.MiniClusterExtension; +import org.apache.flink.types.Row; import org.apache.commons.collections.CollectionUtils; import org.junit.jupiter.api.AfterEach; @@ -63,6 +64,7 @@ import java.nio.file.Path; import java.nio.file.Paths; import java.nio.file.StandardCopyOption; import java.util.ArrayList; +import java.util.Collection; import java.util.Collections; import java.util.EnumSet; import java.util.HashMap; @@ -118,6 +120,7 @@ public abstract class RestoreTestBase implements TableTestProgramRunner { TestKind.FUNCTION, TestKind.TEMPORAL_FUNCTION, TestKind.SOURCE_WITH_RESTORE_DATA, + TestKind.SOURCE_WITH_DATA, TestKind.SINK_WITH_RESTORE_DATA, TestKind.SINK_WITH_DATA); } @@ -264,7 +267,11 @@ public abstract class RestoreTestBase implements TableTestProgramRunner { program.getSetupConfigOptionTestSteps().forEach(s -> s.apply(tEnv)); for (SourceTestStep sourceTestStep : program.getSetupSourceTestSteps()) { - final String id = TestValuesTableFactory.registerData(sourceTestStep.dataAfterRestore); + final Collection<Row> data = + afterRestoreSource == AfterRestoreSource.NO_RESTORE + ? sourceTestStep.dataBeforeRestore + : sourceTestStep.dataAfterRestore; + final String id = TestValuesTableFactory.registerData(data); final Map<String, String> options = new HashMap<>(); options.put("connector", "values"); options.put("data-id", id); diff --git a/flink-table/flink-table-planner/src/test/resources/restore-tests/stream-exec-sort_1/sort-asc/plan/sort-asc.json b/flink-table/flink-table-planner/src/test/resources/restore-tests/stream-exec-sort_1/sort-asc/plan/sort-asc.json new file mode 100644 index 00000000000..333017882b4 --- /dev/null +++ b/flink-table/flink-table-planner/src/test/resources/restore-tests/stream-exec-sort_1/sort-asc/plan/sort-asc.json @@ -0,0 +1,164 @@ +{ + "flinkVersion" : "1.19", + "nodes" : [ { + "id" : 1, + "type" : "stream-exec-table-source-scan_1", + "scanTableSource" : { + "table" : { + "identifier" : "`default_catalog`.`default_database`.`source_t`", + "resolvedTable" : { + "schema" : { + "columns" : [ { + "name" : "a", + "dataType" : "INT" + }, { + "name" : "b", + "dataType" : "VARCHAR(2147483647)" + }, { + "name" : "c", + "dataType" : "INT" + } ], + "watermarkSpecs" : [ ] + }, + "partitionKeys" : [ ] + } + } + }, + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` INT>", + "description" : "TableSourceScan(table=[[default_catalog, default_database, source_t]], fields=[a, b, c])", + "inputProperties" : [ ] + }, { + "id" : 2, + "type" : "stream-exec-exchange_1", + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "SINGLETON" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` INT>", + "description" : "Exchange(distribution=[single])" + }, { + "id" : 3, + "type" : "stream-exec-sort_1", + "orderBy" : { + "fields" : [ { + "index" : 0, + "isAscending" : true, + "nullIsLast" : false + } ] + }, + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "UNKNOWN" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` INT>", + "description" : "Sort(orderBy=[a ASC])" + }, { + "id" : 4, + "type" : "stream-exec-calc_1", + "projection" : [ { + "kind" : "INPUT_REF", + "inputIndex" : 0, + "type" : "INT" + }, { + "kind" : "INPUT_REF", + "inputIndex" : 1, + "type" : "VARCHAR(2147483647)" + }, { + "kind" : "CALL", + "syntax" : "SPECIAL", + "internalName" : "$CAST$1", + "operands" : [ { + "kind" : "INPUT_REF", + "inputIndex" : 2, + "type" : "INT" + } ], + "type" : "BIGINT" + } ], + "condition" : null, + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "UNKNOWN" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` BIGINT>", + "description" : "Calc(select=[a, b, CAST(c AS BIGINT) AS c])" + }, { + "id" : 5, + "type" : "stream-exec-sink_1", + "configuration" : { + "table.exec.sink.keyed-shuffle" : "AUTO", + "table.exec.sink.not-null-enforcer" : "ERROR", + "table.exec.sink.rowtime-inserter" : "ENABLED", + "table.exec.sink.type-length-enforcer" : "IGNORE", + "table.exec.sink.upsert-materialize" : "AUTO" + }, + "dynamicTableSink" : { + "table" : { + "identifier" : "`default_catalog`.`default_database`.`sink_t`", + "resolvedTable" : { + "schema" : { + "columns" : [ { + "name" : "a", + "dataType" : "INT" + }, { + "name" : "b", + "dataType" : "VARCHAR(2147483647)" + }, { + "name" : "c", + "dataType" : "BIGINT" + } ], + "watermarkSpecs" : [ ] + }, + "partitionKeys" : [ ] + } + } + }, + "inputChangelogMode" : [ "INSERT" ], + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "UNKNOWN" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` BIGINT>", + "description" : "Sink(table=[default_catalog.default_database.sink_t], fields=[a, b, c])" + } ], + "edges" : [ { + "source" : 1, + "target" : 2, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + }, { + "source" : 2, + "target" : 3, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + }, { + "source" : 3, + "target" : 4, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + }, { + "source" : 4, + "target" : 5, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + } ] +} \ No newline at end of file diff --git a/flink-table/flink-table-planner/src/test/resources/restore-tests/stream-exec-sort_1/sort-desc/plan/sort-desc.json b/flink-table/flink-table-planner/src/test/resources/restore-tests/stream-exec-sort_1/sort-desc/plan/sort-desc.json new file mode 100644 index 00000000000..6be002da6a6 --- /dev/null +++ b/flink-table/flink-table-planner/src/test/resources/restore-tests/stream-exec-sort_1/sort-desc/plan/sort-desc.json @@ -0,0 +1,164 @@ +{ + "flinkVersion" : "1.19", + "nodes" : [ { + "id" : 1, + "type" : "stream-exec-table-source-scan_1", + "scanTableSource" : { + "table" : { + "identifier" : "`default_catalog`.`default_database`.`source_t`", + "resolvedTable" : { + "schema" : { + "columns" : [ { + "name" : "a", + "dataType" : "INT" + }, { + "name" : "b", + "dataType" : "VARCHAR(2147483647)" + }, { + "name" : "c", + "dataType" : "INT" + } ], + "watermarkSpecs" : [ ] + }, + "partitionKeys" : [ ] + } + } + }, + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` INT>", + "description" : "TableSourceScan(table=[[default_catalog, default_database, source_t]], fields=[a, b, c])", + "inputProperties" : [ ] + }, { + "id" : 2, + "type" : "stream-exec-exchange_1", + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "SINGLETON" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` INT>", + "description" : "Exchange(distribution=[single])" + }, { + "id" : 3, + "type" : "stream-exec-sort_1", + "orderBy" : { + "fields" : [ { + "index" : 0, + "isAscending" : false, + "nullIsLast" : true + } ] + }, + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "UNKNOWN" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` INT>", + "description" : "Sort(orderBy=[a DESC])" + }, { + "id" : 4, + "type" : "stream-exec-calc_1", + "projection" : [ { + "kind" : "INPUT_REF", + "inputIndex" : 0, + "type" : "INT" + }, { + "kind" : "INPUT_REF", + "inputIndex" : 1, + "type" : "VARCHAR(2147483647)" + }, { + "kind" : "CALL", + "syntax" : "SPECIAL", + "internalName" : "$CAST$1", + "operands" : [ { + "kind" : "INPUT_REF", + "inputIndex" : 2, + "type" : "INT" + } ], + "type" : "BIGINT" + } ], + "condition" : null, + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "UNKNOWN" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` BIGINT>", + "description" : "Calc(select=[a, b, CAST(c AS BIGINT) AS c])" + }, { + "id" : 5, + "type" : "stream-exec-sink_1", + "configuration" : { + "table.exec.sink.keyed-shuffle" : "AUTO", + "table.exec.sink.not-null-enforcer" : "ERROR", + "table.exec.sink.rowtime-inserter" : "ENABLED", + "table.exec.sink.type-length-enforcer" : "IGNORE", + "table.exec.sink.upsert-materialize" : "AUTO" + }, + "dynamicTableSink" : { + "table" : { + "identifier" : "`default_catalog`.`default_database`.`sink_t`", + "resolvedTable" : { + "schema" : { + "columns" : [ { + "name" : "a", + "dataType" : "INT" + }, { + "name" : "b", + "dataType" : "VARCHAR(2147483647)" + }, { + "name" : "c", + "dataType" : "BIGINT" + } ], + "watermarkSpecs" : [ ] + }, + "partitionKeys" : [ ] + } + } + }, + "inputChangelogMode" : [ "INSERT" ], + "inputProperties" : [ { + "requiredDistribution" : { + "type" : "UNKNOWN" + }, + "damBehavior" : "PIPELINED", + "priority" : 0 + } ], + "outputType" : "ROW<`a` INT, `b` VARCHAR(2147483647), `c` BIGINT>", + "description" : "Sink(table=[default_catalog.default_database.sink_t], fields=[a, b, c])" + } ], + "edges" : [ { + "source" : 1, + "target" : 2, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + }, { + "source" : 2, + "target" : 3, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + }, { + "source" : 3, + "target" : 4, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + }, { + "source" : 4, + "target" : 5, + "shuffle" : { + "type" : "FORWARD" + }, + "shuffleMode" : "PIPELINED" + } ] +} \ No newline at end of file