[
https://issues.apache.org/jira/browse/SPARK-31928?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
]
Jungtaek Lim updated SPARK-31928:
---------------------------------
Description:
Test failed:
https://amplab.cs.berkeley.edu/jenkins/job/SparkPullRequestBuilder/123621/
{code:java}
[info] with spark.sql.streaming.noDataMicroBatches.enabled = false
[info] Assert on query failed: :
[info] Assert on query failed:
[info]
[info] == Progress ==
[info]
StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
-> false),null)
[info] AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
[info] CheckAnswer: [10],[11],[12],[13],[14],[15]
[info] AssertOnQuery(<condition>, Check total state rows = List(6),
updated state rows = List(6))
[info] AddData to MemoryStream[value#437541]: 25
[info] CheckNewAnswer: [25]
[info] AssertOnQuery(<condition>, Check total state rows = List(7),
updated state rows = List(1))
[info] => AssertOnQuery(<condition>, )
[info]
[info] == Stream ==
[info] Output Mode: Append
[info] Stream state: {MemoryStream[value#437541]: 1}
[info] Thread state: alive
[info] Thread stack trace: java.lang.Thread.sleep(Native Method)
[info]
org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
[info]
org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
Source)
[info]
org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
[info]
org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
[info]
org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
[info]
org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
[info]
[info]
[info] == Sink ==
[info] 0: [11] [14] [13] [10] [15] [12]
[info] 1: [25]
[info]
[info]
[info] == Plan ==
[info] == Parsed Logical Plan ==
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
[info] +- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
[info]
[info] == Analyzed Logical Plan ==
[info]
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
[info] +- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
[info]
[info] == Optimized Logical Plan ==
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
[info] +- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
[info]
[info] == Physical Plan ==
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- *(2) Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- StreamingDeduplicate [value#437541, eventTime#437544-T10000ms],
state info [ checkpoint =
file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1, numPartitions
= 5], 5000
[info] +- Exchange hashpartitioning(value#437541,
eventTime#437544-T10000ms, 5), true, [id=#875392]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- *(1) Project [value#437541, cast(value#437541 as
timestamp) AS eventTime#437544]
[info] +- *(1) Project [value#437541]
[info] +- MicroBatchScan[value#437541]
MemoryStreamDataSource
[info]
[info]
[info]
[info]
org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
[info]
org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
[info]
org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
[info] org.scalatest.Assertions.fail(Assertions.scala:1091)
[info] org.scalatest.Assertions.fail$(Assertions.scala:1087)
[info] org.scalatest.FunSuite.fail(FunSuite.scala:1560)
[info]
org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
[info]
org.apache.spark.sql.streaming.StreamTest.verify$1(StreamTest.scala:423)
[info]
org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:651)
[info]
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
[info]
[info]
[info] == Progress ==
[info]
StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
-> false),null)
[info] AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
[info] CheckAnswer: [10],[11],[12],[13],[14],[15]
[info] AssertOnQuery(<condition>, Check total state rows = List(6),
updated state rows = List(6))
[info] AddData to MemoryStream[value#437541]: 25
[info] CheckNewAnswer: [25]
[info] AssertOnQuery(<condition>, Check total state rows = List(7),
updated state rows = List(1))
[info] => AssertOnQuery(<condition>, )
[info]
[info] == Stream ==
[info] Output Mode: Append
[info] Stream state: {MemoryStream[value#437541]: 1}
[info] Thread state: alive
[info] Thread stack trace: java.lang.Thread.sleep(Native Method)
[info]
org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
[info]
org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
Source)
[info]
org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
[info]
org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
[info]
org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
[info]
org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
[info]
[info]
[info] == Sink ==
[info] 0: [11] [14] [13] [10] [15] [12]
[info] 1: [25]
[info]
[info]
[info] == Plan ==
[info] == Parsed Logical Plan ==
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
[info] +- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
[info]
[info] == Analyzed Logical Plan ==
[info]
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
[info] +- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
[info]
[info] == Optimized Logical Plan ==
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
[info] +- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
[info]
[info] == Physical Plan ==
[info] WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
[info] +- *(2) Project [cast(eventTime#437544-T10000ms as bigint) AS
eventTime#437548L]
[info] +- StreamingDeduplicate [value#437541, eventTime#437544-T10000ms],
state info [ checkpoint =
file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1, numPartitions
= 5], 5000
[info] +- Exchange hashpartitioning(value#437541,
eventTime#437544-T10000ms, 5), true, [id=#875392]
[info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
[info] +- *(1) Project [value#437541, cast(value#437541 as
timestamp) AS eventTime#437544]
[info] +- *(1) Project [value#437541]
[info] +- MicroBatchScan[value#437541]
MemoryStreamDataSource (StreamTest.scala:452)
[info] org.scalatest.exceptions.TestFailedException:
[info] at
org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
[info] at
org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
[info] at
org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
[info] at org.scalatest.Assertions.fail(Assertions.scala:1091)
[info] at org.scalatest.Assertions.fail$(Assertions.scala:1087)
[info] at org.scalatest.FunSuite.fail(FunSuite.scala:1560)
[info] at
org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
[info] at
org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:654)
[info] at
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
[info] at
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56$adapted(StreamTest.scala:765)
[info] at
scala.collection.IndexedSeqOptimized.foreach(IndexedSeqOptimized.scala:36)
[info] at
scala.collection.IndexedSeqOptimized.foreach$(IndexedSeqOptimized.scala:33)
[info] at scala.collection.mutable.WrappedArray.foreach(WrappedArray.scala:38)
[info] at
org.apache.spark.sql.streaming.StreamTest.liftedTree1$1(StreamTest.scala:765)
[info] at
org.apache.spark.sql.streaming.StreamTest.testStream(StreamTest.scala:764)
[info] at
org.apache.spark.sql.streaming.StreamTest.testStream$(StreamTest.scala:334)
[info] at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.testStream(StreamingDeduplicationSuite.scala:29)
[info] at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.$anonfun$new$19(StreamingDeduplicationSuite.scala:284)
[info] at
scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:23)
[info] at org.scalatest.Assertions.withClue(Assertions.scala:1223)
[info] at org.scalatest.Assertions.withClue$(Assertions.scala:1210)
[info] at org.scalatest.FunSuite.withClue(FunSuite.scala:1560)
[info] at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.testWithFlag$1(StreamingDeduplicationSuite.scala:264)
[info] at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.$anonfun$new$18(StreamingDeduplicationSuite.scala:289)
[info] at
scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:23)
[info] at org.scalatest.OutcomeOf.outcomeOf(OutcomeOf.scala:85)
[info] at org.scalatest.OutcomeOf.outcomeOf$(OutcomeOf.scala:83)
[info] at org.scalatest.OutcomeOf$.outcomeOf(OutcomeOf.scala:104)
[info] at org.scalatest.Transformer.apply(Transformer.scala:22)
[info] at org.scalatest.Transformer.apply(Transformer.scala:20)
[info] at org.scalatest.FunSuiteLike$$anon$1.apply(FunSuiteLike.scala:186)
[info] at org.apache.spark.SparkFunSuite.withFixture(SparkFunSuite.scala:157)
[info] at
org.scalatest.FunSuiteLike.invokeWithFixture$1(FunSuiteLike.scala:184)
[info] at
org.scalatest.FunSuiteLike.$anonfun$runTest$1(FunSuiteLike.scala:196)
[info] at org.scalatest.SuperEngine.runTestImpl(Engine.scala:286)
[info] at org.scalatest.FunSuiteLike.runTest(FunSuiteLike.scala:196)
[info] at org.scalatest.FunSuiteLike.runTest$(FunSuiteLike.scala:178)
[info] at
org.apache.spark.SparkFunSuite.org$scalatest$BeforeAndAfterEach$$super$runTest(SparkFunSuite.scala:59)
[info] at
org.scalatest.BeforeAndAfterEach.runTest(BeforeAndAfterEach.scala:221)
[info] at
org.scalatest.BeforeAndAfterEach.runTest$(BeforeAndAfterEach.scala:214)
[info] at org.apache.spark.SparkFunSuite.runTest(SparkFunSuite.scala:59)
[info] at
org.scalatest.FunSuiteLike.$anonfun$runTests$1(FunSuiteLike.scala:229)
[info] at
org.scalatest.SuperEngine.$anonfun$runTestsInBranch$1(Engine.scala:393)
[info] at scala.collection.immutable.List.foreach(List.scala:392)
[info] at org.scalatest.SuperEngine.traverseSubNodes$1(Engine.scala:381)
[info] at org.scalatest.SuperEngine.runTestsInBranch(Engine.scala:376)
[info] at org.scalatest.SuperEngine.runTestsImpl(Engine.scala:458)
[info] at org.scalatest.FunSuiteLike.runTests(FunSuiteLike.scala:229)
[info] at org.scalatest.FunSuiteLike.runTests$(FunSuiteLike.scala:228)
[info] at org.scalatest.FunSuite.runTests(FunSuite.scala:1560)
[info] at org.scalatest.Suite.run(Suite.scala:1124)
[info] at org.scalatest.Suite.run$(Suite.scala:1106)
[info] at
org.scalatest.FunSuite.org$scalatest$FunSuiteLike$$super$run(FunSuite.scala:1560)
[info] at org.scalatest.FunSuiteLike.$anonfun$run$1(FunSuiteLike.scala:233)
[info] at org.scalatest.SuperEngine.runImpl(Engine.scala:518)
[info] at org.scalatest.FunSuiteLike.run(FunSuiteLike.scala:233)
[info] at org.scalatest.FunSuiteLike.run$(FunSuiteLike.scala:232)
[info] at
org.apache.spark.SparkFunSuite.org$scalatest$BeforeAndAfterAll$$super$run(SparkFunSuite.scala:59)
[info] at
org.scalatest.BeforeAndAfterAll.liftedTree1$1(BeforeAndAfterAll.scala:213)
[info] at org.scalatest.BeforeAndAfterAll.run(BeforeAndAfterAll.scala:210)
[info] at org.scalatest.BeforeAndAfterAll.run$(BeforeAndAfterAll.scala:208)
[info] at org.apache.spark.SparkFunSuite.run(SparkFunSuite.scala:59)
[info] at
org.scalatest.tools.Framework.org$scalatest$tools$Framework$$runSuite(Framework.scala:317)
[info] at
org.scalatest.tools.Framework$ScalaTestTask.execute(Framework.scala:510)
[info] at sbt.ForkMain$Run$2.call(ForkMain.java:296)
[info] at sbt.ForkMain$Run$2.call(ForkMain.java:286)
[info] at java.util.concurrent.FutureTask.run(FutureTask.java:266)
[info] at
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
[info] at
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
[info] at java.lang.Thread.run(Thread.java:748)
04:06:09.061 WARN org.apache.spark.sql.streaming.StreamingDeduplicationSuite:
===== POSSIBLE THREAD LEAK IN SUITE
o.a.s.sql.streaming.StreamingDeduplicationSuite, thread names:
state-store-maintenance-task, shuffle-boss-1682-1, rpc-boss-1679-1 =====
{code}
was:
Test failed:
https://amplab.cs.berkeley.edu/jenkins/job/SparkPullRequestBuilder/123621/
{code:java}
org.scalatest.exceptions.TestFailedException: with
spark.sql.streaming.noDataMicroBatches.enabled = false Assert on query failed:
: Assert on query failed: == Progress ==
StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
-> false),null) AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
CheckAnswer: [10],[11],[12],[13],[14],[15] AssertOnQuery(<condition>, Check
total state rows = List(6), updated state rows = List(6)) AddData to
MemoryStream[value#437541]: 25 CheckNewAnswer: [25]
AssertOnQuery(<condition>, Check total state rows = List(7), updated state rows
= List(1)) => AssertOnQuery(<condition>, ) == Stream == Output Mode: Append
Stream state: {MemoryStream[value#437541]: 1} Thread state: alive Thread stack
trace: java.lang.Thread.sleep(Native Method)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
Source)
org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
== Sink == 0: [11] [14] [13] [10] [15] [12] 1: [25] == Plan == == Parsed
Logical Plan == WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L] +-
Deduplicate [value#437541, eventTime#437544-T10000ms] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- Project
[value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1 == Analyzed Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L] +-
Deduplicate [value#437541, eventTime#437544-T10000ms] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- Project
[value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1 == Optimized Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L] +-
Deduplicate [value#437541, eventTime#437544-T10000ms] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- Project
[value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1 == Physical Plan == WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
*(2) Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- StreamingDeduplicate [value#437541, eventTime#437544-T10000ms], state info
[ checkpoint =
file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1, numPartitions
= 5], 5000 +- Exchange hashpartitioning(value#437541,
eventTime#437544-T10000ms, 5), true, [id=#875392] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- *(1)
Project [value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- *(1) Project [value#437541] +-
MicroBatchScan[value#437541] MemoryStreamDataSource
org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
org.scalatest.Assertions.fail(Assertions.scala:1091)
org.scalatest.Assertions.fail$(Assertions.scala:1087)
org.scalatest.FunSuite.fail(FunSuite.scala:1560)
org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
org.apache.spark.sql.streaming.StreamTest.verify$1(StreamTest.scala:423)
org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:651)
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
== Progress ==
StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
-> false),null) AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
CheckAnswer: [10],[11],[12],[13],[14],[15] AssertOnQuery(<condition>, Check
total state rows = List(6), updated state rows = List(6)) AddData to
MemoryStream[value#437541]: 25 CheckNewAnswer: [25]
AssertOnQuery(<condition>, Check total state rows = List(7), updated state rows
= List(1)) => AssertOnQuery(<condition>, ) == Stream == Output Mode: Append
Stream state: {MemoryStream[value#437541]: 1} Thread state: alive Thread stack
trace: java.lang.Thread.sleep(Native Method)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
Source)
org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
== Sink == 0: [11] [14] [13] [10] [15] [12] 1: [25] == Plan == == Parsed
Logical Plan == WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L] +-
Deduplicate [value#437541, eventTime#437544-T10000ms] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- Project
[value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1 == Analyzed Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L] +-
Deduplicate [value#437541, eventTime#437544-T10000ms] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- Project
[value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1 == Optimized Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L] +-
Deduplicate [value#437541, eventTime#437544-T10000ms] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- Project
[value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1 == Physical Plan == WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13 +-
*(2) Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- StreamingDeduplicate [value#437541, eventTime#437544-T10000ms], state info
[ checkpoint =
file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1, numPartitions
= 5], 5000 +- Exchange hashpartitioning(value#437541,
eventTime#437544-T10000ms, 5), true, [id=#875392] +-
EventTimeWatermark eventTime#437544: timestamp, 10 seconds +- *(1)
Project [value#437541, cast(value#437541 as timestamp) AS eventTime#437544]
+- *(1) Project [value#437541] +-
MicroBatchScan[value#437541] MemoryStreamDataSource
Stacktrace
sbt.ForkMain$ForkError: org.scalatest.exceptions.TestFailedException: with
spark.sql.streaming.noDataMicroBatches.enabled = false
Assert on query failed: :
Assert on query failed:
== Progress ==
StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
-> false),null)
AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
CheckAnswer: [10],[11],[12],[13],[14],[15]
AssertOnQuery(<condition>, Check total state rows = List(6), updated state
rows = List(6))
AddData to MemoryStream[value#437541]: 25
CheckNewAnswer: [25]
AssertOnQuery(<condition>, Check total state rows = List(7), updated state
rows = List(1))
=> AssertOnQuery(<condition>, )
== Stream ==
Output Mode: Append
Stream state: {MemoryStream[value#437541]: 1}
Thread state: alive
Thread stack trace: java.lang.Thread.sleep(Native Method)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
Source)
org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
== Sink ==
0: [11] [14] [13] [10] [15] [12]
1: [25]
== Plan ==
== Parsed Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- Deduplicate [value#437541, eventTime#437544-T10000ms]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
== Analyzed Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- Deduplicate [value#437541, eventTime#437544-T10000ms]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
== Optimized Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- Deduplicate [value#437541, eventTime#437544-T10000ms]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
== Physical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- *(2) Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- StreamingDeduplicate [value#437541, eventTime#437544-T10000ms], state
info [ checkpoint =
file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1, numPartitions
= 5], 5000
+- Exchange hashpartitioning(value#437541, eventTime#437544-T10000ms, 5),
true, [id=#875392]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- *(1) Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- *(1) Project [value#437541]
+- MicroBatchScan[value#437541] MemoryStreamDataSource
org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
org.scalatest.Assertions.fail(Assertions.scala:1091)
org.scalatest.Assertions.fail$(Assertions.scala:1087)
org.scalatest.FunSuite.fail(FunSuite.scala:1560)
org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
org.apache.spark.sql.streaming.StreamTest.verify$1(StreamTest.scala:423)
org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:651)
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
== Progress ==
StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
-> false),null)
AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
CheckAnswer: [10],[11],[12],[13],[14],[15]
AssertOnQuery(<condition>, Check total state rows = List(6), updated state
rows = List(6))
AddData to MemoryStream[value#437541]: 25
CheckNewAnswer: [25]
AssertOnQuery(<condition>, Check total state rows = List(7), updated state
rows = List(1))
=> AssertOnQuery(<condition>, )
== Stream ==
Output Mode: Append
Stream state: {MemoryStream[value#437541]: 1}
Thread state: alive
Thread stack trace: java.lang.Thread.sleep(Native Method)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
Source)
org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
== Sink ==
0: [11] [14] [13] [10] [15] [12]
1: [25]
== Plan ==
== Parsed Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- Deduplicate [value#437541, eventTime#437544-T10000ms]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
== Analyzed Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- Deduplicate [value#437541, eventTime#437544-T10000ms]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
== Optimized Logical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- Deduplicate [value#437541, eventTime#437544-T10000ms]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- StreamingDataSourceV2Relation [value#437541],
org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
MemoryStream[value#437541], 0, 1
== Physical Plan ==
WriteToDataSourceV2
org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
+- *(2) Project [cast(eventTime#437544-T10000ms as bigint) AS eventTime#437548L]
+- StreamingDeduplicate [value#437541, eventTime#437544-T10000ms], state
info [ checkpoint =
file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1, numPartitions
= 5], 5000
+- Exchange hashpartitioning(value#437541, eventTime#437544-T10000ms, 5),
true, [id=#875392]
+- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
+- *(1) Project [value#437541, cast(value#437541 as timestamp) AS
eventTime#437544]
+- *(1) Project [value#437541]
+- MicroBatchScan[value#437541] MemoryStreamDataSource
at
org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
at
org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
at
org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
at org.scalatest.Assertions.fail(Assertions.scala:1091)
at org.scalatest.Assertions.fail$(Assertions.scala:1087)
at org.scalatest.FunSuite.fail(FunSuite.scala:1560)
at
org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
at
org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:654)
at
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
at
org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56$adapted(StreamTest.scala:765)
at
scala.collection.IndexedSeqOptimized.foreach(IndexedSeqOptimized.scala:36)
at
scala.collection.IndexedSeqOptimized.foreach$(IndexedSeqOptimized.scala:33)
at scala.collection.mutable.WrappedArray.foreach(WrappedArray.scala:38)
at
org.apache.spark.sql.streaming.StreamTest.liftedTree1$1(StreamTest.scala:765)
at
org.apache.spark.sql.streaming.StreamTest.testStream(StreamTest.scala:764)
at
org.apache.spark.sql.streaming.StreamTest.testStream$(StreamTest.scala:334)
at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.testStream(StreamingDeduplicationSuite.scala:29)
at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.$anonfun$new$19(StreamingDeduplicationSuite.scala:284)
at
scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:23)
at org.scalatest.Assertions.withClue(Assertions.scala:1223)
at org.scalatest.Assertions.withClue$(Assertions.scala:1210)
at org.scalatest.FunSuite.withClue(FunSuite.scala:1560)
at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.testWithFlag$1(StreamingDeduplicationSuite.scala:264)
at
org.apache.spark.sql.streaming.StreamingDeduplicationSuite.$anonfun$new$18(StreamingDeduplicationSuite.scala:289)
at
scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:23)
at org.scalatest.OutcomeOf.outcomeOf(OutcomeOf.scala:85)
at org.scalatest.OutcomeOf.outcomeOf$(OutcomeOf.scala:83)
at org.scalatest.OutcomeOf$.outcomeOf(OutcomeOf.scala:104)
at org.scalatest.Transformer.apply(Transformer.scala:22)
at org.scalatest.Transformer.apply(Transformer.scala:20)
at org.scalatest.FunSuiteLike$$anon$1.apply(FunSuiteLike.scala:186)
at org.apache.spark.SparkFunSuite.withFixture(SparkFunSuite.scala:157)
at
org.scalatest.FunSuiteLike.invokeWithFixture$1(FunSuiteLike.scala:184)
at org.scalatest.FunSuiteLike.$anonfun$runTest$1(FunSuiteLike.scala:196)
at org.scalatest.SuperEngine.runTestImpl(Engine.scala:286)
at org.scalatest.FunSuiteLike.runTest(FunSuiteLike.scala:196)
at org.scalatest.FunSuiteLike.runTest$(FunSuiteLike.scala:178)
at
org.apache.spark.SparkFunSuite.org$scalatest$BeforeAndAfterEach$$super$runTest(SparkFunSuite.scala:59)
at
org.scalatest.BeforeAndAfterEach.runTest(BeforeAndAfterEach.scala:221)
at
org.scalatest.BeforeAndAfterEach.runTest$(BeforeAndAfterEach.scala:214)
at org.apache.spark.SparkFunSuite.runTest(SparkFunSuite.scala:59)
at
org.scalatest.FunSuiteLike.$anonfun$runTests$1(FunSuiteLike.scala:229)
at
org.scalatest.SuperEngine.$anonfun$runTestsInBranch$1(Engine.scala:393)
at scala.collection.immutable.List.foreach(List.scala:392)
at org.scalatest.SuperEngine.traverseSubNodes$1(Engine.scala:381)
at org.scalatest.SuperEngine.runTestsInBranch(Engine.scala:376)
at org.scalatest.SuperEngine.runTestsImpl(Engine.scala:458)
at org.scalatest.FunSuiteLike.runTests(FunSuiteLike.scala:229)
at org.scalatest.FunSuiteLike.runTests$(FunSuiteLike.scala:228)
at org.scalatest.FunSuite.runTests(FunSuite.scala:1560)
at org.scalatest.Suite.run(Suite.scala:1124)
at org.scalatest.Suite.run$(Suite.scala:1106)
at
org.scalatest.FunSuite.org$scalatest$FunSuiteLike$$super$run(FunSuite.scala:1560)
at org.scalatest.FunSuiteLike.$anonfun$run$1(FunSuiteLike.scala:233)
at org.scalatest.SuperEngine.runImpl(Engine.scala:518)
at org.scalatest.FunSuiteLike.run(FunSuiteLike.scala:233)
at org.scalatest.FunSuiteLike.run$(FunSuiteLike.scala:232)
at
org.apache.spark.SparkFunSuite.org$scalatest$BeforeAndAfterAll$$super$run(SparkFunSuite.scala:59)
at
org.scalatest.BeforeAndAfterAll.liftedTree1$1(BeforeAndAfterAll.scala:213)
at org.scalatest.BeforeAndAfterAll.run(BeforeAndAfterAll.scala:210)
at org.scalatest.BeforeAndAfterAll.run$(BeforeAndAfterAll.scala:208)
at org.apache.spark.SparkFunSuite.run(SparkFunSuite.scala:59)
at
org.scalatest.tools.Framework.org$scalatest$tools$Framework$$runSuite(Framework.scala:317)
at
org.scalatest.tools.Framework$ScalaTestTask.execute(Framework.scala:510)
at sbt.ForkMain$Run$2.call(ForkMain.java:296)
at sbt.ForkMain$Run$2.call(ForkMain.java:286)
at java.util.concurrent.FutureTask.run(FutureTask.java:266)
at
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
{code}
> Flaky test: StreamingDeduplicationSuite.test no-data flag
> ---------------------------------------------------------
>
> Key: SPARK-31928
> URL: https://issues.apache.org/jira/browse/SPARK-31928
> Project: Spark
> Issue Type: Bug
> Components: Structured Streaming, Tests
> Affects Versions: 3.1.0
> Reporter: Gabor Somogyi
> Priority: Major
>
> Test failed:
> https://amplab.cs.berkeley.edu/jenkins/job/SparkPullRequestBuilder/123621/
> {code:java}
> [info] with spark.sql.streaming.noDataMicroBatches.enabled = false
> [info] Assert on query failed: :
> [info] Assert on query failed:
> [info]
> [info] == Progress ==
> [info]
> StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
> -> false),null)
> [info] AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
> [info] CheckAnswer: [10],[11],[12],[13],[14],[15]
> [info] AssertOnQuery(<condition>, Check total state rows = List(6),
> updated state rows = List(6))
> [info] AddData to MemoryStream[value#437541]: 25
> [info] CheckNewAnswer: [25]
> [info] AssertOnQuery(<condition>, Check total state rows = List(7),
> updated state rows = List(1))
> [info] => AssertOnQuery(<condition>, )
> [info]
> [info] == Stream ==
> [info] Output Mode: Append
> [info] Stream state: {MemoryStream[value#437541]: 1}
> [info] Thread state: alive
> [info] Thread stack trace: java.lang.Thread.sleep(Native Method)
> [info]
> org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
> [info]
> org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
> Source)
> [info]
> org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
> [info]
> org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
> [info]
> org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
> [info]
> org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
> [info]
> [info]
> [info] == Sink ==
> [info] 0: [11] [14] [13] [10] [15] [12]
> [info] 1: [25]
> [info]
> [info]
> [info] == Plan ==
> [info] == Parsed Logical Plan ==
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
> [info] +- Project [value#437541, cast(value#437541 as timestamp)
> AS eventTime#437544]
> [info] +- StreamingDataSourceV2Relation [value#437541],
> org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
> MemoryStream[value#437541], 0, 1
> [info]
> [info] == Analyzed Logical Plan ==
> [info]
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
> [info] +- Project [value#437541, cast(value#437541 as timestamp)
> AS eventTime#437544]
> [info] +- StreamingDataSourceV2Relation [value#437541],
> org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
> MemoryStream[value#437541], 0, 1
> [info]
> [info] == Optimized Logical Plan ==
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
> [info] +- Project [value#437541, cast(value#437541 as timestamp)
> AS eventTime#437544]
> [info] +- StreamingDataSourceV2Relation [value#437541],
> org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
> MemoryStream[value#437541], 0, 1
> [info]
> [info] == Physical Plan ==
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- *(2) Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- StreamingDeduplicate [value#437541,
> eventTime#437544-T10000ms], state info [ checkpoint =
> file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
> runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1,
> numPartitions = 5], 5000
> [info] +- Exchange hashpartitioning(value#437541,
> eventTime#437544-T10000ms, 5), true, [id=#875392]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10
> seconds
> [info] +- *(1) Project [value#437541, cast(value#437541 as
> timestamp) AS eventTime#437544]
> [info] +- *(1) Project [value#437541]
> [info] +- MicroBatchScan[value#437541]
> MemoryStreamDataSource
> [info]
> [info]
> [info]
> [info]
> org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
> [info]
> org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
> [info]
> org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
> [info] org.scalatest.Assertions.fail(Assertions.scala:1091)
> [info] org.scalatest.Assertions.fail$(Assertions.scala:1087)
> [info] org.scalatest.FunSuite.fail(FunSuite.scala:1560)
> [info]
> org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
> [info]
> org.apache.spark.sql.streaming.StreamTest.verify$1(StreamTest.scala:423)
> [info]
> org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:651)
> [info]
> org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
> [info]
> [info]
> [info] == Progress ==
> [info]
> StartStream(ProcessingTimeTrigger(0),org.apache.spark.util.SystemClock@372edb19,Map(spark.sql.streaming.noDataMicroBatches.enabled
> -> false),null)
> [info] AddData to MemoryStream[value#437541]: 10,11,12,13,14,15
> [info] CheckAnswer: [10],[11],[12],[13],[14],[15]
> [info] AssertOnQuery(<condition>, Check total state rows = List(6),
> updated state rows = List(6))
> [info] AddData to MemoryStream[value#437541]: 25
> [info] CheckNewAnswer: [25]
> [info] AssertOnQuery(<condition>, Check total state rows = List(7),
> updated state rows = List(1))
> [info] => AssertOnQuery(<condition>, )
> [info]
> [info] == Stream ==
> [info] Output Mode: Append
> [info] Stream state: {MemoryStream[value#437541]: 1}
> [info] Thread state: alive
> [info] Thread stack trace: java.lang.Thread.sleep(Native Method)
> [info]
> org.apache.spark.sql.execution.streaming.MicroBatchExecution.$anonfun$runActivatedStream$1(MicroBatchExecution.scala:241)
> [info]
> org.apache.spark.sql.execution.streaming.MicroBatchExecution$$Lambda$1375/882607691.apply$mcZ$sp(Unknown
> Source)
> [info]
> org.apache.spark.sql.execution.streaming.ProcessingTimeExecutor.execute(TriggerExecutor.scala:57)
> [info]
> org.apache.spark.sql.execution.streaming.MicroBatchExecution.runActivatedStream(MicroBatchExecution.scala:185)
> [info]
> org.apache.spark.sql.execution.streaming.StreamExecution.org$apache$spark$sql$execution$streaming$StreamExecution$$runStream(StreamExecution.scala:334)
> [info]
> org.apache.spark.sql.execution.streaming.StreamExecution$$anon$1.run(StreamExecution.scala:245)
> [info]
> [info]
> [info] == Sink ==
> [info] 0: [11] [14] [13] [10] [15] [12]
> [info] 1: [25]
> [info]
> [info]
> [info] == Plan ==
> [info] == Parsed Logical Plan ==
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
> [info] +- Project [value#437541, cast(value#437541 as timestamp)
> AS eventTime#437544]
> [info] +- StreamingDataSourceV2Relation [value#437541],
> org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
> MemoryStream[value#437541], 0, 1
> [info]
> [info] == Analyzed Logical Plan ==
> [info]
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
> [info] +- Project [value#437541, cast(value#437541 as timestamp)
> AS eventTime#437544]
> [info] +- StreamingDataSourceV2Relation [value#437541],
> org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
> MemoryStream[value#437541], 0, 1
> [info]
> [info] == Optimized Logical Plan ==
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- Deduplicate [value#437541, eventTime#437544-T10000ms]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10 seconds
> [info] +- Project [value#437541, cast(value#437541 as timestamp)
> AS eventTime#437544]
> [info] +- StreamingDataSourceV2Relation [value#437541],
> org.apache.spark.sql.execution.streaming.MemoryStreamScanBuilder@1802eea6,
> MemoryStream[value#437541], 0, 1
> [info]
> [info] == Physical Plan ==
> [info] WriteToDataSourceV2
> org.apache.spark.sql.execution.streaming.sources.MicroBatchWrite@158ccd13
> [info] +- *(2) Project [cast(eventTime#437544-T10000ms as bigint) AS
> eventTime#437548L]
> [info] +- StreamingDeduplicate [value#437541,
> eventTime#437544-T10000ms], state info [ checkpoint =
> file:/home/jenkins/workspace/SparkPullRequestBuilder@2/target/tmp/streaming.metadata-e446f9e9-0afe-4b5e-b6a6-772d0debc7ee/state,
> runId = 9ed21ac3-8994-4e13-8da1-db14a1f22da6, opId = 0, ver = 1,
> numPartitions = 5], 5000
> [info] +- Exchange hashpartitioning(value#437541,
> eventTime#437544-T10000ms, 5), true, [id=#875392]
> [info] +- EventTimeWatermark eventTime#437544: timestamp, 10
> seconds
> [info] +- *(1) Project [value#437541, cast(value#437541 as
> timestamp) AS eventTime#437544]
> [info] +- *(1) Project [value#437541]
> [info] +- MicroBatchScan[value#437541]
> MemoryStreamDataSource (StreamTest.scala:452)
> [info] org.scalatest.exceptions.TestFailedException:
> [info] at
> org.scalatest.Assertions.newAssertionFailedException(Assertions.scala:530)
> [info] at
> org.scalatest.Assertions.newAssertionFailedException$(Assertions.scala:529)
> [info] at
> org.scalatest.FunSuite.newAssertionFailedException(FunSuite.scala:1560)
> [info] at org.scalatest.Assertions.fail(Assertions.scala:1091)
> [info] at org.scalatest.Assertions.fail$(Assertions.scala:1087)
> [info] at org.scalatest.FunSuite.fail(FunSuite.scala:1560)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.failTest$1(StreamTest.scala:452)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.executeAction$1(StreamTest.scala:654)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56(StreamTest.scala:778)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.$anonfun$testStream$56$adapted(StreamTest.scala:765)
> [info] at
> scala.collection.IndexedSeqOptimized.foreach(IndexedSeqOptimized.scala:36)
> [info] at
> scala.collection.IndexedSeqOptimized.foreach$(IndexedSeqOptimized.scala:33)
> [info] at
> scala.collection.mutable.WrappedArray.foreach(WrappedArray.scala:38)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.liftedTree1$1(StreamTest.scala:765)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.testStream(StreamTest.scala:764)
> [info] at
> org.apache.spark.sql.streaming.StreamTest.testStream$(StreamTest.scala:334)
> [info] at
> org.apache.spark.sql.streaming.StreamingDeduplicationSuite.testStream(StreamingDeduplicationSuite.scala:29)
> [info] at
> org.apache.spark.sql.streaming.StreamingDeduplicationSuite.$anonfun$new$19(StreamingDeduplicationSuite.scala:284)
> [info] at
> scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:23)
> [info] at org.scalatest.Assertions.withClue(Assertions.scala:1223)
> [info] at org.scalatest.Assertions.withClue$(Assertions.scala:1210)
> [info] at org.scalatest.FunSuite.withClue(FunSuite.scala:1560)
> [info] at
> org.apache.spark.sql.streaming.StreamingDeduplicationSuite.testWithFlag$1(StreamingDeduplicationSuite.scala:264)
> [info] at
> org.apache.spark.sql.streaming.StreamingDeduplicationSuite.$anonfun$new$18(StreamingDeduplicationSuite.scala:289)
> [info] at
> scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:23)
> [info] at org.scalatest.OutcomeOf.outcomeOf(OutcomeOf.scala:85)
> [info] at org.scalatest.OutcomeOf.outcomeOf$(OutcomeOf.scala:83)
> [info] at org.scalatest.OutcomeOf$.outcomeOf(OutcomeOf.scala:104)
> [info] at org.scalatest.Transformer.apply(Transformer.scala:22)
> [info] at org.scalatest.Transformer.apply(Transformer.scala:20)
> [info] at org.scalatest.FunSuiteLike$$anon$1.apply(FunSuiteLike.scala:186)
> [info] at
> org.apache.spark.SparkFunSuite.withFixture(SparkFunSuite.scala:157)
> [info] at
> org.scalatest.FunSuiteLike.invokeWithFixture$1(FunSuiteLike.scala:184)
> [info] at
> org.scalatest.FunSuiteLike.$anonfun$runTest$1(FunSuiteLike.scala:196)
> [info] at org.scalatest.SuperEngine.runTestImpl(Engine.scala:286)
> [info] at org.scalatest.FunSuiteLike.runTest(FunSuiteLike.scala:196)
> [info] at org.scalatest.FunSuiteLike.runTest$(FunSuiteLike.scala:178)
> [info] at
> org.apache.spark.SparkFunSuite.org$scalatest$BeforeAndAfterEach$$super$runTest(SparkFunSuite.scala:59)
> [info] at
> org.scalatest.BeforeAndAfterEach.runTest(BeforeAndAfterEach.scala:221)
> [info] at
> org.scalatest.BeforeAndAfterEach.runTest$(BeforeAndAfterEach.scala:214)
> [info] at org.apache.spark.SparkFunSuite.runTest(SparkFunSuite.scala:59)
> [info] at
> org.scalatest.FunSuiteLike.$anonfun$runTests$1(FunSuiteLike.scala:229)
> [info] at
> org.scalatest.SuperEngine.$anonfun$runTestsInBranch$1(Engine.scala:393)
> [info] at scala.collection.immutable.List.foreach(List.scala:392)
> [info] at org.scalatest.SuperEngine.traverseSubNodes$1(Engine.scala:381)
> [info] at org.scalatest.SuperEngine.runTestsInBranch(Engine.scala:376)
> [info] at org.scalatest.SuperEngine.runTestsImpl(Engine.scala:458)
> [info] at org.scalatest.FunSuiteLike.runTests(FunSuiteLike.scala:229)
> [info] at org.scalatest.FunSuiteLike.runTests$(FunSuiteLike.scala:228)
> [info] at org.scalatest.FunSuite.runTests(FunSuite.scala:1560)
> [info] at org.scalatest.Suite.run(Suite.scala:1124)
> [info] at org.scalatest.Suite.run$(Suite.scala:1106)
> [info] at
> org.scalatest.FunSuite.org$scalatest$FunSuiteLike$$super$run(FunSuite.scala:1560)
> [info] at org.scalatest.FunSuiteLike.$anonfun$run$1(FunSuiteLike.scala:233)
> [info] at org.scalatest.SuperEngine.runImpl(Engine.scala:518)
> [info] at org.scalatest.FunSuiteLike.run(FunSuiteLike.scala:233)
> [info] at org.scalatest.FunSuiteLike.run$(FunSuiteLike.scala:232)
> [info] at
> org.apache.spark.SparkFunSuite.org$scalatest$BeforeAndAfterAll$$super$run(SparkFunSuite.scala:59)
> [info] at
> org.scalatest.BeforeAndAfterAll.liftedTree1$1(BeforeAndAfterAll.scala:213)
> [info] at org.scalatest.BeforeAndAfterAll.run(BeforeAndAfterAll.scala:210)
> [info] at org.scalatest.BeforeAndAfterAll.run$(BeforeAndAfterAll.scala:208)
> [info] at org.apache.spark.SparkFunSuite.run(SparkFunSuite.scala:59)
> [info] at
> org.scalatest.tools.Framework.org$scalatest$tools$Framework$$runSuite(Framework.scala:317)
> [info] at
> org.scalatest.tools.Framework$ScalaTestTask.execute(Framework.scala:510)
> [info] at sbt.ForkMain$Run$2.call(ForkMain.java:296)
> [info] at sbt.ForkMain$Run$2.call(ForkMain.java:286)
> [info] at java.util.concurrent.FutureTask.run(FutureTask.java:266)
> [info] at
> java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
> [info] at
> java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
> [info] at java.lang.Thread.run(Thread.java:748)
> 04:06:09.061 WARN org.apache.spark.sql.streaming.StreamingDeduplicationSuite:
> ===== POSSIBLE THREAD LEAK IN SUITE
> o.a.s.sql.streaming.StreamingDeduplicationSuite, thread names:
> state-store-maintenance-task, shuffle-boss-1682-1, rpc-boss-1679-1 =====
> {code}
--
This message was sent by Atlassian Jira
(v8.3.4#803005)
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]