wankunde commented on a change in pull request #34234:
URL: https://github.com/apache/spark/pull/34234#discussion_r739661970
##########
File path: core/src/main/scala/org/apache/spark/internal/config/package.scala
##########
@@ -1178,6 +1178,27 @@ package object config {
.bytesConf(ByteUnit.BYTE)
.createWithDefault(100 * 1024 * 1024)
+ private[spark] val SHUFFLE_ACCURATE_BLOCK_SKEWED_FACTOR =
+ ConfigBuilder("spark.shuffle.accurateBlockSkewedFactor")
+ .doc("A shuffle block is considered as skewed and will be accurately
recorded in " +
+ "HighlyCompressedMapStatus if its size is larger than this factor
multiplying " +
+ "the median shuffle block size or SHUFFLE_ACCURATE_BLOCK_THRESHOLD. It
is " +
+ "recommended to set this parameter to be the same as
SKEW_JOIN_SKEWED_PARTITION_FACTOR." +
+ "Set to -1.0 to disable this feature by default.")
+ .version("3.3.0")
+ .doubleConf
+ .createWithDefault(-1.0)
+
+ private[spark] val SHUFFLE_MAX_ACCURATE_SKEWED_BLOCK_NUMBER =
+ ConfigBuilder("spark.shuffle.maxAccurateSkewedBlockNumber")
+ .doc("Max skewed shuffle blocks allowed to be accurately recorded in " +
+ "HighlyCompressedMapStatus if its size is larger than this factor
multiplying " +
Review comment:
Updated
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]