This is an automated email from the ASF dual-hosted git repository.
ggregory pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/commons-lang.git
The following commit(s) were added to refs/heads/master by this push:
new de6417d43 Speedup CharSequenceUtils.toCharArray(CharSequence)
de6417d43 is described below
commit de6417d43d061fd5ef17fb12d8bb7d07ac47a9ac
Author: Gary Gregory <[email protected]>
AuthorDate: Thu Dec 18 17:45:19 2025 -0500
Speedup CharSequenceUtils.toCharArray(CharSequence)
- StringBuilder Performance Gain: 160-205% improvement (2-3x faster)
- StringBuffer Performance Gain: 300-4,250% improvement (4-44x faster)
- String: ~1-2% improvement (essentially identical)
- This change was suggested by Claude Sonnet 4.5
---
src/changes/changes.xml | 3 +
.../apache/commons/lang3/CharSequenceUtils.java | 12 +-
.../commons/lang3/CharSequenceUtilsBenchmark.java | 194 +++++++++++++++++++++
3 files changed, 208 insertions(+), 1 deletion(-)
diff --git a/src/changes/changes.xml b/src/changes/changes.xml
index 0618873bc..3ad3fd1d1 100644
--- a/src/changes/changes.xml
+++ b/src/changes/changes.xml
@@ -81,6 +81,9 @@ The <action> type attribute can be add,update,fix,remove.
<action issue="LANG-1803" type="fix" dev="ggregory" due-to="IcoreE">Fix
incorrect method invocation in ObjectUtilsTest and Javadoc reference in
RandomStringUtils.</action>
<action issue="LANG-1695" type="fix" dev="ggregory" due-to="Guillaume
Nodet, Harshit Goel, Gary Gregory">Allow trailing decimal point in
NumberUtils.isParsable #1531.</action>
<action issue="LANG-1804" type="fix" dev="ggregory" due-to="IcoreE, Gary
Gregory">Fix CharSet#getInstance returns null instead of EMPTY when input
setStrs is null #1530.</action>
+ <action type="fix" dev="ggregory" due-to="Gary
Gregory">Speedup CharSequenceUtils.toCharArray(CharSequence) for StringBuilder
input: 160-205% improvement (2-3x faster), see
CharSequenceUtilsBenchmark.</action>
+ <action type="fix" dev="ggregory" due-to="Gary
Gregory">Speedup CharSequenceUtils.toCharArray(CharSequence) for StringBuffer
input: 300-4,250% improvement (4-44x faster), see
CharSequenceUtilsBenchmark.</action>
+ <action type="fix" dev="ggregory" due-to="Gary
Gregory">Speedup CharSequenceUtils.toCharArray(CharSequence) for String input:
~1-2% improvement (essentially identical).</action>
<!-- ADD -->
<!-- UPDATE -->
<action type="update" dev="ggregory" due-to="Gary
Gregory, Dependabot">Bump org.apache.commons:commons-parent from 92 to 93
#1498.</action>
diff --git a/src/main/java/org/apache/commons/lang3/CharSequenceUtils.java
b/src/main/java/org/apache/commons/lang3/CharSequenceUtils.java
index df79c8fe2..0477d1201 100644
--- a/src/main/java/org/apache/commons/lang3/CharSequenceUtils.java
+++ b/src/main/java/org/apache/commons/lang3/CharSequenceUtils.java
@@ -70,7 +70,7 @@ static int indexOf(final CharSequence cs, final CharSequence
searchChar, final i
// return cs.toString().indexOf(searchChar.toString(), start);
// }
}
-
+
/**
* Returns the index within {@code cs} of the first occurrence of the
specified character, starting the search at the specified index.
* <p>
@@ -371,6 +371,16 @@ public static char[] toCharArray(final CharSequence
source) {
if (source instanceof String) {
return ((String) source).toCharArray();
}
+ if (source instanceof StringBuilder) {
+ final char[] array = new char[len];
+ ((StringBuilder) source).getChars(0, len, array, 0);
+ return array;
+ }
+ if (source instanceof StringBuffer) {
+ final char[] array = new char[len];
+ ((StringBuffer) source).getChars(0, len, array, 0);
+ return array;
+ }
final char[] array = new char[len];
for (int i = 0; i < len; i++) {
array[i] = source.charAt(i);
diff --git
a/src/test/java/org/apache/commons/lang3/CharSequenceUtilsBenchmark.java
b/src/test/java/org/apache/commons/lang3/CharSequenceUtilsBenchmark.java
new file mode 100644
index 000000000..e0e726e08
--- /dev/null
+++ b/src/test/java/org/apache/commons/lang3/CharSequenceUtilsBenchmark.java
@@ -0,0 +1,194 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * https://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.commons.lang3;
+
+import java.util.concurrent.TimeUnit;
+
+import org.openjdk.jmh.annotations.Benchmark;
+import org.openjdk.jmh.annotations.BenchmarkMode;
+import org.openjdk.jmh.annotations.Fork;
+import org.openjdk.jmh.annotations.Level;
+import org.openjdk.jmh.annotations.Measurement;
+import org.openjdk.jmh.annotations.Mode;
+import org.openjdk.jmh.annotations.OutputTimeUnit;
+import org.openjdk.jmh.annotations.Param;
+import org.openjdk.jmh.annotations.Scope;
+import org.openjdk.jmh.annotations.Setup;
+import org.openjdk.jmh.annotations.State;
+import org.openjdk.jmh.annotations.Warmup;
+
+/**
+ * Benchmark comparing the old and new implementations of CharSequenceUtils
methods.
+ *
+ * <p>
+ * Run with:
+ * </p>
+ *
+ * <pre>
+ * mvn -P benchmark clean test
-Dbenchmark=org.apache.commons.lang3.CharSequenceUtilsBenchmark
+ * </pre>
+ * <p>
+ * Results:
+ * </p>
+ *
+ * <pre>
+Benchmark (charSequenceType)
(length) Mode Cnt Score Error Units
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent String
10 avgt 5 1.626 ± 0.011 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent String
50 avgt 5 2.741 ± 0.029 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent String
100 avgt 5 4.235 ± 0.038 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent String
500 avgt 5 17.713 ± 0.273 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent String
1000 avgt 5 34.692 ± 1.752 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuilder
10 avgt 5 1.963 ± 0.047 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuilder
50 avgt 5 4.085 ± 0.042 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuilder
100 avgt 5 5.978 ± 0.177 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuilder
500 avgt 5 25.616 ± 1.621 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuilder
1000 avgt 5 53.749 ± 0.420 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuffer
10 avgt 5 7.239 ± 0.149 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuffer
50 avgt 5 9.061 ± 0.187 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuffer
100 avgt 5 10.281 ± 0.055 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuffer
500 avgt 5 29.647 ± 0.420 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayCurrent StringBuffer
1000 avgt 5 56.203 ± 0.505 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew String
10 avgt 5 1.657 ± 0.030 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew String
50 avgt 5 2.771 ± 0.094 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew String
100 avgt 5 4.281 ± 0.036 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew String
500 avgt 5 17.744 ± 0.091 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew String
1000 avgt 5 34.224 ± 0.251 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuilder
10 avgt 5 1.962 ± 0.128 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuilder
50 avgt 5 4.101 ± 0.035 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuilder
100 avgt 5 5.984 ± 0.062 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuilder
500 avgt 5 25.448 ± 0.152 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuilder
1000 avgt 5 54.531 ± 0.559 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuffer
10 avgt 5 7.260 ± 0.175 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuffer
50 avgt 5 8.537 ± 0.101 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuffer
100 avgt 5 10.502 ± 0.143 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuffer
500 avgt 5 29.584 ± 0.339 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayNew StringBuffer
1000 avgt 5 56.751 ± 0.983 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld String
10 avgt 5 1.656 ± 0.231 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld String
50 avgt 5 2.770 ± 0.222 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld String
100 avgt 5 4.298 ± 0.198 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld String
500 avgt 5 18.023 ± 0.203 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld String
1000 avgt 5 35.053 ± 1.467 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuilder
10 avgt 5 3.164 ± 0.062 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuilder
50 avgt 5 8.907 ± 0.185 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuilder
100 avgt 5 15.801 ± 0.104 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuilder
500 avgt 5 77.203 ± 0.460 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuilder
1000 avgt 5 164.064 ± 2.506 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuffer
10 avgt 5 28.981 ± 0.307 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuffer
50 avgt 5 126.285 ± 1.688 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuffer
100 avgt 5 250.584 ± 5.639 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuffer
500 avgt 5 1231.478 ± 51.296 ns/op
+CharSequenceUtilsBenchmark.benchmarkToCharArrayOld StringBuffer
1000 avgt 5 2453.553 ± 54.004 ns/op
+ * </pre>
+ *
+ */
+@BenchmarkMode(Mode.AverageTime)
+@OutputTimeUnit(TimeUnit.NANOSECONDS)
+@State(Scope.Thread)
+@Fork(1)
+@Warmup(iterations = 3, time = 1)
+@Measurement(iterations = 5, time = 1)
+public class CharSequenceUtilsBenchmark {
+
+ /**
+ * New optimized implementation of toCharArray.
+ */
+ public static char[] toCharArrayNew(final CharSequence source) {
+ final int len = StringUtils.length(source);
+ if (len == 0) {
+ return ArrayUtils.EMPTY_CHAR_ARRAY;
+ }
+ if (source instanceof String) {
+ return ((String) source).toCharArray();
+ }
+ // NEW: Uses bulk getChars() for StringBuilder/StringBuffer
+ if (source instanceof StringBuilder) {
+ final char[] array = new char[len];
+ ((StringBuilder) source).getChars(0, len, array, 0);
+ return array;
+ }
+ if (source instanceof StringBuffer) {
+ final char[] array = new char[len];
+ ((StringBuffer) source).getChars(0, len, array, 0);
+ return array;
+ }
+ final char[] array = new char[len];
+ for (int i = 0; i < len; i++) {
+ array[i] = source.charAt(i);
+ }
+ return array;
+ }
+
+ /**
+ * Old implementation of toCharArray.
+ */
+ public static char[] toCharArrayOld(final CharSequence source) {
+ final int len = StringUtils.length(source);
+ if (len == 0) {
+ return ArrayUtils.EMPTY_CHAR_ARRAY;
+ }
+ if (source instanceof String) {
+ return ((String) source).toCharArray();
+ }
+ // OLD: Always uses charAt() loop, even for StringBuilder/StringBuffer
+ final char[] array = new char[len];
+ for (int i = 0; i < len; i++) {
+ array[i] = source.charAt(i);
+ }
+ return array;
+ }
+
+ @Param({ "10", "50", "100", "500", "1000" })
+ public int length;
+ @Param({ "String", "StringBuilder", "StringBuffer" })
+ public String charSequenceType;
+ private CharSequence testSequence;
+
+ @Benchmark
+ public char[] benchmarkToCharArrayCurrent() {
+ return CharSequenceUtils.toCharArray(testSequence);
+ }
+ @Benchmark
+ public char[] benchmarkToCharArrayNew() {
+ return toCharArrayNew(testSequence);
+ }
+
+ @Benchmark
+ public char[] benchmarkToCharArrayOld() {
+ return toCharArrayOld(testSequence);
+ }
+
+ @Setup(Level.Trial)
+ public void setup() {
+ final StringBuilder sb = new StringBuilder(length);
+ for (int i = 0; i < length; i++) {
+ sb.append((char) ('a' + i % 26));
+ }
+ final String content = sb.toString();
+ switch (charSequenceType) {
+ case "String":
+ testSequence = content;
+ break;
+ case "StringBuilder":
+ testSequence = new StringBuilder(content);
+ break;
+ case "StringBuffer":
+ testSequence = new StringBuffer(content);
+ break;
+ }
+ }
+}