Skip to content

Commit 7449e1c

Browse files
GlavoRoger Riggs
authored and
Roger Riggs
committedMar 3, 2023
8299807: newStringNoRepl should avoid copying arrays for ASCII compatible charsets
Reviewed-by: rriggs
1 parent c6de66c commit 7449e1c

File tree

2 files changed

+16
-5
lines changed

2 files changed

+16
-5
lines changed
 

‎src/java.base/share/classes/java/lang/String.java

+15-4
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 1994, 2022, Oracle and/or its affiliates. All rights reserved.
2+
* Copyright (c) 1994, 2023, Oracle and/or its affiliates. All rights reserved.
33
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
44
*
55
* This code is free software; you can redistribute it and/or modify it
@@ -698,8 +698,13 @@ private String(Charset charset, byte[] bytes, int offset, int length) {
698698

699699
/*
700700
* Throws iae, instead of replacing, if malformed or unmappable.
701+
*
702+
* @param noShare
703+
* {@code true} if the resulting string MUST NOT share the byte array,
704+
* {@code false} if the byte array can be exclusively used to construct
705+
* the string and is not modified or used for any other purpose.
701706
*/
702-
static String newStringUTF8NoRepl(byte[] bytes, int offset, int length) {
707+
static String newStringUTF8NoRepl(byte[] bytes, int offset, int length, boolean noShare) {
703708
checkBoundsOffCount(offset, length, bytes.length);
704709
if (length == 0) {
705710
return "";
@@ -710,7 +715,11 @@ static String newStringUTF8NoRepl(byte[] bytes, int offset, int length) {
710715
dp = StringCoding.countPositives(bytes, offset, length);
711716
int sl = offset + length;
712717
if (dp == length) {
713-
return new String(Arrays.copyOfRange(bytes, offset, offset + length), LATIN1);
718+
if (noShare || length != bytes.length) {
719+
return new String(Arrays.copyOfRange(bytes, offset, offset + length), LATIN1);
720+
} else {
721+
return new String(bytes, LATIN1);
722+
}
714723
}
715724
dst = new byte[length];
716725
System.arraycopy(bytes, offset, dst, 0, dp);
@@ -778,7 +787,7 @@ private static String newStringNoRepl1(byte[] src, Charset cs) {
778787
return "";
779788
}
780789
if (cs == UTF_8.INSTANCE) {
781-
return newStringUTF8NoRepl(src, 0, src.length);
790+
return newStringUTF8NoRepl(src, 0, src.length, false);
782791
}
783792
if (cs == ISO_8859_1.INSTANCE) {
784793
if (COMPACT_STRINGS)
@@ -800,6 +809,8 @@ private static String newStringNoRepl1(byte[] src, Charset cs) {
800809
if (cd instanceof ArrayDecoder ad &&
801810
ad.isASCIICompatible() &&
802811
!StringCoding.hasNegatives(src, 0, src.length)) {
812+
if (COMPACT_STRINGS)
813+
return new String(src, LATIN1);
803814
return new String(src, 0, src.length, ISO_8859_1.INSTANCE);
804815
}
805816
int en = scale(len, cd.maxCharsPerByte());

‎src/java.base/share/classes/java/lang/System.java

+1-1
Original file line numberDiff line numberDiff line change
@@ -2478,7 +2478,7 @@ public byte[] getBytesNoRepl(String s, Charset cs) throws CharacterCodingExcepti
24782478
}
24792479

24802480
public String newStringUTF8NoRepl(byte[] bytes, int off, int len) {
2481-
return String.newStringUTF8NoRepl(bytes, off, len);
2481+
return String.newStringUTF8NoRepl(bytes, off, len, true);
24822482
}
24832483

24842484
public byte[] getBytesUTF8NoRepl(String s) {

0 commit comments

Comments
 (0)
Please sign in to comment.