blob: 68a1c06c60765f6c78f3f93695aabfb6e420b13c [file] [log] [blame]
Ian Rogers2dd0e2c2013-01-24 12:42:14 -08001/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Brian Carlstromfc0e3212013-07-17 14:40:12 -070017#ifndef ART_RUNTIME_MIRROR_STRING_H_
18#define ART_RUNTIME_MIRROR_STRING_H_
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080019
Vladimir Marko5924a4a2018-05-29 17:40:41 +010020#include "base/bit_utils.h"
Vladimir Marko6834d342018-05-25 13:12:09 +010021#include "class.h"
Ian Rogerse63db272014-07-15 15:36:11 -070022#include "object.h"
Andreas Gampe5a0430d2019-01-04 14:33:57 -080023#include "runtime_globals.h"
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080024
25namespace art {
26
Andreas Gampe391be3a2019-05-14 12:41:40 -070027namespace gc {
28enum AllocatorType : char;
29} // namespace gc
30
Mathieu Chartiereb8167a2014-05-07 15:43:14 -070031template<class T> class Handle;
Vladimir Marko179b7c62019-03-22 13:38:57 +000032template<class MirrorType> class ObjPtr;
Vladimir Marko552a1342017-10-31 10:56:47 +000033class StringBuilderAppend;
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080034struct StringOffsets;
Roland Levillain0d5a2812015-11-13 10:07:31 +000035class StubTest_ReadBarrierForRoot_Test;
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080036
37namespace mirror {
38
jessicahandojo3aaa37b2016-07-29 14:46:37 -070039// String Compression
Vladimir Markobcf716f2017-02-23 10:43:09 +000040static constexpr bool kUseStringCompression = true;
Vladimir Markofdaf0f42016-10-13 19:29:53 +010041enum class StringCompressionFlag : uint32_t {
42 kCompressed = 0u,
43 kUncompressed = 1u
44};
jessicahandojo3aaa37b2016-07-29 14:46:37 -070045
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080046// C++ mirror of java.lang.String
Roland Levillainbbc6e7e2018-08-24 16:58:47 +010047class MANAGED String final : public Object {
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080048 public:
Mingyao Yang98d1cc82014-05-15 17:02:16 -070049 // Size of java.lang.String.class.
Andreas Gampe542451c2016-07-26 09:02:02 -070050 static uint32_t ClassSize(PointerSize pointer_size);
Mingyao Yang98d1cc82014-05-15 17:02:16 -070051
52 // Size of an instance of java.lang.String not including its value array.
53 static constexpr uint32_t InstanceSize() {
54 return sizeof(String);
55 }
56
David Srbecky56de89a2018-10-01 15:32:20 +010057 static constexpr MemberOffset CountOffset() {
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080058 return OFFSET_OF_OBJECT_MEMBER(String, count_);
59 }
60
David Srbecky56de89a2018-10-01 15:32:20 +010061 static constexpr MemberOffset ValueOffset() {
Jeff Hao848f70a2014-01-15 13:49:50 -080062 return OFFSET_OF_OBJECT_MEMBER(String, value_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080063 }
64
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070065 uint16_t* GetValue() REQUIRES_SHARED(Locks::mutator_lock_) {
Jeff Hao848f70a2014-01-15 13:49:50 -080066 return &value_[0];
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080067 }
68
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070069 uint8_t* GetValueCompressed() REQUIRES_SHARED(Locks::mutator_lock_) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -070070 return &value_compressed_[0];
71 }
72
Jeff Hao848f70a2014-01-15 13:49:50 -080073 template<VerifyObjectFlags kVerifyFlags = kDefaultVerifyFlags>
Vladimir Marko5924a4a2018-05-29 17:40:41 +010074 size_t SizeOf() REQUIRES_SHARED(Locks::mutator_lock_) {
75 size_t size = sizeof(String);
76 if (IsCompressed()) {
77 size += (sizeof(uint8_t) * GetLength<kVerifyFlags>());
78 } else {
79 size += (sizeof(uint16_t) * GetLength<kVerifyFlags>());
80 }
81 // String.equals() intrinsics assume zero-padding up to kObjectAlignment,
82 // so make sure the zero-padding is actually copied around if GC compaction
83 // chooses to copy only SizeOf() bytes.
84 // http://b/23528461
85 return RoundUp(size, kObjectAlignment);
86 }
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080087
jessicahandojo3aaa37b2016-07-29 14:46:37 -070088 // Taking out the first/uppermost bit because it is not part of actual length value
Jeff Hao848f70a2014-01-15 13:49:50 -080089 template<VerifyObjectFlags kVerifyFlags = kDefaultVerifyFlags>
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070090 int32_t GetLength() REQUIRES_SHARED(Locks::mutator_lock_) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -070091 return GetLengthFromCount(GetCount<kVerifyFlags>());
92 }
93
94 template<VerifyObjectFlags kVerifyFlags = kDefaultVerifyFlags>
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070095 int32_t GetCount() REQUIRES_SHARED(Locks::mutator_lock_) {
Jeff Hao848f70a2014-01-15 13:49:50 -080096 return GetField32<kVerifyFlags>(OFFSET_OF_OBJECT_MEMBER(String, count_));
Ian Rogers2dd0e2c2013-01-24 12:42:14 -080097 }
98
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070099 void SetCount(int32_t new_count) REQUIRES_SHARED(Locks::mutator_lock_) {
Jeff Hao848f70a2014-01-15 13:49:50 -0800100 // Count is invariant so use non-transactional mode. Also disable check as we may run inside
101 // a transaction.
Jeff Hao848f70a2014-01-15 13:49:50 -0800102 SetField32<false, false>(OFFSET_OF_OBJECT_MEMBER(String, count_), new_count);
103 }
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800104
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700105 int32_t GetHashCode() REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800106
Mathieu Chartiercdfd39f2014-08-29 18:16:58 -0700107 // Computes, stores, and returns the hash code.
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700108 int32_t ComputeHashCode() REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800109
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700110 int32_t GetUtfLength() REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800111
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700112 uint16_t CharAt(int32_t index) REQUIRES_SHARED(Locks::mutator_lock_);
Jeff Hao848f70a2014-01-15 13:49:50 -0800113
Vladimir Marko92907f32017-02-20 14:08:30 +0000114 // Create a new string where all occurences of `old_c` are replaced with `new_c`.
115 // String.doReplace(char, char) is called from String.replace(char, char) when there is a match.
Vladimir Marko9e57aba2017-03-16 10:45:40 +0000116 static ObjPtr<String> DoReplace(Thread* self, Handle<String> src, uint16_t old_c, uint16_t new_c)
Vladimir Marko92907f32017-02-20 14:08:30 +0000117 REQUIRES_SHARED(Locks::mutator_lock_);
Jeff Hao848f70a2014-01-15 13:49:50 -0800118
Mathieu Chartier9e868092016-10-31 14:58:04 -0700119 ObjPtr<String> Intern() REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800120
Vladimir Marko9b81ac32019-05-16 16:47:08 +0100121 template <bool kIsInstrumented = true>
Vladimir Marko179b7c62019-03-22 13:38:57 +0000122 ALWAYS_INLINE static ObjPtr<String> AllocFromByteArray(Thread* self,
123 int32_t byte_length,
124 Handle<ByteArray> array,
125 int32_t offset,
126 int32_t high_byte,
127 gc::AllocatorType allocator_type)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700128 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Jeff Hao848f70a2014-01-15 13:49:50 -0800129
Vladimir Marko9b81ac32019-05-16 16:47:08 +0100130 template <bool kIsInstrumented = true>
Vladimir Marko179b7c62019-03-22 13:38:57 +0000131 ALWAYS_INLINE static ObjPtr<String> AllocFromCharArray(Thread* self,
132 int32_t count,
133 Handle<CharArray> array,
134 int32_t offset,
135 gc::AllocatorType allocator_type)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700136 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Jeff Hao848f70a2014-01-15 13:49:50 -0800137
Vladimir Marko9b81ac32019-05-16 16:47:08 +0100138 template <bool kIsInstrumented = true>
Vladimir Marko179b7c62019-03-22 13:38:57 +0000139 ALWAYS_INLINE static ObjPtr<String> AllocFromString(Thread* self,
140 int32_t string_length,
141 Handle<String> string,
142 int32_t offset,
143 gc::AllocatorType allocator_type)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700144 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Jeff Hao848f70a2014-01-15 13:49:50 -0800145
Vladimir Marko9b81ac32019-05-16 16:47:08 +0100146 template <bool kIsInstrumented = true>
Vladimir Marko179b7c62019-03-22 13:38:57 +0000147 ALWAYS_INLINE static ObjPtr<String> AllocEmptyString(Thread* self,
148 gc::AllocatorType allocator_type)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700149 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700150
Vladimir Marko036b0702020-10-27 10:36:06 +0000151 static ObjPtr<String> DoConcat(Thread* self, Handle<String> h_this, Handle<String> h_arg)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700152 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Jeff Hao848f70a2014-01-15 13:49:50 -0800153
Vladimir Marko179b7c62019-03-22 13:38:57 +0000154 static ObjPtr<String> AllocFromUtf16(Thread* self,
155 int32_t utf16_length,
156 const uint16_t* utf16_data_in)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700157 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800158
Vladimir Marko179b7c62019-03-22 13:38:57 +0000159 static ObjPtr<String> AllocFromModifiedUtf8(Thread* self, const char* utf)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700160 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800161
Vladimir Marko179b7c62019-03-22 13:38:57 +0000162 static ObjPtr<String> AllocFromModifiedUtf8(Thread* self,
163 int32_t utf16_length,
164 const char* utf8_data_in,
165 int32_t utf8_length)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700166 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Bruce Hoult1646d7a2015-10-28 15:06:12 +0300167
Vladimir Marko179b7c62019-03-22 13:38:57 +0000168 static ObjPtr<String> AllocFromModifiedUtf8(Thread* self,
169 int32_t utf16_length,
170 const char* utf8_data_in)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700171 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800172
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700173 bool Equals(const char* modified_utf8) REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800174
Mathieu Chartier31e88222016-10-14 18:43:19 -0700175 bool Equals(ObjPtr<String> that) REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800176
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800177 // Create a modified UTF-8 encoded std::string from a java/lang/String object.
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700178 std::string ToModifiedUtf8() REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800179
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700180 int32_t FastIndexOf(int32_t ch, int32_t start) REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800181
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700182 template <typename MemoryType>
183 int32_t FastIndexOf(MemoryType* chars, int32_t ch, int32_t start)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700184 REQUIRES_SHARED(Locks::mutator_lock_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700185
Mathieu Chartier31e88222016-10-14 18:43:19 -0700186 int32_t CompareTo(ObjPtr<String> other) REQUIRES_SHARED(Locks::mutator_lock_);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800187
Vladimir Marko3068d582019-05-28 16:39:29 +0100188 static ObjPtr<CharArray> ToCharArray(Handle<String> h_this, Thread* self)
189 REQUIRES_SHARED(Locks::mutator_lock_)
Mathieu Chartiered8990a2015-07-23 14:11:16 -0700190 REQUIRES(!Roles::uninterruptible_);
Mathieu Chartierfd04b6f2014-11-14 19:34:18 -0800191
Jeff Hao848f70a2014-01-15 13:49:50 -0800192 void GetChars(int32_t start, int32_t end, Handle<CharArray> array, int32_t index)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700193 REQUIRES_SHARED(Locks::mutator_lock_);
Mathieu Chartierfd04b6f2014-11-14 19:34:18 -0800194
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700195 template<VerifyObjectFlags kVerifyFlags = kDefaultVerifyFlags>
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700196 bool IsCompressed() REQUIRES_SHARED(Locks::mutator_lock_) {
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100197 return kUseStringCompression && IsCompressed(GetCount());
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700198 }
199
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700200 bool IsValueNull() REQUIRES_SHARED(Locks::mutator_lock_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700201
202 template<typename MemoryType>
Vladimir Markoe39f14f2017-02-10 15:44:25 +0000203 static bool AllASCII(const MemoryType* chars, const int length);
204
205 static bool DexFileStringAllASCII(const char* chars, const int length);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700206
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100207 ALWAYS_INLINE static bool IsCompressed(int32_t count) {
208 return GetCompressionFlagFromCount(count) == StringCompressionFlag::kCompressed;
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700209 }
210
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100211 ALWAYS_INLINE static StringCompressionFlag GetCompressionFlagFromCount(int32_t count) {
212 return kUseStringCompression
213 ? static_cast<StringCompressionFlag>(static_cast<uint32_t>(count) & 1u)
214 : StringCompressionFlag::kUncompressed;
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700215 }
216
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100217 ALWAYS_INLINE static int32_t GetLengthFromCount(int32_t count) {
218 return kUseStringCompression ? static_cast<int32_t>(static_cast<uint32_t>(count) >> 1) : count;
219 }
220
221 ALWAYS_INLINE static int32_t GetFlaggedCount(int32_t length, bool compressible) {
222 return kUseStringCompression
223 ? static_cast<int32_t>((static_cast<uint32_t>(length) << 1) |
224 (static_cast<uint32_t>(compressible
225 ? StringCompressionFlag::kCompressed
226 : StringCompressionFlag::kUncompressed)))
227 : length;
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700228 }
229
David Sehr709b0702016-10-13 09:12:37 -0700230 // Returns a human-readable equivalent of 'descriptor'. So "I" would be "int",
231 // "[[I" would be "int[][]", "[Ljava/lang/String;" would be
232 // "java.lang.String[]", and so forth.
233 static std::string PrettyStringDescriptor(ObjPtr<mirror::String> descriptor)
234 REQUIRES_SHARED(Locks::mutator_lock_);
235 std::string PrettyStringDescriptor()
236 REQUIRES_SHARED(Locks::mutator_lock_);
237
Vladimir Marko92907f32017-02-20 14:08:30 +0000238 static constexpr bool IsASCII(uint16_t c) {
239 // Valid ASCII characters are in range 1..0x7f. Zero is not considered ASCII
240 // because it would complicate the detection of ASCII strings in Modified-UTF8.
241 return (c - 1u) < 0x7fu;
242 }
243
Vladimir Marko7dd48b92020-11-12 15:18:40 +0000244 private:
Vladimir Marko92907f32017-02-20 14:08:30 +0000245 static bool AllASCIIExcept(const uint16_t* chars, int32_t length, uint16_t non_ascii);
246
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700247 void SetHashCode(int32_t new_hash_code) REQUIRES_SHARED(Locks::mutator_lock_) {
Sebastien Hertzd2fe10a2014-01-15 10:20:56 +0100248 // Hash code is invariant so use non-transactional mode. Also disable check as we may run inside
249 // a transaction.
Ian Rogersb0fa5dc2014-04-28 16:47:08 -0700250 DCHECK_EQ(0, GetField32(OFFSET_OF_OBJECT_MEMBER(String, hash_code_)));
251 SetField32<false, false>(OFFSET_OF_OBJECT_MEMBER(String, hash_code_), new_hash_code);
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800252 }
253
Vladimir Marko9b81ac32019-05-16 16:47:08 +0100254 template <bool kIsInstrumented = true, typename PreFenceVisitor>
Vladimir Marko179b7c62019-03-22 13:38:57 +0000255 ALWAYS_INLINE static ObjPtr<String> Alloc(Thread* self,
256 int32_t utf16_length_with_flag,
257 gc::AllocatorType allocator_type,
258 const PreFenceVisitor& pre_fence_visitor)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700259 REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!Roles::uninterruptible_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700260
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800261 // Field order required by test "ValidateFieldOrderOfJavaCppUnionClasses".
Vladimir Marko595beb32017-02-06 14:11:54 +0000262
263 // If string compression is enabled, count_ holds the StringCompressionFlag in the
264 // least significant bit and the length in the remaining bits, length = count_ >> 1.
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800265 int32_t count_;
266
267 uint32_t hash_code_;
268
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700269 // Compression of all-ASCII into 8-bit memory leads to usage one of these fields
270 union {
271 uint16_t value_[0];
272 uint8_t value_compressed_[0];
273 };
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800274
Vladimir Marko552a1342017-10-31 10:56:47 +0000275 friend class art::StringBuilderAppend;
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800276 friend struct art::StringOffsets; // for verifying offset information
Ian Rogers6f3dbba2014-10-14 17:41:57 -0700277
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800278 DISALLOW_IMPLICIT_CONSTRUCTORS(String);
279};
280
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800281} // namespace mirror
282} // namespace art
283
Brian Carlstromfc0e3212013-07-17 14:40:12 -0700284#endif // ART_RUNTIME_MIRROR_STRING_H_