blob: 95516ace9fcde16e7bea94a139ae0664df4ea742 [file] [log] [blame]
Ian Rogersb0fa5dc2014-04-28 16:47:08 -07001/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Ian Rogersb0fa5dc2014-04-28 16:47:08 -070016#ifndef ART_RUNTIME_MIRROR_STRING_INL_H_
17#define ART_RUNTIME_MIRROR_STRING_INL_H_
18
19#include "array.h"
Vladimir Marko4ef52262015-08-26 18:12:56 +010020#include "base/bit_utils.h"
Mingyao Yang98d1cc82014-05-15 17:02:16 -070021#include "class.h"
Vladimir Marko87f3fcb2016-04-28 15:52:11 +010022#include "common_throws.h"
Jeff Hao848f70a2014-01-15 13:49:50 -080023#include "gc/heap-inl.h"
Vladimir Marko4ef52262015-08-26 18:12:56 +010024#include "globals.h"
Ian Rogersb0fa5dc2014-04-28 16:47:08 -070025#include "intern_table.h"
26#include "runtime.h"
27#include "string.h"
28#include "thread.h"
Mathieu Chartiercdfd39f2014-08-29 18:16:58 -070029#include "utf.h"
Vladimir Marko80afd022015-05-19 18:08:00 +010030#include "utils.h"
Ian Rogersb0fa5dc2014-04-28 16:47:08 -070031
32namespace art {
33namespace mirror {
34
Andreas Gampe542451c2016-07-26 09:02:02 -070035inline uint32_t String::ClassSize(PointerSize pointer_size) {
Przemyslaw Szczepaniaka4fa2e72016-06-22 13:30:36 +010036 uint32_t vtable_entries = Object::kVTableLength + 57;
Narayan Kamath5d8fa8b2016-04-13 14:17:44 +010037 return Class::ComputeClassSize(true, vtable_entries, 0, 0, 0, 1, 2, pointer_size);
Mingyao Yang98d1cc82014-05-15 17:02:16 -070038}
39
Jeff Hao848f70a2014-01-15 13:49:50 -080040// Sets string count in the allocation code path to ensure it is guarded by a CAS.
41class SetStringCountVisitor {
42 public:
43 explicit SetStringCountVisitor(int32_t count) : count_(count) {
44 }
Narayan Kamatha5afcfc2015-01-29 20:06:46 +000045
Mathieu Chartier9d156d52016-10-06 17:44:26 -070046 void operator()(ObjPtr<Object> obj, size_t usable_size ATTRIBUTE_UNUSED) const
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070047 REQUIRES_SHARED(Locks::mutator_lock_) {
Jeff Hao848f70a2014-01-15 13:49:50 -080048 // Avoid AsString as object is not yet in live bitmap or allocation stack.
Mathieu Chartier9d156d52016-10-06 17:44:26 -070049 ObjPtr<String> string = ObjPtr<String>::DownCast(obj);
Jeff Hao848f70a2014-01-15 13:49:50 -080050 string->SetCount(count_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -070051 DCHECK(!string->IsCompressed() || kUseStringCompression);
Jeff Hao848f70a2014-01-15 13:49:50 -080052 }
Ian Rogersb0fa5dc2014-04-28 16:47:08 -070053
Jeff Hao848f70a2014-01-15 13:49:50 -080054 private:
55 const int32_t count_;
56};
Ian Rogersb0fa5dc2014-04-28 16:47:08 -070057
Jeff Hao848f70a2014-01-15 13:49:50 -080058// Sets string count and value in the allocation code path to ensure it is guarded by a CAS.
59class SetStringCountAndBytesVisitor {
60 public:
Mathieu Chartier81aa0122015-04-28 10:01:28 -070061 SetStringCountAndBytesVisitor(int32_t count, Handle<ByteArray> src_array, int32_t offset,
62 int32_t high_byte)
63 : count_(count), src_array_(src_array), offset_(offset), high_byte_(high_byte) {
Jeff Hao848f70a2014-01-15 13:49:50 -080064 }
65
Mathieu Chartier9d156d52016-10-06 17:44:26 -070066 void operator()(ObjPtr<Object> obj, size_t usable_size ATTRIBUTE_UNUSED) const
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070067 REQUIRES_SHARED(Locks::mutator_lock_) {
Jeff Hao848f70a2014-01-15 13:49:50 -080068 // Avoid AsString as object is not yet in live bitmap or allocation stack.
Mathieu Chartier9d156d52016-10-06 17:44:26 -070069 ObjPtr<String> string = ObjPtr<String>::DownCast(obj);
Jeff Hao848f70a2014-01-15 13:49:50 -080070 string->SetCount(count_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -070071 DCHECK(!string->IsCompressed() || kUseStringCompression);
72 int32_t length = String::GetLengthFromCount(count_);
Mathieu Chartier81aa0122015-04-28 10:01:28 -070073 const uint8_t* const src = reinterpret_cast<uint8_t*>(src_array_->GetData()) + offset_;
jessicahandojo3aaa37b2016-07-29 14:46:37 -070074 if (string->IsCompressed()) {
75 uint8_t* valueCompressed = string->GetValueCompressed();
76 for (int i = 0; i < length; i++) {
77 valueCompressed[i] = (src[i] & 0xFF);
78 }
79 } else {
80 uint16_t* value = string->GetValue();
81 for (int i = 0; i < length; i++) {
82 value[i] = high_byte_ + (src[i] & 0xFF);
83 }
Jeff Hao848f70a2014-01-15 13:49:50 -080084 }
85 }
86
87 private:
88 const int32_t count_;
Mathieu Chartier81aa0122015-04-28 10:01:28 -070089 Handle<ByteArray> src_array_;
90 const int32_t offset_;
Jeff Hao848f70a2014-01-15 13:49:50 -080091 const int32_t high_byte_;
92};
93
94// Sets string count and value in the allocation code path to ensure it is guarded by a CAS.
Mathieu Chartier81aa0122015-04-28 10:01:28 -070095class SetStringCountAndValueVisitorFromCharArray {
Jeff Hao848f70a2014-01-15 13:49:50 -080096 public:
Mathieu Chartier81aa0122015-04-28 10:01:28 -070097 SetStringCountAndValueVisitorFromCharArray(int32_t count, Handle<CharArray> src_array,
98 int32_t offset) :
99 count_(count), src_array_(src_array), offset_(offset) {
Jeff Hao848f70a2014-01-15 13:49:50 -0800100 }
101
Mathieu Chartier9d156d52016-10-06 17:44:26 -0700102 void operator()(ObjPtr<Object> obj, size_t usable_size ATTRIBUTE_UNUSED) const
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700103 REQUIRES_SHARED(Locks::mutator_lock_) {
Jeff Hao848f70a2014-01-15 13:49:50 -0800104 // Avoid AsString as object is not yet in live bitmap or allocation stack.
Mathieu Chartier9d156d52016-10-06 17:44:26 -0700105 ObjPtr<String> string = ObjPtr<String>::DownCast(obj);
Jeff Hao848f70a2014-01-15 13:49:50 -0800106 string->SetCount(count_);
Mathieu Chartier81aa0122015-04-28 10:01:28 -0700107 const uint16_t* const src = src_array_->GetData() + offset_;
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700108 const int32_t length = String::GetLengthFromCount(count_);
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100109 if (kUseStringCompression && String::IsCompressed(count_)) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700110 for (int i = 0; i < length; ++i) {
111 string->GetValueCompressed()[i] = static_cast<uint8_t>(src[i]);
112 }
113 } else {
114 memcpy(string->GetValue(), src, length * sizeof(uint16_t));
115 }
Jeff Hao848f70a2014-01-15 13:49:50 -0800116 }
117
118 private:
119 const int32_t count_;
Mathieu Chartier81aa0122015-04-28 10:01:28 -0700120 Handle<CharArray> src_array_;
121 const int32_t offset_;
122};
123
124// Sets string count and value in the allocation code path to ensure it is guarded by a CAS.
125class SetStringCountAndValueVisitorFromString {
126 public:
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100127 SetStringCountAndValueVisitorFromString(int32_t count,
128 Handle<String> src_string,
Mathieu Chartier81aa0122015-04-28 10:01:28 -0700129 int32_t offset) :
130 count_(count), src_string_(src_string), offset_(offset) {
131 }
132
Mathieu Chartier9d156d52016-10-06 17:44:26 -0700133 void operator()(ObjPtr<Object> obj, size_t usable_size ATTRIBUTE_UNUSED) const
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700134 REQUIRES_SHARED(Locks::mutator_lock_) {
Mathieu Chartier81aa0122015-04-28 10:01:28 -0700135 // Avoid AsString as object is not yet in live bitmap or allocation stack.
Mathieu Chartier9d156d52016-10-06 17:44:26 -0700136 ObjPtr<String> string = ObjPtr<String>::DownCast(obj);
Mathieu Chartier81aa0122015-04-28 10:01:28 -0700137 string->SetCount(count_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700138 const int32_t length = String::GetLengthFromCount(count_);
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100139 bool compressible = kUseStringCompression && String::IsCompressed(count_);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700140 if (src_string_->IsCompressed()) {
141 const uint8_t* const src = src_string_->GetValueCompressed() + offset_;
142 memcpy(string->GetValueCompressed(), src, length * sizeof(uint8_t));
143 } else {
144 const uint16_t* const src = src_string_->GetValue() + offset_;
145 if (compressible) {
146 for (int i = 0; i < length; ++i) {
147 string->GetValueCompressed()[i] = static_cast<uint8_t>(src[i]);
148 }
149 } else {
150 memcpy(string->GetValue(), src, length * sizeof(uint16_t));
151 }
152 }
Mathieu Chartier81aa0122015-04-28 10:01:28 -0700153 }
154
155 private:
156 const int32_t count_;
157 Handle<String> src_string_;
158 const int32_t offset_;
Jeff Hao848f70a2014-01-15 13:49:50 -0800159};
Ian Rogersb0fa5dc2014-04-28 16:47:08 -0700160
Mathieu Chartier9e868092016-10-31 14:58:04 -0700161inline ObjPtr<String> String::Intern() {
Ian Rogersb0fa5dc2014-04-28 16:47:08 -0700162 return Runtime::Current()->GetInternTable()->InternWeak(this);
163}
164
Jeff Hao848f70a2014-01-15 13:49:50 -0800165inline uint16_t String::CharAt(int32_t index) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700166 int32_t count = GetLength();
Jeff Hao848f70a2014-01-15 13:49:50 -0800167 if (UNLIKELY((index < 0) || (index >= count))) {
Vladimir Marko87f3fcb2016-04-28 15:52:11 +0100168 ThrowStringIndexOutOfBoundsException(index, count);
Jeff Hao848f70a2014-01-15 13:49:50 -0800169 return 0;
170 }
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700171 if (IsCompressed()) {
172 return GetValueCompressed()[index];
173 } else {
174 return GetValue()[index];
175 }
176}
177
178template <typename MemoryType>
179int32_t String::FastIndexOf(MemoryType* chars, int32_t ch, int32_t start) {
180 const MemoryType* p = chars + start;
181 const MemoryType* end = chars + GetLength();
182 while (p < end) {
183 if (*p++ == ch) {
184 return (p - 1) - chars;
185 }
186 }
187 return -1;
Jeff Hao848f70a2014-01-15 13:49:50 -0800188}
189
190template<VerifyObjectFlags kVerifyFlags>
191inline size_t String::SizeOf() {
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700192 size_t size = sizeof(String);
193 if (IsCompressed()) {
194 size += (sizeof(uint8_t) * GetLength<kVerifyFlags>());
195 } else {
196 size += (sizeof(uint16_t) * GetLength<kVerifyFlags>());
197 }
Vladimir Marko4ef52262015-08-26 18:12:56 +0100198 // String.equals() intrinsics assume zero-padding up to kObjectAlignment,
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100199 // so make sure the zero-padding is actually copied around if GC compaction
200 // chooses to copy only SizeOf() bytes.
Vladimir Marko4ef52262015-08-26 18:12:56 +0100201 // http://b/23528461
202 return RoundUp(size, kObjectAlignment);
Jeff Hao848f70a2014-01-15 13:49:50 -0800203}
204
205template <bool kIsInstrumented, typename PreFenceVisitor>
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700206inline String* String::Alloc(Thread* self, int32_t utf16_length_with_flag,
207 gc::AllocatorType allocator_type,
Jeff Hao848f70a2014-01-15 13:49:50 -0800208 const PreFenceVisitor& pre_fence_visitor) {
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100209 constexpr size_t header_size = sizeof(String);
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100210 const bool compressible = kUseStringCompression && String::IsCompressed(utf16_length_with_flag);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700211 const size_t block_size = (compressible) ? sizeof(uint8_t) : sizeof(uint16_t);
212 size_t length = String::GetLengthFromCount(utf16_length_with_flag);
213 static_assert(sizeof(length) <= sizeof(size_t),
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100214 "static_cast<size_t>(utf16_length) must not lose bits.");
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700215 size_t data_size = block_size * length;
Jeff Hao848f70a2014-01-15 13:49:50 -0800216 size_t size = header_size + data_size;
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100217 // String.equals() intrinsics assume zero-padding up to kObjectAlignment,
218 // so make sure the allocator clears the padding as well.
219 // http://b/23528461
220 size_t alloc_size = RoundUp(size, kObjectAlignment);
Jeff Hao848f70a2014-01-15 13:49:50 -0800221
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700222 Class* string_class = GetJavaLangString();
Jeff Hao848f70a2014-01-15 13:49:50 -0800223 // Check for overflow and throw OutOfMemoryError if this was an unreasonable request.
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100224 // Do this by comparing with the maximum length that will _not_ cause an overflow.
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700225 const size_t overflow_length = (-header_size) / block_size; // Unsigned arithmetic.
226 const size_t max_alloc_length = overflow_length - 1u;
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100227 static_assert(IsAligned<sizeof(uint16_t)>(kObjectAlignment),
228 "kObjectAlignment must be at least as big as Java char alignment");
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700229 const size_t max_length = RoundDown(max_alloc_length, kObjectAlignment / block_size);
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100230 if (UNLIKELY(length > max_length)) {
Jeff Hao848f70a2014-01-15 13:49:50 -0800231 self->ThrowOutOfMemoryError(StringPrintf("%s of length %d would overflow",
David Sehr709b0702016-10-13 09:12:37 -0700232 Class::PrettyDescriptor(string_class).c_str(),
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700233 static_cast<int>(length)).c_str());
Jeff Hao848f70a2014-01-15 13:49:50 -0800234 return nullptr;
235 }
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100236
Jeff Hao848f70a2014-01-15 13:49:50 -0800237 gc::Heap* heap = Runtime::Current()->GetHeap();
238 return down_cast<String*>(
Vladimir Markoc2b35d22015-08-27 11:09:29 +0100239 heap->AllocObjectWithAllocator<kIsInstrumented, true>(self, string_class, alloc_size,
Jeff Haob7c8c1a2015-06-22 14:29:54 -0700240 allocator_type, pre_fence_visitor));
Jeff Hao848f70a2014-01-15 13:49:50 -0800241}
242
243template <bool kIsInstrumented>
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700244inline String* String::AllocEmptyString(Thread* self, gc::AllocatorType allocator_type) {
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100245 const int32_t length_with_flag = String::GetFlaggedCount(0, /* compressible */ true);
jessicahandojo7908c8e2016-09-09 19:05:34 -0700246 SetStringCountVisitor visitor(length_with_flag);
247 return Alloc<kIsInstrumented>(self, length_with_flag, allocator_type, visitor);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700248}
249
250template <bool kIsInstrumented>
Jeff Hao848f70a2014-01-15 13:49:50 -0800251inline String* String::AllocFromByteArray(Thread* self, int32_t byte_length,
252 Handle<ByteArray> array, int32_t offset,
253 int32_t high_byte, gc::AllocatorType allocator_type) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700254 const uint8_t* const src = reinterpret_cast<uint8_t*>(array->GetData()) + offset;
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100255 const bool compressible =
256 kUseStringCompression && String::AllASCII<uint8_t>(src, byte_length) && (high_byte == 0);
257 const int32_t length_with_flag = String::GetFlaggedCount(byte_length, compressible);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700258 SetStringCountAndBytesVisitor visitor(length_with_flag, array, offset, high_byte << 8);
259 String* string = Alloc<kIsInstrumented>(self, length_with_flag, allocator_type, visitor);
Jeff Hao848f70a2014-01-15 13:49:50 -0800260 return string;
261}
262
263template <bool kIsInstrumented>
Igor Murashkinc449e8b2015-06-10 15:56:42 -0700264inline String* String::AllocFromCharArray(Thread* self, int32_t count,
Jeff Hao848f70a2014-01-15 13:49:50 -0800265 Handle<CharArray> array, int32_t offset,
266 gc::AllocatorType allocator_type) {
Igor Murashkinc449e8b2015-06-10 15:56:42 -0700267 // It is a caller error to have a count less than the actual array's size.
268 DCHECK_GE(array->GetLength(), count);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700269 const bool compressible = kUseStringCompression &&
270 String::AllASCII<uint16_t>(array->GetData() + offset, count);
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100271 const int32_t length_with_flag = String::GetFlaggedCount(count, compressible);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700272 SetStringCountAndValueVisitorFromCharArray visitor(length_with_flag, array, offset);
273 String* new_string = Alloc<kIsInstrumented>(self, length_with_flag, allocator_type, visitor);
Jeff Hao848f70a2014-01-15 13:49:50 -0800274 return new_string;
275}
276
277template <bool kIsInstrumented>
278inline String* String::AllocFromString(Thread* self, int32_t string_length, Handle<String> string,
279 int32_t offset, gc::AllocatorType allocator_type) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700280 const bool compressible = kUseStringCompression &&
281 ((string->IsCompressed()) ? true : String::AllASCII<uint16_t>(string->GetValue() + offset,
282 string_length));
Vladimir Markofdaf0f42016-10-13 19:29:53 +0100283 const int32_t length_with_flag = String::GetFlaggedCount(string_length, compressible);
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700284 SetStringCountAndValueVisitorFromString visitor(length_with_flag, string, offset);
285 String* new_string = Alloc<kIsInstrumented>(self, length_with_flag, allocator_type, visitor);
Jeff Hao848f70a2014-01-15 13:49:50 -0800286 return new_string;
287}
288
Mathieu Chartiercdfd39f2014-08-29 18:16:58 -0700289inline int32_t String::GetHashCode() {
290 int32_t result = GetField32(OFFSET_OF_OBJECT_MEMBER(String, hash_code_));
291 if (UNLIKELY(result == 0)) {
292 result = ComputeHashCode();
293 }
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700294 if (kIsDebugBuild) {
295 if (IsCompressed()) {
296 DCHECK(result != 0 || ComputeUtf16Hash(GetValueCompressed(), GetLength()) == 0)
297 << ToModifiedUtf8() << " " << result;
298 } else {
299 DCHECK(result != 0 || ComputeUtf16Hash(GetValue(), GetLength()) == 0)
300 << ToModifiedUtf8() << " " << result;
301 }
302 }
Mathieu Chartiercdfd39f2014-08-29 18:16:58 -0700303 return result;
304}
305
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700306template<typename MemoryType>
307bool String::AllASCII(const MemoryType* const chars, const int length) {
Vladimir Marko16850ae2016-12-09 14:01:02 +0000308 static_assert(std::is_unsigned<MemoryType>::value, "Expecting unsigned MemoryType");
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700309 for (int i = 0; i < length; ++i) {
Vladimir Marko16850ae2016-12-09 14:01:02 +0000310 // Valid ASCII characters are in range 1..0x7f. Zero is not considered ASCII
311 // because it would complicate the detection of ASCII strings in Modified-UTF8.
312 if ((chars[i] - 1u) >= 0x7fu) {
jessicahandojo3aaa37b2016-07-29 14:46:37 -0700313 return false;
314 }
315 }
316 return true;
317}
318
Ian Rogersb0fa5dc2014-04-28 16:47:08 -0700319} // namespace mirror
320} // namespace art
321
322#endif // ART_RUNTIME_MIRROR_STRING_INL_H_