1 /*
2 * Copyright (C) 2019 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #include "string_builder_append.h"
18
19 #include "base/casts.h"
20 #include "base/logging.h"
21 #include "common_throws.h"
22 #include "gc/heap.h"
23 #include "mirror/array-inl.h"
24 #include "mirror/string-alloc-inl.h"
25 #include "obj_ptr-inl.h"
26 #include "runtime.h"
27 #include "well_known_classes.h"
28
29 namespace art HIDDEN {
30
31 class StringBuilderAppend::Builder {
32 public:
Builder(uint32_t format,const uint32_t * args,Thread * self)33 Builder(uint32_t format, const uint32_t* args, Thread* self)
34 : format_(format),
35 args_(args),
36 hs_(self) {}
37
38 int32_t CalculateLengthWithFlag() REQUIRES_SHARED(Locks::mutator_lock_);
39
40 void operator()(ObjPtr<mirror::Object> obj, size_t usable_size) const
41 REQUIRES_SHARED(Locks::mutator_lock_);
42
43 private:
44 static size_t Uint64Length(uint64_t value);
45
Int64Length(int64_t value)46 static size_t Int64Length(int64_t value) {
47 uint64_t v = static_cast<uint64_t>(value);
48 return (value >= 0) ? Uint64Length(v) : 1u + Uint64Length(-v);
49 }
50
RemainingSpace(ObjPtr<mirror::String> new_string,const uint8_t * data)51 static size_t RemainingSpace(ObjPtr<mirror::String> new_string, const uint8_t* data)
52 REQUIRES_SHARED(Locks::mutator_lock_) {
53 DCHECK(new_string->IsCompressed());
54 DCHECK_GE(new_string->GetLength(), data - new_string->GetValueCompressed());
55 return new_string->GetLength() - (data - new_string->GetValueCompressed());
56 }
57
RemainingSpace(ObjPtr<mirror::String> new_string,const uint16_t * data)58 static size_t RemainingSpace(ObjPtr<mirror::String> new_string, const uint16_t* data)
59 REQUIRES_SHARED(Locks::mutator_lock_) {
60 DCHECK(!new_string->IsCompressed());
61 DCHECK_GE(new_string->GetLength(), data - new_string->GetValue());
62 return new_string->GetLength() - (data - new_string->GetValue());
63 }
64
65 template <typename CharType>
66 CharType* AppendFpArg(ObjPtr<mirror::String> new_string,
67 CharType* data,
68 size_t fp_arg_index) const REQUIRES_SHARED(Locks::mutator_lock_);
69
70 template <typename CharType, size_t size>
71 static CharType* AppendLiteral(ObjPtr<mirror::String> new_string,
72 CharType* data,
73 const char (&literal)[size]) REQUIRES_SHARED(Locks::mutator_lock_);
74
75 template <typename CharType>
76 static CharType* AppendString(ObjPtr<mirror::String> new_string,
77 CharType* data,
78 ObjPtr<mirror::String> str) REQUIRES_SHARED(Locks::mutator_lock_);
79
80 template <typename CharType>
81 static CharType* AppendInt64(ObjPtr<mirror::String> new_string,
82 CharType* data,
83 int64_t value) REQUIRES_SHARED(Locks::mutator_lock_);
84
85 int32_t ConvertFpArgs() REQUIRES_SHARED(Locks::mutator_lock_);
86
87 template <typename CharType>
88 void StoreData(ObjPtr<mirror::String> new_string, CharType* data) const
89 REQUIRES_SHARED(Locks::mutator_lock_);
90
91 static constexpr char kNull[] = "null";
92 static constexpr size_t kNullLength = sizeof(kNull) - 1u;
93 static constexpr char kTrue[] = "true";
94 static constexpr size_t kTrueLength = sizeof(kTrue) - 1u;
95 static constexpr char kFalse[] = "false";
96 static constexpr size_t kFalseLength = sizeof(kFalse) - 1u;
97
98 // The format and arguments to append.
99 const uint32_t format_;
100 const uint32_t* const args_;
101
102 // References are moved to the handle scope during CalculateLengthWithFlag().
103 StackHandleScope<kMaxArgs> hs_;
104
105 // We convert float/double values using jdk.internal.math.FloatingDecimal which uses
106 // a thread-local converter under the hood. As we may have more than one
107 // float/double argument, we need to copy the data out of the converter.
108 // Maximum number of characters is 26. See BinaryToASCIIBuffer.buffer in FloatingDecimal.java .
109 // (This is more than enough for the `ExceptionalBinaryToASCIIBuffer` cases.)
110 static constexpr size_t kBinaryToASCIIBufferSize = 26;
111 uint8_t converted_fp_args_[kMaxArgs][kBinaryToASCIIBufferSize];
112 int32_t converted_fp_arg_lengths_[kMaxArgs];
113
114 // The length and flag to store when the AppendBuilder is used as a pre-fence visitor.
115 int32_t length_with_flag_ = 0u;
116 };
117
Uint64Length(uint64_t value)118 inline size_t StringBuilderAppend::Builder::Uint64Length(uint64_t value) {
119 if (value == 0u) {
120 return 1u;
121 }
122 // Calculate floor(log2(value)).
123 size_t log2_value = BitSizeOf<uint64_t>() - 1u - CLZ(value);
124 // Calculate an estimate of floor(log10(value)).
125 // log10(2) = 0.301029996 > 0.296875 = 19/64
126 // floor(log10(v)) == floor(log2(v) * log10(2))
127 // >= floor(log2(v) * 19/64)
128 // >= floor(floor(log2(v)) * 19/64)
129 // This estimate is no more that one off from the actual value because log2(value) < 64 and thus
130 // log2(v) * log10(2) - log2(v) * 19/64 < 64*(log10(2) - 19/64)
131 // for the first approximation and
132 // log2(v) * 19/64 - floor(log2(v)) * 19/64 < 19/64
133 // for the second one. Together,
134 // 64*(log10(2) - 19/64) + 19/64 = 0.56278 < 1 .
135 size_t log10_value_estimate = log2_value * 19u / 64u;
136 static constexpr uint64_t bounds[] = {
137 UINT64_C(9),
138 UINT64_C(99),
139 UINT64_C(999),
140 UINT64_C(9999),
141 UINT64_C(99999),
142 UINT64_C(999999),
143 UINT64_C(9999999),
144 UINT64_C(99999999),
145 UINT64_C(999999999),
146 UINT64_C(9999999999),
147 UINT64_C(99999999999),
148 UINT64_C(999999999999),
149 UINT64_C(9999999999999),
150 UINT64_C(99999999999999),
151 UINT64_C(999999999999999),
152 UINT64_C(9999999999999999),
153 UINT64_C(99999999999999999),
154 UINT64_C(999999999999999999),
155 UINT64_C(9999999999999999999),
156 };
157 // Add 1 for the lowest digit, add another 1 if the estimate was too low.
158 DCHECK_LT(log10_value_estimate, std::size(bounds));
159 size_t adjustment = (value > bounds[log10_value_estimate]) ? 2u : 1u;
160 return log10_value_estimate + adjustment;
161 }
162
163 template <typename CharType>
AppendFpArg(ObjPtr<mirror::String> new_string,CharType * data,size_t fp_arg_index) const164 inline CharType* StringBuilderAppend::Builder::AppendFpArg(ObjPtr<mirror::String> new_string,
165 CharType* data,
166 size_t fp_arg_index) const {
167 DCHECK_LE(fp_arg_index, std::size(converted_fp_args_));
168 const uint8_t* src = converted_fp_args_[fp_arg_index];
169 size_t length = converted_fp_arg_lengths_[fp_arg_index];
170 DCHECK_LE(length, kBinaryToASCIIBufferSize);
171 DCHECK_LE(length, RemainingSpace(new_string, data));
172 return std::copy_n(src, length, data);
173 }
174
175 template <typename CharType, size_t size>
AppendLiteral(ObjPtr<mirror::String> new_string,CharType * data,const char (& literal)[size])176 inline CharType* StringBuilderAppend::Builder::AppendLiteral(ObjPtr<mirror::String> new_string,
177 CharType* data,
178 const char (&literal)[size]) {
179 static_assert(size >= 2, "We need something to append.");
180
181 // Literals are zero-terminated.
182 constexpr size_t length = size - 1u;
183 DCHECK_EQ(literal[length], '\0');
184
185 DCHECK_LE(length, RemainingSpace(new_string, data));
186 for (size_t i = 0; i != length; ++i) {
187 data[i] = literal[i];
188 }
189 return data + length;
190 }
191
192 template <typename CharType>
AppendString(ObjPtr<mirror::String> new_string,CharType * data,ObjPtr<mirror::String> str)193 inline CharType* StringBuilderAppend::Builder::AppendString(ObjPtr<mirror::String> new_string,
194 CharType* data,
195 ObjPtr<mirror::String> str) {
196 size_t length = dchecked_integral_cast<size_t>(str->GetLength());
197 DCHECK_LE(length, RemainingSpace(new_string, data));
198 if (sizeof(CharType) == sizeof(uint8_t) || str->IsCompressed()) {
199 DCHECK(str->IsCompressed());
200 const uint8_t* value = str->GetValueCompressed();
201 for (size_t i = 0; i != length; ++i) {
202 data[i] = value[i];
203 }
204 } else {
205 const uint16_t* value = str->GetValue();
206 for (size_t i = 0; i != length; ++i) {
207 data[i] = dchecked_integral_cast<CharType>(value[i]);
208 }
209 }
210 return data + length;
211 }
212
213 template <typename CharType>
AppendInt64(ObjPtr<mirror::String> new_string,CharType * data,int64_t value)214 inline CharType* StringBuilderAppend::Builder::AppendInt64(ObjPtr<mirror::String> new_string,
215 CharType* data,
216 int64_t value) {
217 DCHECK_GE(RemainingSpace(new_string, data), Int64Length(value));
218 uint64_t v = static_cast<uint64_t>(value);
219 if (value < 0) {
220 *data = '-';
221 ++data;
222 v = -v;
223 }
224 size_t length = Uint64Length(v);
225 // Write the digits from the end, do not write the most significant digit
226 // in the loop to avoid an unnecessary division.
227 for (size_t i = 1; i != length; ++i) {
228 uint64_t digit = v % UINT64_C(10);
229 v /= UINT64_C(10);
230 data[length - i] = '0' + static_cast<char>(digit);
231 }
232 DCHECK_LE(v, 10u);
233 *data = '0' + static_cast<char>(v);
234 return data + length;
235 }
236
ConvertFpArgs()237 int32_t StringBuilderAppend::Builder::ConvertFpArgs() {
238 int32_t fp_args_length = 0u;
239 const uint32_t* current_arg = args_;
240 size_t fp_arg_index = 0u;
241 for (uint32_t f = format_; f != 0u; f >>= kBitsPerArg) {
242 DCHECK_LE(f & kArgMask, static_cast<uint32_t>(Argument::kLast));
243 bool fp_arg = false;
244 ObjPtr<mirror::Object> converter;
245 switch (static_cast<Argument>(f & kArgMask)) {
246 case Argument::kString:
247 case Argument::kBoolean:
248 case Argument::kChar:
249 case Argument::kInt:
250 break;
251 case Argument::kLong: {
252 current_arg = AlignUp(current_arg, sizeof(int64_t));
253 ++current_arg; // Skip the low word, let the common code skip the high word.
254 break;
255 }
256 case Argument::kFloat: {
257 fp_arg = true;
258 float arg = bit_cast<float>(*current_arg);
259 converter = WellKnownClasses::jdk_internal_math_FloatingDecimal_getBinaryToASCIIConverter_F
260 ->InvokeStatic<'L', 'F'>(hs_.Self(), arg);
261 break;
262 }
263 case Argument::kDouble: {
264 fp_arg = true;
265 current_arg = AlignUp(current_arg, sizeof(int64_t));
266 double arg = bit_cast<double>(
267 static_cast<uint64_t>(current_arg[0]) + (static_cast<uint64_t>(current_arg[1]) << 32));
268 converter = WellKnownClasses::jdk_internal_math_FloatingDecimal_getBinaryToASCIIConverter_D
269 ->InvokeStatic<'L', 'D'>(hs_.Self(), arg);
270 ++current_arg; // Skip the low word, let the common code skip the high word.
271 break;
272 }
273 case Argument::kStringBuilder:
274 case Argument::kCharArray:
275 case Argument::kObject:
276 LOG(FATAL) << "Unimplemented arg format: 0x" << std::hex
277 << (f & kArgMask) << " full format: 0x" << std::hex << format_;
278 UNREACHABLE();
279 default:
280 LOG(FATAL) << "Unexpected arg format: 0x" << std::hex
281 << (f & kArgMask) << " full format: 0x" << std::hex << format_;
282 UNREACHABLE();
283 }
284 if (fp_arg) {
285 // If we see an exception (presumably OOME or SOE), keep it as is, even
286 // though it may be confusing to see the stack trace for FP argument
287 // conversion continue at the StringBuilder.toString() invoke location.
288 DCHECK_EQ(converter == nullptr, hs_.Self()->IsExceptionPending());
289 if (UNLIKELY(converter == nullptr)) {
290 return -1;
291 }
292 ArtField* btab_buffer_field =
293 WellKnownClasses::jdk_internal_math_FloatingDecimal_BinaryToASCIIBuffer_buffer;
294 int32_t length;
295 if (converter->GetClass() == btab_buffer_field->GetDeclaringClass()) {
296 // Call `converter.getChars(converter.buffer)`.
297 StackHandleScope<1u> hs2(hs_.Self());
298 Handle<mirror::CharArray> buffer =
299 hs2.NewHandle(btab_buffer_field->GetObj<mirror::CharArray>(converter));
300 DCHECK(buffer != nullptr);
301 length = WellKnownClasses::jdk_internal_math_FloatingDecimal_BinaryToASCIIBuffer_getChars
302 ->InvokeInstance<'I', 'L'>(hs_.Self(), converter, buffer.Get());
303 if (UNLIKELY(hs_.Self()->IsExceptionPending())) {
304 return -1;
305 }
306 // The converted string is now at the front of the buffer.
307 DCHECK_GT(length, 0);
308 DCHECK_LE(length, buffer->GetLength());
309 DCHECK_LE(static_cast<size_t>(length), std::size(converted_fp_args_[0]));
310 DCHECK(mirror::String::AllASCII(buffer->GetData(), length));
311 std::copy_n(buffer->GetData(), length, converted_fp_args_[fp_arg_index]);
312 } else {
313 ArtField* ebtab_image_field = WellKnownClasses::
314 jdk_internal_math_FloatingDecimal_ExceptionalBinaryToASCIIBuffer_image;
315 DCHECK(converter->GetClass() == ebtab_image_field->GetDeclaringClass());
316 ObjPtr<mirror::String> converted = ebtab_image_field->GetObj<mirror::String>(converter);
317 DCHECK(converted != nullptr);
318 length = converted->GetLength();
319 if (mirror::kUseStringCompression) {
320 DCHECK(converted->IsCompressed());
321 memcpy(converted_fp_args_[fp_arg_index], converted->GetValueCompressed(), length);
322 } else {
323 DCHECK(mirror::String::AllASCII(converted->GetValue(), length));
324 std::copy_n(converted->GetValue(), length, converted_fp_args_[fp_arg_index]);
325 }
326 }
327 converted_fp_arg_lengths_[fp_arg_index] = length;
328 fp_args_length += length;
329 ++fp_arg_index;
330 }
331 ++current_arg;
332 DCHECK_LE(fp_arg_index, kMaxArgs);
333 }
334 return fp_args_length;
335 }
336
CalculateLengthWithFlag()337 inline int32_t StringBuilderAppend::Builder::CalculateLengthWithFlag() {
338 static_assert(static_cast<size_t>(Argument::kEnd) == 0u, "kEnd must be 0.");
339 bool compressible = mirror::kUseStringCompression;
340 uint64_t length = 0u;
341 bool has_fp_args = false;
342 const uint32_t* current_arg = args_;
343 for (uint32_t f = format_; f != 0u; f >>= kBitsPerArg) {
344 DCHECK_LE(f & kArgMask, static_cast<uint32_t>(Argument::kLast));
345 switch (static_cast<Argument>(f & kArgMask)) {
346 case Argument::kString: {
347 Handle<mirror::String> str =
348 hs_.NewHandle(reinterpret_cast32<mirror::String*>(*current_arg));
349 if (str != nullptr) {
350 length += str->GetLength();
351 compressible = compressible && str->IsCompressed();
352 } else {
353 length += kNullLength;
354 }
355 break;
356 }
357 case Argument::kBoolean: {
358 length += (*current_arg != 0u) ? kTrueLength : kFalseLength;
359 break;
360 }
361 case Argument::kChar: {
362 length += 1u;
363 compressible = compressible &&
364 mirror::String::IsASCII(reinterpret_cast<const uint16_t*>(current_arg)[0]);
365 break;
366 }
367 case Argument::kInt: {
368 length += Int64Length(static_cast<int32_t>(*current_arg));
369 break;
370 }
371 case Argument::kLong: {
372 current_arg = AlignUp(current_arg, sizeof(int64_t));
373 length += Int64Length(*reinterpret_cast<const int64_t*>(current_arg));
374 ++current_arg; // Skip the low word, let the common code skip the high word.
375 break;
376 }
377 case Argument::kDouble:
378 current_arg = AlignUp(current_arg, sizeof(int64_t));
379 ++current_arg; // Skip the low word, let the common code skip the high word.
380 FALLTHROUGH_INTENDED;
381 case Argument::kFloat:
382 // Conversion shall be performed in a separate pass because it calls back to
383 // managed code and we need to convert reference arguments to `Handle<>`s first.
384 has_fp_args = true;
385 break;
386
387 case Argument::kStringBuilder:
388 case Argument::kCharArray:
389 case Argument::kObject:
390 LOG(FATAL) << "Unimplemented arg format: 0x" << std::hex
391 << (f & kArgMask) << " full format: 0x" << std::hex << format_;
392 UNREACHABLE();
393 default:
394 LOG(FATAL) << "Unexpected arg format: 0x" << std::hex
395 << (f & kArgMask) << " full format: 0x" << std::hex << format_;
396 UNREACHABLE();
397 }
398 ++current_arg;
399 }
400
401 if (UNLIKELY(has_fp_args)) {
402 // Call Java helpers to convert FP args.
403 int32_t fp_args_length = ConvertFpArgs();
404 if (fp_args_length == -1) {
405 return -1;
406 }
407 DCHECK_GT(fp_args_length, 0);
408 length += fp_args_length;
409 }
410
411 if (length > std::numeric_limits<int32_t>::max()) {
412 // We cannot allocate memory for the entire result.
413 hs_.Self()->ThrowNewException("Ljava/lang/OutOfMemoryError;",
414 "Out of memory for StringBuilder append.");
415 return -1;
416 }
417
418 length_with_flag_ = mirror::String::GetFlaggedCount(length, compressible);
419 return length_with_flag_;
420 }
421
422 template <typename CharType>
StoreData(ObjPtr<mirror::String> new_string,CharType * data) const423 inline void StringBuilderAppend::Builder::StoreData(ObjPtr<mirror::String> new_string,
424 CharType* data) const {
425 size_t handle_index = 0u;
426 size_t fp_arg_index = 0u;
427 const uint32_t* current_arg = args_;
428 for (uint32_t f = format_; f != 0u; f >>= kBitsPerArg) {
429 DCHECK_LE(f & kArgMask, static_cast<uint32_t>(Argument::kLast));
430 switch (static_cast<Argument>(f & kArgMask)) {
431 case Argument::kString: {
432 DCHECK_LT(handle_index, hs_.Size());
433 ObjPtr<mirror::String> str =
434 ObjPtr<mirror::String>::DownCast(hs_.GetReference(handle_index));
435 ++handle_index;
436 if (str != nullptr) {
437 data = AppendString(new_string, data, str);
438 } else {
439 data = AppendLiteral(new_string, data, kNull);
440 }
441 break;
442 }
443 case Argument::kBoolean: {
444 if (*current_arg != 0u) {
445 data = AppendLiteral(new_string, data, kTrue);
446 } else {
447 data = AppendLiteral(new_string, data, kFalse);
448 }
449 break;
450 }
451 case Argument::kChar: {
452 DCHECK_GE(RemainingSpace(new_string, data), 1u);
453 *data = *reinterpret_cast<const CharType*>(current_arg);
454 ++data;
455 break;
456 }
457 case Argument::kInt: {
458 data = AppendInt64(new_string, data, static_cast<int32_t>(*current_arg));
459 break;
460 }
461 case Argument::kLong: {
462 current_arg = AlignUp(current_arg, sizeof(int64_t));
463 data = AppendInt64(new_string, data, *reinterpret_cast<const int64_t*>(current_arg));
464 ++current_arg; // Skip the low word, let the common code skip the high word.
465 break;
466 }
467 case Argument::kDouble:
468 current_arg = AlignUp(current_arg, sizeof(int64_t));
469 ++current_arg; // Skip the low word, let the common code skip the high word.
470 FALLTHROUGH_INTENDED;
471 case Argument::kFloat: {
472 data = AppendFpArg(new_string, data, fp_arg_index);
473 ++fp_arg_index;
474 break;
475 }
476
477 case Argument::kStringBuilder:
478 case Argument::kCharArray:
479 LOG(FATAL) << "Unimplemented arg format: 0x" << std::hex
480 << (f & kArgMask) << " full format: 0x" << std::hex << format_;
481 UNREACHABLE();
482 default:
483 LOG(FATAL) << "Unexpected arg format: 0x" << std::hex
484 << (f & kArgMask) << " full format: 0x" << std::hex << format_;
485 UNREACHABLE();
486 }
487 ++current_arg;
488 DCHECK_LE(fp_arg_index, std::size(converted_fp_args_));
489 }
490 DCHECK_EQ(RemainingSpace(new_string, data), 0u) << std::hex << format_;
491 }
492
operator ()(ObjPtr<mirror::Object> obj,size_t usable_size) const493 inline void StringBuilderAppend::Builder::operator()(ObjPtr<mirror::Object> obj,
494 [[maybe_unused]] size_t usable_size) const {
495 ObjPtr<mirror::String> new_string = ObjPtr<mirror::String>::DownCast(obj);
496 new_string->SetCount(length_with_flag_);
497 if (mirror::String::IsCompressed(length_with_flag_)) {
498 StoreData(new_string, new_string->GetValueCompressed());
499 } else {
500 StoreData(new_string, new_string->GetValue());
501 }
502 }
503
AppendF(uint32_t format,const uint32_t * args,Thread * self)504 ObjPtr<mirror::String> StringBuilderAppend::AppendF(uint32_t format,
505 const uint32_t* args,
506 Thread* self) {
507 Builder builder(format, args, self);
508 self->AssertNoPendingException();
509 int32_t length_with_flag = builder.CalculateLengthWithFlag();
510 if (self->IsExceptionPending()) {
511 return nullptr;
512 }
513 gc::AllocatorType allocator_type = Runtime::Current()->GetHeap()->GetCurrentAllocator();
514 ObjPtr<mirror::String> result = mirror::String::Alloc(
515 self, length_with_flag, allocator_type, builder);
516
517 return result;
518 }
519
520 } // namespace art
521