| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * Copyright (c) 2020, Andreas Kling <kling@serenityos.org> | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |  * Copyright (c) 2022, Linus Groh <linusg@serenityos.org> | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2021-04-22 01:24:48 -07:00
										 |  |  |  * SPDX-License-Identifier: BSD-2-Clause | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | #include <AK/CharacterTypes.h>
 | 
					
						
							|  |  |  | #include <AK/Utf16View.h>
 | 
					
						
							| 
									
										
										
										
											2022-11-23 13:41:50 +01:00
										 |  |  | #include <AK/Utf8View.h>
 | 
					
						
							| 
									
										
										
										
											2022-02-12 00:48:23 -08:00
										 |  |  | #include <LibJS/Runtime/AbstractOperations.h>
 | 
					
						
							|  |  |  | #include <LibJS/Runtime/GlobalObject.h>
 | 
					
						
							| 
									
										
										
										
											2020-03-16 14:20:30 +01:00
										 |  |  | #include <LibJS/Runtime/PrimitiveString.h>
 | 
					
						
							| 
									
										
										
										
											2022-02-12 00:48:23 -08:00
										 |  |  | #include <LibJS/Runtime/PropertyKey.h>
 | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  | #include <LibJS/Runtime/ThrowableStringBuilder.h>
 | 
					
						
							| 
									
										
										
										
											2020-09-27 20:03:42 +02:00
										 |  |  | #include <LibJS/Runtime/VM.h>
 | 
					
						
							| 
									
										
										
										
											2022-02-14 15:06:16 +01:00
										 |  |  | #include <LibJS/Runtime/Value.h>
 | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | namespace JS { | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | PrimitiveString::PrimitiveString(PrimitiveString& lhs, PrimitiveString& rhs) | 
					
						
							| 
									
										
										
										
											2022-08-06 01:06:02 +01:00
										 |  |  |     : m_is_rope(true) | 
					
						
							|  |  |  |     , m_lhs(&lhs) | 
					
						
							|  |  |  |     , m_rhs(&rhs) | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | { | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  | PrimitiveString::PrimitiveString(String string) | 
					
						
							|  |  |  |     : m_utf8_string(move(string)) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-04 18:02:33 +00:00
										 |  |  | PrimitiveString::PrimitiveString(DeprecatedString string) | 
					
						
							| 
									
										
										
										
											2023-01-13 09:36:12 -05:00
										 |  |  |     : m_deprecated_string(move(string)) | 
					
						
							| 
									
										
										
										
											2021-08-01 19:02:19 -04:00
										 |  |  | { | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-08-09 09:06:45 -04:00
										 |  |  | PrimitiveString::PrimitiveString(Utf16String string) | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |     : m_utf16_string(move(string)) | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  | { | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | PrimitiveString::~PrimitiveString() | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  |     if (has_utf8_string()) | 
					
						
							|  |  |  |         vm().string_cache().remove(*m_utf8_string); | 
					
						
							| 
									
										
										
										
											2023-01-13 09:36:12 -05:00
										 |  |  |     if (has_deprecated_string()) | 
					
						
							| 
									
										
										
										
											2023-01-13 09:41:24 -05:00
										 |  |  |         vm().deprecated_string_cache().remove(*m_deprecated_string); | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | void PrimitiveString::visit_edges(Cell::Visitor& visitor) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     Cell::visit_edges(visitor); | 
					
						
							|  |  |  |     if (m_is_rope) { | 
					
						
							| 
									
										
										
										
											2022-08-06 01:06:02 +01:00
										 |  |  |         visitor.visit(m_lhs); | 
					
						
							|  |  |  |         visitor.visit(m_rhs); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-07-17 21:08:53 +02:00
										 |  |  | bool PrimitiveString::is_empty() const | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |     if (m_is_rope) { | 
					
						
							|  |  |  |         // NOTE: We never make an empty rope string.
 | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |     if (has_utf16_string()) | 
					
						
							|  |  |  |         return m_utf16_string->is_empty(); | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  |     if (has_utf8_string()) | 
					
						
							|  |  |  |         return m_utf8_string->is_empty(); | 
					
						
							| 
									
										
										
										
											2023-01-13 09:36:12 -05:00
										 |  |  |     if (has_deprecated_string()) | 
					
						
							|  |  |  |         return m_deprecated_string->is_empty(); | 
					
						
							| 
									
										
										
										
											2022-07-17 21:08:53 +02:00
										 |  |  |     VERIFY_NOT_REACHED(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  | ThrowCompletionOr<String> PrimitiveString::utf8_string() const | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     auto& vm = this->vm(); | 
					
						
							|  |  |  |     TRY(resolve_rope_if_needed()); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!has_utf8_string()) { | 
					
						
							|  |  |  |         if (has_deprecated_string()) | 
					
						
							|  |  |  |             m_utf8_string = TRY_OR_THROW_OOM(vm, String::from_utf8(*m_deprecated_string)); | 
					
						
							|  |  |  |         else if (has_utf16_string()) | 
					
						
							|  |  |  |             m_utf8_string = TRY(m_utf16_string->to_utf8(vm)); | 
					
						
							|  |  |  |         else | 
					
						
							|  |  |  |             VERIFY_NOT_REACHED(); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return *m_utf8_string; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-15 09:37:32 -05:00
										 |  |  | ThrowCompletionOr<StringView> PrimitiveString::utf8_string_view() const | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     (void)TRY(utf8_string()); | 
					
						
							|  |  |  |     return m_utf8_string->bytes_as_string_view(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 15:33:31 -05:00
										 |  |  | ThrowCompletionOr<DeprecatedString> PrimitiveString::deprecated_string() const | 
					
						
							| 
									
										
										
										
											2021-08-01 19:02:19 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |     TRY(resolve_rope_if_needed()); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 09:36:12 -05:00
										 |  |  |     if (!has_deprecated_string()) { | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  |         if (has_utf8_string()) | 
					
						
							|  |  |  |             m_deprecated_string = m_utf8_string->to_deprecated_string(); | 
					
						
							|  |  |  |         else if (has_utf16_string()) | 
					
						
							|  |  |  |             m_deprecated_string = TRY(m_utf16_string->to_deprecated_string(vm())); | 
					
						
							|  |  |  |         else | 
					
						
							|  |  |  |             VERIFY_NOT_REACHED(); | 
					
						
							| 
									
										
										
										
											2021-08-01 19:02:19 -04:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 09:36:12 -05:00
										 |  |  |     return *m_deprecated_string; | 
					
						
							| 
									
										
										
										
											2021-08-01 19:02:19 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 15:33:31 -05:00
										 |  |  | ThrowCompletionOr<Utf16String> PrimitiveString::utf16_string() const | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |     TRY(resolve_rope_if_needed()); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!has_utf16_string()) { | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  |         if (has_utf8_string()) { | 
					
						
							|  |  |  |             m_utf16_string = TRY(Utf16String::create(vm(), m_utf8_string->bytes_as_string_view())); | 
					
						
							|  |  |  |         } else { | 
					
						
							|  |  |  |             VERIFY(has_deprecated_string()); | 
					
						
							|  |  |  |             m_utf16_string = TRY(Utf16String::create(vm(), *m_deprecated_string)); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2021-08-01 19:02:19 -04:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  |     return *m_utf16_string; | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  | ThrowCompletionOr<Utf16View> PrimitiveString::utf16_string_view() const | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2023-01-13 15:33:31 -05:00
										 |  |  |     (void)TRY(utf16_string()); | 
					
						
							|  |  |  |     return m_utf16_string->view(); | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  | ThrowCompletionOr<Optional<Value>> PrimitiveString::get(VM& vm, PropertyKey const& property_key) const | 
					
						
							| 
									
										
										
										
											2022-02-12 00:48:23 -08:00
										 |  |  | { | 
					
						
							|  |  |  |     if (property_key.is_symbol()) | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |         return Optional<Value> {}; | 
					
						
							| 
									
										
										
										
											2022-02-12 00:48:23 -08:00
										 |  |  |     if (property_key.is_string()) { | 
					
						
							| 
									
										
										
										
											2022-08-21 20:38:35 +01:00
										 |  |  |         if (property_key.as_string() == vm.names.length.as_string()) { | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |             auto length = TRY(utf16_string()).length_in_code_units(); | 
					
						
							| 
									
										
										
										
											2022-02-12 00:48:23 -08:00
										 |  |  |             return Value(static_cast<double>(length)); | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2022-02-14 01:17:07 -08:00
										 |  |  |     auto index = canonical_numeric_index_string(property_key, CanonicalIndexMode::IgnoreNumericRoundtrip); | 
					
						
							|  |  |  |     if (!index.is_index()) | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |         return Optional<Value> {}; | 
					
						
							|  |  |  |     auto str = TRY(utf16_string_view()); | 
					
						
							| 
									
										
										
										
											2022-02-12 00:48:23 -08:00
										 |  |  |     auto length = str.length_in_code_units(); | 
					
						
							| 
									
										
										
										
											2022-02-14 01:17:07 -08:00
										 |  |  |     if (length <= index.as_index()) | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |         return Optional<Value> {}; | 
					
						
							|  |  |  |     return create(vm, TRY(Utf16String::create(vm, str.substring_view(index.as_index(), 1)))); | 
					
						
							| 
									
										
										
										
											2021-08-01 19:02:19 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  | NonnullGCPtr<PrimitiveString> PrimitiveString::create(VM& vm, Utf16String string) | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | { | 
					
						
							|  |  |  |     if (string.is_empty()) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |         return vm.empty_string(); | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-08-09 09:06:45 -04:00
										 |  |  |     if (string.length_in_code_units() == 1) { | 
					
						
							|  |  |  |         u16 code_unit = string.code_unit_at(0); | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  |         if (is_ascii(code_unit)) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |             return vm.single_ascii_character_string(static_cast<u8>(code_unit)); | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-14 17:40:33 +00:00
										 |  |  |     return vm.heap().allocate_without_realm<PrimitiveString>(move(string)); | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 12:24:02 -05:00
										 |  |  | NonnullGCPtr<PrimitiveString> PrimitiveString::create(VM& vm, String string) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (string.is_empty()) | 
					
						
							|  |  |  |         return vm.empty_string(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (auto bytes = string.bytes_as_string_view(); bytes.length() == 1) { | 
					
						
							|  |  |  |         auto ch = static_cast<u8>(bytes[0]); | 
					
						
							|  |  |  |         if (is_ascii(ch)) | 
					
						
							|  |  |  |             return vm.single_ascii_character_string(ch); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     auto& string_cache = vm.string_cache(); | 
					
						
							|  |  |  |     if (auto it = string_cache.find(string); it != string_cache.end()) | 
					
						
							|  |  |  |         return *it->value; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     auto new_string = vm.heap().allocate_without_realm<PrimitiveString>(string); | 
					
						
							|  |  |  |     string_cache.set(move(string), new_string); | 
					
						
							|  |  |  |     return *new_string; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-02-09 09:00:14 -05:00
										 |  |  | ThrowCompletionOr<NonnullGCPtr<PrimitiveString>> PrimitiveString::create(VM& vm, StringView string) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     return create(vm, TRY_OR_THROW_OOM(vm, String::from_utf8(string))); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  | NonnullGCPtr<PrimitiveString> PrimitiveString::create(VM& vm, DeprecatedString string) | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2020-09-22 16:36:33 +02:00
										 |  |  |     if (string.is_empty()) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |         return vm.empty_string(); | 
					
						
							| 
									
										
										
										
											2020-10-22 17:43:48 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  |     if (string.length() == 1) { | 
					
						
							|  |  |  |         auto ch = static_cast<u8>(string.characters()[0]); | 
					
						
							|  |  |  |         if (is_ascii(ch)) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |             return vm.single_ascii_character_string(ch); | 
					
						
							| 
									
										
										
										
											2021-07-20 10:46:53 -04:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-13 09:41:24 -05:00
										 |  |  |     auto& string_cache = vm.deprecated_string_cache(); | 
					
						
							| 
									
										
										
										
											2021-10-02 01:36:57 +02:00
										 |  |  |     auto it = string_cache.find(string); | 
					
						
							|  |  |  |     if (it == string_cache.end()) { | 
					
						
							| 
									
										
										
										
											2022-12-14 17:40:33 +00:00
										 |  |  |         auto new_string = vm.heap().allocate_without_realm<PrimitiveString>(string); | 
					
						
							| 
									
										
										
										
											2021-10-02 01:36:57 +02:00
										 |  |  |         string_cache.set(move(string), new_string); | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |         return *new_string; | 
					
						
							| 
									
										
										
										
											2021-10-02 01:36:57 +02:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |     return *it->value; | 
					
						
							| 
									
										
										
										
											2020-04-04 12:57:37 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-02-09 09:00:14 -05:00
										 |  |  | NonnullGCPtr<PrimitiveString> PrimitiveString::create(VM& vm, DeprecatedFlyString const& string) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     return create(vm, string.impl()); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  | NonnullGCPtr<PrimitiveString> PrimitiveString::create(VM& vm, PrimitiveString& lhs, PrimitiveString& rhs) | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | { | 
					
						
							|  |  |  |     // We're here to concatenate two strings into a new rope string.
 | 
					
						
							|  |  |  |     // However, if any of them are empty, no rope is required.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     bool lhs_empty = lhs.is_empty(); | 
					
						
							|  |  |  |     bool rhs_empty = rhs.is_empty(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (lhs_empty && rhs_empty) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |         return vm.empty_string(); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     if (lhs_empty) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |         return rhs; | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     if (rhs_empty) | 
					
						
							| 
									
										
										
										
											2022-12-06 22:17:27 +00:00
										 |  |  |         return lhs; | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-14 17:40:33 +00:00
										 |  |  |     return vm.heap().allocate_without_realm<PrimitiveString>(lhs, rhs); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  | ThrowCompletionOr<void> PrimitiveString::resolve_rope_if_needed() const | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | { | 
					
						
							|  |  |  |     if (!m_is_rope) | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |         return {}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     auto& vm = this->vm(); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     // NOTE: Special case for two concatenated UTF-16 strings.
 | 
					
						
							|  |  |  |     //       This is here as an optimization, although I'm unsure how valuable it is.
 | 
					
						
							| 
									
										
										
										
											2022-08-06 01:06:02 +01:00
										 |  |  |     if (m_lhs->has_utf16_string() && m_rhs->has_utf16_string()) { | 
					
						
							| 
									
										
										
										
											2023-01-13 15:33:31 -05:00
										 |  |  |         auto const& lhs_string = m_lhs->m_utf16_string.value(); | 
					
						
							|  |  |  |         auto const& rhs_string = m_rhs->m_utf16_string.value(); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-06 11:00:24 -05:00
										 |  |  |         Utf16Data combined; | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |         TRY_OR_THROW_OOM(vm, combined.try_ensure_capacity(lhs_string.length_in_code_units() + rhs_string.length_in_code_units())); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |         combined.extend(lhs_string.string()); | 
					
						
							|  |  |  |         combined.extend(rhs_string.string()); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |         m_utf16_string = TRY(Utf16String::create(vm, move(combined))); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |         m_is_rope = false; | 
					
						
							| 
									
										
										
										
											2022-08-06 01:06:02 +01:00
										 |  |  |         m_lhs = nullptr; | 
					
						
							|  |  |  |         m_rhs = nullptr; | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |         return {}; | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // This vector will hold all the pieces of the rope that need to be assembled
 | 
					
						
							|  |  |  |     // into the resolved string.
 | 
					
						
							|  |  |  |     Vector<PrimitiveString const*> pieces; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // NOTE: We traverse the rope tree without using recursion, since we'd run out of
 | 
					
						
							|  |  |  |     //       stack space quickly when handling a long sequence of unresolved concatenations.
 | 
					
						
							|  |  |  |     Vector<PrimitiveString const*> stack; | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |     TRY_OR_THROW_OOM(vm, stack.try_append(m_rhs)); | 
					
						
							|  |  |  |     TRY_OR_THROW_OOM(vm, stack.try_append(m_lhs)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |     while (!stack.is_empty()) { | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |         auto const* current = stack.take_last(); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |         if (current->m_is_rope) { | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |             TRY_OR_THROW_OOM(vm, stack.try_append(current->m_rhs)); | 
					
						
							|  |  |  |             TRY_OR_THROW_OOM(vm, stack.try_append(current->m_lhs)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |             continue; | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |         TRY_OR_THROW_OOM(vm, pieces.try_append(current)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Now that we have all the pieces, we can concatenate them using a StringBuilder.
 | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |     ThrowableStringBuilder builder(vm); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     // We keep track of the previous piece in order to handle surrogate pairs spread across two pieces.
 | 
					
						
							|  |  |  |     PrimitiveString const* previous = nullptr; | 
					
						
							|  |  |  |     for (auto const* current : pieces) { | 
					
						
							|  |  |  |         if (!previous) { | 
					
						
							|  |  |  |             // This is the very first piece, just append it and continue.
 | 
					
						
							| 
									
										
										
										
											2023-01-14 10:31:18 -05:00
										 |  |  |             TRY(builder.append(TRY(current->utf8_string()))); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |             previous = current; | 
					
						
							|  |  |  |             continue; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Get the UTF-8 representations for both strings.
 | 
					
						
							| 
									
										
										
										
											2023-01-15 09:37:32 -05:00
										 |  |  |         auto current_string_as_utf8 = TRY(current->utf8_string_view()); | 
					
						
							|  |  |  |         auto previous_string_as_utf8 = TRY(previous->utf8_string_view()); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         // NOTE: Now we need to look at the end of the previous string and the start
 | 
					
						
							|  |  |  |         //       of the current string, to see if they should be combined into a surrogate.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Surrogates encoded as UTF-8 are 3 bytes.
 | 
					
						
							|  |  |  |         if ((previous_string_as_utf8.length() < 3) || (current_string_as_utf8.length() < 3)) { | 
					
						
							| 
									
										
										
										
											2023-01-14 10:31:18 -05:00
										 |  |  |             TRY(builder.append(current_string_as_utf8)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |             previous = current; | 
					
						
							|  |  |  |             continue; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Might the previous string end with a UTF-8 encoded surrogate?
 | 
					
						
							|  |  |  |         if ((static_cast<u8>(previous_string_as_utf8[previous_string_as_utf8.length() - 3]) & 0xf0) != 0xe0) { | 
					
						
							|  |  |  |             // If not, just append the current string and continue.
 | 
					
						
							| 
									
										
										
										
											2023-01-14 10:31:18 -05:00
										 |  |  |             TRY(builder.append(current_string_as_utf8)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |             previous = current; | 
					
						
							|  |  |  |             continue; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Might the current string begin with a UTF-8 encoded surrogate?
 | 
					
						
							|  |  |  |         if ((static_cast<u8>(current_string_as_utf8[0]) & 0xf0) != 0xe0) { | 
					
						
							|  |  |  |             // If not, just append the current string and continue.
 | 
					
						
							| 
									
										
										
										
											2023-01-14 10:31:18 -05:00
										 |  |  |             TRY(builder.append(current_string_as_utf8)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |             previous = current; | 
					
						
							|  |  |  |             continue; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         auto high_surrogate = *Utf8View(previous_string_as_utf8.substring_view(previous_string_as_utf8.length() - 3)).begin(); | 
					
						
							|  |  |  |         auto low_surrogate = *Utf8View(current_string_as_utf8).begin(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if (!Utf16View::is_high_surrogate(high_surrogate) || !Utf16View::is_low_surrogate(low_surrogate)) { | 
					
						
							| 
									
										
										
										
											2023-01-14 10:31:18 -05:00
										 |  |  |             TRY(builder.append(current_string_as_utf8)); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |             previous = current; | 
					
						
							|  |  |  |             continue; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Remove 3 bytes from the builder and replace them with the UTF-8 encoded code point.
 | 
					
						
							|  |  |  |         builder.trim(3); | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |         TRY(builder.append_code_point(Utf16View::decode_surrogate_pair(high_surrogate, low_surrogate))); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         // Append the remaining part of the current string.
 | 
					
						
							| 
									
										
										
										
											2023-01-07 15:33:15 -05:00
										 |  |  |         TRY(builder.append(current_string_as_utf8.substring_view(3))); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |         previous = current; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-14 10:31:18 -05:00
										 |  |  |     m_utf8_string = TRY(builder.to_string()); | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  |     m_is_rope = false; | 
					
						
							| 
									
										
										
										
											2022-08-06 01:06:02 +01:00
										 |  |  |     m_lhs = nullptr; | 
					
						
							|  |  |  |     m_rhs = nullptr; | 
					
						
							| 
									
										
										
										
											2023-01-07 12:24:05 -05:00
										 |  |  |     return {}; | 
					
						
							| 
									
										
										
										
											2022-08-05 23:58:47 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-03-11 18:55:01 +01:00
										 |  |  | } |