2020-01-18 09:38:21 +01:00
|
|
|
|
/*
|
2024-10-04 13:19:50 +02:00
|
|
|
|
* Copyright (c) 2018-2022, Andreas Kling <andreas@ladybird.org>
|
2025-05-14 12:56:03 +02:00
|
|
|
|
* Copyright (c) 2025, Jelle Raaijmakers <jelle@ladybird.org>
|
2020-01-18 09:38:21 +01:00
|
|
|
|
*
|
2021-04-22 01:24:48 -07:00
|
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2020-01-18 09:38:21 +01:00
|
|
|
|
*/
|
|
|
|
|
|
2024-09-18 11:09:07 +01:00
|
|
|
|
#include <LibUnicode/CharacterTypes.h>
|
2022-09-25 16:15:49 -06:00
|
|
|
|
#include <LibWeb/Bindings/Intrinsics.h>
|
2024-04-27 12:09:58 +12:00
|
|
|
|
#include <LibWeb/Bindings/TextPrototype.h>
|
2022-03-21 20:05:25 +01:00
|
|
|
|
#include <LibWeb/DOM/Range.h>
|
2020-03-07 10:32:51 +01:00
|
|
|
|
#include <LibWeb/DOM/Text.h>
|
2022-09-25 16:15:49 -06:00
|
|
|
|
#include <LibWeb/HTML/Scripting/Environments.h>
|
2022-03-07 23:08:26 +01:00
|
|
|
|
#include <LibWeb/HTML/Window.h>
|
2020-11-22 15:53:01 +01:00
|
|
|
|
#include <LibWeb/Layout/TextNode.h>
|
2019-06-15 18:55:47 +02:00
|
|
|
|
|
2020-07-26 19:37:56 +02:00
|
|
|
|
namespace Web::DOM {
|
2020-03-07 10:27:02 +01:00
|
|
|
|
|
2024-11-15 04:01:23 +13:00
|
|
|
|
GC_DEFINE_ALLOCATOR(Text);
|
2023-11-19 19:47:52 +01:00
|
|
|
|
|
2025-07-24 12:05:52 -04:00
|
|
|
|
Text::Text(Document& document, Utf16String data)
|
|
|
|
|
: CharacterData(document, NodeType::TEXT_NODE, move(data))
|
2019-06-15 18:55:47 +02:00
|
|
|
|
{
|
|
|
|
|
}
|
|
|
|
|
|
2025-07-24 12:05:52 -04:00
|
|
|
|
Text::Text(Document& document, NodeType type, Utf16String data)
|
|
|
|
|
: CharacterData(document, type, move(data))
|
2022-06-27 21:20:59 +01:00
|
|
|
|
{
|
2023-01-10 06:28:20 -05:00
|
|
|
|
}
|
|
|
|
|
|
2023-08-07 08:41:28 +02:00
|
|
|
|
void Text::initialize(JS::Realm& realm)
|
2023-01-10 06:28:20 -05:00
|
|
|
|
{
|
2024-03-16 13:13:08 +01:00
|
|
|
|
WEB_SET_PROTOTYPE_FOR_INTERFACE(Text);
|
2025-04-20 16:22:57 +02:00
|
|
|
|
Base::initialize(realm);
|
2022-08-28 13:42:07 +02:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void Text::visit_edges(Cell::Visitor& visitor)
|
|
|
|
|
{
|
|
|
|
|
Base::visit_edges(visitor);
|
2023-09-05 13:07:35 -04:00
|
|
|
|
SlottableMixin::visit_edges(visitor);
|
2022-06-27 21:20:59 +01:00
|
|
|
|
}
|
|
|
|
|
|
2021-09-06 01:07:11 +01:00
|
|
|
|
// https://dom.spec.whatwg.org/#dom-text-text
|
2025-07-24 12:05:52 -04:00
|
|
|
|
WebIDL::ExceptionOr<GC::Ref<Text>> Text::construct_impl(JS::Realm& realm, Utf16String data)
|
2021-09-06 01:07:11 +01:00
|
|
|
|
{
|
2022-09-25 16:15:49 -06:00
|
|
|
|
// The new Text(data) constructor steps are to set this’s data to data and this’s node document to current global object’s associated Document.
|
2025-01-21 09:12:05 -05:00
|
|
|
|
auto& window = as<HTML::Window>(HTML::current_principal_global_object());
|
2025-07-24 12:05:52 -04:00
|
|
|
|
return realm.create<Text>(window.associated_document(), move(data));
|
2021-09-06 01:07:11 +01:00
|
|
|
|
}
|
|
|
|
|
|
2022-03-21 18:57:10 +01:00
|
|
|
|
// https://dom.spec.whatwg.org/#dom-text-splittext
|
|
|
|
|
// https://dom.spec.whatwg.org/#concept-text-split
|
2024-11-15 04:01:23 +13:00
|
|
|
|
WebIDL::ExceptionOr<GC::Ref<Text>> Text::split_text(size_t offset)
|
2022-03-21 18:57:10 +01:00
|
|
|
|
{
|
|
|
|
|
// 1. Let length be node’s length.
|
|
|
|
|
auto length = this->length();
|
|
|
|
|
|
|
|
|
|
// 2. If offset is greater than length, then throw an "IndexSizeError" DOMException.
|
|
|
|
|
if (offset > length)
|
2025-08-07 19:31:52 -04:00
|
|
|
|
return WebIDL::IndexSizeError::create(realm(), "Split offset is greater than length"_utf16);
|
2022-03-21 18:57:10 +01:00
|
|
|
|
|
|
|
|
|
// 3. Let count be length minus offset.
|
|
|
|
|
auto count = length - offset;
|
|
|
|
|
|
|
|
|
|
// 4. Let new data be the result of substringing data with node node, offset offset, and count count.
|
2022-03-22 12:40:24 +00:00
|
|
|
|
auto new_data = TRY(substring_data(offset, count));
|
2022-03-21 18:57:10 +01:00
|
|
|
|
|
|
|
|
|
// 5. Let new node be a new Text node, with the same node document as node. Set new node’s data to new data.
|
2024-11-14 05:50:17 +13:00
|
|
|
|
auto new_node = realm().create<Text>(document(), new_data);
|
2022-03-21 18:57:10 +01:00
|
|
|
|
|
|
|
|
|
// 6. Let parent be node’s parent.
|
2024-11-15 04:01:23 +13:00
|
|
|
|
GC::Ptr<Node> parent = this->parent();
|
2022-03-21 18:57:10 +01:00
|
|
|
|
|
|
|
|
|
// 7. If parent is not null, then:
|
|
|
|
|
if (parent) {
|
|
|
|
|
// 1. Insert new node into parent before node’s next sibling.
|
2022-08-28 13:42:07 +02:00
|
|
|
|
parent->insert_before(*new_node, next_sibling());
|
2022-03-21 18:57:10 +01:00
|
|
|
|
|
2025-05-14 12:56:03 +02:00
|
|
|
|
// 2. For each live range whose start node is node and start offset is greater than offset, set its start node
|
|
|
|
|
// to new node and decrease its start offset by offset.
|
|
|
|
|
for (auto* range : Range::live_ranges()) {
|
|
|
|
|
if (range->start_container() == this && range->start_offset() > offset) {
|
|
|
|
|
range->set_start_node(*new_node);
|
|
|
|
|
range->decrease_start_offset(offset);
|
|
|
|
|
}
|
2022-03-21 20:05:25 +01:00
|
|
|
|
}
|
|
|
|
|
|
2025-05-14 12:56:03 +02:00
|
|
|
|
// 3. For each live range whose end node is node and end offset is greater than offset, set its end node to new
|
|
|
|
|
// node and decrease its end offset by offset.
|
|
|
|
|
for (auto* range : Range::live_ranges()) {
|
|
|
|
|
if (range->end_container() == this && range->end_offset() > offset) {
|
|
|
|
|
range->set_end_node(*new_node);
|
|
|
|
|
range->decrease_end_offset(offset);
|
|
|
|
|
}
|
2022-03-21 20:05:25 +01:00
|
|
|
|
}
|
|
|
|
|
|
2025-05-14 12:56:03 +02:00
|
|
|
|
// 4. For each live range whose start node is parent and start offset is equal to the index of node plus 1,
|
|
|
|
|
// increase its start offset by 1.
|
|
|
|
|
for (auto* range : Range::live_ranges()) {
|
2024-08-27 10:45:11 +02:00
|
|
|
|
if (range->start_container() == parent.ptr() && range->start_offset() == index() + 1)
|
2025-05-14 12:56:03 +02:00
|
|
|
|
range->increase_start_offset(1);
|
2022-03-21 20:05:25 +01:00
|
|
|
|
}
|
|
|
|
|
|
2025-05-14 12:56:03 +02:00
|
|
|
|
// 5. For each live range whose end node is parent and end offset is equal to the index of node plus 1, increase
|
|
|
|
|
// its end offset by 1.
|
|
|
|
|
for (auto* range : Range::live_ranges()) {
|
|
|
|
|
if (range->end_container() == parent.ptr() && range->end_offset() == index() + 1)
|
|
|
|
|
range->increase_end_offset(1);
|
2022-03-21 20:05:25 +01:00
|
|
|
|
}
|
2022-03-21 18:57:10 +01:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// 8. Replace data with node node, offset offset, count count, and data the empty string.
|
2025-07-24 12:05:52 -04:00
|
|
|
|
TRY(replace_data(offset, count, {}));
|
2022-03-21 18:57:10 +01:00
|
|
|
|
|
|
|
|
|
// 9. Return new node.
|
|
|
|
|
return new_node;
|
|
|
|
|
}
|
|
|
|
|
|
2024-07-19 13:57:24 -06:00
|
|
|
|
// https://dom.spec.whatwg.org/#dom-text-wholetext
|
2025-07-24 12:05:52 -04:00
|
|
|
|
Utf16String Text::whole_text()
|
2024-07-19 13:57:24 -06:00
|
|
|
|
{
|
|
|
|
|
// https://dom.spec.whatwg.org/#contiguous-text-nodes
|
|
|
|
|
// The contiguous Text nodes of a node node are node, node’s previous sibling Text node, if any, and its contiguous
|
|
|
|
|
// Text nodes, and node’s next sibling Text node, if any, and its contiguous Text nodes, avoiding any duplicates.
|
|
|
|
|
Vector<Text*> nodes;
|
|
|
|
|
|
|
|
|
|
nodes.append(this);
|
|
|
|
|
|
|
|
|
|
auto* current_node = previous_sibling();
|
|
|
|
|
while (current_node && (current_node->is_text() || current_node->is_cdata_section())) {
|
|
|
|
|
nodes.append(static_cast<Text*>(current_node));
|
|
|
|
|
current_node = current_node->previous_sibling();
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Reverse nodes so they are in tree order
|
|
|
|
|
nodes.reverse();
|
|
|
|
|
|
|
|
|
|
current_node = next_sibling();
|
|
|
|
|
while (current_node && (current_node->is_text() || current_node->is_cdata_section())) {
|
|
|
|
|
nodes.append(static_cast<Text*>(current_node));
|
|
|
|
|
current_node = current_node->next_sibling();
|
|
|
|
|
}
|
|
|
|
|
|
2025-07-24 12:05:52 -04:00
|
|
|
|
StringBuilder builder(StringBuilder::Mode::UTF16);
|
2024-07-19 13:57:24 -06:00
|
|
|
|
for (auto const& text_node : nodes)
|
|
|
|
|
builder.append(text_node->data());
|
|
|
|
|
|
2025-07-24 12:05:52 -04:00
|
|
|
|
return builder.to_utf16_string();
|
2024-07-19 13:57:24 -06:00
|
|
|
|
}
|
|
|
|
|
|
2024-09-18 11:09:07 +01:00
|
|
|
|
// https://html.spec.whatwg.org/multipage/dom.html#text-node-directionality
|
|
|
|
|
Optional<Element::Directionality> Text::directionality() const
|
|
|
|
|
{
|
|
|
|
|
// 1. If text's data does not contain a code point whose bidirectional character type is L, AL, or R, then return null.
|
|
|
|
|
// 2. Let codePoint be the first code point in text's data whose bidirectional character type is L, AL, or R.
|
|
|
|
|
Optional<Unicode::BidiClass> found_character_bidi_class;
|
2025-07-24 12:05:52 -04:00
|
|
|
|
for (auto code_point : data()) {
|
2024-09-18 11:09:07 +01:00
|
|
|
|
auto bidi_class = Unicode::bidirectional_class(code_point);
|
|
|
|
|
if (first_is_one_of(bidi_class, Unicode::BidiClass::LeftToRight, Unicode::BidiClass::RightToLeftArabic, Unicode::BidiClass::RightToLeft)) {
|
|
|
|
|
found_character_bidi_class = bidi_class;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (!found_character_bidi_class.has_value())
|
|
|
|
|
return {};
|
|
|
|
|
|
|
|
|
|
// 3. If codePoint is of bidirectional character type AL or R, then return 'rtl'.
|
|
|
|
|
if (first_is_one_of(*found_character_bidi_class, Unicode::BidiClass::RightToLeftArabic, Unicode::BidiClass::RightToLeft))
|
|
|
|
|
return Element::Directionality::Rtl;
|
|
|
|
|
|
|
|
|
|
// 4. If codePoint is of bidirectional character type L, then return 'ltr'.
|
|
|
|
|
// NOTE: codePoint should always be of bidirectional character type L by this point, so we can just return 'ltr' here.
|
|
|
|
|
VERIFY(*found_character_bidi_class == Unicode::BidiClass::LeftToRight);
|
|
|
|
|
return Element::Directionality::Ltr;
|
|
|
|
|
}
|
|
|
|
|
|
2020-03-07 10:27:02 +01:00
|
|
|
|
}
|