ladybird/Libraries/LibWeb/CSS/StyleValues/UnresolvedStyleValue.cpp
Andreas Kling ff13ac2b79 LibWeb: Avoid copying ASF argument component values
Parse arbitrary substitution function arguments as spans into the
existing component value list. This avoids copying each argument into a
new vector for var(), attr(), env(), if(), and inherit() parsing.

Expose a span-returning declaration-value parser that shares the same
walker as the existing vector-returning API, so the argument parser does
not duplicate declaration-value grammar logic. Substitution output still
uses owned vectors, and the unresolved Typed OM reifier now consumes
spans too.
2026-06-03 22:28:54 +02:00

225 lines
9.7 KiB
C++
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/*
* Copyright (c) 2018-2020, Andreas Kling <andreas@ladybird.org>
* Copyright (c) 2021, Tobias Christiansen <tobyase@serenityos.org>
* Copyright (c) 2021-2025, Sam Atkins <sam@ladybird.org>
* Copyright (c) 2022-2023, MacDue <macdue@dueutil.tech>
*
* SPDX-License-Identifier: BSD-2-Clause
*/
#include <AK/StringBuilder.h>
#include <LibWeb/CSS/CSSUnparsedValue.h>
#include <LibWeb/CSS/CSSVariableReferenceValue.h>
#include <LibWeb/CSS/Parser/ArbitrarySubstitutionFunctions.h>
#include <LibWeb/CSS/Parser/Parser.h>
#include <LibWeb/CSS/Parser/TokenStream.h>
#include <LibWeb/CSS/PropertyName.h>
#include <LibWeb/CSS/Serialize.h>
#include <LibWeb/CSS/StyleValues/UnresolvedStyleValue.h>
namespace Web::CSS {
static String source_text_from_component_values(Vector<Parser::ComponentValue> const& values, UnresolvedStyleValue::SourceTextMode source_text_mode)
{
StringBuilder builder;
for (auto const& value : values) {
auto original_source_text = value.original_source_text();
if (original_source_text.is_empty()) {
auto serialized_values = serialize_a_series_of_component_values(values);
if (source_text_mode == UnresolvedStyleValue::SourceTextMode::Trim)
return MUST(serialized_values.trim_ascii_whitespace());
return serialized_values;
}
builder.append(original_source_text);
}
auto source_text = builder.to_string_without_validation();
if (source_text_mode == UnresolvedStyleValue::SourceTextMode::Trim)
return MUST(source_text.trim_ascii_whitespace());
return source_text;
}
static void mark_as_attr_tainted(Vector<Parser::ComponentValue>& values)
{
for (auto& value : values)
value.set_attr_tainted();
}
StringView UnresolvedStyleValue::comparison_text() const
{
if (!m_value_comparison_text.is_empty())
return m_value_comparison_text.bytes_as_string_view();
return m_source_text.bytes_as_string_view().trim_whitespace();
}
ValueComparingNonnullRefPtr<UnresolvedStyleValue const> UnresolvedStyleValue::create(Vector<Parser::ComponentValue>&& values, Parser::SubstitutionFunctionsPresence substitution_presence, Optional<String> original_source_text, SourceTextMode source_text_mode, bool contains_attr_tainted_values)
{
auto has_original_source_text = original_source_text.has_value();
auto serialized_values = serialize_a_series_of_component_values(values);
auto source_text = [&] {
if (has_original_source_text)
return MUST(original_source_text.release_value().trim_ascii_whitespace());
if (source_text_mode == SourceTextMode::Trim)
return MUST(serialize_a_series_of_component_values_preserving_original_source_text(values).trim_ascii_whitespace());
return source_text_from_component_values(values, source_text_mode);
}();
auto value_comparison_text = has_original_source_text ? MUST(serialized_values.trim_ascii_whitespace()) : String {};
return adopt_ref(*new (nothrow) UnresolvedStyleValue(move(source_text), move(value_comparison_text), substitution_presence, contains_attr_tainted_values));
}
UnresolvedStyleValue::UnresolvedStyleValue(String source_text, String value_comparison_text, Parser::SubstitutionFunctionsPresence substitution_presence, bool contains_attr_tainted_values)
: StyleValue(Type::Unresolved)
, m_source_text(move(source_text))
, m_value_comparison_text(move(value_comparison_text))
, m_substitution_functions_presence(substitution_presence)
, m_contains_attr_tainted_values(contains_attr_tainted_values)
{
}
void UnresolvedStyleValue::serialize(StringBuilder& builder, SerializationMode) const
{
builder.append(m_source_text);
}
Vector<Parser::ComponentValue> UnresolvedStyleValue::values() const
{
auto parser = Parser::Parser::create(Parser::ParsingParams {}, m_value_comparison_text.is_empty() ? m_source_text : m_value_comparison_text);
auto values = parser.parse_as_list_of_component_values();
if (m_contains_attr_tainted_values)
mark_as_attr_tainted(values);
return values;
}
Vector<Parser::ComponentValue> UnresolvedStyleValue::tokenize() const
{
return values();
}
bool UnresolvedStyleValue::equals(StyleValue const& other) const
{
if (type() != other.type())
return false;
auto const& other_unresolved = other.as_unresolved();
return comparison_text() == other_unresolved.comparison_text();
}
static GC::Ref<CSSUnparsedValue> reify_a_list_of_component_values(JS::Realm&, ReadonlySpan<Parser::ComponentValue>);
// https://drafts.css-houdini.org/css-typed-om-1/#reify-var
static GC::Ptr<CSSVariableReferenceValue> reify_a_var_reference(JS::Realm& realm, Parser::Function function)
{
// NB: A var() might not be representable as a CSSVariableReferenceValue, for example if it has invalid syntax or
// it contains an ASF in its variable-name slot. In those cases, we return null here, so it's treated like a
// regular function.
auto maybe_var_arguments = Parser::parse_according_to_argument_grammar(Parser::ArbitrarySubstitutionFunction::Var, function.value);
if (!maybe_var_arguments.has_value())
return nullptr;
auto var_arguments = maybe_var_arguments.release_value().get<Parser::DeclarationValueList>();
// NB: Try to parse the variable name. If we can't, return null as above.
Parser::TokenStream tokens { var_arguments.first() };
tokens.discard_whitespace();
auto& maybe_variable = tokens.consume_a_token();
tokens.discard_whitespace();
if (tokens.has_next_token()
|| !maybe_variable.is(Parser::Token::Type::Ident)
|| !is_a_custom_property_name_string(maybe_variable.token().ident()))
return nullptr;
// To reify a var() reference var:
// 1. Let object be a new CSSVariableReferenceValue.
// 2. Set objects variable internal slot to the serialization of the <custom-ident> providing the variable name.
FlyString variable = maybe_variable.token().ident();
// 3. If var has a fallback value, set objects fallback internal slot to the result of reifying the fallbacks
// component values. Otherwise, set it to null.
GC::Ptr<CSSUnparsedValue> fallback;
if (var_arguments.size() > 1)
fallback = reify_a_list_of_component_values(realm, var_arguments[1]);
// 4. Return object.
return CSSVariableReferenceValue::create(realm, move(variable), move(fallback));
}
class Reifier {
public:
static Vector<CSSUnparsedSegment> reify(JS::Realm& realm, ReadonlySpan<Parser::ComponentValue> source_values)
{
Reifier reifier;
reifier.process_values(realm, source_values);
if (!reifier.m_unserialized_values.is_empty())
reifier.serialize_unserialized_values();
return move(reifier.m_reified_values);
}
private:
void process_values(JS::Realm& realm, ReadonlySpan<Parser::ComponentValue> source_values)
{
// NB: var() could be arbitrarily nested within other functions and blocks, so we have to walk the tree.
// Also, a var() might not be representable, if it has an ASF in place of its name, so those will be part
// of a string instead.
for (auto const& component_value : source_values) {
if (component_value.is_function("var"sv)) {
// First parse the var() to see if it is representable as a CSSVariableReferenceValue. It might not be,
// for example if it has an ASF in the place of its variable name. In that case we fall back to
// serializing it like a regular function.
if (auto var_reference = reify_a_var_reference(realm, component_value.function())) {
serialize_unserialized_values();
m_reified_values.append(GC::Ref { *var_reference });
continue;
}
}
if (component_value.is_function()) {
auto& function = component_value.function();
m_unserialized_values.append(function.name_token);
process_values(realm, function.value);
m_unserialized_values.append(function.end_token);
continue;
}
if (component_value.is_block()) {
auto& block = component_value.block();
m_unserialized_values.append(block.token);
process_values(realm, block.value);
m_unserialized_values.append(block.end_token);
continue;
}
m_unserialized_values.append(component_value);
}
}
void serialize_unserialized_values()
{
m_reified_values.append(serialize_a_series_of_component_values(m_unserialized_values));
m_unserialized_values.clear_with_capacity();
}
Vector<CSSUnparsedSegment> m_reified_values {};
Vector<Parser::ComponentValue> m_unserialized_values {};
};
static GC::Ref<CSSUnparsedValue> reify_a_list_of_component_values(JS::Realm& realm, ReadonlySpan<Parser::ComponentValue> component_values)
{
// To reify a list of component values from a list:
// 1. Replace all var() references in list with CSSVariableReferenceValue objects, as described in §5.4 var() References.
// 2. Replace each remaining maximal subsequence of component values in list with a single string of their concatenated serializations.
auto reified_values = Reifier::reify(realm, component_values);
// 3. Return a new CSSUnparsedValue whose [[tokens]] slot is set to list.
return CSSUnparsedValue::create(realm, move(reified_values));
}
// https://drafts.css-houdini.org/css-typed-om-1/#reify-a-list-of-component-values
GC::Ref<CSSStyleValue> UnresolvedStyleValue::reify(JS::Realm& realm, FlyString const&) const
{
auto component_values = values();
return reify_a_list_of_component_values(realm, component_values);
}
}