mirror of
https://github.com/LadybirdBrowser/ladybird.git
synced 2025-12-08 06:09:58 +00:00
Now that we don't remove whitespace when parsing, we don't need to artificially insert it back in again when serializing. We do now need to trim leading and trailing whitespace from UnresolvedStyleValues, as this previously was done as part of the whitespace insertion. This makes our serialization of UnresolvedStyleValues more correct and gets us a few WPT passes for each property in the Typed OM tests.
208 lines
7.9 KiB
C++
208 lines
7.9 KiB
C++
/*
|
|
* Copyright (c) 2021-2025, Sam Atkins <sam@ladybird.org>
|
|
*
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
*/
|
|
|
|
#include <AK/StringBuilder.h>
|
|
#include <AK/Utf8View.h>
|
|
#include <LibWeb/CSS/Parser/ComponentValue.h>
|
|
#include <LibWeb/CSS/Serialize.h>
|
|
#include <LibWeb/Infra/Strings.h>
|
|
|
|
namespace Web::CSS {
|
|
|
|
// https://www.w3.org/TR/cssom-1/#escape-a-character
|
|
void escape_a_character(StringBuilder& builder, u32 character)
|
|
{
|
|
builder.append('\\');
|
|
builder.append_code_point(character);
|
|
}
|
|
|
|
// https://www.w3.org/TR/cssom-1/#escape-a-character-as-code-point
|
|
void escape_a_character_as_code_point(StringBuilder& builder, u32 character)
|
|
{
|
|
builder.appendff("\\{:x} ", character);
|
|
}
|
|
|
|
// https://www.w3.org/TR/cssom-1/#serialize-an-identifier
|
|
void serialize_an_identifier(StringBuilder& builder, StringView ident)
|
|
{
|
|
Utf8View characters { ident };
|
|
auto first_character = characters.is_empty() ? 0 : *characters.begin();
|
|
|
|
// To serialize an identifier means to create a string represented by the concatenation of,
|
|
// for each character of the identifier:
|
|
for (auto character : characters) {
|
|
// If the character is NULL (U+0000), then the REPLACEMENT CHARACTER (U+FFFD).
|
|
if (character == 0) {
|
|
builder.append_code_point(0xFFFD);
|
|
continue;
|
|
}
|
|
// If the character is in the range [\1-\1f] (U+0001 to U+001F) or is U+007F,
|
|
// then the character escaped as code point.
|
|
if ((character >= 0x0001 && character <= 0x001F) || (character == 0x007F)) {
|
|
escape_a_character_as_code_point(builder, character);
|
|
continue;
|
|
}
|
|
// If the character is the first character and is in the range [0-9] (U+0030 to U+0039),
|
|
// then the character escaped as code point.
|
|
if (builder.is_empty() && character >= '0' && character <= '9') {
|
|
escape_a_character_as_code_point(builder, character);
|
|
continue;
|
|
}
|
|
// If the character is the second character and is in the range [0-9] (U+0030 to U+0039)
|
|
// and the first character is a "-" (U+002D), then the character escaped as code point.
|
|
if (builder.length() == 1 && first_character == '-' && character >= '0' && character <= '9') {
|
|
escape_a_character_as_code_point(builder, character);
|
|
continue;
|
|
}
|
|
// If the character is the first character and is a "-" (U+002D), and there is no second
|
|
// character, then the escaped character.
|
|
if (builder.is_empty() && character == '-' && characters.length() == 1) {
|
|
escape_a_character(builder, character);
|
|
continue;
|
|
}
|
|
// If the character is not handled by one of the above rules and is greater than or equal to U+0080, is "-" (U+002D) or "_" (U+005F), or is in one of the ranges [0-9] (U+0030 to U+0039), [A-Z] (U+0041 to U+005A), or \[a-z] (U+0061 to U+007A), then the character itself.
|
|
if ((character >= 0x0080)
|
|
|| (character == '-') || (character == '_')
|
|
|| (character >= '0' && character <= '9')
|
|
|| (character >= 'A' && character <= 'Z')
|
|
|| (character >= 'a' && character <= 'z')) {
|
|
builder.append_code_point(character);
|
|
continue;
|
|
}
|
|
// Otherwise, the escaped character.
|
|
escape_a_character(builder, character);
|
|
}
|
|
}
|
|
|
|
// https://www.w3.org/TR/cssom-1/#serialize-a-string
|
|
void serialize_a_string(StringBuilder& builder, StringView string)
|
|
{
|
|
Utf8View characters { string };
|
|
|
|
// To serialize a string means to create a string represented by '"' (U+0022), followed by the result
|
|
// of applying the rules below to each character of the given string, followed by '"' (U+0022):
|
|
builder.append('"');
|
|
|
|
for (auto character : characters) {
|
|
// If the character is NULL (U+0000), then the REPLACEMENT CHARACTER (U+FFFD).
|
|
if (character == 0) {
|
|
builder.append_code_point(0xFFFD);
|
|
continue;
|
|
}
|
|
// If the character is in the range [\1-\1f] (U+0001 to U+001F) or is U+007F, the character escaped as code point.
|
|
if ((character >= 0x0001 && character <= 0x001F) || (character == 0x007F)) {
|
|
escape_a_character_as_code_point(builder, character);
|
|
continue;
|
|
}
|
|
// If the character is '"' (U+0022) or "\" (U+005C), the escaped character.
|
|
if (character == 0x0022 || character == 0x005C) {
|
|
escape_a_character(builder, character);
|
|
continue;
|
|
}
|
|
// Otherwise, the character itself.
|
|
builder.append_code_point(character);
|
|
}
|
|
|
|
builder.append('"');
|
|
}
|
|
|
|
// https://www.w3.org/TR/cssom-1/#serialize-a-url
|
|
void serialize_a_url(StringBuilder& builder, StringView url)
|
|
{
|
|
// To serialize a URL means to create a string represented by "url(",
|
|
// followed by the serialization of the URL as a string, followed by ")".
|
|
builder.append("url("sv);
|
|
serialize_a_string(builder, url);
|
|
builder.append(')');
|
|
}
|
|
|
|
// NOTE: No spec currently exists for serializing a <'unicode-range'>.
|
|
void serialize_unicode_ranges(StringBuilder& builder, Vector<Gfx::UnicodeRange> const& unicode_ranges)
|
|
{
|
|
serialize_a_comma_separated_list(builder, unicode_ranges, [](auto& builder, Gfx::UnicodeRange unicode_range) -> void {
|
|
return serialize_a_string(builder, unicode_range.to_string());
|
|
});
|
|
}
|
|
|
|
// https://drafts.csswg.org/cssom/#serialize-a-css-value
|
|
void serialize_a_number(StringBuilder& builder, double value)
|
|
{
|
|
// -> <number>
|
|
// A base-ten number using digits 0-9 (U+0030 to U+0039) in the shortest form possible, using "." to separate
|
|
// decimals (if any), rounding the value if necessary to not produce more than 6 decimals, preceded by "-" (U+002D)
|
|
// if it is negative.
|
|
builder.appendff("{:.6}", value);
|
|
}
|
|
|
|
String serialize_an_identifier(StringView ident)
|
|
{
|
|
StringBuilder builder;
|
|
serialize_an_identifier(builder, ident);
|
|
return builder.to_string_without_validation();
|
|
}
|
|
|
|
String serialize_a_string(StringView string)
|
|
{
|
|
StringBuilder builder;
|
|
serialize_a_string(builder, string);
|
|
return builder.to_string_without_validation();
|
|
}
|
|
|
|
String serialize_a_url(StringView url)
|
|
{
|
|
StringBuilder builder;
|
|
serialize_a_url(builder, url);
|
|
return builder.to_string_without_validation();
|
|
}
|
|
|
|
String serialize_a_number(double value)
|
|
{
|
|
StringBuilder builder;
|
|
serialize_a_number(builder, value);
|
|
return builder.to_string_without_validation();
|
|
}
|
|
|
|
// https://drafts.csswg.org/cssom/#serialize-a-css-declaration
|
|
String serialize_a_css_declaration(StringView property, StringView value, Important important)
|
|
{
|
|
// 1. Let s be the empty string.
|
|
StringBuilder builder;
|
|
|
|
// 2. Append property to s.
|
|
// AD-HOC: There's no place currently on the spec where the property name properly escaped,
|
|
// and this needs to be done when custom properties have special characters.
|
|
// Related spec issues:
|
|
// - https://github.com/w3c/csswg-drafts/issues/11729
|
|
// - https://github.com/w3c/csswg-drafts/issues/12258
|
|
serialize_an_identifier(builder, property);
|
|
|
|
// 3. Append ": " (U+003A U+0020) to s.
|
|
builder.append(": "sv);
|
|
|
|
// 4. If value contains any non-whitespace characters, append value to s.
|
|
if (!value.is_whitespace())
|
|
builder.append(value);
|
|
|
|
// 5. If the important flag is set, append " !important" (U+0020 U+0021 U+0069 U+006D U+0070 U+006F U+0072 U+0074
|
|
// U+0061 U+006E U+0074) to s.
|
|
if (important == Important::Yes)
|
|
builder.append(" !important"sv);
|
|
|
|
// 6. Append ";" (U+003B) to s.
|
|
builder.append(';');
|
|
|
|
// 7. Return s.
|
|
return builder.to_string_without_validation();
|
|
}
|
|
|
|
// https://drafts.csswg.org/css-syntax/#serialization
|
|
String serialize_a_series_of_component_values(ReadonlySpan<Parser::ComponentValue> component_values)
|
|
{
|
|
// FIXME: There are special rules here where we should insert a comment between certain tokens. Do that!
|
|
return MUST(String::join(""sv, component_values));
|
|
}
|
|
|
|
}
|