ladybird/Libraries/LibHTTP/Header.cpp

/*
 * Copyright (c) 2024, Andreas Kling <andreas@ladybird.org>
 * Copyright (c) 2022-2023, Linus Groh <linusg@serenityos.org>
 * Copyright (c) 2026, Shannon Booth <shannon@serenityos.org>
 *
 * SPDX-License-Identifier: BSD-2-Clause
 */

#include <AK/AllOf.h>
#include <AK/AnyOf.h>
#include <AK/GenericLexer.h>
#include <AK/QuickSort.h>
#include <LibHTTP/HTTP.h>
#include <LibHTTP/Header.h>
#include <LibHTTP/Method.h>
#include <LibIPC/Decoder.h>
#include <LibIPC/Encoder.h>
#include <LibTextCodec/Decoder.h>
#include <LibTextCodec/Encoder.h>

namespace HTTP {

Header Header::isomorphic_encode(StringView name, StringView value)
{
    return { TextCodec::isomorphic_encode(name), TextCodec::isomorphic_encode(value) };
}

// https://www.rfc-editor.org/rfc/rfc9110.html#name-recipient-requirements
static Optional<Vector<ByteString>> extract_token_headers(ByteString const& value)
{
    Vector<ByteString> result;
    for (auto& part : value.split(',', SplitBehavior::Nothing)) {
        auto trimmed = part.trim(HTTP_WHITESPACE, TrimMode::Both);
        if (trimmed.is_empty())
            continue;
        if (!is_header_name(trimmed))
            return {};
        result.append(move(trimmed));
    }
    return result;
}

// https://fetch.spec.whatwg.org/#extract-header-values
Optional<Vector<ByteString>> Header::extract_header_values() const
{
    // NB: There is some specification work to try and rework this function, see: https://github.com/whatwg/fetch/issues/814

    // 1. If parsing header’s value, per the ABNF for header’s name, fails, then return failure.
    // 2. Return one or more values resulting from parsing header’s value, per the ABNF for header’s name.

    // ABNF taken from:
    //  * https://fetch.spec.whatwg.org/#http-new-header-syntax
    //  * https://httpwg.org/specs/rfc9110.html#field.accept-ranges

    // Access-Control-Expose-Headers = #field-name (field-name = token)
    // Access-Control-Allow-Headers  = #field-name (field-name = token)
    // Access-Control-Allow-Methods  = #method     (method = token)
    if (name.is_one_of_ignoring_ascii_case(
            "Access-Control-Expose-Headers"sv,
            "Access-Control-Allow-Headers"sv,
            "Access-Control-Allow-Methods"sv)) {
        return extract_token_headers(value);
    }

    // Access-Control-Request-Headers = 1#field-name      (field-name = token)
    // Accept-Ranges                  = acceptable-ranges (acceptable-ranges = 1#range-unit, range-unit = token)
    if (name.is_one_of_ignoring_ascii_case(
            "Access-Control-Request-Headers"sv,
            "Accept-Ranges"sv)) {
        if (auto headers = extract_token_headers(value); headers.has_value()) {
            if (headers->is_empty())
                return {};
            return headers;
        }
        return {};
    }

    // FIXME: What other headers should we handle here (or elsewhere?)
    return Vector { value };
}

// https://fetch.spec.whatwg.org/#header-name
bool is_header_name(StringView header_name)
{
    // A header name is a byte sequence that matches the field-name token production.
    return !header_name.is_empty() && all_of(header_name, is_http_token_code_point);
}

// https://fetch.spec.whatwg.org/#header-value
bool is_header_value(StringView header_value)
{
    // A header value is a byte sequence that matches the following conditions:
    // - Has no leading or trailing HTTP tab or space bytes.
    // - Contains no 0x00 (NUL) or HTTP newline bytes.
    if (header_value.is_empty())
        return true;

    auto first_byte = header_value[0];
    auto last_byte = header_value[header_value.length() - 1];

    if (is_http_tab_or_space(first_byte) || is_http_tab_or_space(last_byte))
        return false;

    return !any_of(header_value, [](auto byte) {
        return byte == 0x00 || is_http_newline(byte);
    });
}

// https://fetch.spec.whatwg.org/#concept-header-value-normalize
StringView normalize_header_value(StringView potential_value)
{
    // To normalize a byte sequence potentialValue, remove any leading and trailing HTTP whitespace bytes from
    // potentialValue.
    if (potential_value.is_empty())
        return {};
    return potential_value.trim(HTTP_WHITESPACE, TrimMode::Both);
}

// https://fetch.spec.whatwg.org/#forbidden-header-name
bool is_forbidden_request_header(Header const& header)
{
    auto const& [name, value] = header;

    // 1. If name is a byte-case-insensitive match for one of:
    // [...]
    // then return true.
    if (name.is_one_of_ignoring_ascii_case(
            "Accept-Charset"sv,
            "Accept-Encoding"sv,
            "Access-Control-Request-Headers"sv,
            "Access-Control-Request-Method"sv,
            "Connection"sv,
            "Content-Length"sv,
            "Cookie"sv,
            "Cookie2"sv,
            "Date"sv,
            "DNT"sv,
            "Expect"sv,
            "Host"sv,
            "Keep-Alive"sv,
            "Origin"sv,
            "Referer"sv,
            "Set-Cookie"sv,
            "TE"sv,
            "Trailer"sv,
            "Transfer-Encoding"sv,
            "Upgrade"sv,
            "Via"sv)) {
        return true;
    }

    // 2. If name when byte-lowercased starts with `proxy-` or `sec-`, then return true.
    if (name.starts_with("proxy-"sv, CaseSensitivity::CaseInsensitive)
        || name.starts_with("sec-"sv, CaseSensitivity::CaseInsensitive)) {
        return true;
    }

    // 3. If name is a byte-case-insensitive match for one of:
    // - `X-HTTP-Method`
    // - `X-HTTP-Method-Override`
    // - `X-Method-Override`
    // then:
    if (name.is_one_of_ignoring_ascii_case(
            "X-HTTP-Method"sv,
            "X-HTTP-Method-Override"sv,
            "X-Method-Override"sv)) {
        // 1. Let parsedValues be the result of getting, decoding, and splitting value.
        auto parsed_values = get_decode_and_split_header_value(value);

        // 2. For each method of parsedValues: if the isomorphic encoding of method is a forbidden method, then return true.
        // NB: The values returned from get_decode_and_split_header_value have already been decoded.
        if (any_of(parsed_values, [](auto const& method) { return is_forbidden_method(method); }))
            return true;
    }

    // 4. Return false.
    return false;
}

// https://fetch.spec.whatwg.org/#forbidden-response-header-name
bool is_forbidden_response_header_name(StringView header_name)
{
    // A forbidden response-header name is a header name that is a byte-case-insensitive match for one of:
    // - `Set-Cookie`
    // - `Set-Cookie2`
    return header_name.is_one_of_ignoring_ascii_case(
        "Set-Cookie"sv,
        "Set-Cookie2"sv);
}

// https://fetch.spec.whatwg.org/#header-value-get-decode-and-split
Vector<String> get_decode_and_split_header_value(StringView value)
{
    // 1. Let input be the result of isomorphic decoding value.
    auto input = TextCodec::isomorphic_decode(value);

    // 2. Let position be a position variable for input, initially pointing at the start of input.
    GenericLexer lexer { input };

    // 3. Let values be a list of strings, initially « ».
    Vector<String> values;

    // 4. Let temporaryValue be the empty string.
    StringBuilder temporary_value_builder;

    // 5. While true:
    while (true) {
        // 1. Append the result of collecting a sequence of code points that are not U+0022 (") or U+002C (,) from
        //    input, given position, to temporaryValue.
        // NOTE: The result might be the empty string.
        temporary_value_builder.append(lexer.consume_until(is_any_of("\","sv)));

        // 2. If position is not past the end of input and the code point at position within input is U+0022 ("):
        if (!lexer.is_eof() && lexer.peek() == '"') {
            // 1. Append the result of collecting an HTTP quoted string from input, given position, to temporaryValue.
            temporary_value_builder.append(collect_an_http_quoted_string(lexer));

            // 2. If position is not past the end of input, then continue.
            if (!lexer.is_eof())
                continue;
        }

        // 3. Remove all HTTP tab or space from the start and end of temporaryValue.
        auto temporary_value = MUST(String::from_utf8(temporary_value_builder.string_view().trim(HTTP_TAB_OR_SPACE, TrimMode::Both)));

        // 4. Append temporaryValue to values.
        values.append(move(temporary_value));

        // 5. Set temporaryValue to the empty string.
        temporary_value_builder.clear();

        // 6. If position is past the end of input, then return values.
        if (lexer.is_eof())
            return values;

        // 7. Assert: the code point at position within input is U+002C (,).
        VERIFY(lexer.peek() == ',');

        // 8. Advance position by 1.
        lexer.ignore(1);
    }
}

// https://fetch.spec.whatwg.org/#convert-header-names-to-a-sorted-lowercase-set
Vector<ByteString> convert_header_names_to_a_sorted_lowercase_set(ReadonlySpan<ByteString> header_names)
{
    // 1. Let headerNamesSet be a new ordered set.
    HashTable<StringView, CaseInsensitiveASCIIStringTraits> header_names_seen;
    Vector<ByteString> header_names_set;

    // 2. For each name of headerNames, append the result of byte-lowercasing name to headerNamesSet.
    for (auto const& name : header_names) {
        if (header_names_seen.contains(name))
            continue;

        header_names_seen.set(name);
        header_names_set.append(name.to_lowercase());
    }

    // 3. Return the result of sorting headerNamesSet in ascending order with byte less than.
    quick_sort(header_names_set);
    return header_names_set;
}

// https://fetch.spec.whatwg.org/#build-a-content-range
ByteString build_content_range(u64 range_start, u64 range_end, u64 full_length)
{
    // 1. Let contentRange be `bytes `.
    // 2. Append rangeStart, serialized and isomorphic encoded, to contentRange.
    // 3. Append 0x2D (-) to contentRange.
    // 4. Append rangeEnd, serialized and isomorphic encoded to contentRange.
    // 5. Append 0x2F (/) to contentRange.
    // 6. Append fullLength, serialized and isomorphic encoded to contentRange.
    // 7. Return contentRange.
    return ByteString::formatted("bytes {}-{}/{}", range_start, range_end, full_length);
}

// https://fetch.spec.whatwg.org/#simple-range-header-value
Optional<RangeHeaderValue> parse_single_range_header_value(StringView value, bool allow_whitespace)
{
    // 1. Let data be the isomorphic decoding of value.
    auto data = TextCodec::isomorphic_decode(value);

    // 2. If data does not start with "bytes", then return failure.
    if (!data.starts_with_bytes("bytes"sv))
        return {};

    // 3. Let position be a position variable for data, initially pointing at the 5th code point of data.
    GenericLexer lexer { data };
    lexer.ignore(5);

    // 4. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
    if (allow_whitespace)
        lexer.consume_while(is_http_tab_or_space);

    // 5. If the code point at position within data is not U+003D (=), then return failure.
    // 6. Advance position by 1.
    if (!lexer.consume_specific('='))
        return {};

    // 7. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
    if (allow_whitespace)
        lexer.consume_while(is_http_tab_or_space);

    // 8. Let rangeStart be the result of collecting a sequence of code points that are ASCII digits, from data given position.
    auto range_start = lexer.consume_while(is_ascii_digit);

    // 9. Let rangeStartValue be rangeStart, interpreted as decimal number, if rangeStart is not the empty string;
    //    otherwise null.
    auto range_start_value = range_start.to_number<u64>();

    // 10. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
    if (allow_whitespace)
        lexer.consume_while(is_http_tab_or_space);

    // 11. If the code point at position within data is not U+002D (-), then return failure.
    // 12. Advance position by 1.
    if (!lexer.consume_specific('-'))
        return {};

    // 13. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
    if (allow_whitespace)
        lexer.consume_while(is_http_tab_or_space);

    // 14. Let rangeEnd be the result of collecting a sequence of code points that are ASCII digits, from data given position.
    auto range_end = lexer.consume_while(is_ascii_digit);

    // 15. Let rangeEndValue be rangeEnd, interpreted as decimal number, if rangeEnd is not the empty string; otherwise null.
    auto range_end_value = range_end.to_number<u64>();

    // 16. If position is not past the end of data, then return failure.
    if (!lexer.is_eof())
        return {};

    // 17. If rangeEndValue and rangeStartValue are null, then return failure.
    if (!range_end_value.has_value() && !range_start_value.has_value())
        return {};

    // 18. If rangeStartValue and rangeEndValue are numbers, and rangeStartValue is greater than rangeEndValue, then
    //     return failure.
    if (range_start_value.has_value() && range_end_value.has_value() && *range_start_value > *range_end_value)
        return {};

    // 19. Return (rangeStartValue, rangeEndValue).
    return RangeHeaderValue { range_start_value, range_end_value };
}

}

namespace IPC {

template<>
ErrorOr<void> encode(Encoder& encoder, HTTP::Header const& header)
{
    TRY(encoder.encode(header.name));
    TRY(encoder.encode(header.value));
    return {};
}

template<>
ErrorOr<HTTP::Header> decode(Decoder& decoder)
{
    auto name = TRY(decoder.decode<ByteString>());
    auto value = TRY(decoder.decode<ByteString>());
    return HTTP::Header { move(name), move(value) };
}

}
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								/*
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								 * Copyright (c) 2024, Andreas Kling <andreas@ladybird.org>
-												LibWeb: Implement Headers.getSetCookie()

This is a normative change in the Fetch spec.
See: https://github.com/whatwg/fetch/commit/e4d3480

This also implements the changes to the 'sort and combine' algorithm,
which now treats "set-cookie" headers differently, and is exposed to JS
via the Headers' iterator.

Passes all 21 WPT tests :^)
http://wpt.live/fetch/api/headers/header-setcookie.any.html

											
										
										
											2023-02-10 22:02:18 +00:00
+								 * Copyright (c) 2022-2023, Linus Groh <linusg@serenityos.org>
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								 * Copyright (c) 2026, Shannon Booth <shannon@serenityos.org>
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								 *
 								 * SPDX-License-Identifier: BSD-2-Clause
 								 */
-												LibRegex: Add ECMAScriptRegex and migrate callers

Add `ECMAScriptRegex`, LibRegex's C++ facade for ECMAScript regexes.

The facade owns compilation, execution, captures, named groups, and
error translation for the Rust backend, which lets callers stop
depending on the legacy parser and matcher types directly. Use it in the
remaining non-LibJS callers: URLPattern, HTML input pattern handling,
and the places in LibHTTP that only needed token validation.

Where a full regex engine was unnecessary, replace those call sites with
direct character checks. Also update focused LibURL, LibHTTP, and WPT
coverage for the migrated callers and corrected surrogate handling.

											
										
										
											2026-03-25 10:52:20 +01:00
+								#include <AK/AllOf.h>
 								#include <AK/AnyOf.h>
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								#include <AK/GenericLexer.h>
 								#include <AK/QuickSort.h>
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								#include <LibHTTP/HTTP.h>
 								#include <LibHTTP/Header.h>
 								#include <LibHTTP/Method.h>
 								#include <LibIPC/Decoder.h>
 								#include <LibIPC/Encoder.h>
-												LibWeb: Implement the legacy extracting an encoding AO

											
										
										
											2023-05-10 16:26:51 -04:00
+								#include <LibTextCodec/Decoder.h>
-												LibTextCodec+LibWeb: Move isomorphic coders to LibTextCodec

This will be used outside of LibWeb.

											
										
										
											2025-11-24 12:20:51 -05:00
+								#include <LibTextCodec/Encoder.h>
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								namespace HTTP {
-												LibWeb: Add calls to JS_{DECLARE,DEFINE}_ALLOCATOR()

											
										
										
											2024-04-06 10:16:04 -07:00
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								Header Header::isomorphic_encode(StringView name, StringView value)
-												LibWeb/Fetch: Do not clone stored responses

Reading the RFC9111 spec makes it clear that the stored response was
not intended to be cloned. This is because there is a "clone response"
operation that is used in other places, but never for stored responses.

											
										
										
											2024-10-22 11:47:22 +02:00
+								{
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								    return { TextCodec::isomorphic_encode(name), TextCodec::isomorphic_encode(value) };
-												LibWeb: Add Fetch::Infrastructure::Header::from_string_pair() helper

This allows us to use this:

```cpp
auto header = TRY_OR_RETURN_OOM(realm,
    Infrastructure::Header::from_string_pair(name, value));
```

Instead of the somewhat unwieldly:

```cpp
auto header = Infrastructure::Header {
    .name = TRY_OR_RETURN_OOM(realm, ByteBuffer::copy(name.bytes())),
    .value = TRY_OR_RETURN_OOM(realm, ByteBuffer::copy(value.bytes())),
};
```

											
										
										
											2022-10-24 09:16:32 +01:00
+								}
-												LibHTTP: Ignore empty list elements when extracting token headers

It turns out that the validation of header values in db5f16f042
was a bit over aggressive. extract_token_headers previously treated
empty list elements (empty or whitespace-only after trimming) as parse
failures. This is incorrect per RFC 9110, which specifies that
recipients must ignore empty list elements in comma-separated header
values.

> A recipient MUST parse and ignore a reasonable number of empty
> list elements

											
										
										
											2026-03-15 19:39:29 +01:00
+								// https://www.rfc-editor.org/rfc/rfc9110.html#name-recipient-requirements
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								static Optional<Vector<ByteString>> extract_token_headers(ByteString const& value)
 								{
-												LibHTTP: Ignore empty list elements when extracting token headers

It turns out that the validation of header values in db5f16f042
was a bit over aggressive. extract_token_headers previously treated
empty list elements (empty or whitespace-only after trimming) as parse
failures. This is incorrect per RFC 9110, which specifies that
recipients must ignore empty list elements in comma-separated header
values.

> A recipient MUST parse and ignore a reasonable number of empty
> list elements

											
										
										
											2026-03-15 19:39:29 +01:00
+								    Vector<ByteString> result;
 								    for (auto& part : value.split(',', SplitBehavior::Nothing)) {
 								        auto trimmed = part.trim(HTTP_WHITESPACE, TrimMode::Both);
 								        if (trimmed.is_empty())
 								            continue;
 								        if (!is_header_name(trimmed))
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								            return {};
-												LibHTTP: Ignore empty list elements when extracting token headers

It turns out that the validation of header values in db5f16f042
was a bit over aggressive. extract_token_headers previously treated
empty list elements (empty or whitespace-only after trimming) as parse
failures. This is incorrect per RFC 9110, which specifies that
recipients must ignore empty list elements in comma-separated header
values.

> A recipient MUST parse and ignore a reasonable number of empty
> list elements

											
										
										
											2026-03-15 19:39:29 +01:00
+								        result.append(move(trimmed));
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								    }
-												LibHTTP: Ignore empty list elements when extracting token headers

It turns out that the validation of header values in db5f16f042
was a bit over aggressive. extract_token_headers previously treated
empty list elements (empty or whitespace-only after trimming) as parse
failures. This is incorrect per RFC 9110, which specifies that
recipients must ignore empty list elements in comma-separated header
values.

> A recipient MUST parse and ignore a reasonable number of empty
> list elements

											
										
										
											2026-03-15 19:39:29 +01:00
+								    return result;
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								}
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								// https://fetch.spec.whatwg.org/#extract-header-values
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								Optional<Vector<ByteString>> Header::extract_header_values() const
-												LibWeb: Make Fetch::Infrastructure::{Request,Response,HeaderList} GC'd

This is the way.

On a more serious note, there's no reason to keep adding ref-counted
classes to LibWeb now that the majority of classes is GC'd - it only
adds the risk of discovering some cycle down the line, and forces us to
use handles as we can't visit().

											
										
										
											2022-10-30 01:52:07 +00:00
+								{
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								    // NB: There is some specification work to try and rework this function, see: https://github.com/whatwg/fetch/issues/814
 								    // 1. If parsing header’s value, per the ABNF for header’s name, fails, then return failure.
 								    // 2. Return one or more values resulting from parsing header’s value, per the ABNF for header’s name.
 								    // ABNF taken from:
 								    //  * https://fetch.spec.whatwg.org/#http-new-header-syntax
 								    //  * https://httpwg.org/specs/rfc9110.html#field.accept-ranges
-												LibWeb: Make Fetch::Infrastructure::{Request,Response,HeaderList} GC'd

This is the way.

On a more serious note, there's no reason to keep adding ref-counted
classes to LibWeb now that the majority of classes is GC'd - it only
adds the risk of discovering some cycle down the line, and forces us to
use handles as we can't visit().

											
										
										
											2022-10-30 01:52:07 +00:00
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								    // Access-Control-Expose-Headers = #field-name (field-name = token)
 								    // Access-Control-Allow-Headers  = #field-name (field-name = token)
 								    // Access-Control-Allow-Methods  = #method     (method = token)
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    if (name.is_one_of_ignoring_ascii_case(
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								            "Access-Control-Expose-Headers"sv,
 								            "Access-Control-Allow-Headers"sv,
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								            "Access-Control-Allow-Methods"sv)) {
 								        return extract_token_headers(value);
 								    }
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								    // Access-Control-Request-Headers = 1#field-name      (field-name = token)
 								    // Accept-Ranges                  = acceptable-ranges (acceptable-ranges = 1#range-unit, range-unit = token)
 								    if (name.is_one_of_ignoring_ascii_case(
 								            "Access-Control-Request-Headers"sv,
 								            "Accept-Ranges"sv)) {
 								        if (auto headers = extract_token_headers(value); headers.has_value()) {
 								            if (headers->is_empty())
 								                return {};
 								            return headers;
 								        }
 								        return {};
-												LibWeb: Support for Access-Control-Expose-Headers in Fetch

This adds the headers named in Access-Control-Expose-Headers to the
response's CORS-exposed header-name list which allows those headers to
be accessed from JS.

											
										
										
											2023-08-01 21:40:30 +12:00
+								    }
-												LibHTTP: Parse token-list headers according to their ABNF

The previous implementation did not fully align with each
headers ABNF, so would not reject some headers as we should
have been doing.

Fixes 6 WPT subtests for

https://wpt.live/cors/access-control-expose-headers-parsing.window.html

											
										
										
											2026-02-28 18:36:44 +01:00
+								    // FIXME: What other headers should we handle here (or elsewhere?)
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    return Vector { value };
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								}
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								// https://fetch.spec.whatwg.org/#header-name
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								bool is_header_name(StringView header_name)
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								{
 								    // A header name is a byte sequence that matches the field-name token production.
-												LibRegex: Add ECMAScriptRegex and migrate callers

Add `ECMAScriptRegex`, LibRegex's C++ facade for ECMAScript regexes.

The facade owns compilation, execution, captures, named groups, and
error translation for the Rust backend, which lets callers stop
depending on the legacy parser and matcher types directly. Use it in the
remaining non-LibJS callers: URLPattern, HTML input pattern handling,
and the places in LibHTTP that only needed token validation.

Where a full regex engine was unnecessary, replace those call sites with
direct character checks. Also update focused LibURL, LibHTTP, and WPT
coverage for the migrated callers and corrected surrogate handling.

											
										
										
											2026-03-25 10:52:20 +01:00
+								    return !header_name.is_empty() && all_of(header_name, is_http_token_code_point);
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								}
 								// https://fetch.spec.whatwg.org/#header-value
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								bool is_header_value(StringView header_value)
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								{
 								    // A header value is a byte sequence that matches the following conditions:
 								    // - Has no leading or trailing HTTP tab or space bytes.
 								    // - Contains no 0x00 (NUL) or HTTP newline bytes.
 								    if (header_value.is_empty())
 								        return true;
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    auto first_byte = header_value[0];
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    auto last_byte = header_value[header_value.length() - 1];
 								    if (is_http_tab_or_space(first_byte) || is_http_tab_or_space(last_byte))
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								        return false;
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    return !any_of(header_value, [](auto byte) {
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								        return byte == 0x00 || is_http_newline(byte);
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    });
 								}
 								// https://fetch.spec.whatwg.org/#concept-header-value-normalize
-												LibHTTP: Return a StringView from HTTP::normalize_header_value

This lets callers that do not need a string avoid a needless allocation.
All callers that do need a string will already either:

* Turn it into a ByteString themselves
* Pass this along to the isomorphic encoder

											
										
										
											2026-02-26 14:51:41 -05:00
+								StringView normalize_header_value(StringView potential_value)
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								{
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    // To normalize a byte sequence potentialValue, remove any leading and trailing HTTP whitespace bytes from
 								    // potentialValue.
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    if (potential_value.is_empty())
-												LibWeb: Remove OOM propagation from Fetch::Infrastructure::Headers

											
										
										
											2024-04-26 13:24:20 -04:00
+								        return {};
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    return potential_value.trim(HTTP_WHITESPACE, TrimMode::Both);
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								}
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								// https://fetch.spec.whatwg.org/#forbidden-header-name
 								bool is_forbidden_request_header(Header const& header)
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								{
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    auto const& [name, value] = header;
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    // 1. If name is a byte-case-insensitive match for one of:
 								    // [...]
 								    // then return true.
 								    if (name.is_one_of_ignoring_ascii_case(
 								            "Accept-Charset"sv,
 								            "Accept-Encoding"sv,
 								            "Access-Control-Request-Headers"sv,
 								            "Access-Control-Request-Method"sv,
 								            "Connection"sv,
 								            "Content-Length"sv,
 								            "Cookie"sv,
 								            "Cookie2"sv,
 								            "Date"sv,
 								            "DNT"sv,
 								            "Expect"sv,
 								            "Host"sv,
 								            "Keep-Alive"sv,
 								            "Origin"sv,
 								            "Referer"sv,
 								            "Set-Cookie"sv,
 								            "TE"sv,
 								            "Trailer"sv,
 								            "Transfer-Encoding"sv,
 								            "Upgrade"sv,
 								            "Via"sv)) {
 								        return true;
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    }
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    // 2. If name when byte-lowercased starts with `proxy-` or `sec-`, then return true.
 								    if (name.starts_with("proxy-"sv, CaseSensitivity::CaseInsensitive)
 								        || name.starts_with("sec-"sv, CaseSensitivity::CaseInsensitive)) {
 								        return true;
-												LibWeb/Fetch: Refactor forbidden request-headers

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/92e6c91
- https://github.com/whatwg/xhr/commit/494431a

											
										
										
											2022-12-07 18:16:32 +00:00
+								    }
 								    // 3. If name is a byte-case-insensitive match for one of:
 								    // - `X-HTTP-Method`
 								    // - `X-HTTP-Method-Override`
 								    // - `X-Method-Override`
 								    // then:
-												Everywhere: Rename equals_ignoring_case => equals_ignoring_ascii_case

Let's make it clear that these functions deal with ASCII case only.

											
										
										
											2023-03-10 08:48:54 +01:00
+								    if (name.is_one_of_ignoring_ascii_case(
-												LibWeb/Fetch: Refactor forbidden request-headers

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/92e6c91
- https://github.com/whatwg/xhr/commit/494431a

											
										
										
											2022-12-07 18:16:32 +00:00
+								            "X-HTTP-Method"sv,
 								            "X-HTTP-Method-Override"sv,
-												LibWeb/Fetch: Correct check for X-Method-Override

Previously the code was checking for X-Method.

See:
 - http://wpt.live/fetch/api/basic/request-forbidden-headers.any.html

											
										
										
											2024-08-04 11:53:52 +01:00
+								            "X-Method-Override"sv)) {
-												LibWeb/Fetch: Refactor forbidden request-headers

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/92e6c91
- https://github.com/whatwg/xhr/commit/494431a

											
										
										
											2022-12-07 18:16:32 +00:00
+								        // 1. Let parsedValues be the result of getting, decoding, and splitting value.
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								        auto parsed_values = get_decode_and_split_header_value(value);
-												LibWeb/Fetch: Refactor forbidden request-headers

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/92e6c91
- https://github.com/whatwg/xhr/commit/494431a

											
										
										
											2022-12-07 18:16:32 +00:00
-												LibWeb/Fetch: Tweak wording in some spec comments

This is a change in the Fetch spec.

See: https://github.com/whatwg/fetch/commit/223ca89

											
										
										
											2022-12-07 18:29:17 +00:00
+								        // 2. For each method of parsedValues: if the isomorphic encoding of method is a forbidden method, then return true.
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								        // NB: The values returned from get_decode_and_split_header_value have already been decoded.
 								        if (any_of(parsed_values, [](auto const& method) { return is_forbidden_method(method); }))
-												LibWeb/Fetch: Refactor forbidden request-headers

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/92e6c91
- https://github.com/whatwg/xhr/commit/494431a

											
										
										
											2022-12-07 18:16:32 +00:00
+								            return true;
 								    }
 								    // 4. Return false.
 								    return false;
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								}
 								// https://fetch.spec.whatwg.org/#forbidden-response-header-name
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								bool is_forbidden_response_header_name(StringView header_name)
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								{
 								    // A forbidden response-header name is a header name that is a byte-case-insensitive match for one of:
 								    // - `Set-Cookie`
 								    // - `Set-Cookie2`
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    return header_name.is_one_of_ignoring_ascii_case(
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								        "Set-Cookie"sv,
 								        "Set-Cookie2"sv);
 								}
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								// https://fetch.spec.whatwg.org/#header-value-get-decode-and-split
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								Vector<String> get_decode_and_split_header_value(StringView value)
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
+								{
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    // 1. Let input be the result of isomorphic decoding value.
-												LibTextCodec+LibWeb: Move isomorphic coders to LibTextCodec

This will be used outside of LibWeb.

											
										
										
											2025-11-24 12:20:51 -05:00
+								    auto input = TextCodec::isomorphic_decode(value);
-												LibWeb: Parse header value lists for some CORS headers

This adds a simple and incomplete implementation for extracting some
specific CORS headers that are used by fetch. This unifies the existing
ad-hoc parsing that already existed for Access-Control-Allow-Headers
and Access-Control-Allow-Methods, as well as adding
Access-control-Expose-Headers.

											
										
										
											2023-08-01 22:00:28 +12:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    // 2. Let position be a position variable for input, initially pointing at the start of input.
 								    GenericLexer lexer { input };
 								    // 3. Let values be a list of strings, initially « ».
 								    Vector<String> values;
 								    // 4. Let temporaryValue be the empty string.
 								    StringBuilder temporary_value_builder;
 								    // 5. While true:
 								    while (true) {
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								        // 1. Append the result of collecting a sequence of code points that are not U+0022 (") or U+002C (,) from
 								        //    input, given position, to temporaryValue.
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // NOTE: The result might be the empty string.
 								        temporary_value_builder.append(lexer.consume_until(is_any_of("\","sv)));
 								        // 2. If position is not past the end of input and the code point at position within input is U+0022 ("):
 								        if (!lexer.is_eof() && lexer.peek() == '"') {
 								            // 1. Append the result of collecting an HTTP quoted string from input, given position, to temporaryValue.
 								            temporary_value_builder.append(collect_an_http_quoted_string(lexer));
 								            // 2. If position is not past the end of input, then continue.
 								            if (!lexer.is_eof())
 								                continue;
-												LibWeb: Parse header value lists for some CORS headers

This adds a simple and incomplete implementation for extracting some
specific CORS headers that are used by fetch. This unifies the existing
ad-hoc parsing that already existed for Access-Control-Allow-Headers
and Access-Control-Allow-Methods, as well as adding
Access-control-Expose-Headers.

											
										
										
											2023-08-01 22:00:28 +12:00
+								        }
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // 3. Remove all HTTP tab or space from the start and end of temporaryValue.
 								        auto temporary_value = MUST(String::from_utf8(temporary_value_builder.string_view().trim(HTTP_TAB_OR_SPACE, TrimMode::Both)));
-												LibWeb: Parse header value lists for some CORS headers

This adds a simple and incomplete implementation for extracting some
specific CORS headers that are used by fetch. This unifies the existing
ad-hoc parsing that already existed for Access-Control-Allow-Headers
and Access-Control-Allow-Methods, as well as adding
Access-control-Expose-Headers.

											
										
										
											2023-08-01 22:00:28 +12:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // 4. Append temporaryValue to values.
 								        values.append(move(temporary_value));
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // 5. Set temporaryValue to the empty string.
 								        temporary_value_builder.clear();
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // 6. If position is past the end of input, then return values.
 								        if (lexer.is_eof())
 								            return values;
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // 7. Assert: the code point at position within input is U+002C (,).
 								        VERIFY(lexer.peek() == ',');
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        // 8. Advance position by 1.
 								        lexer.ignore(1);
 								    }
 								}
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								// https://fetch.spec.whatwg.org/#convert-header-names-to-a-sorted-lowercase-set
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								Vector<ByteString> convert_header_names_to_a_sorted_lowercase_set(ReadonlySpan<ByteString> header_names)
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								{
 								    // 1. Let headerNamesSet be a new ordered set.
-												AK: Rename CaseInsensitiveStringTraits

To CaseInsensitiveASCIIStringTraits. This change indicates that these
traits are about ASCII-only insensitivity.

											
										
										
											2025-12-21 23:31:17 -06:00
+								    HashTable<StringView, CaseInsensitiveASCIIStringTraits> header_names_seen;
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    Vector<ByteString> header_names_set;
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    // 2. For each name of headerNames, append the result of byte-lowercasing name to headerNamesSet.
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    for (auto const& name : header_names) {
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        if (header_names_seen.contains(name))
 								            continue;
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								        header_names_seen.set(name);
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								        header_names_set.append(name.to_lowercase());
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
+								    }
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    // 3. Return the result of sorting headerNamesSet in ascending order with byte less than.
-												LibWeb: Store HTTP methods and headers as ByteString

The spec declares these as a byte sequence, which we then implemented as
a ByteBuffer. This has become pretty awkward to deal with, as evidenced
by the plethora of `MUST(ByteBuffer::copy(...))` and `.bytes()` calls
everywhere inside Fetch. We would then treat the bytes as a string
anyways by wrapping them in StringView everywhere.

We now store these as a ByteString. This is more comfortable to deal
with, and we no longer need to continually copy underlying storage (as
ByteString is ref-counted).

This work is largely preparatory for an upcoming HTTP header refactor.

											
										
										
											2025-11-24 18:35:55 -05:00
+								    quick_sort(header_names_set);
 								    return header_names_set;
-												LibWeb: Partially implement 'Extract header (list) values' AOs

The header-specific ABNF rules are completely ignored for now, but we
can at least extract a single header value, which at least works for
simple cases like `Location`-based redirects.

											
										
										
											2022-10-25 23:02:47 +01:00
+								}
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Implement `build_content_range(start, end, full_length)`

											
										
										
											2024-11-18 17:20:33 -06:00
+								// https://fetch.spec.whatwg.org/#build-a-content-range
-												LibWeb: Simplify Fetch's build-content-range implementation

* Don't pass u64 by reference
* Don't double-format the range numbers

											
										
										
											2025-11-25 11:02:12 -05:00
+								ByteString build_content_range(u64 range_start, u64 range_end, u64 full_length)
-												LibWeb/Fetch: Implement `build_content_range(start, end, full_length)`

											
										
										
											2024-11-18 17:20:33 -06:00
+								{
 								    // 1. Let contentRange be `bytes `.
 								    // 2. Append rangeStart, serialized and isomorphic encoded, to contentRange.
 								    // 3. Append 0x2D (-) to contentRange.
 								    // 4. Append rangeEnd, serialized and isomorphic encoded to contentRange.
 								    // 5. Append 0x2F (/) to contentRange.
 								    // 6. Append fullLength, serialized and isomorphic encoded to contentRange.
 								    // 7. Return contentRange.
-												LibWeb: Simplify Fetch's build-content-range implementation

* Don't pass u64 by reference
* Don't double-format the range numbers

											
										
										
											2025-11-25 11:02:12 -05:00
+								    return ByteString::formatted("bytes {}-{}/{}", range_start, range_end, full_length);
-												LibWeb/Fetch: Implement `build_content_range(start, end, full_length)`

											
										
										
											2024-11-18 17:20:33 -06:00
+								}
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								// https://fetch.spec.whatwg.org/#simple-range-header-value
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								Optional<RangeHeaderValue> parse_single_range_header_value(StringView value, bool allow_whitespace)
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								{
 								    // 1. Let data be the isomorphic decoding of value.
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								    auto data = TextCodec::isomorphic_decode(value);
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 2. If data does not start with "bytes", then return failure.
 								    if (!data.starts_with_bytes("bytes"sv))
-												LibWeb/Fetch: Add support for parsing a single range header value

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/2d080d7
- https://github.com/whatwg/fetch/commit/a18fb3e

											
										
										
											2022-10-15 00:39:40 +02:00
+								        return {};
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 3. Let position be a position variable for data, initially pointing at the 5th code point of data.
-												LibWeb: Organize Fetch Headers.h/Headers.cpp a bit

Generally just define things in the order they are declared (will make a
change to use ByteString in this file a bit easier to follow). Also make
a couple of free functions be class methods on Header / HeaderList.

											
										
										
											2025-11-25 10:57:32 -05:00
+								    GenericLexer lexer { data };
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    lexer.ignore(5);
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 4. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
 								    if (allow_whitespace)
 								        lexer.consume_while(is_http_tab_or_space);
 								    // 5. If the code point at position within data is not U+003D (=), then return failure.
 								    // 6. Advance position by 1.
 								    if (!lexer.consume_specific('='))
 								        return {};
 								    // 7. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
 								    if (allow_whitespace)
 								        lexer.consume_while(is_http_tab_or_space);
 								    // 8. Let rangeStart be the result of collecting a sequence of code points that are ASCII digits, from data given position.
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    auto range_start = lexer.consume_while(is_ascii_digit);
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								    // 9. Let rangeStartValue be rangeStart, interpreted as decimal number, if rangeStart is not the empty string;
 								    //    otherwise null.
-												Everywhere: Use to_number<T> instead of to_{int,uint,float,double}

In a bunch of cases, this actually ends up simplifying the code as
to_number will handle something such as:

```
Optional<I> opt;
if constexpr (IsSigned<I>)
    opt = view.to_int<I>();
else
    opt = view.to_uint<I>();
```

For us.

The main goal here however is to have a single generic number conversion
API between all of the String classes.

											
										
										
											2023-12-23 15:59:14 +13:00
+								    auto range_start_value = range_start.to_number<u64>();
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 10. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
 								    if (allow_whitespace)
 								        lexer.consume_while(is_http_tab_or_space);
 								    // 11. If the code point at position within data is not U+002D (-), then return failure.
 								    // 12. Advance position by 1.
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    if (!lexer.consume_specific('-'))
-												LibWeb/Fetch: Add support for parsing a single range header value

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/2d080d7
- https://github.com/whatwg/fetch/commit/a18fb3e

											
										
										
											2022-10-15 00:39:40 +02:00
+								        return {};
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 13. If allowWhitespace is true, collect a sequence of code points that are HTTP tab or space, from data given position.
 								    if (allow_whitespace)
 								        lexer.consume_while(is_http_tab_or_space);
 								    // 14. Let rangeEnd be the result of collecting a sequence of code points that are ASCII digits, from data given position.
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    auto range_end = lexer.consume_while(is_ascii_digit);
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 15. Let rangeEndValue be rangeEnd, interpreted as decimal number, if rangeEnd is not the empty string; otherwise null.
-												Everywhere: Use to_number<T> instead of to_{int,uint,float,double}

In a bunch of cases, this actually ends up simplifying the code as
to_number will handle something such as:

```
Optional<I> opt;
if constexpr (IsSigned<I>)
    opt = view.to_int<I>();
else
    opt = view.to_uint<I>();
```

For us.

The main goal here however is to have a single generic number conversion
API between all of the String classes.

											
										
										
											2023-12-23 15:59:14 +13:00
+								    auto range_end_value = range_end.to_number<u64>();
-												LibWeb/Fetch: Add support for parsing a single range header value

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/2d080d7
- https://github.com/whatwg/fetch/commit/a18fb3e

											
										
										
											2022-10-15 00:39:40 +02:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 16. If position is not past the end of data, then return failure.
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								    if (!lexer.is_eof())
-												LibWeb/Fetch: Add support for parsing a single range header value

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/2d080d7
- https://github.com/whatwg/fetch/commit/a18fb3e

											
										
										
											2022-10-15 00:39:40 +02:00
+								        return {};
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 17. If rangeEndValue and rangeStartValue are null, then return failure.
-												LibWeb/Fetch: Add support for parsing a single range header value

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/2d080d7
- https://github.com/whatwg/fetch/commit/a18fb3e

											
										
										
											2022-10-15 00:39:40 +02:00
+								    if (!range_end_value.has_value() && !range_start_value.has_value())
 								        return {};
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								    // 18. If rangeStartValue and rangeEndValue are numbers, and rangeStartValue is greater than rangeEndValue, then
 								    //     return failure.
-												LibWeb/Fetch: Add support for parsing a single range header value

This is a change in the Fetch spec.

See:
- https://github.com/whatwg/fetch/commit/2d080d7
- https://github.com/whatwg/fetch/commit/a18fb3e

											
										
										
											2022-10-15 00:39:40 +02:00
+								    if (range_start_value.has_value() && range_end_value.has_value() && *range_start_value > *range_end_value)
 								        return {};
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
-												LibWeb/Fetch: Bring `parse_single_range_header_value()` up to spec

The previous implementation wasn't using the latest specification steps.

											
										
										
											2024-11-18 17:18:26 -06:00
+								    // 19. Return (rangeStartValue, rangeEndValue).
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								    return RangeHeaderValue { range_start_value, range_end_value };
 								}
 								}
 								namespace IPC {
 								template<>
 								ErrorOr<void> encode(Encoder& encoder, HTTP::Header const& header)
 								{
 								    TRY(encoder.encode(header.name));
 								    TRY(encoder.encode(header.value));
 								    return {};
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								}
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								template<>
 								ErrorOr<HTTP::Header> decode(Decoder& decoder)
-												LibWeb: Implement 'Default `User-Agent` value' AO

											
										
										
											2022-10-24 09:23:18 +01:00
+								{
-												LibHTTP+LibWeb+RequestServer: Move Fetch's HTTP header infra to LibHTTP

The end goal here is for LibHTTP to be the home of our RFC 9111 (HTTP
caching) implementation. We currently have one implementation in LibWeb
for our in-memory cache and another in RequestServer for our disk cache.

The implementations both largely revolve around interacting with HTTP
headers. But in LibWeb, we are using Fetch's header infra, and in RS we
are using are home-grown header infra from LibHTTP.

So to give these a common denominator, this patch replaces the LibHTTP
implementation with Fetch's infra. Our existing LibHTTP implementation
was not particularly compliant with any spec, so this at least gives us
a standards-based common implementation.

This migration also required moving a handful of other Fetch AOs over
to LibHTTP. (It turns out these AOs were all from the Fetch/Infra/HTTP
folder, so perhaps it makes sense for LibHTTP to be the implementation
of that entire set of facilities.)

											
										
										
											2025-11-26 14:13:23 -05:00
+								    auto name = TRY(decoder.decode<ByteString>());
 								    auto value = TRY(decoder.decode<ByteString>());
 								    return HTTP::Header { move(name), move(value) };
-												LibWeb: Implement 'Default `User-Agent` value' AO

											
										
										
											2022-10-24 09:23:18 +01:00
+								}
-												LibWeb: Add definitions from '2.2.2. Headers' in the Fetch spec

											
										
										
											2022-07-11 21:42:14 +01:00
+								}