ladybird/Libraries/LibJS/Bytecode/Executable.cpp
Andreas Kling bc4379983f LibJS: Improve bytecode executable dump format
Add a metadata header showing register count, block count, local
variable names, and the constants table. Resolve jump targets to
block labels (e.g. "block1") instead of raw hex addresses, and add
visual separation between basic blocks.

Make identifier and property key formatting more concise by using
backtick quoting and showing base_identifier as a trailing
parenthetical hint that joins the base and property names.

Generate a stable name for each executable by hashing the source
text it covers (stable across codegen changes). Named functions
show as "foo$9beb91ec", anonymous ones as "$43362f3f". Also show
the source filename, line, and column.
2026-03-20 00:51:23 -05:00

360 lines
13 KiB
C++

/*
* Copyright (c) 2021-2025, Andreas Kling <andreas@ladybird.org>
*
* SPDX-License-Identifier: BSD-2-Clause
*/
#include <AK/BinarySearch.h>
#include <LibJS/Bytecode/BasicBlock.h>
#include <LibJS/Bytecode/Executable.h>
#include <LibJS/Bytecode/FormatOperand.h>
#include <LibJS/Bytecode/Instruction.h>
#include <LibJS/Bytecode/Op.h>
#include <LibJS/Bytecode/RegexTable.h>
#include <LibJS/Runtime/Array.h>
#include <LibJS/Runtime/SharedFunctionInstanceData.h>
#include <LibJS/Runtime/Value.h>
#include <LibJS/SourceCode.h>
namespace JS::Bytecode {
GC_DEFINE_ALLOCATOR(Executable);
Executable::Executable(
Vector<u8> bytecode,
NonnullOwnPtr<IdentifierTable> identifier_table,
NonnullOwnPtr<PropertyKeyTable> property_key_table,
NonnullOwnPtr<StringTable> string_table,
NonnullOwnPtr<RegexTable> regex_table,
Vector<Value> constants,
NonnullRefPtr<SourceCode const> source_code,
size_t number_of_property_lookup_caches,
size_t number_of_global_variable_caches,
size_t number_of_template_object_caches,
size_t number_of_object_shape_caches,
size_t number_of_registers,
Strict strict)
: GC::WeakContainer(heap())
, bytecode(move(bytecode))
, string_table(move(string_table))
, identifier_table(move(identifier_table))
, property_key_table(move(property_key_table))
, regex_table(move(regex_table))
, constants(move(constants))
, source_code(move(source_code))
, number_of_registers(number_of_registers)
, is_strict_mode(strict == Strict::Yes)
{
property_lookup_caches.resize(number_of_property_lookup_caches);
global_variable_caches.resize(number_of_global_variable_caches);
template_object_caches.resize(number_of_template_object_caches);
object_shape_caches.resize(number_of_object_shape_caches);
}
Executable::~Executable() = default;
void Executable::fixup_cache_pointers()
{
for (auto it = InstructionStreamIterator(bytecode); !it.at_end(); ++it) {
fixup_instruction_cache(
const_cast<Instruction&>(*it),
property_lookup_caches.span(),
global_variable_caches.span(),
template_object_caches.span(),
object_shape_caches.span());
}
}
static void dump_header(StringBuilder& output, Executable const& executable, bool use_color)
{
auto const white_bold = use_color ? "\033[37;1m"sv : ""sv;
auto const reset = use_color ? "\033[0m"sv : ""sv;
// Generate a stable hash from the source text for identification.
// We hash source code rather than bytecode so the ID is stable
// across changes to bytecode generation.
// Find the overall source range covered by this executable.
u32 source_start = NumericLimits<u32>::max();
u32 source_end = 0;
for (auto const& entry : executable.source_map) {
if (entry.source_record.source_start_offset < entry.source_record.source_end_offset) {
source_start = min(source_start, entry.source_record.source_start_offset);
source_end = max(source_end, entry.source_record.source_end_offset);
}
}
u32 hash = 2166136261u; // FNV-1a offset basis
auto code_view = executable.source_code->code_view();
for (auto i = source_start; i < source_end && i < code_view.length_in_code_units(); ++i) {
auto code_unit = code_view.code_unit_at(i);
hash ^= code_unit & 0xFF;
hash *= 16777619u;
hash ^= (code_unit >> 8) & 0xFF;
hash *= 16777619u;
}
if (executable.name.is_empty())
output.appendff("{}${:08x}{}", white_bold, hash, reset);
else
output.appendff("{}{}${:08x}{}", white_bold, executable.name, hash, reset);
// Show source location if available.
if (source_start < source_end) {
auto range = executable.source_code->range_from_offsets(source_start, source_end);
auto filename = executable.source_code->filename();
if (!filename.is_empty()) {
// Show just the basename to keep output portable across machines.
auto last_slash = filename.bytes_as_string_view().find_last('/');
if (last_slash.has_value())
filename = MUST(filename.substring_from_byte_offset(last_slash.value() + 1));
output.appendff(" {}:{}:{}", filename, range.start.line, range.start.column);
} else {
output.appendff(" line {}, column {}", range.start.line, range.start.column);
}
}
output.append('\n');
}
static void dump_metadata(StringBuilder& output, Executable const& executable, bool use_color)
{
auto const green = use_color ? "\033[32m"sv : ""sv;
auto const yellow = use_color ? "\033[33m"sv : ""sv;
auto const blue = use_color ? "\033[34m"sv : ""sv;
auto const cyan = use_color ? "\033[36m"sv : ""sv;
auto const reset = use_color ? "\033[0m"sv : ""sv;
output.appendff(" {}Registers{}: {}\n", green, reset, executable.number_of_registers);
output.appendff(" {}Blocks{}: {}\n", green, reset, executable.basic_block_start_offsets.size());
if (!executable.local_variable_names.is_empty()) {
output.appendff(" {}Locals{}: ", green, reset);
for (size_t i = 0; i < executable.local_variable_names.size(); ++i) {
if (i != 0)
output.append(", "sv);
output.appendff("{}{}~{}{}", blue, executable.local_variable_names[i].name, i, reset);
}
output.append('\n');
}
if (!executable.constants.is_empty()) {
output.appendff(" {}Constants{}:\n", green, reset);
for (size_t i = 0; i < executable.constants.size(); ++i) {
auto value = executable.constants[i];
output.append(" "sv);
output.appendff("{}[{}]{} = ", yellow, i, reset);
output.append(cyan);
if (value.is_special_empty_value())
output.append("<Empty>"sv);
else if (value.is_boolean())
output.appendff("Bool({})", value.as_bool() ? "true"sv : "false"sv);
else if (value.is_int32())
output.appendff("Int32({})", value.as_i32());
else if (value.is_double())
output.appendff("Double({})", value.as_double());
else if (value.is_bigint())
output.appendff("BigInt({})", MUST(value.as_bigint().to_string()));
else if (value.is_string())
output.appendff("String(\"{}\")", value.as_string().utf8_string_view());
else if (value.is_undefined())
output.append("Undefined"sv);
else if (value.is_null())
output.append("Null"sv);
else
output.appendff("Value({})", value);
output.append(reset);
output.append('\n');
}
}
}
static void dump_bytecode(StringBuilder& output, Executable const& executable, bool use_color)
{
auto const magenta = use_color ? "\033[35;1m"sv : ""sv;
auto const reset = use_color ? "\033[0m"sv : ""sv;
InstructionStreamIterator it(executable.bytecode, &executable);
size_t basic_block_offset_index = 0;
while (!it.at_end()) {
if (basic_block_offset_index < executable.basic_block_start_offsets.size()
&& it.offset() == executable.basic_block_start_offsets[basic_block_offset_index]) {
if (basic_block_offset_index > 0)
output.append('\n');
output.appendff("{}block{}{}:\n", magenta, basic_block_offset_index, reset);
++basic_block_offset_index;
}
output.appendff(" [{:4x}] {}\n", it.offset(), (*it).to_byte_string(executable));
++it;
}
}
void Executable::dump() const
{
StringBuilder output;
dump_header(output, *this, true);
dump_metadata(output, *this, true);
output.append('\n');
dump_bytecode(output, *this, true);
if (!exception_handlers.is_empty()) {
output.append("\nException handlers:\n"sv);
for (auto const& handler : exception_handlers) {
output.appendff(" [{:4x} .. {:4x}] => handler ", handler.start_offset, handler.end_offset);
Label handler_label(static_cast<u32>(handler.handler_offset));
output.appendff("{}\n", format_label(""sv, handler_label, *this));
}
}
output.append('\n');
warnln("{}", output.string_view());
}
String Executable::dump_to_string() const
{
StringBuilder output;
dump_header(output, *this, false);
dump_metadata(output, *this, false);
output.append('\n');
dump_bytecode(output, *this, false);
if (!exception_handlers.is_empty()) {
output.append("\nException handlers:\n"sv);
for (auto const& handler : exception_handlers) {
output.appendff(" [{:4x} .. {:4x}] => handler ", handler.start_offset, handler.end_offset);
Label handler_label(static_cast<u32>(handler.handler_offset));
output.appendff("{}\n", format_label(""sv, handler_label, *this));
}
}
return output.to_string_without_validation();
}
void Executable::visit_edges(Visitor& visitor)
{
Base::visit_edges(visitor);
visitor.visit(constants);
for (auto& cache : template_object_caches)
visitor.visit(cache.cached_template_object);
for (auto& data : shared_function_data)
visitor.visit(data);
for (auto& blueprint : class_blueprints) {
for (auto& element : blueprint.elements) {
if (element.literal_value.has_value() && element.literal_value->is_cell())
visitor.visit(element.literal_value->as_cell());
}
}
property_key_table->visit_edges(visitor);
}
static Vector<PropertyLookupCache*>& static_property_lookup_caches()
{
static Vector<PropertyLookupCache*> caches;
return caches;
}
StaticPropertyLookupCache::StaticPropertyLookupCache()
{
static_property_lookup_caches().append(this);
}
static void clear_cache_entry_if_dead(PropertyLookupCache::Entry& entry)
{
if (entry.from_shape && entry.from_shape->state() != Cell::State::Live)
entry.from_shape = nullptr;
if (entry.shape && entry.shape->state() != Cell::State::Live)
entry.shape = nullptr;
if (entry.prototype && entry.prototype->state() != Cell::State::Live)
entry.prototype = nullptr;
if (entry.prototype_chain_validity && entry.prototype_chain_validity->state() != Cell::State::Live)
entry.prototype_chain_validity = nullptr;
}
void StaticPropertyLookupCache::sweep_all()
{
for (auto* cache : static_property_lookup_caches()) {
for (auto& entry : cache->entries)
clear_cache_entry_if_dead(entry);
}
}
void Executable::remove_dead_cells(Badge<GC::Heap>)
{
for (auto& cache : property_lookup_caches) {
for (auto& entry : cache.entries)
clear_cache_entry_if_dead(entry);
}
for (auto& cache : global_variable_caches) {
for (auto& entry : cache.entries)
clear_cache_entry_if_dead(entry);
}
for (auto& cache : object_shape_caches) {
if (cache.shape && cache.shape->state() != Cell::State::Live)
cache.shape = nullptr;
}
}
Optional<Executable::ExceptionHandlers const&> Executable::exception_handlers_for_offset(size_t offset) const
{
// NB: exception_handlers is sorted by start_offset.
auto* entry = binary_search(exception_handlers, offset, nullptr, [](size_t needle, ExceptionHandlers const& entry) -> int {
if (needle < entry.start_offset)
return -1;
if (needle >= entry.end_offset)
return 1;
return 0;
});
if (!entry)
return {};
return *entry;
}
UnrealizedSourceRange Executable::source_range_at(size_t offset) const
{
if (offset >= bytecode.size())
return {};
auto it = InstructionStreamIterator(bytecode.span().slice(offset), this);
VERIFY(!it.at_end());
auto* entry = binary_search(source_map, offset, nullptr, [](size_t needle, SourceMapEntry const& entry) -> int {
if (needle < entry.bytecode_offset)
return -1;
if (needle > entry.bytecode_offset)
return 1;
return 0;
});
if (!entry)
return {};
return UnrealizedSourceRange {
.source_code = source_code,
.start_offset = entry->source_record.source_start_offset,
.end_offset = entry->source_record.source_end_offset,
};
}
SourceRange const& Executable::get_source_range(u32 program_counter)
{
return m_source_range_cache.ensure(program_counter, [&] {
auto unrealized = source_range_at(program_counter);
if (unrealized.source_code)
return unrealized.realize();
static SourceRange dummy { SourceCode::create({}, {}), {}, {} };
return dummy;
});
}
Operand Executable::original_operand_from_raw(u32 raw) const
{
// NB: Layout is [registers | locals | constants | arguments]
if (raw < number_of_registers)
return Operand { Operand::Type::Register, raw };
if (raw < registers_and_locals_count)
return Operand { Operand::Type::Local, raw - local_index_base };
if (raw < argument_index_base)
return Operand { Operand::Type::Constant, raw - registers_and_locals_count };
return Operand { Operand::Type::Argument, raw - argument_index_base };
}
}