ladybird/Libraries/LibJS/Runtime/VM.h
Luke Wilde 3d43462ccd LibJS: Implement the Dynamic Code Brand Checks stage 3 proposal
This is an active proposal at stage 3 of the TC39 proposal process.
See: https://tc39.es/proposal-dynamic-code-brand-checks/
See: https://github.com/tc39/proposal-dynamic-code-brand-checks

This proposal essentially adds support for the TrustedScript type from
the Trusted Types specification to eval and Function. This in turn
pipes support for the type into the CSP hook to check if the CSP allows
dynamic code compilation.

However, it currently doesn't support ShadowRealms, so the
implementation here is a close approximation, using PerformEval as the
basis.
See: https://github.com/tc39/proposal-dynamic-code-brand-checks/issues/19

This is required to support the new function signature for the CSP
hook, and will allow us to slot in Trusted Types support in the future.
2025-07-09 15:52:54 -06:00

380 lines
14 KiB
C++

/*
* Copyright (c) 2020-2023, Andreas Kling <andreas@ladybird.org>
* Copyright (c) 2020-2023, Linus Groh <linusg@serenityos.org>
* Copyright (c) 2021-2022, David Tuin <davidot@serenityos.org>
* Copyright (c) 2023, networkException <networkexception@serenityos.org>
*
* SPDX-License-Identifier: BSD-2-Clause
*/
#pragma once
#include <AK/FlyString.h>
#include <AK/Function.h>
#include <AK/HashMap.h>
#include <AK/RefCounted.h>
#include <AK/StackInfo.h>
#include <AK/Variant.h>
#include <LibCrypto/Forward.h>
#include <LibGC/Function.h>
#include <LibGC/Heap.h>
#include <LibGC/RootVector.h>
#include <LibJS/CyclicModule.h>
#include <LibJS/ModuleLoading.h>
#include <LibJS/Runtime/Agent.h>
#include <LibJS/Runtime/CommonPropertyNames.h>
#include <LibJS/Runtime/Completion.h>
#include <LibJS/Runtime/Error.h>
#include <LibJS/Runtime/ErrorTypes.h>
#include <LibJS/Runtime/ExecutionContext.h>
#include <LibJS/Runtime/Promise.h>
#include <LibJS/Runtime/Value.h>
namespace JS {
class Identifier;
struct BindingPattern;
enum class HandledByHost {
Handled,
Unhandled,
};
enum class EvalMode {
Direct,
Indirect
};
enum class CompilationType {
DirectEval,
IndirectEval,
Function,
};
class JS_API VM : public RefCounted<VM> {
public:
static NonnullRefPtr<VM> create();
~VM();
GC::Heap& heap() { return m_heap; }
GC::Heap const& heap() const { return m_heap; }
Bytecode::Interpreter& bytecode_interpreter() { return *m_bytecode_interpreter; }
void dump_backtrace() const;
void gather_roots(HashMap<GC::Cell*, GC::HeapRoot>&);
#define __JS_ENUMERATE(SymbolName, snake_name) \
GC::Ref<Symbol> well_known_symbol_##snake_name() const \
{ \
return *m_well_known_symbols.snake_name; \
}
JS_ENUMERATE_WELL_KNOWN_SYMBOLS
#undef __JS_ENUMERATE
HashMap<String, GC::Ptr<PrimitiveString>>& string_cache()
{
return m_string_cache;
}
HashMap<Utf16String, GC::Ptr<PrimitiveString>>& utf16_string_cache()
{
return m_utf16_string_cache;
}
PrimitiveString& empty_string() { return *m_empty_string; }
PrimitiveString& single_ascii_character_string(u8 character)
{
VERIFY(character < 0x80);
return *m_single_ascii_character_strings[character];
}
// This represents the list of errors from ErrorTypes.h whose messages are used in contexts which
// must not fail to allocate when they are used. For example, we cannot allocate when we raise an
// out-of-memory error, thus we pre-allocate that error string at VM creation time.
enum class ErrorMessage {
OutOfMemory,
// Keep this last:
__Count,
};
String const& error_message(ErrorMessage) const;
bool did_reach_stack_space_limit() const
{
#if defined(AK_OS_MACOS) && defined(HAS_ADDRESS_SANITIZER)
// We hit stack limits sooner on macOS 14 arm64 with ASAN enabled.
return m_stack_info.size_free() < 96 * KiB;
#else
return m_stack_info.size_free() < 32 * KiB;
#endif
}
// TODO: Rename this function instead of providing a second argument, now that the global object is no longer passed in.
struct CheckStackSpaceLimitTag { };
ThrowCompletionOr<void> push_execution_context(ExecutionContext& context, CheckStackSpaceLimitTag)
{
// Ensure we got some stack space left, so the next function call doesn't kill us.
if (did_reach_stack_space_limit()) [[unlikely]] {
return throw_completion<InternalError>(ErrorType::CallStackSizeExceeded);
}
m_execution_context_stack.append(&context);
return {};
}
void push_execution_context(ExecutionContext& context)
{
m_execution_context_stack.append(&context);
}
void pop_execution_context()
{
m_execution_context_stack.take_last();
}
// https://tc39.es/ecma262/#running-execution-context
// At any point in time, there is at most one execution context per agent that is actually executing code.
// This is known as the agent's running execution context.
ExecutionContext& running_execution_context()
{
VERIFY(!m_execution_context_stack.is_empty());
return *m_execution_context_stack.last();
}
ExecutionContext const& running_execution_context() const
{
VERIFY(!m_execution_context_stack.is_empty());
return *m_execution_context_stack.last();
}
// https://tc39.es/ecma262/#execution-context-stack
// The execution context stack is used to track execution contexts.
Vector<ExecutionContext*> const& execution_context_stack() const { return m_execution_context_stack; }
Vector<ExecutionContext*>& execution_context_stack() { return m_execution_context_stack; }
Environment const* lexical_environment() const { return running_execution_context().lexical_environment; }
Environment* lexical_environment() { return running_execution_context().lexical_environment; }
Environment const* variable_environment() const { return running_execution_context().variable_environment; }
Environment* variable_environment() { return running_execution_context().variable_environment; }
// https://tc39.es/ecma262/#current-realm
// The value of the Realm component of the running execution context is also called the current Realm Record.
Realm const* current_realm() const { return running_execution_context().realm; }
Realm* current_realm() { return running_execution_context().realm; }
// https://tc39.es/ecma262/#active-function-object
// The value of the Function component of the running execution context is also called the active function object.
FunctionObject const* active_function_object() const { return running_execution_context().function; }
FunctionObject* active_function_object() { return running_execution_context().function; }
bool in_strict_mode() const
{
return running_execution_context().is_strict_mode;
}
size_t argument_count() const
{
return running_execution_context().arguments.size();
}
Value argument(size_t index) const
{
return running_execution_context().argument(index);
}
Value this_value() const
{
return running_execution_context().this_value.value();
}
ThrowCompletionOr<Value> resolve_this_binding();
StackInfo const& stack_info() const { return m_stack_info; }
HashMap<String, GC::Ref<Symbol>> const& global_symbol_registry() const { return m_global_symbol_registry; }
HashMap<String, GC::Ref<Symbol>>& global_symbol_registry() { return m_global_symbol_registry; }
u32 execution_generation() const { return m_execution_generation; }
void finish_execution_generation() { ++m_execution_generation; }
ThrowCompletionOr<Reference> resolve_binding(FlyString const&, Environment* = nullptr);
ThrowCompletionOr<Reference> get_identifier_reference(Environment*, FlyString, bool strict, size_t hops = 0);
// 5.2.3.2 Throw an Exception, https://tc39.es/ecma262/#sec-throw-an-exception
template<typename T, typename... Args>
Completion throw_completion(Args&&... args)
{
auto& realm = *current_realm();
auto completion = T::create(realm, forward<Args>(args)...);
return JS::throw_completion(completion);
}
template<typename T>
Completion throw_completion(ErrorType type)
{
return throw_completion<T>(String::from_utf8_without_validation(type.message().bytes()));
}
template<typename T, typename... Args>
Completion throw_completion(ErrorType type, Args&&... args)
{
return throw_completion<T>(MUST(String::formatted(type.message(), forward<Args>(args)...)));
}
Value get_new_target();
Object* get_import_meta();
Object& get_global_object();
CommonPropertyNames names;
struct {
GC::Ptr<PrimitiveString> number;
GC::Ptr<PrimitiveString> undefined;
GC::Ptr<PrimitiveString> object;
GC::Ptr<PrimitiveString> string;
GC::Ptr<PrimitiveString> symbol;
GC::Ptr<PrimitiveString> boolean;
GC::Ptr<PrimitiveString> bigint;
GC::Ptr<PrimitiveString> function;
GC::Ptr<PrimitiveString> object_Object;
} cached_strings;
void run_queued_promise_jobs()
{
if (m_promise_jobs.is_empty())
return;
run_queued_promise_jobs_impl();
}
void enqueue_promise_job(GC::Ref<GC::Function<ThrowCompletionOr<Value>()>> job, Realm*);
void run_queued_finalization_registry_cleanup_jobs();
void enqueue_finalization_registry_cleanup_job(FinalizationRegistry&);
void promise_rejection_tracker(Promise&, Promise::RejectionOperation) const;
Function<void(Promise&)> on_promise_unhandled_rejection;
Function<void(Promise&)> on_promise_rejection_handled;
Function<void(Object const&, PropertyKey const&)> on_unimplemented_property_access;
void set_agent(OwnPtr<Agent> agent) { m_agent = move(agent); }
Agent* agent() { return m_agent; }
Agent const* agent() const { return m_agent; }
void save_execution_context_stack();
void clear_execution_context_stack();
void restore_execution_context_stack();
// Do not call this method unless you are sure this is the only and first module to be loaded in this vm.
ThrowCompletionOr<void> link_and_eval_module(Badge<Bytecode::Interpreter>, SourceTextModule& module);
ScriptOrModule get_active_script_or_module() const;
// 16.2.1.10 HostLoadImportedModule ( referrer, moduleRequest, hostDefined, payload ), https://tc39.es/ecma262/#sec-HostLoadImportedModule
Function<void(ImportedModuleReferrer, ModuleRequest const&, GC::Ptr<GraphLoadingState::HostDefined>, ImportedModulePayload)> host_load_imported_module;
Function<HashMap<PropertyKey, Value>(SourceTextModule&)> host_get_import_meta_properties;
Function<void(Object*, SourceTextModule const&)> host_finalize_import_meta;
Function<Vector<String>()> host_get_supported_import_attributes;
void set_dynamic_imports_allowed(bool value) { m_dynamic_imports_allowed = value; }
Function<void(Promise&, Promise::RejectionOperation)> host_promise_rejection_tracker;
Function<ThrowCompletionOr<Value>(JobCallback&, Value, ReadonlySpan<Value>)> host_call_job_callback;
Function<void(FinalizationRegistry&)> host_enqueue_finalization_registry_cleanup_job;
Function<void(GC::Ref<GC::Function<ThrowCompletionOr<Value>()>>, Realm*)> host_enqueue_promise_job;
Function<GC::Ref<JobCallback>(FunctionObject&)> host_make_job_callback;
Function<GC::Ptr<PrimitiveString>(Object const&)> host_get_code_for_eval;
Function<ThrowCompletionOr<void>(Realm&, ReadonlySpan<String>, StringView, StringView, CompilationType, ReadonlySpan<Value>, Value)> host_ensure_can_compile_strings;
Function<ThrowCompletionOr<void>(Object&)> host_ensure_can_add_private_element;
Function<ThrowCompletionOr<HandledByHost>(ArrayBuffer&, size_t)> host_resize_array_buffer;
Function<void(StringView)> host_unrecognized_date_string;
Function<ThrowCompletionOr<void>(Realm&, NonnullOwnPtr<ExecutionContext>, ShadowRealm&)> host_initialize_shadow_realm;
Function<Crypto::SignedBigInteger(Object const& global)> host_system_utc_epoch_nanoseconds;
Vector<StackTraceElement> stack_trace() const;
private:
using ErrorMessages = AK::Array<String, to_underlying(ErrorMessage::__Count)>;
struct WellKnownSymbols {
#define __JS_ENUMERATE(SymbolName, snake_name) \
GC::Ptr<Symbol> snake_name;
JS_ENUMERATE_WELL_KNOWN_SYMBOLS
#undef __JS_ENUMERATE
};
explicit VM(ErrorMessages);
void load_imported_module(ImportedModuleReferrer, ModuleRequest const&, GC::Ptr<GraphLoadingState::HostDefined>, ImportedModulePayload);
ThrowCompletionOr<void> link_and_eval_module(CyclicModule&);
void set_well_known_symbols(WellKnownSymbols well_known_symbols) { m_well_known_symbols = move(well_known_symbols); }
void run_queued_promise_jobs_impl();
HashMap<String, GC::Ptr<PrimitiveString>> m_string_cache;
HashMap<Utf16String, GC::Ptr<PrimitiveString>> m_utf16_string_cache;
GC::Heap m_heap;
Vector<ExecutionContext*> m_execution_context_stack;
Vector<Vector<ExecutionContext*>> m_saved_execution_context_stacks;
StackInfo m_stack_info;
// GlobalSymbolRegistry, https://tc39.es/ecma262/#table-globalsymbolregistry-record-fields
HashMap<String, GC::Ref<Symbol>> m_global_symbol_registry;
Vector<GC::Ref<GC::Function<ThrowCompletionOr<Value>()>>> m_promise_jobs;
Vector<GC::Ptr<FinalizationRegistry>> m_finalization_registry_cleanup_jobs;
GC::Ptr<PrimitiveString> m_empty_string;
GC::Ptr<PrimitiveString> m_single_ascii_character_strings[128] {};
ErrorMessages m_error_messages;
struct StoredModule {
ImportedModuleReferrer referrer;
ByteString filename;
String type;
GC::Root<Module> module;
bool has_once_started_linking { false };
};
StoredModule* get_stored_module(ImportedModuleReferrer const& script_or_module, ByteString const& filename, String const& type);
Vector<StoredModule> m_loaded_modules;
WellKnownSymbols m_well_known_symbols;
u32 m_execution_generation { 0 };
OwnPtr<Agent> m_agent;
OwnPtr<Bytecode::Interpreter> m_bytecode_interpreter;
bool m_dynamic_imports_allowed { false };
};
template<typename GlobalObjectType, typename... Args>
[[nodiscard]] static NonnullOwnPtr<ExecutionContext> create_simple_execution_context(VM& vm, Args&&... args)
{
auto root_execution_context = MUST(Realm::initialize_host_defined_realm(
vm,
[&](Realm& realm_) -> GlobalObject* {
return vm.heap().allocate<GlobalObjectType>(realm_, forward<Args>(args)...);
},
nullptr));
return root_execution_context;
}
}