// Copyright 2017 the V8 project authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "src/wasm/module-compiler.h" #include #include #include #include #include "src/api/api-inl.h" #include "src/base/enum-set.h" #include "src/base/optional.h" #include "src/base/platform/mutex.h" #include "src/base/platform/semaphore.h" #include "src/base/platform/time.h" #include "src/codegen/compiler.h" #include "src/compiler/wasm-compiler.h" #include "src/debug/debug.h" #include "src/handles/global-handles-inl.h" #include "src/logging/counters-scopes.h" #include "src/logging/metrics.h" #include "src/tracing/trace-event.h" #include "src/wasm/code-space-access.h" #include "src/wasm/module-decoder.h" #include "src/wasm/pgo.h" #include "src/wasm/std-object-sizes.h" #include "src/wasm/streaming-decoder.h" #include "src/wasm/wasm-code-manager.h" #include "src/wasm/wasm-engine.h" #include "src/wasm/wasm-import-wrapper-cache.h" #include "src/wasm/wasm-js.h" #include "src/wasm/wasm-limits.h" #include "src/wasm/wasm-objects-inl.h" #include "src/wasm/wasm-result.h" #include "src/wasm/wasm-serialization.h" #define TRACE_COMPILE(...) \ do { \ if (v8_flags.trace_wasm_compiler) PrintF(__VA_ARGS__); \ } while (false) #define TRACE_STREAMING(...) \ do { \ if (v8_flags.trace_wasm_streaming) PrintF(__VA_ARGS__); \ } while (false) #define TRACE_LAZY(...) \ do { \ if (v8_flags.trace_wasm_lazy_compilation) PrintF(__VA_ARGS__); \ } while (false) namespace v8 { namespace internal { namespace wasm { namespace { enum class CompileStrategy : uint8_t { // Compiles functions on first use. In this case, execution will block until // the function's baseline is reached and top tier compilation starts in // background (if applicable). // Lazy compilation can help to reduce startup time and code size at the risk // of blocking execution. kLazy, // Compiles baseline ahead of execution and starts top tier compilation in // background (if applicable). kEager, // Triggers baseline compilation on first use (just like {kLazy}) with the // difference that top tier compilation is started eagerly. // This strategy can help to reduce startup time at the risk of blocking // execution, but only in its early phase (until top tier compilation // finishes). kLazyBaselineEagerTopTier, // Marker for default strategy. kDefault = kEager, }; class CompilationStateImpl; class CompilationUnitBuilder; class V8_NODISCARD BackgroundCompileScope { public: explicit BackgroundCompileScope(std::weak_ptr native_module) : native_module_(native_module.lock()) {} NativeModule* native_module() const { DCHECK(native_module_); return native_module_.get(); } inline CompilationStateImpl* compilation_state() const; bool cancelled() const; private: // Keep the native module alive while in this scope. std::shared_ptr native_module_; }; enum CompilationTier { kBaseline = 0, kTopTier = 1, kNumTiers = kTopTier + 1 }; // A set of work-stealing queues (vectors of units). Each background compile // task owns one of the queues and steals from all others once its own queue // runs empty. class CompilationUnitQueues { public: // Public API for QueueImpl. struct Queue { bool ShouldPublish(int num_processed_units) const; }; explicit CompilationUnitQueues(int num_declared_functions) : num_declared_functions_(num_declared_functions) { // Add one first queue, to add units to. queues_.emplace_back(std::make_unique(0)); #if !defined(__cpp_lib_atomic_value_initialization) || \ __cpp_lib_atomic_value_initialization < 201911L for (auto& atomic_counter : num_units_) { std::atomic_init(&atomic_counter, size_t{0}); } #endif top_tier_compiled_ = std::make_unique[]>(num_declared_functions); #if !defined(__cpp_lib_atomic_value_initialization) || \ __cpp_lib_atomic_value_initialization < 201911L for (int i = 0; i < num_declared_functions; i++) { std::atomic_init(&top_tier_compiled_.get()[i], false); } #endif } Queue* GetQueueForTask(int task_id) { int required_queues = task_id + 1; { base::SharedMutexGuard queues_guard{&queues_mutex_}; if (V8_LIKELY(static_cast(queues_.size()) >= required_queues)) { return queues_[task_id].get(); } } // Otherwise increase the number of queues. base::SharedMutexGuard queues_guard{&queues_mutex_}; int num_queues = static_cast(queues_.size()); while (num_queues < required_queues) { int steal_from = num_queues + 1; queues_.emplace_back(std::make_unique(steal_from)); ++num_queues; } // Update the {publish_limit}s of all queues. // We want background threads to publish regularly (to avoid contention when // they are all publishing at the end). On the other side, each publishing // has some overhead (part of it for synchronizing between threads), so it // should not happen *too* often. Thus aim for 4-8 publishes per thread, but // distribute it such that publishing is likely to happen at different // times. int units_per_thread = num_declared_functions_ / num_queues; int min = std::max(10, units_per_thread / 8); int queue_id = 0; for (auto& queue : queues_) { // Set a limit between {min} and {2*min}, but not smaller than {10}. int limit = min + (min * queue_id / num_queues); queue->publish_limit.store(limit, std::memory_order_relaxed); ++queue_id; } return queues_[task_id].get(); } base::Optional GetNextUnit(Queue* queue, CompilationTier tier) { DCHECK_LT(tier, CompilationTier::kNumTiers); if (auto unit = GetNextUnitOfTier(queue, tier)) { size_t old_units_count = num_units_[tier].fetch_sub(1, std::memory_order_relaxed); DCHECK_LE(1, old_units_count); USE(old_units_count); return unit; } return {}; } void AddUnits(base::Vector baseline_units, base::Vector top_tier_units, const WasmModule* module) { DCHECK_LT(0, baseline_units.size() + top_tier_units.size()); // Add to the individual queues in a round-robin fashion. No special care is // taken to balance them; they will be balanced by work stealing. QueueImpl* queue; { int queue_to_add = next_queue_to_add.load(std::memory_order_relaxed); base::SharedMutexGuard queues_guard{&queues_mutex_}; while (!next_queue_to_add.compare_exchange_weak( queue_to_add, next_task_id(queue_to_add, queues_.size()), std::memory_order_relaxed)) { // Retry with updated {queue_to_add}. } queue = queues_[queue_to_add].get(); } base::MutexGuard guard(&queue->mutex); base::Optional big_units_guard; for (auto pair : {std::make_pair(CompilationTier::kBaseline, baseline_units), std::make_pair(CompilationTier::kTopTier, top_tier_units)}) { int tier = pair.first; base::Vector units = pair.second; if (units.empty()) continue; num_units_[tier].fetch_add(units.size(), std::memory_order_relaxed); for (WasmCompilationUnit unit : units) { size_t func_size = module->functions[unit.func_index()].code.length(); if (func_size <= kBigUnitsLimit) { queue->units[tier].push_back(unit); } else { if (!big_units_guard) { big_units_guard.emplace(&big_units_queue_.mutex); } big_units_queue_.has_units[tier].store(true, std::memory_order_relaxed); big_units_queue_.units[tier].emplace(func_size, unit); } } } } void AddTopTierPriorityUnit(WasmCompilationUnit unit, size_t priority) { base::SharedMutexGuard queues_guard{&queues_mutex_}; // Add to the individual queues in a round-robin fashion. No special care is // taken to balance them; they will be balanced by work stealing. // Priorities should only be seen as a hint here; without balancing, we // might pop a unit with lower priority from one queue while other queues // still hold higher-priority units. // Since updating priorities in a std::priority_queue is difficult, we just // add new units with higher priorities, and use the // {CompilationUnitQueues::top_tier_compiled_} array to discard units for // functions which are already being compiled. int queue_to_add = next_queue_to_add.load(std::memory_order_relaxed); while (!next_queue_to_add.compare_exchange_weak( queue_to_add, next_task_id(queue_to_add, queues_.size()), std::memory_order_relaxed)) { // Retry with updated {queue_to_add}. } { auto* queue = queues_[queue_to_add].get(); base::MutexGuard guard(&queue->mutex); queue->top_tier_priority_units.emplace(priority, unit); num_priority_units_.fetch_add(1, std::memory_order_relaxed); num_units_[CompilationTier::kTopTier].fetch_add( 1, std::memory_order_relaxed); } } // Get the current number of units in the queue for |tier|. This is only a // momentary snapshot, it's not guaranteed that {GetNextUnit} returns a unit // if this method returns non-zero. size_t GetSizeForTier(CompilationTier tier) const { DCHECK_LT(tier, CompilationTier::kNumTiers); return num_units_[tier].load(std::memory_order_relaxed); } void AllowAnotherTopTierJob(uint32_t func_index) { top_tier_compiled_[func_index].store(false, std::memory_order_relaxed); } void AllowAnotherTopTierJobForAllFunctions() { for (int i = 0; i < num_declared_functions_; i++) { AllowAnotherTopTierJob(i); } } size_t EstimateCurrentMemoryConsumption() const; private: // Functions bigger than {kBigUnitsLimit} will be compiled first, in ascending // order of their function body size. static constexpr size_t kBigUnitsLimit = 4096; struct BigUnit { BigUnit(size_t func_size, WasmCompilationUnit unit) : func_size{func_size}, unit(unit) {} size_t func_size; WasmCompilationUnit unit; bool operator<(const BigUnit& other) const { return func_size < other.func_size; } }; struct TopTierPriorityUnit { TopTierPriorityUnit(int priority, WasmCompilationUnit unit) : priority(priority), unit(unit) {} size_t priority; WasmCompilationUnit unit; bool operator<(const TopTierPriorityUnit& other) const { return priority < other.priority; } }; struct BigUnitsQueue { BigUnitsQueue() { #if !defined(__cpp_lib_atomic_value_initialization) || \ __cpp_lib_atomic_value_initialization < 201911L for (auto& atomic : has_units) std::atomic_init(&atomic, false); #endif } mutable base::Mutex mutex; // Can be read concurrently to check whether any elements are in the queue. std::atomic has_units[CompilationTier::kNumTiers]; // Protected by {mutex}: std::priority_queue units[CompilationTier::kNumTiers]; }; struct QueueImpl : public Queue { explicit QueueImpl(int next_steal_task_id) : next_steal_task_id(next_steal_task_id) {} // Number of units after which the task processing this queue should publish // compilation results. Updated (reduced, using relaxed ordering) when new // queues are allocated. If there is only one thread running, we can delay // publishing arbitrarily. std::atomic publish_limit{kMaxInt}; base::Mutex mutex; // All fields below are protected by {mutex}. std::vector units[CompilationTier::kNumTiers]; std::priority_queue top_tier_priority_units; int next_steal_task_id; }; int next_task_id(int task_id, size_t num_queues) const { int next = task_id + 1; return next == static_cast(num_queues) ? 0 : next; } base::Optional GetNextUnitOfTier(Queue* public_queue, int tier) { QueueImpl* queue = static_cast(public_queue); // First check whether there is a priority unit. Execute that first. if (tier == CompilationTier::kTopTier) { if (auto unit = GetTopTierPriorityUnit(queue)) { return unit; } } // Then check whether there is a big unit of that tier. if (auto unit = GetBigUnitOfTier(tier)) return unit; // Finally check whether our own queue has a unit of the wanted tier. If // so, return it, otherwise get the task id to steal from. int steal_task_id; { base::MutexGuard mutex_guard(&queue->mutex); if (!queue->units[tier].empty()) { auto unit = queue->units[tier].back(); queue->units[tier].pop_back(); return unit; } steal_task_id = queue->next_steal_task_id; } // Try to steal from all other queues. If this succeeds, return one of the // stolen units. { base::SharedMutexGuard guard{&queues_mutex_}; for (size_t steal_trials = 0; steal_trials < queues_.size(); ++steal_trials, ++steal_task_id) { if (steal_task_id >= static_cast(queues_.size())) { steal_task_id = 0; } if (auto unit = StealUnitsAndGetFirst(queue, steal_task_id, tier)) { return unit; } } } // If we reach here, we didn't find any unit of the requested tier. return {}; } base::Optional GetBigUnitOfTier(int tier) { // Fast path without locking. if (!big_units_queue_.has_units[tier].load(std::memory_order_relaxed)) { return {}; } base::MutexGuard guard(&big_units_queue_.mutex); if (big_units_queue_.units[tier].empty()) return {}; WasmCompilationUnit unit = big_units_queue_.units[tier].top().unit; big_units_queue_.units[tier].pop(); if (big_units_queue_.units[tier].empty()) { big_units_queue_.has_units[tier].store(false, std::memory_order_relaxed); } return unit; } base::Optional GetTopTierPriorityUnit(QueueImpl* queue) { // Fast path without locking. if (num_priority_units_.load(std::memory_order_relaxed) == 0) { return {}; } int steal_task_id; { base::MutexGuard mutex_guard(&queue->mutex); while (!queue->top_tier_priority_units.empty()) { auto unit = queue->top_tier_priority_units.top().unit; queue->top_tier_priority_units.pop(); num_priority_units_.fetch_sub(1, std::memory_order_relaxed); if (!top_tier_compiled_[unit.func_index()].exchange( true, std::memory_order_relaxed)) { return unit; } num_units_[CompilationTier::kTopTier].fetch_sub( 1, std::memory_order_relaxed); } steal_task_id = queue->next_steal_task_id; } // Try to steal from all other queues. If this succeeds, return one of the // stolen units. { base::SharedMutexGuard guard{&queues_mutex_}; for (size_t steal_trials = 0; steal_trials < queues_.size(); ++steal_trials, ++steal_task_id) { if (steal_task_id >= static_cast(queues_.size())) { steal_task_id = 0; } if (auto unit = StealTopTierPriorityUnit(queue, steal_task_id)) { return unit; } } } return {}; } // Steal units of {wanted_tier} from {steal_from_task_id} to {queue}. Return // first stolen unit (rest put in queue of {task_id}), or {nullopt} if // {steal_from_task_id} had no units of {wanted_tier}. // Hold a shared lock on {queues_mutex_} when calling this method. base::Optional StealUnitsAndGetFirst( QueueImpl* queue, int steal_from_task_id, int wanted_tier) { auto* steal_queue = queues_[steal_from_task_id].get(); // Cannot steal from own queue. if (steal_queue == queue) return {}; std::vector stolen; base::Optional returned_unit; { base::MutexGuard guard(&steal_queue->mutex); auto* steal_from_vector = &steal_queue->units[wanted_tier]; if (steal_from_vector->empty()) return {}; size_t remaining = steal_from_vector->size() / 2; auto steal_begin = steal_from_vector->begin() + remaining; returned_unit = *steal_begin; stolen.assign(steal_begin + 1, steal_from_vector->end()); steal_from_vector->erase(steal_begin, steal_from_vector->end()); } base::MutexGuard guard(&queue->mutex); auto* target_queue = &queue->units[wanted_tier]; target_queue->insert(target_queue->end(), stolen.begin(), stolen.end()); queue->next_steal_task_id = steal_from_task_id + 1; return returned_unit; } // Steal one priority unit from {steal_from_task_id} to {task_id}. Return // stolen unit, or {nullopt} if {steal_from_task_id} had no priority units. // Hold a shared lock on {queues_mutex_} when calling this method. base::Optional StealTopTierPriorityUnit( QueueImpl* queue, int steal_from_task_id) { auto* steal_queue = queues_[steal_from_task_id].get(); // Cannot steal from own queue. if (steal_queue == queue) return {}; base::Optional returned_unit; { base::MutexGuard guard(&steal_queue->mutex); while (true) { if (steal_queue->top_tier_priority_units.empty()) return {}; auto unit = steal_queue->top_tier_priority_units.top().unit; steal_queue->top_tier_priority_units.pop(); num_priority_units_.fetch_sub(1, std::memory_order_relaxed); if (!top_tier_compiled_[unit.func_index()].exchange( true, std::memory_order_relaxed)) { returned_unit = unit; break; } num_units_[CompilationTier::kTopTier].fetch_sub( 1, std::memory_order_relaxed); } } base::MutexGuard guard(&queue->mutex); queue->next_steal_task_id = steal_from_task_id + 1; return returned_unit; } // {queues_mutex_} protectes {queues_}; mutable base::SharedMutex queues_mutex_; std::vector> queues_; const int num_declared_functions_; BigUnitsQueue big_units_queue_; std::atomic num_units_[CompilationTier::kNumTiers]; std::atomic num_priority_units_{0}; std::unique_ptr[]> top_tier_compiled_; std::atomic next_queue_to_add{0}; }; size_t CompilationUnitQueues::EstimateCurrentMemoryConsumption() const { UPDATE_WHEN_CLASS_CHANGES(CompilationUnitQueues, 248); UPDATE_WHEN_CLASS_CHANGES(QueueImpl, 144); UPDATE_WHEN_CLASS_CHANGES(BigUnitsQueue, 120); // Not including sizeof(CompilationUnitQueues) because that's included in // sizeof(CompilationStateImpl). size_t result = 0; { base::SharedMutexGuard lock(&queues_mutex_); result += ContentSize(queues_) + queues_.size() * sizeof(QueueImpl); for (const auto& q : queues_) { result += ContentSize(*q->units); result += q->top_tier_priority_units.size() * sizeof(TopTierPriorityUnit); } } { base::MutexGuard lock(&big_units_queue_.mutex); result += big_units_queue_.units[0].size() * sizeof(BigUnit); result += big_units_queue_.units[1].size() * sizeof(BigUnit); } // For {top_tier_compiled_}. result += sizeof(std::atomic) * num_declared_functions_; return result; } bool CompilationUnitQueues::Queue::ShouldPublish( int num_processed_units) const { auto* queue = static_cast(this); return num_processed_units >= queue->publish_limit.load(std::memory_order_relaxed); } // The {CompilationStateImpl} keeps track of the compilation state of the // owning NativeModule, i.e. which functions are left to be compiled. // It contains a task manager to allow parallel and asynchronous background // compilation of functions. // Its public interface {CompilationState} lives in compilation-environment.h. class CompilationStateImpl { public: CompilationStateImpl(const std::shared_ptr& native_module, std::shared_ptr async_counters, DynamicTiering dynamic_tiering); ~CompilationStateImpl() { if (js_to_wasm_wrapper_job_ && js_to_wasm_wrapper_job_->IsValid()) js_to_wasm_wrapper_job_->CancelAndDetach(); if (baseline_compile_job_->IsValid()) baseline_compile_job_->CancelAndDetach(); if (top_tier_compile_job_->IsValid()) top_tier_compile_job_->CancelAndDetach(); } // Call right after the constructor, after the {compilation_state_} field in // the {NativeModule} has been initialized. void InitCompileJob(); // {kCancelUnconditionally}: Cancel all compilation. // {kCancelInitialCompilation}: Cancel all compilation if initial (baseline) // compilation is not finished yet. enum CancellationPolicy { kCancelUnconditionally, kCancelInitialCompilation }; void CancelCompilation(CancellationPolicy); bool cancelled() const; // Apply a compilation hint to the initial compilation progress, updating all // internal fields accordingly. void ApplyCompilationHintToInitialProgress(const WasmCompilationHint& hint, size_t hint_idx); // Use PGO information to choose a better initial compilation progress // (tiering decisions). void ApplyPgoInfoToInitialProgress(ProfileInformation* pgo_info); // Apply PGO information to a fully initialized compilation state. Also // trigger compilation as needed. void ApplyPgoInfoLate(ProfileInformation* pgo_info); // Initialize compilation progress. Set compilation tiers to expect for // baseline and top tier compilation. Must be set before // {CommitCompilationUnits} is invoked which triggers background compilation. void InitializeCompilationProgress(int num_import_wrappers, int num_export_wrappers, ProfileInformation* pgo_info); void InitializeCompilationProgressAfterDeserialization( base::Vector lazy_functions, base::Vector eager_functions); // Initializes compilation units based on the information encoded in the // {compilation_progress_}. void InitializeCompilationUnits( std::unique_ptr builder); // Adds compilation units for another function to the // {CompilationUnitBuilder}. This function is the streaming compilation // equivalent to {InitializeCompilationUnits}. void AddCompilationUnit(CompilationUnitBuilder* builder, int func_index); // Add the callback to be called on compilation events. Needs to be // set before {CommitCompilationUnits} is run to ensure that it receives all // events. The callback object must support being deleted from any thread. void AddCallback(std::unique_ptr callback); // Inserts new functions to compile and kicks off compilation. void CommitCompilationUnits( base::Vector baseline_units, base::Vector top_tier_units, base::Vector> js_to_wasm_wrapper_units); void CommitTopTierCompilationUnit(WasmCompilationUnit); void AddTopTierPriorityCompilationUnit(WasmCompilationUnit, size_t); CompilationUnitQueues::Queue* GetQueueForCompileTask(int task_id); base::Optional GetNextCompilationUnit( CompilationUnitQueues::Queue*, CompilationTier tier); std::shared_ptr GetJSToWasmWrapperCompilationUnit(size_t index); void FinalizeJSToWasmWrappers(Isolate* isolate, const WasmModule* module); void OnFinishedUnits(base::Vector); void OnFinishedJSToWasmWrapperUnits(); void OnCompilationStopped(WasmFeatures detected); void PublishDetectedFeatures(Isolate*); void SchedulePublishCompilationResults( std::vector> unpublished_code, CompilationTier tier); size_t NumOutstandingCompilations(CompilationTier tier) const; void SetError(); void WaitForCompilationEvent(CompilationEvent event); void TierUpAllFunctions(); void AllowAnotherTopTierJob(uint32_t func_index) { compilation_unit_queues_.AllowAnotherTopTierJob(func_index); } void AllowAnotherTopTierJobForAllFunctions() { compilation_unit_queues_.AllowAnotherTopTierJobForAllFunctions(); } bool failed() const { return compile_failed_.load(std::memory_order_relaxed); } bool baseline_compilation_finished() const { base::MutexGuard guard(&callbacks_mutex_); return outstanding_baseline_units_ == 0 && !has_outstanding_export_wrappers_; } DynamicTiering dynamic_tiering() const { return dynamic_tiering_; } Counters* counters() const { return async_counters_.get(); } void SetWireBytesStorage( std::shared_ptr wire_bytes_storage) { base::MutexGuard guard(&mutex_); wire_bytes_storage_ = std::move(wire_bytes_storage); } std::shared_ptr GetWireBytesStorage() const { base::MutexGuard guard(&mutex_); DCHECK_NOT_NULL(wire_bytes_storage_); return wire_bytes_storage_; } void set_compilation_id(int compilation_id) { DCHECK_EQ(compilation_id_, kInvalidCompilationID); compilation_id_ = compilation_id; } std::weak_ptr const native_module_weak() const { return native_module_weak_; } size_t EstimateCurrentMemoryConsumption() const; private: void AddCompilationUnitInternal(CompilationUnitBuilder* builder, int function_index, uint8_t function_progress); // Trigger callbacks according to the internal counters below // (outstanding_...). // Hold the {callbacks_mutex_} when calling this method. void TriggerCallbacks(); void PublishCompilationResults( std::vector> unpublished_code); void PublishCode(base::Vector> codes); NativeModule* const native_module_; std::weak_ptr const native_module_weak_; const std::shared_ptr async_counters_; // Compilation error, atomically updated. This flag can be updated and read // using relaxed semantics. std::atomic compile_failed_{false}; // True if compilation was cancelled and worker threads should return. This // flag can be updated and read using relaxed semantics. std::atomic compile_cancelled_{false}; CompilationUnitQueues compilation_unit_queues_; // Wrapper compilation units are stored in shared_ptrs so that they are kept // alive by the tasks even if the NativeModule dies. std::vector> js_to_wasm_wrapper_units_; // Cache the dynamic tiering configuration to be consistent for the whole // compilation. const DynamicTiering dynamic_tiering_; // This mutex protects all information of this {CompilationStateImpl} which is // being accessed concurrently. mutable base::Mutex mutex_; // The compile job handles, initialized right after construction of // {CompilationStateImpl}. std::unique_ptr js_to_wasm_wrapper_job_; std::unique_ptr baseline_compile_job_; std::unique_ptr top_tier_compile_job_; // The compilation id to identify trace events linked to this compilation. static constexpr int kInvalidCompilationID = -1; int compilation_id_ = kInvalidCompilationID; ////////////////////////////////////////////////////////////////////////////// // Protected by {mutex_}: // Features detected to be used in this module. Features can be detected // as a module is being compiled. WasmFeatures detected_features_ = WasmFeatures::None(); // Abstraction over the storage of the wire bytes. Held in a shared_ptr so // that background compilation jobs can keep the storage alive while // compiling. std::shared_ptr wire_bytes_storage_; // End of fields protected by {mutex_}. ////////////////////////////////////////////////////////////////////////////// // This mutex protects the callbacks vector, and the counters used to // determine which callbacks to call. The counters plus the callbacks // themselves need to be synchronized to ensure correct order of events. mutable base::Mutex callbacks_mutex_; ////////////////////////////////////////////////////////////////////////////// // Protected by {callbacks_mutex_}: // Callbacks to be called on compilation events. std::vector> callbacks_; // Events that already happened. base::EnumSet finished_events_; int outstanding_baseline_units_ = 0; bool has_outstanding_export_wrappers_ = false; // The amount of generated top tier code since the last // {kFinishedCompilationChunk} event. size_t bytes_since_last_chunk_ = 0; std::vector compilation_progress_; // End of fields protected by {callbacks_mutex_}. ////////////////////////////////////////////////////////////////////////////// struct PublishState { // {mutex_} protects {publish_queue_} and {publisher_running_}. base::Mutex mutex_; std::vector> publish_queue_; bool publisher_running_ = false; }; PublishState publish_state_[CompilationTier::kNumTiers]; // Encoding of fields in the {compilation_progress_} vector. using RequiredBaselineTierField = base::BitField8; using RequiredTopTierField = base::BitField8; using ReachedTierField = base::BitField8; }; CompilationStateImpl* Impl(CompilationState* compilation_state) { return reinterpret_cast(compilation_state); } const CompilationStateImpl* Impl(const CompilationState* compilation_state) { return reinterpret_cast(compilation_state); } CompilationStateImpl* BackgroundCompileScope::compilation_state() const { DCHECK(native_module_); return Impl(native_module_->compilation_state()); } size_t CompilationStateImpl::EstimateCurrentMemoryConsumption() const { UPDATE_WHEN_CLASS_CHANGES(CompilationStateImpl, 704); UPDATE_WHEN_CLASS_CHANGES(JSToWasmWrapperCompilationUnit, 40); size_t result = sizeof(CompilationStateImpl); result += compilation_unit_queues_.EstimateCurrentMemoryConsumption(); result += ContentSize(js_to_wasm_wrapper_units_); result += js_to_wasm_wrapper_units_.size() * (sizeof(JSToWasmWrapperCompilationUnit) + sizeof(TurbofanCompilationJob)); { base::MutexGuard lock(&callbacks_mutex_); result += ContentSize(callbacks_); // Concrete subclasses of CompilationEventCallback will be bigger, but we // can't know that here. result += callbacks_.size() * sizeof(CompilationEventCallback); result += ContentSize(compilation_progress_); } if (v8_flags.trace_wasm_offheap_memory) { PrintF("CompilationStateImpl: %zu\n", result); } return result; } bool BackgroundCompileScope::cancelled() const { return native_module_ == nullptr || Impl(native_module_->compilation_state())->cancelled(); } void UpdateFeatureUseCounts(Isolate* isolate, WasmFeatures detected) { using Feature = v8::Isolate::UseCounterFeature; constexpr static std::pair kUseCounters[] = { {kFeature_reftypes, Feature::kWasmRefTypes}, {kFeature_simd, Feature::kWasmSimdOpcodes}, {kFeature_threads, Feature::kWasmThreadOpcodes}, {kFeature_eh, Feature::kWasmExceptionHandling}, {kFeature_memory64, Feature::kWasmMemory64}, {kFeature_multi_memory, Feature::kWasmMultiMemory}, {kFeature_gc, Feature::kWasmGC}}; for (auto& feature : kUseCounters) { if (detected.contains(feature.first)) isolate->CountUsage(feature.second); } } } // namespace ////////////////////////////////////////////////////// // PIMPL implementation of {CompilationState}. CompilationState::~CompilationState() { Impl(this)->~CompilationStateImpl(); } void CompilationState::InitCompileJob() { Impl(this)->InitCompileJob(); } void CompilationState::CancelCompilation() { Impl(this)->CancelCompilation(CompilationStateImpl::kCancelUnconditionally); } void CompilationState::CancelInitialCompilation() { Impl(this)->CancelCompilation( CompilationStateImpl::kCancelInitialCompilation); } void CompilationState::SetError() { Impl(this)->SetError(); } void CompilationState::SetWireBytesStorage( std::shared_ptr wire_bytes_storage) { Impl(this)->SetWireBytesStorage(std::move(wire_bytes_storage)); } std::shared_ptr CompilationState::GetWireBytesStorage() const { return Impl(this)->GetWireBytesStorage(); } void CompilationState::AddCallback( std::unique_ptr callback) { return Impl(this)->AddCallback(std::move(callback)); } void CompilationState::TierUpAllFunctions() { Impl(this)->TierUpAllFunctions(); } void CompilationState::AllowAnotherTopTierJob(uint32_t func_index) { Impl(this)->AllowAnotherTopTierJob(func_index); } void CompilationState::AllowAnotherTopTierJobForAllFunctions() { Impl(this)->AllowAnotherTopTierJobForAllFunctions(); } void CompilationState::InitializeAfterDeserialization( base::Vector lazy_functions, base::Vector eager_functions) { Impl(this)->InitializeCompilationProgressAfterDeserialization( lazy_functions, eager_functions); } bool CompilationState::failed() const { return Impl(this)->failed(); } bool CompilationState::baseline_compilation_finished() const { return Impl(this)->baseline_compilation_finished(); } void CompilationState::set_compilation_id(int compilation_id) { Impl(this)->set_compilation_id(compilation_id); } DynamicTiering CompilationState::dynamic_tiering() const { return Impl(this)->dynamic_tiering(); } size_t CompilationState::EstimateCurrentMemoryConsumption() const { return Impl(this)->EstimateCurrentMemoryConsumption(); } // static std::unique_ptr CompilationState::New( const std::shared_ptr& native_module, std::shared_ptr async_counters, DynamicTiering dynamic_tiering) { return std::unique_ptr(reinterpret_cast( new CompilationStateImpl(std::move(native_module), std::move(async_counters), dynamic_tiering))); } // End of PIMPL implementation of {CompilationState}. ////////////////////////////////////////////////////// namespace { ExecutionTier ApplyHintToExecutionTier(WasmCompilationHintTier hint, ExecutionTier default_tier) { switch (hint) { case WasmCompilationHintTier::kDefault: return default_tier; case WasmCompilationHintTier::kBaseline: return ExecutionTier::kLiftoff; case WasmCompilationHintTier::kOptimized: return ExecutionTier::kTurbofan; } UNREACHABLE(); } const WasmCompilationHint* GetCompilationHint(const WasmModule* module, uint32_t func_index) { DCHECK_LE(module->num_imported_functions, func_index); uint32_t hint_index = declared_function_index(module, func_index); const std::vector& compilation_hints = module->compilation_hints; if (hint_index < compilation_hints.size()) { return &compilation_hints[hint_index]; } return nullptr; } CompileStrategy GetCompileStrategy(const WasmModule* module, WasmFeatures enabled_features, uint32_t func_index, bool lazy_module) { if (lazy_module) return CompileStrategy::kLazy; if (!enabled_features.has_compilation_hints()) { return CompileStrategy::kDefault; } auto* hint = GetCompilationHint(module, func_index); if (hint == nullptr) return CompileStrategy::kDefault; switch (hint->strategy) { case WasmCompilationHintStrategy::kLazy: return CompileStrategy::kLazy; case WasmCompilationHintStrategy::kEager: return CompileStrategy::kEager; case WasmCompilationHintStrategy::kLazyBaselineEagerTopTier: return CompileStrategy::kLazyBaselineEagerTopTier; case WasmCompilationHintStrategy::kDefault: return CompileStrategy::kDefault; } } struct ExecutionTierPair { ExecutionTier baseline_tier; ExecutionTier top_tier; }; // Pass the debug state as a separate parameter to avoid data races: the debug // state may change between its use here and its use at the call site. To have // a consistent view on the debug state, the caller reads the debug state once // and then passes it to this function. ExecutionTierPair GetDefaultTiersPerModule(NativeModule* native_module, DynamicTiering dynamic_tiering, DebugState is_in_debug_state, bool lazy_module) { const WasmModule* module = native_module->module(); if (is_asmjs_module(module)) { return {ExecutionTier::kTurbofan, ExecutionTier::kTurbofan}; } if (lazy_module) { return {ExecutionTier::kNone, ExecutionTier::kNone}; } if (is_in_debug_state) { return {ExecutionTier::kLiftoff, ExecutionTier::kLiftoff}; } ExecutionTier baseline_tier = v8_flags.liftoff ? ExecutionTier::kLiftoff : ExecutionTier::kTurbofan; bool eager_tier_up = !dynamic_tiering && v8_flags.wasm_tier_up; ExecutionTier top_tier = eager_tier_up ? ExecutionTier::kTurbofan : baseline_tier; return {baseline_tier, top_tier}; } ExecutionTierPair GetLazyCompilationTiers(NativeModule* native_module, uint32_t func_index, DebugState is_in_debug_state) { DynamicTiering dynamic_tiering = Impl(native_module->compilation_state())->dynamic_tiering(); // For lazy compilation, get the tiers we would use if lazy compilation is // disabled. constexpr bool kNotLazy = false; ExecutionTierPair tiers = GetDefaultTiersPerModule( native_module, dynamic_tiering, is_in_debug_state, kNotLazy); // If we are in debug mode, we ignore compilation hints. if (is_in_debug_state) return tiers; // Check if compilation hints override default tiering behaviour. if (native_module->enabled_features().has_compilation_hints()) { if (auto* hint = GetCompilationHint(native_module->module(), func_index)) { tiers.baseline_tier = ApplyHintToExecutionTier(hint->baseline_tier, tiers.baseline_tier); tiers.top_tier = ApplyHintToExecutionTier(hint->top_tier, tiers.top_tier); } } if (V8_UNLIKELY(v8_flags.wasm_tier_up_filter >= 0 && func_index != static_cast(v8_flags.wasm_tier_up_filter))) { tiers.top_tier = tiers.baseline_tier; } // Correct top tier if necessary. static_assert(ExecutionTier::kLiftoff < ExecutionTier::kTurbofan, "Assume an order on execution tiers"); if (tiers.baseline_tier > tiers.top_tier) { tiers.top_tier = tiers.baseline_tier; } return tiers; } // The {CompilationUnitBuilder} builds compilation units and stores them in an // internal buffer. The buffer is moved into the working queue of the // {CompilationStateImpl} when {Commit} is called. class CompilationUnitBuilder { public: explicit CompilationUnitBuilder(NativeModule* native_module) : native_module_(native_module) {} void AddImportUnit(uint32_t func_index) { DCHECK_GT(native_module_->module()->num_imported_functions, func_index); baseline_units_.emplace_back(func_index, ExecutionTier::kNone, kNotForDebugging); } void AddJSToWasmWrapperUnit( std::shared_ptr unit) { js_to_wasm_wrapper_units_.emplace_back(std::move(unit)); } void AddBaselineUnit(int func_index, ExecutionTier tier) { baseline_units_.emplace_back(func_index, tier, kNotForDebugging); } void AddTopTierUnit(int func_index, ExecutionTier tier) { tiering_units_.emplace_back(func_index, tier, kNotForDebugging); } void Commit() { if (baseline_units_.empty() && tiering_units_.empty() && js_to_wasm_wrapper_units_.empty()) { return; } compilation_state()->CommitCompilationUnits( base::VectorOf(baseline_units_), base::VectorOf(tiering_units_), base::VectorOf(js_to_wasm_wrapper_units_)); Clear(); } void Clear() { baseline_units_.clear(); tiering_units_.clear(); js_to_wasm_wrapper_units_.clear(); } const WasmModule* module() { return native_module_->module(); } private: CompilationStateImpl* compilation_state() const { return Impl(native_module_->compilation_state()); } NativeModule* const native_module_; std::vector baseline_units_; std::vector tiering_units_; std::vector> js_to_wasm_wrapper_units_; }; DecodeResult ValidateSingleFunction(const WasmModule* module, int func_index, base::Vector code, WasmFeatures enabled_features) { // Sometimes functions get validated unpredictably in the background, for // debugging or when inlining one function into another. We check here if that // is the case, and exit early if so. if (module->function_was_validated(func_index)) return {}; const WasmFunction* func = &module->functions[func_index]; FunctionBody body{func->sig, func->code.offset(), code.begin(), code.end()}; WasmFeatures detected_features; DecodeResult result = ValidateFunctionBody(enabled_features, module, &detected_features, body); if (result.ok()) module->set_function_validated(func_index); return result; } enum OnlyLazyFunctions : bool { kAllFunctions = false, kOnlyLazyFunctions = true, }; bool IsLazyModule(const WasmModule* module) { return v8_flags.wasm_lazy_compilation || (v8_flags.asm_wasm_lazy_compilation && is_asmjs_module(module)); } class CompileLazyTimingScope { public: CompileLazyTimingScope(Counters* counters, NativeModule* native_module) : counters_(counters), native_module_(native_module) { timer_.Start(); } ~CompileLazyTimingScope() { base::TimeDelta elapsed = timer_.Elapsed(); native_module_->AddLazyCompilationTimeSample(elapsed.InMicroseconds()); counters_->wasm_lazy_compile_time()->AddTimedSample(elapsed); } private: Counters* counters_; NativeModule* native_module_; base::ElapsedTimer timer_; }; } // namespace bool CompileLazy(Isolate* isolate, Tagged instance, int func_index) { DisallowGarbageCollection no_gc; Tagged module_object = instance->module_object(); NativeModule* native_module = module_object->native_module(); Counters* counters = isolate->counters(); // Put the timer scope around everything, including the {CodeSpaceWriteScope} // and its destruction, to measure complete overhead (apart from the runtime // function itself, which has constant overhead). base::Optional lazy_compile_time_scope; if (base::TimeTicks::IsHighResolution()) { lazy_compile_time_scope.emplace(counters, native_module); } DCHECK(!native_module->lazy_compile_frozen()); TRACE_LAZY("Compiling wasm-function#%d.\n", func_index); CompilationStateImpl* compilation_state = Impl(native_module->compilation_state()); DebugState is_in_debug_state = native_module->IsInDebugState(); ExecutionTierPair tiers = GetLazyCompilationTiers(native_module, func_index, is_in_debug_state); DCHECK_LE(native_module->num_imported_functions(), func_index); DCHECK_LT(func_index, native_module->num_functions()); WasmCompilationUnit baseline_unit{ func_index, tiers.baseline_tier, is_in_debug_state ? kForDebugging : kNotForDebugging}; CompilationEnv env = native_module->CreateCompilationEnv(); WasmFeatures detected_features; WasmCompilationResult result = baseline_unit.ExecuteCompilation( &env, compilation_state->GetWireBytesStorage().get(), counters, &detected_features); compilation_state->OnCompilationStopped(detected_features); // During lazy compilation, we can only get compilation errors when // {--wasm-lazy-validation} is enabled. Otherwise, the module was fully // verified before starting its execution. CHECK_IMPLIES(result.failed(), v8_flags.wasm_lazy_validation); if (result.failed()) { return false; } WasmCodeRefScope code_ref_scope; WasmCode* code = native_module->PublishCode(native_module->AddCompiledCode(result)); DCHECK_EQ(func_index, code->index()); if (V8_UNLIKELY(native_module->log_code())) { GetWasmEngine()->LogCode(base::VectorOf(&code, 1)); // Log the code immediately in the current isolate. GetWasmEngine()->LogOutstandingCodesForIsolate(isolate); } counters->wasm_lazily_compiled_functions()->Increment(); const WasmModule* module = native_module->module(); const bool lazy_module = IsLazyModule(module); if (GetCompileStrategy(module, native_module->enabled_features(), func_index, lazy_module) == CompileStrategy::kLazy && tiers.baseline_tier < tiers.top_tier) { WasmCompilationUnit tiering_unit{func_index, tiers.top_tier, kNotForDebugging}; compilation_state->CommitTopTierCompilationUnit(tiering_unit); } return true; } void ThrowLazyCompilationError(Isolate* isolate, const NativeModule* native_module, int func_index) { const WasmModule* module = native_module->module(); CompilationStateImpl* compilation_state = Impl(native_module->compilation_state()); const WasmFunction* func = &module->functions[func_index]; base::Vector code = compilation_state->GetWireBytesStorage()->GetCode(func->code); auto enabled_features = native_module->enabled_features(); DecodeResult decode_result = ValidateSingleFunction(module, func_index, code, enabled_features); CHECK(decode_result.failed()); wasm::ErrorThrower thrower(isolate, nullptr); thrower.CompileFailed(GetWasmErrorWithName(native_module->wire_bytes(), func_index, module, std::move(decode_result).error())); } class TransitiveTypeFeedbackProcessor { public: static void Process(Tagged instance, int func_index) { TransitiveTypeFeedbackProcessor{instance, func_index}.ProcessQueue(); } private: TransitiveTypeFeedbackProcessor(Tagged instance, int func_index) : instance_(instance), module_(instance->module()), mutex_guard(&module_->type_feedback.mutex), feedback_for_function_(module_->type_feedback.feedback_for_function) { queue_.insert(func_index); } ~TransitiveTypeFeedbackProcessor() { DCHECK(queue_.empty()); } void ProcessQueue() { while (!queue_.empty()) { auto next = queue_.cbegin(); ProcessFunction(*next); queue_.erase(next); } } void ProcessFunction(int func_index); void EnqueueCallees(const std::vector& feedback) { for (size_t i = 0; i < feedback.size(); i++) { const CallSiteFeedback& csf = feedback[i]; for (int j = 0; j < csf.num_cases(); j++) { int func = csf.function_index(j); // Don't spend time on calls that have never been executed. if (csf.call_count(j) == 0) continue; // Don't recompute feedback that has already been processed. auto existing = feedback_for_function_.find(func); if (existing != feedback_for_function_.end() && existing->second.feedback_vector.size() > 0) { continue; } queue_.insert(func); } } } DisallowGarbageCollection no_gc_scope_; WasmInstanceObject instance_; const WasmModule* const module_; // TODO(jkummerow): Check if it makes a difference to apply any updates // as a single batch at the end. base::SharedMutexGuard mutex_guard; std::unordered_map& feedback_for_function_; std::set queue_; }; class FeedbackMaker { public: FeedbackMaker(Tagged instance, int func_index, int num_calls) : instance_(instance), num_imported_functions_( static_cast(instance->module()->num_imported_functions)), func_index_(func_index) { result_.reserve(num_calls); } void AddCandidate(Tagged