| // Copyright 2017 the V8 project authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "src/wasm/module-compiler.h" |
| |
| #include <algorithm> |
| #include <queue> |
| |
| #include "src/api/api-inl.h" |
| #include "src/asmjs/asm-js.h" |
| #include "src/base/enum-set.h" |
| #include "src/base/optional.h" |
| #include "src/base/platform/mutex.h" |
| #include "src/base/platform/semaphore.h" |
| #include "src/base/platform/time.h" |
| #include "src/base/utils/random-number-generator.h" |
| #include "src/compiler/wasm-compiler.h" |
| #include "src/heap/heap-inl.h" // For CodeSpaceMemoryModificationScope. |
| #include "src/logging/counters.h" |
| #include "src/logging/metrics.h" |
| #include "src/objects/property-descriptor.h" |
| #include "src/tasks/task-utils.h" |
| #include "src/tracing/trace-event.h" |
| #include "src/trap-handler/trap-handler.h" |
| #include "src/utils/identity-map.h" |
| #include "src/wasm/module-decoder.h" |
| #include "src/wasm/streaming-decoder.h" |
| #include "src/wasm/wasm-code-manager.h" |
| #include "src/wasm/wasm-engine.h" |
| #include "src/wasm/wasm-import-wrapper-cache.h" |
| #include "src/wasm/wasm-js.h" |
| #include "src/wasm/wasm-limits.h" |
| #include "src/wasm/wasm-objects-inl.h" |
| #include "src/wasm/wasm-opcodes.h" |
| #include "src/wasm/wasm-result.h" |
| #include "src/wasm/wasm-serialization.h" |
| |
| #define TRACE_COMPILE(...) \ |
| do { \ |
| if (FLAG_trace_wasm_compiler) PrintF(__VA_ARGS__); \ |
| } while (false) |
| |
| #define TRACE_STREAMING(...) \ |
| do { \ |
| if (FLAG_trace_wasm_streaming) PrintF(__VA_ARGS__); \ |
| } while (false) |
| |
| #define TRACE_LAZY(...) \ |
| do { \ |
| if (FLAG_trace_wasm_lazy_compilation) PrintF(__VA_ARGS__); \ |
| } while (false) |
| |
| namespace v8 { |
| namespace internal { |
| namespace wasm { |
| |
| namespace { |
| |
| enum class CompileMode : uint8_t { kRegular, kTiering }; |
| |
| enum class CompileStrategy : uint8_t { |
| // Compiles functions on first use. In this case, execution will block until |
| // the function's baseline is reached and top tier compilation starts in |
| // background (if applicable). |
| // Lazy compilation can help to reduce startup time and code size at the risk |
| // of blocking execution. |
| kLazy, |
| // Compiles baseline ahead of execution and starts top tier compilation in |
| // background (if applicable). |
| kEager, |
| // Triggers baseline compilation on first use (just like {kLazy}) with the |
| // difference that top tier compilation is started eagerly. |
| // This strategy can help to reduce startup time at the risk of blocking |
| // execution, but only in its early phase (until top tier compilation |
| // finishes). |
| kLazyBaselineEagerTopTier, |
| // Marker for default strategy. |
| kDefault = kEager, |
| }; |
| |
| class CompilationStateImpl; |
| |
| class BackgroundCompileScope { |
| public: |
| explicit BackgroundCompileScope(std::weak_ptr<NativeModule> native_module) |
| : native_module_(native_module.lock()) {} |
| |
| NativeModule* native_module() const { |
| DCHECK(native_module_); |
| return native_module_.get(); |
| } |
| inline CompilationStateImpl* compilation_state() const; |
| |
| bool cancelled() const; |
| |
| private: |
| // Keep the native module alive while in this scope. |
| std::shared_ptr<NativeModule> native_module_; |
| }; |
| |
| enum CompileBaselineOnly : bool { |
| kBaselineOnly = true, |
| kBaselineOrTopTier = false |
| }; |
| |
| // A set of work-stealing queues (vectors of units). Each background compile |
| // task owns one of the queues and steals from all others once its own queue |
| // runs empty. |
| class CompilationUnitQueues { |
| public: |
| // Public API for QueueImpl. |
| struct Queue { |
| bool ShouldPublish(int num_processed_units) const; |
| }; |
| |
| #if !defined(DISABLE_WASM_STARBOARD) |
| explicit CompilationUnitQueues(int num_declared_functions) |
| : num_declared_functions_(num_declared_functions) { |
| // Add one first queue, to add units to. |
| queues_.emplace_back(std::make_unique<QueueImpl>(0)); |
| |
| for (auto& atomic_counter : num_units_) { |
| std::atomic_init(&atomic_counter, size_t{0}); |
| } |
| |
| top_tier_compiled_ = |
| std::make_unique<std::atomic<bool>[]>(num_declared_functions); |
| |
| for (int i = 0; i < num_declared_functions; i++) { |
| std::atomic_init(&top_tier_compiled_.get()[i], false); |
| } |
| } |
| #else |
| explicit CompilationUnitQueues(int /*max_tasks*/) {} |
| #endif |
| |
| Queue* GetQueueForTask(int task_id) { |
| int required_queues = task_id + 1; |
| { |
| base::SharedMutexGuard<base::kShared> queues_guard(&queues_mutex_); |
| if (V8_LIKELY(static_cast<int>(queues_.size()) >= required_queues)) { |
| return queues_[task_id].get(); |
| } |
| } |
| |
| // Otherwise increase the number of queues. |
| base::SharedMutexGuard<base::kExclusive> queues_guard(&queues_mutex_); |
| int num_queues = static_cast<int>(queues_.size()); |
| while (num_queues < required_queues) { |
| int steal_from = num_queues + 1; |
| queues_.emplace_back(std::make_unique<QueueImpl>(steal_from)); |
| ++num_queues; |
| } |
| |
| // Update the {publish_limit}s of all queues. |
| |
| // We want background threads to publish regularly (to avoid contention when |
| // they are all publishing at the end). On the other side, each publishing |
| // has some overhead (part of it for synchronizing between threads), so it |
| // should not happen *too* often. Thus aim for 4-8 publishes per thread, but |
| // distribute it such that publishing is likely to happen at different |
| // times. |
| int units_per_thread = num_declared_functions_ / num_queues; |
| int min = std::max(10, units_per_thread / 8); |
| int queue_id = 0; |
| for (auto& queue : queues_) { |
| // Set a limit between {min} and {2*min}, but not smaller than {10}. |
| int limit = min + (min * queue_id / num_queues); |
| queue->publish_limit.store(limit, std::memory_order_relaxed); |
| ++queue_id; |
| } |
| |
| return queues_[task_id].get(); |
| } |
| |
| base::Optional<WasmCompilationUnit> GetNextUnit( |
| Queue* queue, CompileBaselineOnly baseline_only) { |
| // As long as any lower-tier units are outstanding we need to steal them |
| // before executing own higher-tier units. |
| int max_tier = baseline_only ? kBaseline : kTopTier; |
| for (int tier = GetLowestTierWithUnits(); tier <= max_tier; ++tier) { |
| if (auto unit = GetNextUnitOfTier(queue, tier)) { |
| size_t old_units_count = |
| num_units_[tier].fetch_sub(1, std::memory_order_relaxed); |
| DCHECK_LE(1, old_units_count); |
| USE(old_units_count); |
| return unit; |
| } |
| } |
| return {}; |
| } |
| |
| void AddUnits(Vector<WasmCompilationUnit> baseline_units, |
| Vector<WasmCompilationUnit> top_tier_units, |
| const WasmModule* module) { |
| DCHECK_LT(0, baseline_units.size() + top_tier_units.size()); |
| #if !defined(DISABLE_WASM_STARBOARD) |
| // Add to the individual queues in a round-robin fashion. No special care is |
| // taken to balance them; they will be balanced by work stealing. |
| QueueImpl* queue; |
| { |
| int queue_to_add = next_queue_to_add.load(std::memory_order_relaxed); |
| base::SharedMutexGuard<base::kShared> queues_guard(&queues_mutex_); |
| while (!next_queue_to_add.compare_exchange_weak( |
| queue_to_add, next_task_id(queue_to_add, queues_.size()), |
| std::memory_order_relaxed)) { |
| // Retry with updated {queue_to_add}. |
| } |
| queue = queues_[queue_to_add].get(); |
| } |
| |
| base::MutexGuard guard(&queue->mutex); |
| base::Optional<base::MutexGuard> big_units_guard; |
| for (auto pair : {std::make_pair(int{kBaseline}, baseline_units), |
| std::make_pair(int{kTopTier}, top_tier_units)}) { |
| int tier = pair.first; |
| Vector<WasmCompilationUnit> units = pair.second; |
| if (units.empty()) continue; |
| num_units_[tier].fetch_add(units.size(), std::memory_order_relaxed); |
| for (WasmCompilationUnit unit : units) { |
| size_t func_size = module->functions[unit.func_index()].code.length(); |
| if (func_size <= kBigUnitsLimit) { |
| queue->units[tier].push_back(unit); |
| } else { |
| if (!big_units_guard) { |
| big_units_guard.emplace(&big_units_queue_.mutex); |
| } |
| big_units_queue_.has_units[tier].store(true, |
| std::memory_order_relaxed); |
| big_units_queue_.units[tier].emplace(func_size, unit); |
| } |
| } |
| } |
| #endif |
| } |
| |
| void AddTopTierPriorityUnit(WasmCompilationUnit unit, size_t priority) { |
| base::SharedMutexGuard<base::kShared> queues_guard(&queues_mutex_); |
| // Add to the individual queues in a round-robin fashion. No special care is |
| // taken to balance them; they will be balanced by work stealing. We use |
| // the same counter for this reason. |
| int queue_to_add = next_queue_to_add.load(std::memory_order_relaxed); |
| while (!next_queue_to_add.compare_exchange_weak( |
| queue_to_add, next_task_id(queue_to_add, queues_.size()), |
| std::memory_order_relaxed)) { |
| // Retry with updated {queue_to_add}. |
| } |
| |
| { |
| auto* queue = queues_[queue_to_add].get(); |
| base::MutexGuard guard(&queue->mutex); |
| queue->top_tier_priority_units.emplace(priority, unit); |
| } |
| num_priority_units_.fetch_add(1, std::memory_order_relaxed); |
| num_units_[kTopTier].fetch_add(1, std::memory_order_relaxed); |
| } |
| |
| // Get the current total number of units in all queues. This is only a |
| // momentary snapshot, it's not guaranteed that {GetNextUnit} returns a unit |
| // if this method returns non-zero. |
| size_t GetTotalSize() const { |
| size_t total = 0; |
| #if !defined(DISABLE_WASM_STARBOARD) |
| for (auto& atomic_counter : num_units_) { |
| total += atomic_counter.load(std::memory_order_relaxed); |
| } |
| #endif |
| return total; |
| } |
| |
| private: |
| // Store tier in int so we can easily loop over it: |
| static constexpr int kBaseline = 0; |
| static constexpr int kTopTier = 1; |
| static constexpr int kNumTiers = kTopTier + 1; |
| |
| // Functions bigger than {kBigUnitsLimit} will be compiled first, in ascending |
| // order of their function body size. |
| static constexpr size_t kBigUnitsLimit = 4096; |
| |
| struct BigUnit { |
| BigUnit(size_t func_size, WasmCompilationUnit unit) |
| : func_size{func_size}, unit(unit) {} |
| |
| size_t func_size; |
| WasmCompilationUnit unit; |
| |
| bool operator<(const BigUnit& other) const { |
| return func_size < other.func_size; |
| } |
| }; |
| |
| struct TopTierPriorityUnit { |
| TopTierPriorityUnit(int priority, WasmCompilationUnit unit) |
| : priority(priority), unit(unit) {} |
| |
| size_t priority; |
| WasmCompilationUnit unit; |
| |
| bool operator<(const TopTierPriorityUnit& other) const { |
| return priority < other.priority; |
| } |
| }; |
| |
| struct BigUnitsQueue { |
| BigUnitsQueue() { |
| #if !defined(DISABLE_WASM_STARBOARD) |
| for (auto& atomic : has_units) std::atomic_init(&atomic, false); |
| #endif |
| } |
| |
| base::Mutex mutex; |
| |
| // Can be read concurrently to check whether any elements are in the queue. |
| std::atomic<bool> has_units[kNumTiers]; |
| |
| // Protected by {mutex}: |
| std::priority_queue<BigUnit> units[kNumTiers]; |
| }; |
| |
| struct QueueImpl : public Queue { |
| explicit QueueImpl(int next_steal_task_id) |
| : next_steal_task_id(next_steal_task_id) {} |
| |
| // Number of units after which the task processing this queue should publish |
| // compilation results. Updated (reduced, using relaxed ordering) when new |
| // queues are allocated. If there is only one thread running, we can delay |
| // publishing arbitrarily. |
| std::atomic<int> publish_limit{kMaxInt}; |
| |
| base::Mutex mutex; |
| |
| // All fields below are protected by {mutex}. |
| std::vector<WasmCompilationUnit> units[kNumTiers]; |
| std::priority_queue<TopTierPriorityUnit> top_tier_priority_units; |
| int next_steal_task_id; |
| }; |
| |
| int next_task_id(int task_id, size_t num_queues) const { |
| int next = task_id + 1; |
| return next == static_cast<int>(num_queues) ? 0 : next; |
| } |
| |
| int GetLowestTierWithUnits() const { |
| #if !defined(DISABLE_WASM_STARBOARD) |
| for (int tier = 0; tier < kNumTiers; ++tier) { |
| if (num_units_[tier].load(std::memory_order_relaxed) > 0) return tier; |
| } |
| #endif |
| return kNumTiers; |
| } |
| |
| base::Optional<WasmCompilationUnit> GetNextUnitOfTier(Queue* public_queue, |
| int tier) { |
| QueueImpl* queue = static_cast<QueueImpl*>(public_queue); |
| |
| // First check whether there is a priority unit. Execute that first. |
| if (tier == kTopTier) { |
| if (auto unit = GetTopTierPriorityUnit(queue)) { |
| return unit; |
| } |
| } |
| |
| // Then check whether there is a big unit of that tier. |
| if (auto unit = GetBigUnitOfTier(tier)) return unit; |
| |
| // Finally check whether our own queue has a unit of the wanted tier. If |
| // so, return it, otherwise get the task id to steal from. |
| int steal_task_id; |
| { |
| base::MutexGuard mutex_guard(&queue->mutex); |
| if (!queue->units[tier].empty()) { |
| auto unit = queue->units[tier].back(); |
| queue->units[tier].pop_back(); |
| return unit; |
| } |
| steal_task_id = queue->next_steal_task_id; |
| } |
| |
| // Try to steal from all other queues. If this succeeds, return one of the |
| // stolen units. |
| { |
| base::SharedMutexGuard<base::kShared> guard(&queues_mutex_); |
| for (size_t steal_trials = 0; steal_trials < queues_.size(); |
| ++steal_trials, ++steal_task_id) { |
| if (steal_task_id >= static_cast<int>(queues_.size())) { |
| steal_task_id = 0; |
| } |
| if (auto unit = StealUnitsAndGetFirst(queue, steal_task_id, tier)) { |
| return unit; |
| } |
| } |
| } |
| |
| // If we reach here, we didn't find any unit of the requested tier. |
| return {}; |
| } |
| |
| base::Optional<WasmCompilationUnit> GetBigUnitOfTier(int tier) { |
| #if !defined(DISABLE_WASM_STARBOARD) |
| // Fast path without locking. |
| if (!big_units_queue_.has_units[tier].load(std::memory_order_relaxed)) { |
| return {}; |
| } |
| #endif |
| base::MutexGuard guard(&big_units_queue_.mutex); |
| if (big_units_queue_.units[tier].empty()) return {}; |
| WasmCompilationUnit unit = big_units_queue_.units[tier].top().unit; |
| big_units_queue_.units[tier].pop(); |
| if (big_units_queue_.units[tier].empty()) { |
| big_units_queue_.has_units[tier].store(false, std::memory_order_relaxed); |
| } |
| return unit; |
| } |
| |
| base::Optional<WasmCompilationUnit> GetTopTierPriorityUnit(QueueImpl* queue) { |
| // Fast path without locking. |
| if (num_priority_units_.load(std::memory_order_relaxed) == 0) { |
| return {}; |
| } |
| |
| int steal_task_id; |
| { |
| base::MutexGuard mutex_guard(&queue->mutex); |
| while (!queue->top_tier_priority_units.empty()) { |
| auto unit = queue->top_tier_priority_units.top().unit; |
| queue->top_tier_priority_units.pop(); |
| num_priority_units_.fetch_sub(1, std::memory_order_relaxed); |
| |
| if (!top_tier_compiled_[unit.func_index()].exchange( |
| true, std::memory_order_relaxed)) { |
| return unit; |
| } |
| num_units_[kTopTier].fetch_sub(1, std::memory_order_relaxed); |
| } |
| steal_task_id = queue->next_steal_task_id; |
| } |
| |
| // Try to steal from all other queues. If this succeeds, return one of the |
| // stolen units. |
| { |
| base::SharedMutexGuard<base::kShared> guard(&queues_mutex_); |
| for (size_t steal_trials = 0; steal_trials < queues_.size(); |
| ++steal_trials, ++steal_task_id) { |
| if (steal_task_id >= static_cast<int>(queues_.size())) { |
| steal_task_id = 0; |
| } |
| if (auto unit = StealTopTierPriorityUnit(queue, steal_task_id)) { |
| return unit; |
| } |
| } |
| } |
| |
| return {}; |
| } |
| |
| // Steal units of {wanted_tier} from {steal_from_task_id} to {queue}. Return |
| // first stolen unit (rest put in queue of {task_id}), or {nullopt} if |
| // {steal_from_task_id} had no units of {wanted_tier}. |
| // Hold a shared lock on {queues_mutex_} when calling this method. |
| base::Optional<WasmCompilationUnit> StealUnitsAndGetFirst( |
| QueueImpl* queue, int steal_from_task_id, int wanted_tier) { |
| auto* steal_queue = queues_[steal_from_task_id].get(); |
| // Cannot steal from own queue. |
| if (steal_queue == queue) return {}; |
| std::vector<WasmCompilationUnit> stolen; |
| base::Optional<WasmCompilationUnit> returned_unit; |
| { |
| base::MutexGuard guard(&steal_queue->mutex); |
| auto* steal_from_vector = &steal_queue->units[wanted_tier]; |
| if (steal_from_vector->empty()) return {}; |
| size_t remaining = steal_from_vector->size() / 2; |
| auto steal_begin = steal_from_vector->begin() + remaining; |
| returned_unit = *steal_begin; |
| stolen.assign(steal_begin + 1, steal_from_vector->end()); |
| steal_from_vector->erase(steal_begin, steal_from_vector->end()); |
| } |
| base::MutexGuard guard(&queue->mutex); |
| auto* target_queue = &queue->units[wanted_tier]; |
| target_queue->insert(target_queue->end(), stolen.begin(), stolen.end()); |
| queue->next_steal_task_id = steal_from_task_id + 1; |
| return returned_unit; |
| } |
| |
| // Steal one priority unit from {steal_from_task_id} to {task_id}. Return |
| // stolen unit, or {nullopt} if {steal_from_task_id} had no priority units. |
| // Hold a shared lock on {queues_mutex_} when calling this method. |
| base::Optional<WasmCompilationUnit> StealTopTierPriorityUnit( |
| QueueImpl* queue, int steal_from_task_id) { |
| auto* steal_queue = queues_[steal_from_task_id].get(); |
| // Cannot steal from own queue. |
| if (steal_queue == queue) return {}; |
| base::Optional<WasmCompilationUnit> returned_unit; |
| { |
| base::MutexGuard guard(&steal_queue->mutex); |
| while (true) { |
| if (steal_queue->top_tier_priority_units.empty()) return {}; |
| |
| auto unit = steal_queue->top_tier_priority_units.top().unit; |
| steal_queue->top_tier_priority_units.pop(); |
| num_priority_units_.fetch_sub(1, std::memory_order_relaxed); |
| |
| if (!top_tier_compiled_[unit.func_index()].exchange( |
| true, std::memory_order_relaxed)) { |
| returned_unit = unit; |
| break; |
| } |
| num_units_[kTopTier].fetch_sub(1, std::memory_order_relaxed); |
| } |
| } |
| base::MutexGuard guard(&queue->mutex); |
| queue->next_steal_task_id = steal_from_task_id + 1; |
| return returned_unit; |
| } |
| |
| // {queues_mutex_} protectes {queues_}; |
| base::SharedMutex queues_mutex_; |
| std::vector<std::unique_ptr<QueueImpl>> queues_; |
| |
| const int num_declared_functions_; |
| |
| BigUnitsQueue big_units_queue_; |
| |
| std::atomic<size_t> num_units_[kNumTiers]; |
| std::atomic<size_t> num_priority_units_{0}; |
| std::unique_ptr<std::atomic<bool>[]> top_tier_compiled_; |
| std::atomic<int> next_queue_to_add{0}; |
| }; |
| |
| bool CompilationUnitQueues::Queue::ShouldPublish( |
| int num_processed_units) const { |
| auto* queue = static_cast<const QueueImpl*>(this); |
| return num_processed_units >= |
| queue->publish_limit.load(std::memory_order_relaxed); |
| } |
| |
| // The {CompilationStateImpl} keeps track of the compilation state of the |
| // owning NativeModule, i.e. which functions are left to be compiled. |
| // It contains a task manager to allow parallel and asynchronous background |
| // compilation of functions. |
| // Its public interface {CompilationState} lives in compilation-environment.h. |
| class CompilationStateImpl { |
| public: |
| CompilationStateImpl(const std::shared_ptr<NativeModule>& native_module, |
| std::shared_ptr<Counters> async_counters); |
| |
| // Cancel all background compilation, without waiting for compile tasks to |
| // finish. |
| void CancelCompilation(); |
| bool cancelled() const; |
| |
| // Initialize compilation progress. Set compilation tiers to expect for |
| // baseline and top tier compilation. Must be set before {AddCompilationUnits} |
| // is invoked which triggers background compilation. |
| void InitializeCompilationProgress(bool lazy_module, int num_import_wrappers, |
| int num_export_wrappers); |
| |
| // Initialize the compilation progress after deserialization. This is needed |
| // for recompilation (e.g. for tier down) to work later. |
| void InitializeCompilationProgressAfterDeserialization(); |
| |
| // Initialize recompilation of the whole module: Setup compilation progress |
| // for recompilation and add the respective compilation units. The callback is |
| // called immediately if no recompilation is needed, or called later |
| // otherwise. |
| void InitializeRecompilation( |
| TieringState new_tiering_state, |
| CompilationState::callback_t recompilation_finished_callback); |
| |
| // Add the callback function to be called on compilation events. Needs to be |
| // set before {AddCompilationUnits} is run to ensure that it receives all |
| // events. The callback object must support being deleted from any thread. |
| void AddCallback(CompilationState::callback_t); |
| |
| // Inserts new functions to compile and kicks off compilation. |
| void AddCompilationUnits( |
| Vector<WasmCompilationUnit> baseline_units, |
| Vector<WasmCompilationUnit> top_tier_units, |
| Vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>> |
| js_to_wasm_wrapper_units); |
| void AddTopTierCompilationUnit(WasmCompilationUnit); |
| void AddTopTierPriorityCompilationUnit(WasmCompilationUnit, size_t); |
| |
| CompilationUnitQueues::Queue* GetQueueForCompileTask(int task_id); |
| |
| base::Optional<WasmCompilationUnit> GetNextCompilationUnit( |
| CompilationUnitQueues::Queue*, CompileBaselineOnly); |
| |
| std::shared_ptr<JSToWasmWrapperCompilationUnit> |
| GetNextJSToWasmWrapperCompilationUnit(); |
| void FinalizeJSToWasmWrappers(Isolate* isolate, const WasmModule* module, |
| Handle<FixedArray>* export_wrappers_out); |
| |
| void OnFinishedUnits(Vector<WasmCode*>); |
| void OnFinishedJSToWasmWrapperUnits(int num); |
| |
| void OnCompilationStopped(const WasmFeatures& detected); |
| void PublishDetectedFeatures(Isolate*); |
| void SchedulePublishCompilationResults( |
| std::vector<std::unique_ptr<WasmCode>> unpublished_code); |
| // Ensure that a compilation job is running, and increase its concurrency if |
| // needed. |
| void ScheduleCompileJobForNewUnits(); |
| |
| size_t NumOutstandingCompilations() const; |
| |
| void SetError(); |
| |
| void WaitForCompilationEvent(CompilationEvent event); |
| |
| void SetHighPriority() { has_priority_ = true; } |
| |
| bool failed() const { |
| #if !defined(DISABLE_WASM_STARBOARD) |
| return compile_failed_.load(std::memory_order_relaxed); |
| #else |
| return false; |
| #endif |
| } |
| |
| bool baseline_compilation_finished() const { |
| base::MutexGuard guard(&callbacks_mutex_); |
| return outstanding_baseline_units_ == 0 && |
| outstanding_export_wrappers_ == 0; |
| } |
| |
| bool top_tier_compilation_finished() const { |
| base::MutexGuard guard(&callbacks_mutex_); |
| return outstanding_top_tier_functions_ == 0; |
| } |
| |
| bool recompilation_finished() const { |
| base::MutexGuard guard(&callbacks_mutex_); |
| return outstanding_recompilation_functions_ == 0; |
| } |
| |
| CompileMode compile_mode() const { return compile_mode_; } |
| Counters* counters() const { return async_counters_.get(); } |
| WasmFeatures* detected_features() { return &detected_features_; } |
| |
| void SetWireBytesStorage( |
| std::shared_ptr<WireBytesStorage> wire_bytes_storage) { |
| base::MutexGuard guard(&mutex_); |
| wire_bytes_storage_ = wire_bytes_storage; |
| } |
| |
| std::shared_ptr<WireBytesStorage> GetWireBytesStorage() const { |
| base::MutexGuard guard(&mutex_); |
| DCHECK_NOT_NULL(wire_bytes_storage_); |
| return wire_bytes_storage_; |
| } |
| |
| private: |
| // Trigger callbacks according to the internal counters below |
| // (outstanding_...), plus the given events. |
| // Hold the {callbacks_mutex_} when calling this method. |
| void TriggerCallbacks(base::EnumSet<CompilationEvent> additional_events = {}); |
| |
| void PublishCompilationResults( |
| std::vector<std::unique_ptr<WasmCode>> unpublished_code); |
| void PublishCode(Vector<std::unique_ptr<WasmCode>> codes); |
| |
| NativeModule* const native_module_; |
| std::weak_ptr<NativeModule> const native_module_weak_; |
| const CompileMode compile_mode_; |
| const std::shared_ptr<Counters> async_counters_; |
| |
| // Compilation error, atomically updated. This flag can be updated and read |
| // using relaxed semantics. |
| std::atomic<bool> compile_failed_{false}; |
| |
| // True if compilation was cancelled and worker threads should return. This |
| // flag can be updated and read using relaxed semantics. |
| std::atomic<bool> compile_cancelled_{false}; |
| |
| CompilationUnitQueues compilation_unit_queues_; |
| |
| // Index of the next wrapper to compile in {js_to_wasm_wrapper_units_}. |
| std::atomic<int> js_to_wasm_wrapper_id_{0}; |
| // Wrapper compilation units are stored in shared_ptrs so that they are kept |
| // alive by the tasks even if the NativeModule dies. |
| std::vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>> |
| js_to_wasm_wrapper_units_; |
| |
| bool has_priority_ = false; |
| |
| // This mutex protects all information of this {CompilationStateImpl} which is |
| // being accessed concurrently. |
| mutable base::Mutex mutex_; |
| |
| ////////////////////////////////////////////////////////////////////////////// |
| // Protected by {mutex_}: |
| |
| std::shared_ptr<JobHandle> current_compile_job_; |
| |
| // Features detected to be used in this module. Features can be detected |
| // as a module is being compiled. |
| WasmFeatures detected_features_ = WasmFeatures::None(); |
| |
| // Abstraction over the storage of the wire bytes. Held in a shared_ptr so |
| // that background compilation jobs can keep the storage alive while |
| // compiling. |
| std::shared_ptr<WireBytesStorage> wire_bytes_storage_; |
| |
| // End of fields protected by {mutex_}. |
| ////////////////////////////////////////////////////////////////////////////// |
| |
| // This mutex protects the callbacks vector, and the counters used to |
| // determine which callbacks to call. The counters plus the callbacks |
| // themselves need to be synchronized to ensure correct order of events. |
| mutable base::Mutex callbacks_mutex_; |
| |
| ////////////////////////////////////////////////////////////////////////////// |
| // Protected by {callbacks_mutex_}: |
| |
| // Callback functions to be called on compilation events. |
| std::vector<CompilationState::callback_t> callbacks_; |
| |
| // Events that already happened. |
| base::EnumSet<CompilationEvent> finished_events_; |
| |
| int outstanding_baseline_units_ = 0; |
| int outstanding_export_wrappers_ = 0; |
| int outstanding_top_tier_functions_ = 0; |
| std::vector<uint8_t> compilation_progress_; |
| |
| int outstanding_recompilation_functions_ = 0; |
| TieringState tiering_state_ = kTieredUp; |
| |
| // End of fields protected by {callbacks_mutex_}. |
| ////////////////////////////////////////////////////////////////////////////// |
| |
| // {publish_mutex_} protects {publish_queue_} and {publisher_running_}. |
| base::Mutex publish_mutex_; |
| std::vector<std::unique_ptr<WasmCode>> publish_queue_; |
| bool publisher_running_ = false; |
| |
| // Encoding of fields in the {compilation_progress_} vector. |
| using RequiredBaselineTierField = base::BitField8<ExecutionTier, 0, 2>; |
| using RequiredTopTierField = base::BitField8<ExecutionTier, 2, 2>; |
| using ReachedTierField = base::BitField8<ExecutionTier, 4, 2>; |
| using MissingRecompilationField = base::BitField8<bool, 6, 1>; |
| }; |
| |
| CompilationStateImpl* Impl(CompilationState* compilation_state) { |
| return reinterpret_cast<CompilationStateImpl*>(compilation_state); |
| } |
| const CompilationStateImpl* Impl(const CompilationState* compilation_state) { |
| return reinterpret_cast<const CompilationStateImpl*>(compilation_state); |
| } |
| |
| CompilationStateImpl* BackgroundCompileScope::compilation_state() const { |
| DCHECK(native_module_); |
| return Impl(native_module_->compilation_state()); |
| } |
| |
| bool BackgroundCompileScope::cancelled() const { |
| return native_module_ == nullptr || |
| Impl(native_module_->compilation_state())->cancelled(); |
| } |
| |
| void UpdateFeatureUseCounts(Isolate* isolate, const WasmFeatures& detected) { |
| using Feature = v8::Isolate::UseCounterFeature; |
| constexpr static std::pair<WasmFeature, Feature> kUseCounters[] = { |
| {kFeature_reftypes, Feature::kWasmRefTypes}, |
| {kFeature_bulk_memory, Feature::kWasmBulkMemory}, |
| {kFeature_mv, Feature::kWasmMultiValue}, |
| {kFeature_simd, Feature::kWasmSimdOpcodes}, |
| {kFeature_threads, Feature::kWasmThreadOpcodes}}; |
| |
| for (auto& feature : kUseCounters) { |
| if (detected.contains(feature.first)) isolate->CountUsage(feature.second); |
| } |
| } |
| |
| } // namespace |
| |
| // static |
| constexpr uint32_t CompilationEnv::kMaxMemoryPagesAtRuntime; |
| |
| ////////////////////////////////////////////////////// |
| // PIMPL implementation of {CompilationState}. |
| |
| CompilationState::~CompilationState() { Impl(this)->~CompilationStateImpl(); } |
| |
| void CompilationState::CancelCompilation() { Impl(this)->CancelCompilation(); } |
| |
| void CompilationState::SetError() { Impl(this)->SetError(); } |
| |
| void CompilationState::SetWireBytesStorage( |
| std::shared_ptr<WireBytesStorage> wire_bytes_storage) { |
| Impl(this)->SetWireBytesStorage(std::move(wire_bytes_storage)); |
| } |
| |
| std::shared_ptr<WireBytesStorage> CompilationState::GetWireBytesStorage() |
| const { |
| return Impl(this)->GetWireBytesStorage(); |
| } |
| |
| void CompilationState::AddCallback(CompilationState::callback_t callback) { |
| return Impl(this)->AddCallback(std::move(callback)); |
| } |
| |
| void CompilationState::WaitForTopTierFinished() { |
| // TODO(clemensb): Contribute to compilation while waiting. |
| auto top_tier_finished_semaphore = std::make_shared<base::Semaphore>(0); |
| AddCallback([top_tier_finished_semaphore](CompilationEvent event) { |
| if (event == CompilationEvent::kFailedCompilation || |
| event == CompilationEvent::kFinishedTopTierCompilation) { |
| top_tier_finished_semaphore->Signal(); |
| } |
| }); |
| top_tier_finished_semaphore->Wait(); |
| } |
| |
| void CompilationState::SetHighPriority() { Impl(this)->SetHighPriority(); } |
| |
| void CompilationState::InitializeAfterDeserialization() { |
| Impl(this)->InitializeCompilationProgressAfterDeserialization(); |
| } |
| |
| bool CompilationState::failed() const { return Impl(this)->failed(); } |
| |
| bool CompilationState::baseline_compilation_finished() const { |
| return Impl(this)->baseline_compilation_finished(); |
| } |
| |
| bool CompilationState::top_tier_compilation_finished() const { |
| return Impl(this)->top_tier_compilation_finished(); |
| } |
| |
| bool CompilationState::recompilation_finished() const { |
| return Impl(this)->recompilation_finished(); |
| } |
| |
| // static |
| std::unique_ptr<CompilationState> CompilationState::New( |
| const std::shared_ptr<NativeModule>& native_module, |
| std::shared_ptr<Counters> async_counters) { |
| return std::unique_ptr<CompilationState>( |
| reinterpret_cast<CompilationState*>(new CompilationStateImpl( |
| std::move(native_module), std::move(async_counters)))); |
| } |
| |
| // End of PIMPL implementation of {CompilationState}. |
| ////////////////////////////////////////////////////// |
| |
| namespace { |
| |
| ExecutionTier ApplyHintToExecutionTier(WasmCompilationHintTier hint, |
| ExecutionTier default_tier) { |
| switch (hint) { |
| case WasmCompilationHintTier::kDefault: |
| return default_tier; |
| case WasmCompilationHintTier::kBaseline: |
| return ExecutionTier::kLiftoff; |
| case WasmCompilationHintTier::kOptimized: |
| return ExecutionTier::kTurbofan; |
| } |
| UNREACHABLE(); |
| } |
| |
| const WasmCompilationHint* GetCompilationHint(const WasmModule* module, |
| uint32_t func_index) { |
| DCHECK_LE(module->num_imported_functions, func_index); |
| uint32_t hint_index = declared_function_index(module, func_index); |
| const std::vector<WasmCompilationHint>& compilation_hints = |
| module->compilation_hints; |
| if (hint_index < compilation_hints.size()) { |
| return &compilation_hints[hint_index]; |
| } |
| return nullptr; |
| } |
| |
| CompileStrategy GetCompileStrategy(const WasmModule* module, |
| const WasmFeatures& enabled_features, |
| uint32_t func_index, bool lazy_module) { |
| if (lazy_module) return CompileStrategy::kLazy; |
| if (!enabled_features.has_compilation_hints()) { |
| return CompileStrategy::kDefault; |
| } |
| auto* hint = GetCompilationHint(module, func_index); |
| if (hint == nullptr) return CompileStrategy::kDefault; |
| switch (hint->strategy) { |
| case WasmCompilationHintStrategy::kLazy: |
| return CompileStrategy::kLazy; |
| case WasmCompilationHintStrategy::kEager: |
| return CompileStrategy::kEager; |
| case WasmCompilationHintStrategy::kLazyBaselineEagerTopTier: |
| return CompileStrategy::kLazyBaselineEagerTopTier; |
| case WasmCompilationHintStrategy::kDefault: |
| return CompileStrategy::kDefault; |
| } |
| } |
| |
| struct ExecutionTierPair { |
| ExecutionTier baseline_tier; |
| ExecutionTier top_tier; |
| }; |
| |
| ExecutionTierPair GetRequestedExecutionTiers( |
| const WasmModule* module, CompileMode compile_mode, |
| const WasmFeatures& enabled_features, uint32_t func_index) { |
| ExecutionTierPair result; |
| |
| result.baseline_tier = WasmCompilationUnit::GetBaselineExecutionTier(module); |
| switch (compile_mode) { |
| case CompileMode::kRegular: |
| result.top_tier = result.baseline_tier; |
| return result; |
| |
| case CompileMode::kTiering: |
| |
| // Default tiering behaviour. |
| result.top_tier = ExecutionTier::kTurbofan; |
| |
| // Check if compilation hints override default tiering behaviour. |
| if (enabled_features.has_compilation_hints()) { |
| const WasmCompilationHint* hint = |
| GetCompilationHint(module, func_index); |
| if (hint != nullptr) { |
| result.baseline_tier = ApplyHintToExecutionTier(hint->baseline_tier, |
| result.baseline_tier); |
| result.top_tier = |
| ApplyHintToExecutionTier(hint->top_tier, result.top_tier); |
| } |
| } |
| |
| // Correct top tier if necessary. |
| static_assert(ExecutionTier::kLiftoff < ExecutionTier::kTurbofan, |
| "Assume an order on execution tiers"); |
| if (result.baseline_tier > result.top_tier) { |
| result.top_tier = result.baseline_tier; |
| } |
| return result; |
| } |
| UNREACHABLE(); |
| } |
| |
| // The {CompilationUnitBuilder} builds compilation units and stores them in an |
| // internal buffer. The buffer is moved into the working queue of the |
| // {CompilationStateImpl} when {Commit} is called. |
| class CompilationUnitBuilder { |
| public: |
| explicit CompilationUnitBuilder(NativeModule* native_module) |
| : native_module_(native_module) {} |
| |
| void AddUnits(uint32_t func_index) { |
| if (func_index < native_module_->module()->num_imported_functions) { |
| baseline_units_.emplace_back(func_index, ExecutionTier::kNone, |
| kNoDebugging); |
| return; |
| } |
| ExecutionTierPair tiers = GetRequestedExecutionTiers( |
| native_module_->module(), compilation_state()->compile_mode(), |
| native_module_->enabled_features(), func_index); |
| // Compile everything for non-debugging initially. If needed, we will tier |
| // down when the module is fully compiled. Synchronization would be pretty |
| // difficult otherwise. |
| baseline_units_.emplace_back(func_index, tiers.baseline_tier, kNoDebugging); |
| if (tiers.baseline_tier != tiers.top_tier) { |
| tiering_units_.emplace_back(func_index, tiers.top_tier, kNoDebugging); |
| } |
| } |
| |
| void AddJSToWasmWrapperUnit( |
| std::shared_ptr<JSToWasmWrapperCompilationUnit> unit) { |
| js_to_wasm_wrapper_units_.emplace_back(std::move(unit)); |
| } |
| |
| void AddTopTierUnit(int func_index) { |
| ExecutionTierPair tiers = GetRequestedExecutionTiers( |
| native_module_->module(), compilation_state()->compile_mode(), |
| native_module_->enabled_features(), func_index); |
| // In this case, the baseline is lazily compiled, if at all. The compilation |
| // unit is added even if the baseline tier is the same. |
| #ifdef DEBUG |
| auto* module = native_module_->module(); |
| DCHECK_EQ(kWasmOrigin, module->origin); |
| const bool lazy_module = false; |
| DCHECK_EQ(CompileStrategy::kLazyBaselineEagerTopTier, |
| GetCompileStrategy(module, native_module_->enabled_features(), |
| func_index, lazy_module)); |
| #endif |
| tiering_units_.emplace_back(func_index, tiers.top_tier, kNoDebugging); |
| } |
| |
| void AddRecompilationUnit(int func_index, ExecutionTier tier) { |
| // For recompilation, just treat all units like baseline units. |
| baseline_units_.emplace_back( |
| func_index, tier, |
| tier == ExecutionTier::kLiftoff ? kForDebugging : kNoDebugging); |
| } |
| |
| bool Commit() { |
| if (baseline_units_.empty() && tiering_units_.empty() && |
| js_to_wasm_wrapper_units_.empty()) { |
| return false; |
| } |
| compilation_state()->AddCompilationUnits( |
| VectorOf(baseline_units_), VectorOf(tiering_units_), |
| VectorOf(js_to_wasm_wrapper_units_)); |
| Clear(); |
| return true; |
| } |
| |
| void Clear() { |
| baseline_units_.clear(); |
| tiering_units_.clear(); |
| js_to_wasm_wrapper_units_.clear(); |
| } |
| |
| private: |
| CompilationStateImpl* compilation_state() const { |
| return Impl(native_module_->compilation_state()); |
| } |
| |
| NativeModule* const native_module_; |
| std::vector<WasmCompilationUnit> baseline_units_; |
| std::vector<WasmCompilationUnit> tiering_units_; |
| std::vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>> |
| js_to_wasm_wrapper_units_; |
| }; |
| |
| void SetCompileError(ErrorThrower* thrower, ModuleWireBytes wire_bytes, |
| const WasmFunction* func, const WasmModule* module, |
| WasmError error) { |
| WasmName name = wire_bytes.GetNameOrNull(func, module); |
| if (name.begin() == nullptr) { |
| thrower->CompileError("Compiling function #%d failed: %s @+%u", |
| func->func_index, error.message().c_str(), |
| error.offset()); |
| } else { |
| TruncatedUserString<> truncated_name(name); |
| thrower->CompileError("Compiling function #%d:\"%.*s\" failed: %s @+%u", |
| func->func_index, truncated_name.length(), |
| truncated_name.start(), error.message().c_str(), |
| error.offset()); |
| } |
| } |
| |
| DecodeResult ValidateSingleFunction(const WasmModule* module, int func_index, |
| Vector<const uint8_t> code, |
| Counters* counters, |
| AccountingAllocator* allocator, |
| WasmFeatures enabled_features) { |
| const WasmFunction* func = &module->functions[func_index]; |
| FunctionBody body{func->sig, func->code.offset(), code.begin(), code.end()}; |
| DecodeResult result; |
| |
| WasmFeatures detected; |
| return VerifyWasmCode(allocator, enabled_features, module, &detected, body); |
| } |
| |
| enum OnlyLazyFunctions : bool { |
| kAllFunctions = false, |
| kOnlyLazyFunctions = true, |
| }; |
| |
| void ValidateSequentially( |
| const WasmModule* module, NativeModule* native_module, Counters* counters, |
| AccountingAllocator* allocator, ErrorThrower* thrower, bool lazy_module, |
| OnlyLazyFunctions only_lazy_functions = kAllFunctions) { |
| DCHECK(!thrower->error()); |
| uint32_t start = module->num_imported_functions; |
| uint32_t end = start + module->num_declared_functions; |
| auto enabled_features = native_module->enabled_features(); |
| for (uint32_t func_index = start; func_index < end; func_index++) { |
| // Skip non-lazy functions if requested. |
| if (only_lazy_functions) { |
| CompileStrategy strategy = |
| GetCompileStrategy(module, enabled_features, func_index, lazy_module); |
| if (strategy != CompileStrategy::kLazy && |
| strategy != CompileStrategy::kLazyBaselineEagerTopTier) { |
| continue; |
| } |
| } |
| |
| ModuleWireBytes wire_bytes{native_module->wire_bytes()}; |
| const WasmFunction* func = &module->functions[func_index]; |
| Vector<const uint8_t> code = wire_bytes.GetFunctionBytes(func); |
| DecodeResult result = ValidateSingleFunction( |
| module, func_index, code, counters, allocator, enabled_features); |
| if (result.failed()) { |
| SetCompileError(thrower, wire_bytes, func, module, result.error()); |
| } |
| } |
| } |
| |
| bool IsLazyModule(const WasmModule* module) { |
| return FLAG_wasm_lazy_compilation || |
| (FLAG_asm_wasm_lazy_compilation && is_asmjs_module(module)); |
| } |
| |
| } // namespace |
| |
| bool CompileLazy(Isolate* isolate, NativeModule* native_module, |
| int func_index) { |
| const WasmModule* module = native_module->module(); |
| auto enabled_features = native_module->enabled_features(); |
| Counters* counters = isolate->counters(); |
| |
| DCHECK(!native_module->lazy_compile_frozen()); |
| NativeModuleModificationScope native_module_modification_scope(native_module); |
| |
| TRACE_LAZY("Compiling wasm-function#%d.\n", func_index); |
| |
| CompilationStateImpl* compilation_state = |
| Impl(native_module->compilation_state()); |
| ExecutionTierPair tiers = GetRequestedExecutionTiers( |
| module, compilation_state->compile_mode(), enabled_features, func_index); |
| |
| DCHECK_LE(native_module->num_imported_functions(), func_index); |
| DCHECK_LT(func_index, native_module->num_functions()); |
| WasmCompilationUnit baseline_unit{func_index, tiers.baseline_tier, |
| kNoDebugging}; |
| CompilationEnv env = native_module->CreateCompilationEnv(); |
| WasmCompilationResult result = baseline_unit.ExecuteCompilation( |
| isolate->wasm_engine(), &env, compilation_state->GetWireBytesStorage(), |
| counters, compilation_state->detected_features()); |
| |
| // During lazy compilation, we can only get compilation errors when |
| // {--wasm-lazy-validation} is enabled. Otherwise, the module was fully |
| // verified before starting its execution. |
| CHECK_IMPLIES(result.failed(), FLAG_wasm_lazy_validation); |
| const WasmFunction* func = &module->functions[func_index]; |
| if (result.failed()) { |
| ErrorThrower thrower(isolate, nullptr); |
| Vector<const uint8_t> code = |
| compilation_state->GetWireBytesStorage()->GetCode(func->code); |
| DecodeResult decode_result = ValidateSingleFunction( |
| module, func_index, code, counters, isolate->wasm_engine()->allocator(), |
| enabled_features); |
| CHECK(decode_result.failed()); |
| SetCompileError(&thrower, ModuleWireBytes(native_module->wire_bytes()), |
| func, module, decode_result.error()); |
| return false; |
| } |
| |
| WasmCodeRefScope code_ref_scope; |
| WasmCode* code = native_module->PublishCode( |
| native_module->AddCompiledCode(std::move(result))); |
| DCHECK_EQ(func_index, code->index()); |
| |
| if (WasmCode::ShouldBeLogged(isolate)) code->LogCode(isolate); |
| |
| counters->wasm_lazily_compiled_functions()->Increment(); |
| |
| const bool lazy_module = IsLazyModule(module); |
| if (GetCompileStrategy(module, enabled_features, func_index, lazy_module) == |
| CompileStrategy::kLazy && |
| tiers.baseline_tier < tiers.top_tier) { |
| WasmCompilationUnit tiering_unit{func_index, tiers.top_tier, kNoDebugging}; |
| compilation_state->AddTopTierCompilationUnit(tiering_unit); |
| } |
| |
| return true; |
| } |
| |
| void TriggerTierUp(Isolate* isolate, NativeModule* native_module, |
| int func_index) { |
| CompilationStateImpl* compilation_state = |
| Impl(native_module->compilation_state()); |
| WasmCompilationUnit tiering_unit{func_index, ExecutionTier::kTurbofan, |
| kNoDebugging}; |
| |
| uint32_t* call_array = native_module->num_liftoff_function_calls_array(); |
| int offset = |
| wasm::declared_function_index(native_module->module(), func_index); |
| |
| size_t priority = |
| base::Relaxed_Load(reinterpret_cast<int*>(&call_array[offset])); |
| compilation_state->AddTopTierPriorityCompilationUnit(tiering_unit, priority); |
| } |
| |
| namespace { |
| |
| void RecordStats(const Code code, Counters* counters) { |
| counters->wasm_generated_code_size()->Increment(code.raw_body_size()); |
| counters->wasm_reloc_size()->Increment(code.relocation_info().length()); |
| } |
| |
| enum CompilationExecutionResult : int8_t { kNoMoreUnits, kYield }; |
| |
| CompilationExecutionResult ExecuteJSToWasmWrapperCompilationUnits( |
| std::weak_ptr<NativeModule> native_module, JobDelegate* delegate) { |
| std::shared_ptr<JSToWasmWrapperCompilationUnit> wrapper_unit = nullptr; |
| int num_processed_wrappers = 0; |
| |
| { |
| BackgroundCompileScope compile_scope(native_module); |
| if (compile_scope.cancelled()) return kNoMoreUnits; |
| wrapper_unit = compile_scope.compilation_state() |
| ->GetNextJSToWasmWrapperCompilationUnit(); |
| if (!wrapper_unit) return kNoMoreUnits; |
| } |
| |
| TRACE_EVENT0("v8.wasm", "wasm.JSToWasmWrapperCompilation"); |
| while (true) { |
| wrapper_unit->Execute(); |
| ++num_processed_wrappers; |
| bool yield = delegate && delegate->ShouldYield(); |
| BackgroundCompileScope compile_scope(native_module); |
| if (compile_scope.cancelled()) return kNoMoreUnits; |
| if (yield || |
| !(wrapper_unit = compile_scope.compilation_state() |
| ->GetNextJSToWasmWrapperCompilationUnit())) { |
| compile_scope.compilation_state()->OnFinishedJSToWasmWrapperUnits( |
| num_processed_wrappers); |
| return yield ? kYield : kNoMoreUnits; |
| } |
| } |
| } |
| |
| namespace { |
| const char* GetCompilationEventName(const WasmCompilationUnit& unit, |
| const CompilationEnv& env) { |
| ExecutionTier tier = unit.tier(); |
| if (tier == ExecutionTier::kLiftoff) { |
| return "wasm.BaselineCompilation"; |
| } |
| if (tier == ExecutionTier::kTurbofan) { |
| return "wasm.TopTierCompilation"; |
| } |
| if (unit.func_index() < |
| static_cast<int>(env.module->num_imported_functions)) { |
| return "wasm.WasmToJSWrapperCompilation"; |
| } |
| return "wasm.OtherCompilation"; |
| } |
| } // namespace |
| |
| // Run by the {BackgroundCompileJob} (on any thread). |
| CompilationExecutionResult ExecuteCompilationUnits( |
| std::weak_ptr<NativeModule> native_module, Counters* counters, |
| JobDelegate* delegate, CompileBaselineOnly baseline_only) { |
| TRACE_EVENT0("v8.wasm", "wasm.ExecuteCompilationUnits"); |
| |
| // Execute JS to Wasm wrapper units first, so that they are ready to be |
| // finalized by the main thread when the kFinishedBaselineCompilation event is |
| // triggered. |
| if (ExecuteJSToWasmWrapperCompilationUnits(native_module, delegate) == |
| kYield) { |
| return kYield; |
| } |
| |
| // These fields are initialized in a {BackgroundCompileScope} before |
| // starting compilation. |
| base::Optional<CompilationEnv> env; |
| std::shared_ptr<WireBytesStorage> wire_bytes; |
| std::shared_ptr<const WasmModule> module; |
| WasmEngine* wasm_engine; |
| // Task 0 is any main thread (there might be multiple from multiple isolates), |
| // worker threads start at 1 (thus the "+ 1"). |
| int task_id = delegate ? (int{delegate->GetTaskId()} + 1) : 0; |
| DCHECK_LE(0, task_id); |
| CompilationUnitQueues::Queue* queue; |
| base::Optional<WasmCompilationUnit> unit; |
| |
| WasmFeatures detected_features = WasmFeatures::None(); |
| |
| // Preparation (synchronized): Initialize the fields above and get the first |
| // compilation unit. |
| { |
| BackgroundCompileScope compile_scope(native_module); |
| if (compile_scope.cancelled()) return kNoMoreUnits; |
| auto* compilation_state = compile_scope.compilation_state(); |
| env.emplace(compile_scope.native_module()->CreateCompilationEnv()); |
| wire_bytes = compilation_state->GetWireBytesStorage(); |
| module = compile_scope.native_module()->shared_module(); |
| wasm_engine = compile_scope.native_module()->engine(); |
| queue = compilation_state->GetQueueForCompileTask(task_id); |
| unit = compilation_state->GetNextCompilationUnit(queue, baseline_only); |
| if (!unit) return kNoMoreUnits; |
| } |
| TRACE_COMPILE("ExecuteCompilationUnits (task id %d)\n", task_id); |
| |
| std::vector<WasmCompilationResult> results_to_publish; |
| while (true) { |
| ExecutionTier current_tier = unit->tier(); |
| const char* event_name = GetCompilationEventName(unit.value(), env.value()); |
| TRACE_EVENT0("v8.wasm", event_name); |
| while (unit->tier() == current_tier) { |
| // (asynchronous): Execute the compilation. |
| WasmCompilationResult result = unit->ExecuteCompilation( |
| wasm_engine, &env.value(), wire_bytes, counters, &detected_features); |
| results_to_publish.emplace_back(std::move(result)); |
| |
| bool yield = delegate && delegate->ShouldYield(); |
| |
| // (synchronized): Publish the compilation result and get the next unit. |
| BackgroundCompileScope compile_scope(native_module); |
| if (compile_scope.cancelled()) return kNoMoreUnits; |
| |
| if (!results_to_publish.back().succeeded()) { |
| compile_scope.compilation_state()->SetError(); |
| return kNoMoreUnits; |
| } |
| |
| // Yield or get next unit. |
| if (yield || |
| !(unit = compile_scope.compilation_state()->GetNextCompilationUnit( |
| queue, baseline_only))) { |
| std::vector<std::unique_ptr<WasmCode>> unpublished_code = |
| compile_scope.native_module()->AddCompiledCode( |
| VectorOf(std::move(results_to_publish))); |
| results_to_publish.clear(); |
| compile_scope.compilation_state()->SchedulePublishCompilationResults( |
| std::move(unpublished_code)); |
| compile_scope.compilation_state()->OnCompilationStopped( |
| detected_features); |
| return yield ? kYield : kNoMoreUnits; |
| } |
| |
| // Before executing a TurboFan unit, ensure to publish all previous |
| // units. If we compiled Liftoff before, we need to publish them anyway |
| // to ensure fast completion of baseline compilation, if we compiled |
| // TurboFan before, we publish to reduce peak memory consumption. |
| // Also publish after finishing a certain amount of units, to avoid |
| // contention when all threads publish at the end. |
| if (unit->tier() == ExecutionTier::kTurbofan || |
| queue->ShouldPublish(static_cast<int>(results_to_publish.size()))) { |
| std::vector<std::unique_ptr<WasmCode>> unpublished_code = |
| compile_scope.native_module()->AddCompiledCode( |
| VectorOf(std::move(results_to_publish))); |
| results_to_publish.clear(); |
| compile_scope.compilation_state()->SchedulePublishCompilationResults( |
| std::move(unpublished_code)); |
| } |
| } |
| } |
| UNREACHABLE(); |
| } |
| |
| using JSToWasmWrapperKey = std::pair<bool, FunctionSig>; |
| |
| // Returns the number of units added. |
| int AddExportWrapperUnits(Isolate* isolate, WasmEngine* wasm_engine, |
| NativeModule* native_module, |
| CompilationUnitBuilder* builder, |
| const WasmFeatures& enabled_features) { |
| std::unordered_set<JSToWasmWrapperKey, base::hash<JSToWasmWrapperKey>> keys; |
| for (auto exp : native_module->module()->export_table) { |
| if (exp.kind != kExternalFunction) continue; |
| auto& function = native_module->module()->functions[exp.index]; |
| JSToWasmWrapperKey key(function.imported, *function.sig); |
| if (keys.insert(key).second) { |
| auto unit = std::make_shared<JSToWasmWrapperCompilationUnit>( |
| isolate, wasm_engine, function.sig, native_module->module(), |
| function.imported, enabled_features, |
| JSToWasmWrapperCompilationUnit::kAllowGeneric); |
| builder->AddJSToWasmWrapperUnit(std::move(unit)); |
| } |
| } |
| |
| return static_cast<int>(keys.size()); |
| } |
| |
| // Returns the number of units added. |
| int AddImportWrapperUnits(NativeModule* native_module, |
| CompilationUnitBuilder* builder) { |
| std::unordered_set<WasmImportWrapperCache::CacheKey, |
| WasmImportWrapperCache::CacheKeyHash> |
| keys; |
| int num_imported_functions = native_module->num_imported_functions(); |
| for (int func_index = 0; func_index < num_imported_functions; func_index++) { |
| const FunctionSig* sig = native_module->module()->functions[func_index].sig; |
| if (!IsJSCompatibleSignature(sig, native_module->module(), |
| native_module->enabled_features())) { |
| continue; |
| } |
| WasmImportWrapperCache::CacheKey key( |
| compiler::kDefaultImportCallKind, sig, |
| static_cast<int>(sig->parameter_count())); |
| auto it = keys.insert(key); |
| if (it.second) { |
| // Ensure that all keys exist in the cache, so that we can populate the |
| // cache later without locking. |
| (*native_module->import_wrapper_cache())[key] = nullptr; |
| builder->AddUnits(func_index); |
| } |
| } |
| return static_cast<int>(keys.size()); |
| } |
| |
| void InitializeCompilationUnits(Isolate* isolate, NativeModule* native_module) { |
| CompilationStateImpl* compilation_state = |
| Impl(native_module->compilation_state()); |
| const bool lazy_module = IsLazyModule(native_module->module()); |
| ModuleWireBytes wire_bytes(native_module->wire_bytes()); |
| CompilationUnitBuilder builder(native_module); |
| auto* module = native_module->module(); |
| const bool prefer_liftoff = native_module->IsTieredDown(); |
| |
| uint32_t start = module->num_imported_functions; |
| uint32_t end = start + module->num_declared_functions; |
| for (uint32_t func_index = start; func_index < end; func_index++) { |
| if (prefer_liftoff) { |
| builder.AddRecompilationUnit(func_index, ExecutionTier::kLiftoff); |
| continue; |
| } |
| CompileStrategy strategy = GetCompileStrategy( |
| module, native_module->enabled_features(), func_index, lazy_module); |
| if (strategy == CompileStrategy::kLazy) { |
| native_module->UseLazyStub(func_index); |
| } else if (strategy == CompileStrategy::kLazyBaselineEagerTopTier) { |
| builder.AddTopTierUnit(func_index); |
| native_module->UseLazyStub(func_index); |
| } else { |
| DCHECK_EQ(strategy, CompileStrategy::kEager); |
| builder.AddUnits(func_index); |
| } |
| } |
| int num_import_wrappers = AddImportWrapperUnits(native_module, &builder); |
| int num_export_wrappers = |
| AddExportWrapperUnits(isolate, isolate->wasm_engine(), native_module, |
| &builder, WasmFeatures::FromIsolate(isolate)); |
| compilation_state->InitializeCompilationProgress( |
| lazy_module, num_import_wrappers, num_export_wrappers); |
| builder.Commit(); |
| } |
| |
| bool MayCompriseLazyFunctions(const WasmModule* module, |
| const WasmFeatures& enabled_features, |
| bool lazy_module) { |
| if (lazy_module || enabled_features.has_compilation_hints()) return true; |
| #ifdef ENABLE_SLOW_DCHECKS |
| int start = module->num_imported_functions; |
| int end = start + module->num_declared_functions; |
| for (int func_index = start; func_index < end; func_index++) { |
| SLOW_DCHECK(GetCompileStrategy(module, enabled_features, func_index, |
| lazy_module) != CompileStrategy::kLazy); |
| } |
| #endif |
| return false; |
| } |
| |
| class CompilationTimeCallback { |
| public: |
| enum CompileMode { kSynchronous, kAsync, kStreaming }; |
| explicit CompilationTimeCallback( |
| std::shared_ptr<Counters> async_counters, |
| std::shared_ptr<metrics::Recorder> metrics_recorder, |
| v8::metrics::Recorder::ContextId context_id, |
| std::weak_ptr<NativeModule> native_module, CompileMode compile_mode) |
| : start_time_(base::TimeTicks::Now()), |
| async_counters_(std::move(async_counters)), |
| metrics_recorder_(std::move(metrics_recorder)), |
| context_id_(context_id), |
| native_module_(std::move(native_module)), |
| compile_mode_(compile_mode) {} |
| |
| void operator()(CompilationEvent event) { |
| DCHECK(base::TimeTicks::IsHighResolution()); |
| std::shared_ptr<NativeModule> native_module = native_module_.lock(); |
| if (!native_module) return; |
| auto now = base::TimeTicks::Now(); |
| auto duration = now - start_time_; |
| if (event == CompilationEvent::kFinishedBaselineCompilation) { |
| // Reset {start_time_} to measure tier-up time. |
| start_time_ = now; |
| if (compile_mode_ != kSynchronous) { |
| TimedHistogram* histogram = |
| compile_mode_ == kAsync |
| ? async_counters_->wasm_async_compile_wasm_module_time() |
| : async_counters_->wasm_streaming_compile_wasm_module_time(); |
| histogram->AddSample(static_cast<int>(duration.InMicroseconds())); |
| } |
| |
| // TODO(sartang@microsoft.com): Remove wall_clock_time_in_us field |
| v8::metrics::WasmModuleCompiled event{ |
| (compile_mode_ != kSynchronous), // async |
| (compile_mode_ == kStreaming), // streamed |
| false, // cached |
| false, // deserialized |
| FLAG_wasm_lazy_compilation, // lazy |
| true, // success |
| native_module->liftoff_code_size(), // code_size_in_bytes |
| native_module->liftoff_bailout_count(), // liftoff_bailout_count |
| duration.InMicroseconds(), // wall_clock_time_in_us |
| duration.InMicroseconds() // wall_clock_duration_in_us |
| }; |
| metrics_recorder_->DelayMainThreadEvent(event, context_id_); |
| } |
| if (event == CompilationEvent::kFinishedTopTierCompilation) { |
| TimedHistogram* histogram = async_counters_->wasm_tier_up_module_time(); |
| histogram->AddSample(static_cast<int>(duration.InMicroseconds())); |
| |
| v8::metrics::WasmModuleTieredUp event{ |
| FLAG_wasm_lazy_compilation, // lazy |
| native_module->turbofan_code_size(), // code_size_in_bytes |
| duration.InMicroseconds(), // wall_clock_time_in_us |
| duration.InMicroseconds() // wall_clock_duration_in_us |
| }; |
| metrics_recorder_->DelayMainThreadEvent(event, context_id_); |
| } |
| if (event == CompilationEvent::kFailedCompilation) { |
| v8::metrics::WasmModuleCompiled event{ |
| (compile_mode_ != kSynchronous), // async |
| (compile_mode_ == kStreaming), // streamed |
| false, // cached |
| false, // deserialized |
| FLAG_wasm_lazy_compilation, // lazy |
| false, // success |
| native_module->liftoff_code_size(), // code_size_in_bytes |
| native_module->liftoff_bailout_count(), // liftoff_bailout_count |
| duration.InMicroseconds(), // wall_clock_time_in_us |
| duration.InMicroseconds() // wall_clock_duration_in_us |
| }; |
| metrics_recorder_->DelayMainThreadEvent(event, context_id_); |
| } |
| } |
| |
| private: |
| base::TimeTicks start_time_; |
| const std::shared_ptr<Counters> async_counters_; |
| std::shared_ptr<metrics::Recorder> metrics_recorder_; |
| v8::metrics::Recorder::ContextId context_id_; |
| std::weak_ptr<NativeModule> native_module_; |
| const CompileMode compile_mode_; |
| }; |
| |
| void CompileNativeModule(Isolate* isolate, |
| v8::metrics::Recorder::ContextId context_id, |
| ErrorThrower* thrower, const WasmModule* wasm_module, |
| std::shared_ptr<NativeModule> native_module, |
| Handle<FixedArray>* export_wrappers_out) { |
| CHECK(!FLAG_jitless); |
| ModuleWireBytes wire_bytes(native_module->wire_bytes()); |
| const bool lazy_module = IsLazyModule(wasm_module); |
| if (!FLAG_wasm_lazy_validation && wasm_module->origin == kWasmOrigin && |
| MayCompriseLazyFunctions(wasm_module, native_module->enabled_features(), |
| lazy_module)) { |
| // Validate wasm modules for lazy compilation if requested. Never validate |
| // asm.js modules as these are valid by construction (additionally a CHECK |
| // will catch this during lazy compilation). |
| ValidateSequentially(wasm_module, native_module.get(), isolate->counters(), |
| isolate->allocator(), thrower, lazy_module, |
| kOnlyLazyFunctions); |
| // On error: Return and leave the module in an unexecutable state. |
| if (thrower->error()) return; |
| } |
| |
| DCHECK_GE(kMaxInt, native_module->module()->num_declared_functions); |
| |
| // The callback captures a shared ptr to the semaphore. |
| auto* compilation_state = Impl(native_module->compilation_state()); |
| if (base::TimeTicks::IsHighResolution()) { |
| compilation_state->AddCallback(CompilationTimeCallback{ |
| isolate->async_counters(), isolate->metrics_recorder(), context_id, |
| native_module, CompilationTimeCallback::kSynchronous}); |
| } |
| |
| // Initialize the compilation units and kick off background compile tasks. |
| InitializeCompilationUnits(isolate, native_module.get()); |
| |
| compilation_state->WaitForCompilationEvent( |
| CompilationEvent::kFinishedExportWrappers); |
| |
| if (compilation_state->failed()) { |
| DCHECK_IMPLIES(lazy_module, !FLAG_wasm_lazy_validation); |
| ValidateSequentially(wasm_module, native_module.get(), isolate->counters(), |
| isolate->allocator(), thrower, lazy_module); |
| CHECK(thrower->error()); |
| return; |
| } |
| |
| if (!FLAG_predictable) { |
| // For predictable mode, do not finalize wrappers yet to make sure we catch |
| // validation errors first. |
| compilation_state->FinalizeJSToWasmWrappers( |
| isolate, native_module->module(), export_wrappers_out); |
| } |
| |
| compilation_state->WaitForCompilationEvent( |
| CompilationEvent::kFinishedBaselineCompilation); |
| |
| compilation_state->PublishDetectedFeatures(isolate); |
| |
| if (compilation_state->failed()) { |
| DCHECK_IMPLIES(lazy_module, !FLAG_wasm_lazy_validation); |
| ValidateSequentially(wasm_module, native_module.get(), isolate->counters(), |
| isolate->allocator(), thrower, lazy_module); |
| CHECK(thrower->error()); |
| } else if (FLAG_predictable) { |
| compilation_state->FinalizeJSToWasmWrappers( |
| isolate, native_module->module(), export_wrappers_out); |
| } |
| } |
| |
| class BackgroundCompileJob final : public JobTask { |
| public: |
| explicit BackgroundCompileJob(std::weak_ptr<NativeModule> native_module, |
| std::shared_ptr<Counters> async_counters) |
| : native_module_(std::move(native_module)), |
| async_counters_(std::move(async_counters)) {} |
| |
| void Run(JobDelegate* delegate) override { |
| ExecuteCompilationUnits(native_module_, async_counters_.get(), delegate, |
| kBaselineOrTopTier); |
| } |
| |
| size_t GetMaxConcurrency(size_t worker_count) const override { |
| BackgroundCompileScope scope(native_module_); |
| if (scope.cancelled()) return 0; |
| // NumOutstandingCompilations() does not reflect the units that running |
| // workers are processing, thus add the current worker count to that number. |
| size_t flag_limit = |
| static_cast<size_t>(std::max(1, FLAG_wasm_num_compilation_tasks)); |
| return std::min( |
| flag_limit, |
| worker_count + scope.compilation_state()->NumOutstandingCompilations()); |
| } |
| |
| private: |
| const std::weak_ptr<NativeModule> native_module_; |
| const std::shared_ptr<Counters> async_counters_; |
| }; |
| |
| } // namespace |
| |
| std::shared_ptr<NativeModule> CompileToNativeModule( |
| Isolate* isolate, const WasmFeatures& enabled, ErrorThrower* thrower, |
| std::shared_ptr<const WasmModule> module, const ModuleWireBytes& wire_bytes, |
| Handle<FixedArray>* export_wrappers_out) { |
| const WasmModule* wasm_module = module.get(); |
| OwnedVector<uint8_t> wire_bytes_copy = |
| OwnedVector<uint8_t>::Of(wire_bytes.module_bytes()); |
| // Prefer {wire_bytes_copy} to {wire_bytes.module_bytes()} for the temporary |
| // cache key. When we eventually install the module in the cache, the wire |
| // bytes of the temporary key and the new key have the same base pointer and |
| // we can skip the full bytes comparison. |
| std::shared_ptr<NativeModule> native_module = |
| isolate->wasm_engine()->MaybeGetNativeModule( |
| wasm_module->origin, wire_bytes_copy.as_vector(), isolate); |
| if (native_module) { |
| // TODO(thibaudm): Look into sharing export wrappers. |
| CompileJsToWasmWrappers(isolate, wasm_module, export_wrappers_out); |
| return native_module; |
| } |
| |
| TimedHistogramScope wasm_compile_module_time_scope(SELECT_WASM_COUNTER( |
| isolate->counters(), wasm_module->origin, wasm_compile, module_time)); |
| |
| // Embedder usage count for declared shared memories. |
| if (wasm_module->has_shared_memory) { |
| isolate->CountUsage(v8::Isolate::UseCounterFeature::kWasmSharedMemory); |
| } |
| |
| // Create a new {NativeModule} first. |
| const bool uses_liftoff = module->origin == kWasmOrigin && FLAG_liftoff; |
| size_t code_size_estimate = |
| wasm::WasmCodeManager::EstimateNativeModuleCodeSize(module.get(), |
| uses_liftoff); |
| native_module = isolate->wasm_engine()->NewNativeModule( |
| isolate, enabled, module, code_size_estimate); |
| #if !defined(DISABLE_WASM_STARBOARD) |
| // std::move(uint8_t[] issue) |
| native_module->SetWireBytes(std::move(wire_bytes_copy)); |
| #endif |
| // Sync compilation is user blocking, so we increase the priority. |
| native_module->compilation_state()->SetHighPriority(); |
| |
| v8::metrics::Recorder::ContextId context_id = |
| isolate->GetOrRegisterRecorderContextId(isolate->native_context()); |
| CompileNativeModule(isolate, context_id, thrower, wasm_module, native_module, |
| export_wrappers_out); |
| bool cache_hit = !isolate->wasm_engine()->UpdateNativeModuleCache( |
| thrower->error(), &native_module, isolate); |
| if (thrower->error()) return {}; |
| |
| if (cache_hit) { |
| CompileJsToWasmWrappers(isolate, wasm_module, export_wrappers_out); |
| return native_module; |
| } |
| |
| // Ensure that the code objects are logged before returning. |
| isolate->wasm_engine()->LogOutstandingCodesForIsolate(isolate); |
| |
| return native_module; |
| } |
| |
| void RecompileNativeModule(NativeModule* native_module, |
| TieringState tiering_state) { |
| // Install a callback to notify us once background recompilation finished. |
| auto recompilation_finished_semaphore = std::make_shared<base::Semaphore>(0); |
| auto* compilation_state = Impl(native_module->compilation_state()); |
| |
| // The callback captures a shared ptr to the semaphore. |
| // Initialize the compilation units and kick off background compile tasks. |
| compilation_state->InitializeRecompilation( |
| tiering_state, |
| [recompilation_finished_semaphore](CompilationEvent event) { |
| if (event == CompilationEvent::kFinishedRecompilation) { |
| recompilation_finished_semaphore->Signal(); |
| } |
| }); |
| |
| // Now wait until all compilation units finished. |
| // TODO(clemensb): Contribute to compilation while waiting. |
| recompilation_finished_semaphore->Wait(); |
| DCHECK(!compilation_state->failed()); |
| } |
| |
| AsyncCompileJob::AsyncCompileJob( |
| Isolate* isolate, const WasmFeatures& enabled, |
| std::unique_ptr<byte[]> bytes_copy, size_t length, Handle<Context> context, |
| Handle<Context> incumbent_context, const char* api_method_name, |
| std::shared_ptr<CompilationResultResolver> resolver) |
| : isolate_(isolate), |
| api_method_name_(api_method_name), |
| enabled_features_(enabled), |
| wasm_lazy_compilation_(FLAG_wasm_lazy_compilation), |
| start_time_(base::TimeTicks::Now()), |
| bytes_copy_(std::move(bytes_copy)), |
| wire_bytes_(bytes_copy_.get(), bytes_copy_.get() + length), |
| resolver_(std::move(resolver)) { |
| TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"), |
| "wasm.AsyncCompileJob"); |
| CHECK(FLAG_wasm_async_compilation); |
| CHECK(!FLAG_jitless); |
| v8::Isolate* v8_isolate = reinterpret_cast<v8::Isolate*>(isolate); |
| v8::Platform* platform = V8::GetCurrentPlatform(); |
| foreground_task_runner_ = platform->GetForegroundTaskRunner(v8_isolate); |
| native_context_ = |
| isolate->global_handles()->Create(context->native_context()); |
| incumbent_context_ = isolate->global_handles()->Create(*incumbent_context); |
| DCHECK(native_context_->IsNativeContext()); |
| context_id_ = isolate->GetOrRegisterRecorderContextId(native_context_); |
| metrics_event_.async = true; |
| } |
| |
| void AsyncCompileJob::Start() { |
| DoAsync<DecodeModule>(isolate_->counters(), |
| isolate_->metrics_recorder()); // -- |
| } |
| |
| void AsyncCompileJob::Abort() { |
| // Removing this job will trigger the destructor, which will cancel all |
| // compilation. |
| isolate_->wasm_engine()->RemoveCompileJob(this); |
| } |
| |
| class AsyncStreamingProcessor final : public StreamingProcessor { |
| public: |
| explicit AsyncStreamingProcessor(AsyncCompileJob* job, |
| std::shared_ptr<Counters> counters, |
| AccountingAllocator* allocator); |
| |
| ~AsyncStreamingProcessor() override; |
| |
| bool ProcessModuleHeader(Vector<const uint8_t> bytes, |
| uint32_t offset) override; |
| |
| bool ProcessSection(SectionCode section_code, Vector<const uint8_t> bytes, |
| uint32_t offset) override; |
| |
| bool ProcessCodeSectionHeader(int num_functions, uint32_t offset, |
| std::shared_ptr<WireBytesStorage>, |
| int code_section_length) override; |
| |
| bool ProcessFunctionBody(Vector<const uint8_t> bytes, |
| uint32_t offset) override; |
| |
| void OnFinishedChunk() override; |
| |
| void OnFinishedStream(OwnedVector<uint8_t> bytes) override; |
| |
| void OnError(const WasmError&) override; |
| |
| void OnAbort() override; |
| |
| bool Deserialize(Vector<const uint8_t> wire_bytes, |
| Vector<const uint8_t> module_bytes) override; |
| |
| private: |
| // Finishes the AsyncCompileJob with an error. |
| void FinishAsyncCompileJobWithError(const WasmError&); |
| |
| void CommitCompilationUnits(); |
| |
| ModuleDecoder decoder_; |
| AsyncCompileJob* job_; |
| WasmEngine* wasm_engine_; |
| std::unique_ptr<CompilationUnitBuilder> compilation_unit_builder_; |
| int num_functions_ = 0; |
| bool prefix_cache_hit_ = false; |
| bool before_code_section_ = true; |
| std::shared_ptr<Counters> async_counters_; |
| AccountingAllocator* allocator_; |
| |
| // Running hash of the wire bytes up to code section size, but excluding the |
| // code section itself. Used by the {NativeModuleCache} to detect potential |
| // duplicate modules. |
| size_t prefix_hash_; |
| }; |
| |
| std::shared_ptr<StreamingDecoder> AsyncCompileJob::CreateStreamingDecoder() { |
| DCHECK_NULL(stream_); |
| stream_ = StreamingDecoder::CreateAsyncStreamingDecoder( |
| std::make_unique<AsyncStreamingProcessor>( |
| this, isolate_->async_counters(), isolate_->allocator())); |
| return stream_; |
| } |
| |
| AsyncCompileJob::~AsyncCompileJob() { |
| // Note: This destructor always runs on the foreground thread of the isolate. |
| background_task_manager_.CancelAndWait(); |
| // If the runtime objects were not created yet, then initial compilation did |
| // not finish yet. In this case we can abort compilation. |
| if (native_module_ && module_object_.is_null()) { |
| Impl(native_module_->compilation_state())->CancelCompilation(); |
| } |
| // Tell the streaming decoder that the AsyncCompileJob is not available |
| // anymore. |
| // TODO(ahaas): Is this notification really necessary? Check |
| // https://crbug.com/888170. |
| if (stream_) stream_->NotifyCompilationEnded(); |
| CancelPendingForegroundTask(); |
| isolate_->global_handles()->Destroy(native_context_.location()); |
| isolate_->global_handles()->Destroy(incumbent_context_.location()); |
| if (!module_object_.is_null()) { |
| isolate_->global_handles()->Destroy(module_object_.location()); |
| } |
| } |
| |
| void AsyncCompileJob::CreateNativeModule( |
| std::shared_ptr<const WasmModule> module, size_t code_size_estimate) { |
| #if !defined(DISABLE_WASM_COMPILER_ISSUE_STARBOARD) |
| // Embedder usage count for declared shared memories. |
| if (module->has_shared_memory) { |
| isolate_->CountUsage(v8::Isolate::UseCounterFeature::kWasmSharedMemory); |
| } |
| |
| // TODO(wasm): Improve efficiency of storing module wire bytes. Only store |
| // relevant sections, not function bodies |
| |
| // Create the module object and populate with compiled functions and |
| // information needed at instantiation time. |
| |
| native_module_ = isolate_->wasm_engine()->NewNativeModule( |
| isolate_, enabled_features_, std::move(module), code_size_estimate); |
| native_module_->SetWireBytes({std::move(bytes_copy_), wire_bytes_.length()}); |
| #endif |
| } |
| |
| bool AsyncCompileJob::GetOrCreateNativeModule( |
| std::shared_ptr<const WasmModule> module, size_t code_size_estimate) { |
| native_module_ = isolate_->wasm_engine()->MaybeGetNativeModule( |
| module->origin, wire_bytes_.module_bytes(), isolate_); |
| if (native_module_ == nullptr) { |
| CreateNativeModule(std::move(module), code_size_estimate); |
| return false; |
| } |
| return true; |
| } |
| |
| void AsyncCompileJob::PrepareRuntimeObjects() { |
| // Create heap objects for script and module bytes to be stored in the |
| // module object. Asm.js is not compiled asynchronously. |
| DCHECK(module_object_.is_null()); |
| auto source_url = stream_ ? stream_->url() : Vector<const char>(); |
| auto script = isolate_->wasm_engine()->GetOrCreateScript( |
| isolate_, native_module_, source_url); |
| Handle<WasmModuleObject> module_object = |
| WasmModuleObject::New(isolate_, native_module_, script); |
| |
| module_object_ = isolate_->global_handles()->Create(*module_object); |
| } |
| |
| // This function assumes that it is executed in a HandleScope, and that a |
| // context is set on the isolate. |
| void AsyncCompileJob::FinishCompile(bool is_after_cache_hit) { |
| TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"), |
| "wasm.FinishAsyncCompile"); |
| bool is_after_deserialization = !module_object_.is_null(); |
| auto compilation_state = Impl(native_module_->compilation_state()); |
| if (!is_after_deserialization) { |
| if (stream_) { |
| stream_->NotifyNativeModuleCreated(native_module_); |
| } |
| PrepareRuntimeObjects(); |
| } |
| |
| // Measure duration of baseline compilation or deserialization from cache. |
| if (base::TimeTicks::IsHighResolution()) { |
| base::TimeDelta duration = base::TimeTicks::Now() - start_time_; |
| int duration_usecs = static_cast<int>(duration.InMicroseconds()); |
| isolate_->counters()->wasm_streaming_finish_wasm_module_time()->AddSample( |
| duration_usecs); |
| |
| if (is_after_cache_hit || is_after_deserialization) { |
| v8::metrics::WasmModuleCompiled event{ |
| true, // async |
| true, // streamed |
| is_after_cache_hit, // cached |
| is_after_deserialization, // deserialized |
| wasm_lazy_compilation_, // lazy |
| !compilation_state->failed(), // success |
| native_module_->liftoff_code_size(), // code_size_in_bytes |
| native_module_->liftoff_bailout_count(), // liftoff_bailout_count |
| duration.InMicroseconds(), // wall_clock_time_in_us |
| duration.InMicroseconds() // wall_clock_duration_in_us |
| }; |
| isolate_->metrics_recorder()->DelayMainThreadEvent(event, context_id_); |
| } |
| } |
| |
| DCHECK(!isolate_->context().is_null()); |
| // Finish the wasm script now and make it public to the debugger. |
| Handle<Script> script(module_object_->script(), isolate_); |
| const WasmModule* module = module_object_->module(); |
| if (script->type() == Script::TYPE_WASM && |
| module->debug_symbols.type == WasmDebugSymbols::Type::SourceMap && |
| !module->debug_symbols.external_url.is_empty()) { |
| ModuleWireBytes wire_bytes(module_object_->native_module()->wire_bytes()); |
| MaybeHandle<String> src_map_str = isolate_->factory()->NewStringFromUtf8( |
| wire_bytes.GetNameOrNull(module->debug_symbols.external_url), |
| AllocationType::kOld); |
| script->set_source_mapping_url(*src_map_str.ToHandleChecked()); |
| } |
| { |
| TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"), |
| "wasm.Debug.OnAfterCompile"); |
| isolate_->debug()->OnAfterCompile(script); |
| } |
| |
| // TODO(bbudge) Allow deserialization without wrapper compilation, so we can |
| // just compile wrappers here. |
| if (!is_after_deserialization) { |
| Handle<FixedArray> export_wrappers; |
| if (is_after_cache_hit) { |
| // TODO(thibaudm): Look into sharing wrappers. |
| CompileJsToWasmWrappers(isolate_, module, &export_wrappers); |
| } else { |
| compilation_state->FinalizeJSToWasmWrappers(isolate_, module, |
| &export_wrappers); |
| } |
| module_object_->set_export_wrappers(*export_wrappers); |
| } |
| // We can only update the feature counts once the entire compile is done. |
| compilation_state->PublishDetectedFeatures(isolate_); |
| |
| FinishModule(); |
| } |
| |
| void AsyncCompileJob::DecodeFailed(const WasmError& error) { |
| ErrorThrower thrower(isolate_, api_method_name_); |
| thrower.CompileFailed(error); |
| // {job} keeps the {this} pointer alive. |
| std::shared_ptr<AsyncCompileJob> job = |
| isolate_->wasm_engine()->RemoveCompileJob(this); |
| resolver_->OnCompilationFailed(thrower.Reify()); |
| } |
| |
| void AsyncCompileJob::AsyncCompileFailed() { |
| ErrorThrower thrower(isolate_, api_method_name_); |
| DCHECK_EQ(native_module_->module()->origin, kWasmOrigin); |
| const bool lazy_module = wasm_lazy_compilation_; |
| ValidateSequentially(native_module_->module(), native_module_.get(), |
| isolate_->counters(), isolate_->allocator(), &thrower, |
| lazy_module); |
| DCHECK(thrower.error()); |
| // {job} keeps the {this} pointer alive. |
| std::shared_ptr<AsyncCompileJob> job = |
| isolate_->wasm_engine()->RemoveCompileJob(this); |
| resolver_->OnCompilationFailed(thrower.Reify()); |
| } |
| |
| void AsyncCompileJob::AsyncCompileSucceeded(Handle<WasmModuleObject> result) { |
| TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"), |
| "wasm.OnCompilationSucceeded"); |
| // We have to make sure that an "incumbent context" is available in case |
| // the module's start function calls out to Blink. |
| Local<v8::Context> backup_incumbent_context = |
| Utils::ToLocal(incumbent_context_); |
| v8::Context::BackupIncumbentScope incumbent(backup_incumbent_context); |
| resolver_->OnCompilationSucceeded(result); |
| } |
| |
| class AsyncCompileJob::CompilationStateCallback { |
| public: |
| explicit CompilationStateCallback(AsyncCompileJob* job) : job_(job) {} |
| |
| void operator()(CompilationEvent event) { |
| // This callback is only being called from a foreground task. |
| switch (event) { |
| case CompilationEvent::kFinishedExportWrappers: |
| // Even if baseline compilation units finish first, we trigger the |
| // "kFinishedExportWrappers" event first. |
| DCHECK(!last_event_.has_value()); |
| break; |
| case CompilationEvent::kFinishedBaselineCompilation: |
| DCHECK_EQ(CompilationEvent::kFinishedExportWrappers, last_event_); |
| if (job_->DecrementAndCheckFinisherCount()) { |
| // Install the native module in the cache, or reuse a conflicting one. |
| // If we get a conflicting module, wait until we are back in the |
| // main thread to update {job_->native_module_} to avoid a data race. |
| std::shared_ptr<NativeModule> native_module = job_->native_module_; |
| bool cache_hit = |
| !job_->isolate_->wasm_engine()->UpdateNativeModuleCache( |
| false, &native_module, job_->isolate_); |
| DCHECK_EQ(cache_hit, native_module != job_->native_module_); |
| job_->DoSync<CompileFinished>(cache_hit ? std::move(native_module) |
| : nullptr); |
| } |
| break; |
| case CompilationEvent::kFinishedTopTierCompilation: |
| DCHECK_EQ(CompilationEvent::kFinishedBaselineCompilation, last_event_); |
| // At this point, the job will already be gone, thus do not access it |
| // here. |
| break; |
| case CompilationEvent::kFailedCompilation: |
| DCHECK(!last_event_.has_value() || |
| last_event_ == CompilationEvent::kFinishedExportWrappers); |
| if (job_->DecrementAndCheckFinisherCount()) { |
| // Don't update {job_->native_module_} to avoid data races with other |
| // compilation threads. Use a copy of the shared pointer instead. |
| std::shared_ptr<NativeModule> native_module = job_->native_module_; |
| job_->isolate_->wasm_engine()->UpdateNativeModuleCache( |
| true, &native_module, job_->isolate_); |
| job_->DoSync<CompileFailed>(); |
| } |
| break; |
| case CompilationEvent::kFinishedRecompilation: |
| // This event can happen either before or after |
| // {kFinishedTopTierCompilation}, hence don't remember this in |
| // {last_event_}. |
| return; |
| } |
| #ifdef DEBUG |
| last_event_ = event; |
| #endif |
| } |
| |
| private: |
| AsyncCompileJob* job_; |
| #ifdef DEBUG |
| // This will be modified by different threads, but they externally |
| // synchronize, so no explicit synchronization (currently) needed here. |
| base::Optional<CompilationEvent> last_event_; |
| #endif |
| }; |
| |
| // A closure to run a compilation step (either as foreground or background |
| // task) and schedule the next step(s), if any. |
| class AsyncCompileJob::CompileStep { |
| public: |
| virtual ~CompileStep() = default; |
| |
| void Run(AsyncCompileJob* job, bool on_foreground) { |
| if (on_foreground) { |
| HandleScope scope(job->isolate_); |
| SaveAndSwitchContext saved_context(job->isolate_, *job->native_context_); |
| RunInForeground(job); |
| } else { |
| RunInBackground(job); |
| } |
| } |
| |
| virtual void RunInForeground(AsyncCompileJob*) { UNREACHABLE(); } |
| virtual void RunInBackground(AsyncCompileJob*) { UNREACHABLE(); } |
| }; |
| |
| class AsyncCompileJob::CompileTask : public CancelableTask { |
| public: |
| CompileTask(AsyncCompileJob* job, bool on_foreground) |
| // We only manage the background tasks with the {CancelableTaskManager} of |
| // the {AsyncCompileJob}. Foreground tasks are managed by the system's |
| // {CancelableTaskManager}. Background tasks cannot spawn tasks managed by |
| // their own task manager. |
| : CancelableTask(on_foreground ? job->isolate_->cancelable_task_manager() |
| : &job->background_task_manager_), |
| job_(job), |
| on_foreground_(on_foreground) {} |
| |
| ~CompileTask() override { |
| if (job_ != nullptr && on_foreground_) ResetPendingForegroundTask(); |
| } |
| |
| void RunInternal() final { |
| if (!job_) return; |
| if (on_foreground_) ResetPendingForegroundTask(); |
| job_->step_->Run(job_, on_foreground_); |
| // After execution, reset {job_} such that we don't try to reset the pending |
| // foreground task when the task is deleted. |
| job_ = nullptr; |
| } |
| |
| void Cancel() { |
| DCHECK_NOT_NULL(job_); |
| job_ = nullptr; |
| } |
| |
| private: |
| // {job_} will be cleared to cancel a pending task. |
| AsyncCompileJob* job_; |
| bool on_foreground_; |
| |
| void ResetPendingForegroundTask() const { |
| DCHECK_EQ(this, job_->pending_foreground_task_); |
| job_->pending_foreground_task_ = nullptr; |
| } |
| }; |
| |
| void AsyncCompileJob::StartForegroundTask() { |
| DCHECK_NULL(pending_foreground_task_); |
| |
| auto new_task = std::make_unique<CompileTask>(this, true); |
| pending_foreground_task_ = new_task.get(); |
| foreground_task_runner_->PostTask(std::move(new_task)); |
| } |
| |
| void AsyncCompileJob::ExecuteForegroundTaskImmediately() { |
| DCHECK_NULL(pending_foreground_task_); |
| |
| auto new_task = std::make_unique<CompileTask>(this, true); |
| pending_foreground_task_ = new_task.get(); |
| new_task->Run(); |
| } |
| |
| void AsyncCompileJob::CancelPendingForegroundTask() { |
| if (!pending_foreground_task_) return; |
| pending_foreground_task_->Cancel(); |
| pending_foreground_task_ = nullptr; |
| } |
| |
| void AsyncCompileJob::StartBackgroundTask() { |
| auto task = std::make_unique<CompileTask>(this, false); |
| |
| // If --wasm-num-compilation-tasks=0 is passed, do only spawn foreground |
| // tasks. This is used to make timing deterministic. |
| if (FLAG_wasm_num_compilation_tasks > 0) { |
| V8::GetCurrentPlatform()->CallOnWorkerThread(std::move(task)); |
| } else { |
| foreground_task_runner_->PostTask(std::move(task)); |
| } |
| } |
| |
| template <typename Step, |
| AsyncCompileJob::UseExistingForegroundTask use_existing_fg_task, |
| typename... Args> |
| void AsyncCompileJob::DoSync(Args&&... args) { |
| NextStep<Step>(std::forward<Args>(args)...); |
| if (use_existing_fg_task && pending_foreground_task_ != nullptr) return; |
| StartForegroundTask(); |
| } |
| |
| template <typename Step, typename... Args> |
| void AsyncCompileJob::DoImmediately(Args&&... args) { |
| NextStep<Step>(std::forward<Args>(args)...); |
| ExecuteForegroundTaskImmediately(); |
| } |
| |
| template <typename Step, typename... Args> |
| void AsyncCompileJob::DoAsync(Args&&... args) { |
| NextStep<Step>(std::forward<Args>(args)...); |
| StartBackgroundTask(); |
| } |
| |
| template <typename Step, typename... Args> |
| void AsyncCompileJob::NextStep(Args&&... args) { |
| step_.reset(new Step(std::forward<Args>(args)...)); |
| } |
| |
| //========================================================================== |
| // Step 1: (async) Decode the module. |
| //========================================================================== |
| class AsyncCompileJob::DecodeModule : public AsyncCompileJob::CompileStep { |
| public: |
| explicit DecodeModule(Counters* counters, |
| std::shared_ptr<metrics::Recorder> metrics_recorder) |
| : counters_(counters), metrics_recorder_(std::move(metrics_recorder)) {} |
| |
| void RunInBackground(AsyncCompileJob* job) override { |
| ModuleResult result; |
| { |
| DisallowHandleAllocation no_handle; |
| DisallowHeapAllocation no_allocation; |
| // Decode the module bytes. |
| TRACE_COMPILE("(1) Decoding module...\n"); |
| TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"), |
| "wasm.DecodeModule"); |
| auto enabled_features = job->enabled_features_; |
| result = DecodeWasmModule( |
| enabled_features, job->wire_bytes_.start(), job->wire_bytes_.end(), |
| false, kWasmOrigin, counters_, metrics_recorder_, job->context_id(), |
| DecodingMethod::kAsync, job->isolate()->wasm_engine()->allocator()); |
| |
| // Validate lazy functions here if requested. |
| if (!FLAG_wasm_lazy_validation && result.ok()) { |
| const WasmModule* module = result.value().get(); |
| DCHECK_EQ(module->origin, kWasmOrigin); |
| const bool lazy_module = job->wasm_lazy_compilation_; |
| if (MayCompriseLazyFunctions(module, enabled_features, lazy_module)) { |
| auto allocator = job->isolate()->wasm_engine()->allocator(); |
| int start = module->num_imported_functions; |
| int end = start + module->num_declared_functions; |
| |
| for (int func_index = start; func_index < end; func_index++) { |
| const WasmFunction* func = &module->functions[func_index]; |
| Vector<const uint8_t> code = |
| job->wire_bytes_.GetFunctionBytes(func); |
| |
| CompileStrategy strategy = GetCompileStrategy( |
| module, enabled_features, func_index, lazy_module); |
| bool validate_lazily_compiled_function = |
| strategy == CompileStrategy::kLazy || |
| strategy == CompileStrategy::kLazyBaselineEagerTopTier; |
| if (validate_lazily_compiled_function) { |
| DecodeResult function_result = |
| ValidateSingleFunction(module, func_index, code, counters_, |
| allocator, enabled_features); |
| if (function_result.failed()) { |
| result = ModuleResult(function_result.error()); |
| break; |
| } |
| } |
| } |
| } |
| } |
| } |
| if (result.failed()) { |
| // Decoding failure; reject the promise and clean up. |
| job->DoSync<DecodeFail>(std::move(result).error()); |
| } else { |
| // Decode passed. |
| std::shared_ptr<WasmModule> module = std::move(result).value(); |
| const bool kUsesLiftoff = false; |
| size_t code_size_estimate = |
| wasm::WasmCodeManager::EstimateNativeModuleCodeSize(module.get(), |
| kUsesLiftoff); |
| job->DoSync<PrepareAndStartCompile>(std::move(module), true, |
| code_size_estimate); |
| } |
| } |
| |
| private: |
| Counters* const counters_; |
| std::shared_ptr<metrics::Recorder> metrics_recorder_; |
| }; |
| |
| //========================================================================== |
| // Step 1b: (sync) Fail decoding the module. |
| //========================================================================== |
| class AsyncCompileJob::DecodeFail : public CompileStep { |
| public: |
| explicit DecodeFail(WasmError error) : error_(std::move(error)) {} |
| |
| private: |
| WasmError error_; |
| |
| void RunInForeground(AsyncCompileJob* job) override { |
| TRACE_COMPILE("(1b) Decoding failed.\n"); |
| // {job_} is deleted in DecodeFailed, therefore the {return}. |
| return job->DecodeFailed(error_); |
| } |
| }; |
| |
| //========================================================================== |
| // Step 2 (sync): Create heap-allocated data and start compile. |
| //========================================================================== |
| class AsyncCompileJob::PrepareAndStartCompile : public CompileStep { |
| public: |
| PrepareAndStartCompile(std::shared_ptr<const WasmModule> module, |
| bool start_compilation, size_t code_size_estimate) |
| : module_(std::move(module)), |
| start_compilation_(start_compilation), |
| code_size_estimate_(code_size_estimate) {} |
| |
| private: |
| const std::shared_ptr<const WasmModule> module_; |
| const bool start_compilation_; |
| const size_t code_size_estimate_; |
| |
| void RunInForeground(AsyncCompileJob* job) override { |
| TRACE_COMPILE("(2) Prepare and start compile...\n"); |
| |
| const bool streaming = job->wire_bytes_.length() == 0; |
| if (streaming) { |
| // Streaming compilation already checked for cache hits. |
| job->CreateNativeModule(module_, code_size_estimate_); |
| } else if (job->GetOrCreateNativeModule(std::move(module_), |
| code_size_estimate_)) { |
| job->FinishCompile(true); |
| return; |
| } |
| |
| // Make sure all compilation tasks stopped running. Decoding (async step) |
| // is done. |
| job->background_task_manager_.CancelAndWait(); |
| |
| CompilationStateImpl* compilation_state = |
| Impl(job->native_module_->compilation_state()); |
| compilation_state->AddCallback(CompilationStateCallback{job}); |
| if (base::TimeTicks::IsHighResolution()) { |
| auto compile_mode = job->stream_ == nullptr |
| ? CompilationTimeCallback::kAsync |
| : CompilationTimeCallback::kStreaming; |
| compilation_state->AddCallback(CompilationTimeCallback{ |
| job->isolate_->async_counters(), job->isolate_->metrics_recorder(), |
| job->context_id_, job->native_module_, compile_mode}); |
| } |
| |
| if (start_compilation_) { |
| // TODO(ahaas): Try to remove the {start_compilation_} check when |
| // streaming decoding is done in the background. If |
| // InitializeCompilationUnits always returns 0 for streaming compilation, |
| // then DoAsync would do the same as NextStep already. |
| |
| // Add compilation units and kick off compilation. |
| InitializeCompilationUnits(job->isolate(), job->native_module_.get()); |
| } |
| } |
| }; |
| |
| //========================================================================== |
| // Step 3a (sync): Compilation failed. |
| //========================================================================== |
| class AsyncCompileJob::CompileFailed : public CompileStep { |
| private: |
| void RunInForeground(AsyncCompileJob* job) override { |
| TRACE_COMPILE("(3a) Compilation failed\n"); |
| DCHECK(job->native_module_->compilation_state()->failed()); |
| |
| // {job_} is deleted in AsyncCompileFailed, therefore the {return}. |
| return job->AsyncCompileFailed(); |
| } |
| }; |
| |
| namespace { |
| class SampleTopTierCodeSizeCallback { |
| public: |
| explicit SampleTopTierCodeSizeCallback( |
| std::weak_ptr<NativeModule> native_module) |
| : native_module_(std::move(native_module)) {} |
| |
| void operator()(CompilationEvent event) { |
| if (event != CompilationEvent::kFinishedTopTierCompilation) return; |
| if (std::shared_ptr<NativeModule> native_module = native_module_.lock()) { |
| native_module->engine()->SampleTopTierCodeSizeInAllIsolates( |
| native_module); |
| } |
| } |
| |
| private: |
| std::weak_ptr<NativeModule> native_module_; |
| }; |
| } // namespace |
| |
| //========================================================================== |
| // Step 3b (sync): Compilation finished. |
| //========================================================================== |
| class AsyncCompileJob::CompileFinished : public CompileStep { |
| public: |
| explicit CompileFinished(std::shared_ptr<NativeModule> cached_native_module) |
| : cached_native_module_(std::move(cached_native_module)) {} |
| |
| private: |
| void RunInForeground(AsyncCompileJob* job) override { |
| TRACE_COMPILE("(3b) Compilation finished\n"); |
| if (cached_native_module_) { |
| job->native_module_ = cached_native_module_; |
| } else { |
| DCHECK(!job->native_module_->compilation_state()->failed()); |
| // Sample the generated code size when baseline compilation finished. |
| job->native_module_->SampleCodeSize(job->isolate_->counters(), |
| NativeModule::kAfterBaseline); |
| // Also, set a callback to sample the code size after top-tier compilation |
| // finished. This callback will *not* keep the NativeModule alive. |
| job->native_module_->compilation_state()->AddCallback( |
| SampleTopTierCodeSizeCallback{job->native_module_}); |
| } |
| // Then finalize and publish the generated module. |
| job->FinishCompile(cached_native_module_ != nullptr); |
| } |
| |
| std::shared_ptr<NativeModule> cached_native_module_; |
| }; |
| |
| void AsyncCompileJob::FinishModule() { |
| TRACE_COMPILE("(4) Finish module...\n"); |
| AsyncCompileSucceeded(module_object_); |
| isolate_->wasm_engine()->RemoveCompileJob(this); |
| } |
| |
| AsyncStreamingProcessor::AsyncStreamingProcessor( |
| AsyncCompileJob* job, std::shared_ptr<Counters> async_counters, |
| AccountingAllocator* allocator) |
| : decoder_(job->enabled_features_), |
| job_(job), |
| wasm_engine_(job_->isolate_->wasm_engine()), |
| compilation_unit_builder_(nullptr), |
| async_counters_(async_counters), |
| allocator_(allocator) {} |
| |
| AsyncStreamingProcessor::~AsyncStreamingProcessor() { |
| if (job_->native_module_ && job_->native_module_->wire_bytes().empty()) { |
| // Clean up the temporary cache entry. |
| job_->isolate_->wasm_engine()->StreamingCompilationFailed(prefix_hash_); |
| } |
| } |
| |
| void AsyncStreamingProcessor::FinishAsyncCompileJobWithError( |
| const WasmError& error) { |
| DCHECK(error.has_error()); |
| // Make sure all background tasks stopped executing before we change the state |
| // of the AsyncCompileJob to DecodeFail. |
| job_->background_task_manager_.CancelAndWait(); |
| |
| // Record event metrics. |
| auto duration = base::TimeTicks::Now() - job_->start_time_; |
| job_->metrics_event_.success = false; |
| job_->metrics_event_.streamed = true; |
| job_->metrics_event_.module_size_in_bytes = job_->wire_bytes_.length(); |
| job_->metrics_event_.function_count = num_functions_; |
| job_->metrics_event_.wall_clock_time_in_us = duration.InMicroseconds(); |
| job_->metrics_event_.wall_clock_duration_in_us = duration.InMicroseconds(); |
| job_->isolate_->metrics_recorder()->DelayMainThreadEvent(job_->metrics_event_, |
| job_->context_id_); |
| |
| // Check if there is already a CompiledModule, in which case we have to clean |
| // up the CompilationStateImpl as well. |
| if (job_->native_module_) { |
| Impl(job_->native_module_->compilation_state())->CancelCompilation(); |
| |
| job_->DoSync<AsyncCompileJob::DecodeFail, |
| AsyncCompileJob::kUseExistingForegroundTask>(error); |
| |
| // Clear the {compilation_unit_builder_} if it exists. This is needed |
| // because there is a check in the destructor of the |
| // {CompilationUnitBuilder} that it is empty. |
| if (compilation_unit_builder_) compilation_unit_builder_->Clear(); |
| } else { |
| job_->DoSync<AsyncCompileJob::DecodeFail>(error); |
| } |
| } |
| |
| // Process the module header. |
| bool AsyncStreamingProcessor::ProcessModuleHeader(Vector<const uint8_t> bytes, |
| uint32_t offset) { |
| TRACE_STREAMING("Process module header...\n"); |
| decoder_.StartDecoding( |
| job_->isolate()->counters(), job_->isolate()->metrics_recorder(), |
| job_->context_id(), job_->isolate()->wasm_engine()->allocator()); |
| decoder_.DecodeModuleHeader(bytes, offset); |
| if (!decoder_.ok()) { |
| FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error()); |
| return false; |
| } |
| prefix_hash_ = NativeModuleCache::WireBytesHash(bytes); |
| return true; |
| } |
| |
| // Process all sections except for the code section. |
| bool AsyncStreamingProcessor::ProcessSection(SectionCode section_code, |
| Vector<const uint8_t> bytes, |
| uint32_t offset) { |
| TRACE_STREAMING("Process section %d ...\n", section_code); |
| if (compilation_unit_builder_) { |
| // We reached a section after the code section, we do not need the |
| // compilation_unit_builder_ anymore. |
| CommitCompilationUnits(); |
| compilation_unit_builder_.reset(); |
| } |
| if (before_code_section_) { |
| // Combine section hashes until code section. |
| prefix_hash_ = base::hash_combine(prefix_hash_, |
| NativeModuleCache::WireBytesHash(bytes)); |
| } |
| if (section_code == SectionCode::kUnknownSectionCode) { |
| size_t bytes_consumed = ModuleDecoder::IdentifyUnknownSection( |
| &decoder_, bytes, offset, §ion_code); |
| if (!decoder_.ok()) { |
| FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error()); |
| return false; |
| } |
| if (section_code == SectionCode::kUnknownSectionCode) { |
| // Skip unknown sections that we do not know how to handle. |
| return true; |
| } |
| // Remove the unknown section tag from the payload bytes. |
| offset += bytes_consumed; |
| bytes = bytes.SubVector(bytes_consumed, bytes.size()); |
| } |
| constexpr bool verify_functions = false; |
| decoder_.DecodeSection(section_code, bytes, offset, verify_functions); |
| if (!decoder_.ok()) { |
| FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error()); |
| return false; |
| } |
| return true; |
| } |
| |
| // Start the code section. |
| bool AsyncStreamingProcessor::ProcessCodeSectionHeader( |
| int num_functions, uint32_t offset, |
| std::shared_ptr<WireBytesStorage> wire_bytes_storage, |
| int code_section_length) { |
| DCHECK_LE(0, code_section_length); |
| before_code_section_ = false; |
| TRACE_STREAMING("Start the code section with %d functions...\n", |
| num_functions); |
| if (!decoder_.CheckFunctionsCount(static_cast<uint32_t>(num_functions), |
| offset)) { |
| FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error()); |
| return false; |
| } |
| |
| decoder_.set_code_section(offset, static_cast<uint32_t>(code_section_length)); |
| |
| prefix_hash_ = base::hash_combine(prefix_hash_, |
| static_cast<uint32_t>(code_section_length)); |
| if (!wasm_engine_->GetStreamingCompilationOwnership(prefix_hash_)) { |
| // Known prefix, wait until the end of the stream and check the cache. |
| prefix_cache_hit_ = true; |
| return true; |
| } |
| |
| // Execute the PrepareAndStartCompile step immediately and not in a separate |
| // task. |
| int num_imported_functions = |
| static_cast<int>(decoder_.module()->num_imported_functions); |
| DCHECK_EQ(kWasmOrigin, decoder_.module()->origin); |
| const bool uses_liftoff = FLAG_liftoff; |
| size_t code_size_estimate = |
| wasm::WasmCodeManager::EstimateNativeModuleCodeSize( |
| num_functions, num_imported_functions, code_section_length, |
| uses_liftoff); |
| job_->DoImmediately<AsyncCompileJob::PrepareAndStartCompile>( |
| decoder_.shared_module(), false, code_size_estimate); |
| |
| auto* compilation_state = Impl(job_->native_module_->compilation_state()); |
| compilation_state->SetWireBytesStorage(std::move(wire_bytes_storage)); |
| DCHECK_EQ(job_->native_module_->module()->origin, kWasmOrigin); |
| const bool lazy_module = job_->wasm_lazy_compilation_; |
| |
| // Set outstanding_finishers_ to 2, because both the AsyncCompileJob and the |
| // AsyncStreamingProcessor have to finish. |
| job_->outstanding_finishers_.store(2); |
| compilation_unit_builder_.reset( |
| new CompilationUnitBuilder(job_->native_module_.get())); |
| |
| NativeModule* native_module = job_->native_module_.get(); |
| |
| int num_import_wrappers = |
| AddImportWrapperUnits(native_module, compilation_unit_builder_.get()); |
| int num_export_wrappers = AddExportWrapperUnits( |
| job_->isolate_, wasm_engine_, native_module, |
| compilation_unit_builder_.get(), job_->enabled_features_); |
| compilation_state->InitializeCompilationProgress( |
| lazy_module, num_import_wrappers, num_export_wrappers); |
| return true; |
| } |
| |
| // Process a function body. |
| bool AsyncStreamingProcessor::ProcessFunctionBody(Vector<const uint8_t> bytes, |
| uint32_t offset) { |
| TRACE_STREAMING("Process function body %d ...\n", num_functions_); |
| |
| decoder_.DecodeFunctionBody( |
| num_functions_, static_cast<uint32_t>(bytes.length()), offset, false); |
| |
| const WasmModule* module = decoder_.module(); |
| auto enabled_features = job_->enabled_features_; |
| uint32_t func_index = |
| num_functions_ + decoder_.module()->num_imported_functions; |
| DCHECK_EQ(module->origin, kWasmOrigin); |
| const bool lazy_module = job_->wasm_lazy_compilation_; |
| CompileStrategy strategy = |
| GetCompileStrategy(module, enabled_features, func_index, lazy_module); |
| bool validate_lazily_compiled_function = |
| !FLAG_wasm_lazy_validation && |
| (strategy == CompileStrategy::kLazy || |
| strategy == CompileStrategy::kLazyBaselineEagerTopTier); |
| if (validate_lazily_compiled_function) { |
| // The native module does not own the wire bytes until {SetWireBytes} is |
| // called in {OnFinishedStream}. Validation must use {bytes} parameter. |
| DecodeResult result = |
| ValidateSingleFunction(module, func_index, bytes, async_counters_.get(), |
| allocator_, enabled_features); |
| |
| if (result.failed()) { |
| FinishAsyncCompileJobWithError(result.error()); |
| return false; |
| } |
| } |
| |
| // Don't compile yet if we might have a cache hit. |
| if (prefix_cache_hit_) { |
| num_functions_++; |
| return true; |
| } |
| |
| NativeModule* native_module = job_->native_module_.get(); |
| if (strategy == CompileStrategy::kLazy) { |
| native_module->UseLazyStub(func_index); |
| } else if (strategy == CompileStrategy::kLazyBaselineEagerTopTier) { |
| compilation_unit_builder_->AddTopTierUnit(func_index); |
| native_module->UseLazyStub(func_index); |
| } else { |
| DCHECK_EQ(strategy, CompileStrategy::kEager); |
| compilation_unit_builder_->AddUnits(func_index); |
| } |
| |
| ++num_functions_; |
| |
| return true; |
| } |
| |
| void AsyncStreamingProcessor::CommitCompilationUnits() { |
| DCHECK(compilation_unit_builder_); |
| compilation_unit_builder_->Commit(); |
| } |
| |
| void AsyncStreamingProcessor::OnFinishedChunk() { |
| TRACE_STREAMING("FinishChunk...\n"); |
| if (compilation_unit_builder_) CommitCompilationUnits(); |
| } |
| |
| // Finish the processing of the stream. |
| void AsyncStreamingProcessor::OnFinishedStream(OwnedVector<uint8_t> bytes) { |
| TRACE_STREAMING("Finish stream...\n"); |
| DCHECK_EQ(NativeModuleCache::PrefixHash(bytes.as_vector()), prefix_hash_); |
| ModuleResult result = decoder_.FinishDecoding(false); |
| if (result.failed()) { |
| FinishAsyncCompileJobWithError(result.error()); |
| return; |
| } |
| |
| job_->wire_bytes_ = ModuleWireBytes(bytes.as_vector()); |
| job_->bytes_copy_ = bytes.ReleaseData(); |
| |
| // Record event metrics. |
| auto duration = base::TimeTicks::Now() - job_->start_time_; |
| job_->metrics_event_.success = true; |
| job_->metrics_event_.streamed = true; |
| job_->metrics_event_.module_size_in_bytes = job_->wire_bytes_.length(); |
| job_->metrics_event_.function_count = num_functions_; |
| job_->metrics_event_.wall_clock_time_in_us = duration.InMicroseconds(); |
| job_->metrics_event_.wall_clock_duration_in_us = duration.InMicroseconds(); |
| job_->isolate_->metrics_recorder()->DelayMainThreadEvent(job_->metrics_event_, |
| job_->context_id_); |
| |
| if (prefix_cache_hit_) { |
| // Restart as an asynchronous, non-streaming compilation. Most likely |
| // {PrepareAndStartCompile} will get the native module from the cache. |
| size_t code_size_estimate = |
| wasm::WasmCodeManager::EstimateNativeModuleCodeSize( |
| result.value().get(), FLAG_liftoff); |
| job_->DoSync<AsyncCompileJob::PrepareAndStartCompile>( |
| std::move(result).value(), true, code_size_estimate); |
| return; |
| } |
| |
| // We have to open a HandleScope and prepare the Context for |
| // CreateNativeModule, PrepareRuntimeObjects and FinishCompile as this is a |
| // callback from the embedder. |
| HandleScope scope(job_->isolate_); |
| SaveAndSwitchContext saved_context(job_->isolate_, *job_->native_context_); |
| |
| // Record the size of the wire bytes. In synchronous and asynchronous |
| // (non-streaming) compilation, this happens in {DecodeWasmModule}. |
| auto* histogram = job_->isolate_->counters()->wasm_wasm_module_size_bytes(); |
| histogram->AddSample(job_->wire_bytes_.module_bytes().length()); |
| |
| const bool has_code_section = job_->native_module_ != nullptr; |
| bool cache_hit = false; |
| if (!has_code_section) { |
| // We are processing a WebAssembly module without code section. Create the |
| // native module now (would otherwise happen in {PrepareAndStartCompile} or |
| // {ProcessCodeSectionHeader}). |
| constexpr size_t kCodeSizeEstimate = 0; |
| cache_hit = job_->GetOrCreateNativeModule(std::move(result).value(), |
| kCodeSizeEstimate); |
| } else { |
| #if !defined(DISABLE_WASM_COMPILER_ISSUE_STARBOARD) |
| job_->native_module_->SetWireBytes( |
| {std::move(job_->bytes_copy_), job_->wire_bytes_.length()}); |
| #endif |
| job_->native_module_->LogWasmCodes(job_->isolate_); |
| } |
| const bool needs_finish = job_->DecrementAndCheckFinisherCount(); |
| DCHECK_IMPLIES(!has_code_section, needs_finish); |
| // We might need to recompile the module for debugging, if the debugger was |
| // enabled while streaming compilation was running. Since handling this while |
| // compiling via streaming is tricky, we just tier down now, before publishing |
| // the module. |
| if (job_->native_module_->IsTieredDown()) { |
| job_->native_module_->RecompileForTiering(); |
| } |
| if (needs_finish) { |
| const bool failed = job_->native_module_->compilation_state()->failed(); |
| if (!cache_hit) { |
| cache_hit = !job_->isolate_->wasm_engine()->UpdateNativeModuleCache( |
| failed, &job_->native_module_, job_->isolate_); |
| } |
| if (failed) { |
| job_->AsyncCompileFailed(); |
| } else { |
| job_->FinishCompile(cache_hit); |
| } |
| } |
| } |
| |
| // Report an error detected in the StreamingDecoder. |
| void AsyncStreamingProcessor::OnError(const WasmError& error) { |
| TRACE_STREAMING("Stream error...\n"); |
| FinishAsyncCompileJobWithError(error); |
| } |
| |
| void AsyncStreamingProcessor::OnAbort() { |
| TRACE_STREAMING("Abort stream...\n"); |
| job_->Abort(); |
| } |
| |
| bool AsyncStreamingProcessor::Deserialize(Vector<const uint8_t> module_bytes, |
| Vector<const uint8_t> wire_bytes) { |
| TRACE_EVENT0("v8.wasm", "wasm.Deserialize"); |
| // DeserializeNativeModule and FinishCompile assume that they are executed in |
| // a HandleScope, and that a context is set on the isolate. |
| HandleScope scope(job_->isolate_); |
| SaveAndSwitchContext saved_context(job_->isolate_, *job_->native_context_); |
| |
| MaybeHandle<WasmModuleObject> result = DeserializeNativeModule( |
| job_->isolate_, module_bytes, wire_bytes, job_->stream_->url()); |
| |
| if (result.is_null()) return false; |
| |
| job_->module_object_ = |
| job_->isolate_->global_handles()->Create(*result.ToHandleChecked()); |
| job_->native_module_ = job_->module_object_->shared_native_module(); |
| job_->wire_bytes_ = ModuleWireBytes(job_->native_module_->wire_bytes()); |
| job_->FinishCompile(false); |
| return true; |
| } |
| |
| CompilationStateImpl::CompilationStateImpl( |
| const std::shared_ptr<NativeModule>& native_module, |
| std::shared_ptr<Counters> async_counters) |
| : native_module_(native_module.get()), |
| native_module_weak_(std::move(native_module)), |
| compile_mode_(FLAG_wasm_tier_up && |
| native_module->module()->origin == kWasmOrigin |
| ? CompileMode::kTiering |
| : CompileMode::kRegular), |
| async_counters_(std::move(async_counters)), |
| compilation_unit_queues_(native_module->num_functions()) {} |
| |
| void CompilationStateImpl::CancelCompilation() { |
| // No more callbacks after abort. |
| base::MutexGuard callbacks_guard(&callbacks_mutex_); |
| // std::memory_order_relaxed is sufficient because no other state is |
| // synchronized with |compile_cancelled_|. |
| compile_cancelled_.store(true, std::memory_order_relaxed); |
| callbacks_.clear(); |
| } |
| |
| bool CompilationStateImpl::cancelled() const { |
| return compile_cancelled_.load(std::memory_order_relaxed); |
| } |
| |
| void CompilationStateImpl::InitializeCompilationProgress( |
| bool lazy_module, int num_import_wrappers, int num_export_wrappers) { |
| DCHECK(!failed()); |
| auto enabled_features = native_module_->enabled_features(); |
| auto* module = native_module_->module(); |
| |
| base::MutexGuard guard(&callbacks_mutex_); |
| DCHECK_EQ(0, outstanding_baseline_units_); |
| DCHECK_EQ(0, outstanding_export_wrappers_); |
| DCHECK_EQ(0, outstanding_top_tier_functions_); |
| compilation_progress_.reserve(module->num_declared_functions); |
| int start = module->num_imported_functions; |
| int end = start + module->num_declared_functions; |
| |
| const bool prefer_liftoff = native_module_->IsTieredDown(); |
| for (int func_index = start; func_index < end; func_index++) { |
| if (prefer_liftoff) { |
| constexpr uint8_t kLiftoffOnlyFunctionProgress = |
| RequiredTopTierField::encode(ExecutionTier::kLiftoff) | |
| RequiredBaselineTierField::encode(ExecutionTier::kLiftoff) | |
| ReachedTierField::encode(ExecutionTier::kNone); |
| compilation_progress_.push_back(kLiftoffOnlyFunctionProgress); |
| outstanding_baseline_units_++; |
| outstanding_top_tier_functions_++; |
| continue; |
| } |
| ExecutionTierPair requested_tiers = GetRequestedExecutionTiers( |
| module, compile_mode(), enabled_features, func_index); |
| CompileStrategy strategy = |
| GetCompileStrategy(module, enabled_features, func_index, lazy_module); |
| |
| bool required_for_baseline = strategy == CompileStrategy::kEager; |
| bool required_for_top_tier = strategy != CompileStrategy::kLazy; |
| DCHECK_EQ(required_for_top_tier, |
| strategy == CompileStrategy::kEager || |
| strategy == CompileStrategy::kLazyBaselineEagerTopTier); |
| |
| // Count functions to complete baseline and top tier compilation. |
| if (required_for_baseline) outstanding_baseline_units_++; |
| if (required_for_top_tier) outstanding_top_tier_functions_++; |
| |
| // Initialize function's compilation progress. |
| ExecutionTier required_baseline_tier = required_for_baseline |
| ? requested_tiers.baseline_tier |
| : ExecutionTier::kNone; |
| ExecutionTier required_top_tier = |
| required_for_top_tier ? requested_tiers.top_tier : ExecutionTier::kNone; |
| uint8_t function_progress = ReachedTierField::encode(ExecutionTier::kNone); |
| function_progress = RequiredBaselineTierField::update( |
| function_progress, required_baseline_tier); |
| function_progress = |
| RequiredTopTierField::update(function_progress, required_top_tier); |
| compilation_progress_.push_back(function_progress); |
| } |
| DCHECK_IMPLIES(lazy_module, outstanding_baseline_units_ == 0); |
| DCHECK_IMPLIES(lazy_module, outstanding_top_tier_functions_ == 0); |
| DCHECK_LE(0, outstanding_baseline_units_); |
| DCHECK_LE(outstanding_baseline_units_, outstanding_top_tier_functions_); |
| outstanding_baseline_units_ += num_import_wrappers; |
| outstanding_export_wrappers_ = num_export_wrappers; |
| |
| // Trigger callbacks if module needs no baseline or top tier compilation. This |
| // can be the case for an empty or fully lazy module. |
| TriggerCallbacks(); |
|