v8/src/wasm/module-compiler.cc - cobalt - Git at Google

 // Copyright 2017 the V8 project authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "src/wasm/module-compiler.h"

 #include <algorithm>
 #include <queue>

 #include "src/api/api-inl.h"
 #include "src/asmjs/asm-js.h"
 #include "src/base/enum-set.h"
 #include "src/base/optional.h"
 #include "src/base/platform/mutex.h"
 #include "src/base/platform/semaphore.h"
 #include "src/base/platform/time.h"
 #include "src/base/utils/random-number-generator.h"
 #include "src/compiler/wasm-compiler.h"
 #include "src/heap/heap-inl.h"  // For CodeSpaceMemoryModificationScope.
 #include "src/logging/counters.h"
 #include "src/logging/metrics.h"
 #include "src/objects/property-descriptor.h"
 #include "src/tasks/task-utils.h"
 #include "src/tracing/trace-event.h"
 #include "src/trap-handler/trap-handler.h"
 #include "src/utils/identity-map.h"
 #include "src/wasm/module-decoder.h"
 #include "src/wasm/streaming-decoder.h"
 #include "src/wasm/wasm-code-manager.h"
 #include "src/wasm/wasm-engine.h"
 #include "src/wasm/wasm-import-wrapper-cache.h"
 #include "src/wasm/wasm-js.h"
 #include "src/wasm/wasm-limits.h"
 #include "src/wasm/wasm-objects-inl.h"
 #include "src/wasm/wasm-opcodes.h"
 #include "src/wasm/wasm-result.h"
 #include "src/wasm/wasm-serialization.h"

 #define TRACE_COMPILE(...)                             \
   do {                                                 \
     if (FLAG_trace_wasm_compiler) PrintF(__VA_ARGS__); \
   } while (false)

 #define TRACE_STREAMING(...)                            \
   do {                                                  \
     if (FLAG_trace_wasm_streaming) PrintF(__VA_ARGS__); \
   } while (false)

 #define TRACE_LAZY(...)                                        \
   do {                                                         \
     if (FLAG_trace_wasm_lazy_compilation) PrintF(__VA_ARGS__); \
   } while (false)

 namespace v8 {
 namespace internal {
 namespace wasm {

 namespace {

 enum class CompileMode : uint8_t { kRegular, kTiering };

 enum class CompileStrategy : uint8_t {
   // Compiles functions on first use. In this case, execution will block until
   // the function's baseline is reached and top tier compilation starts in
   // background (if applicable).
   // Lazy compilation can help to reduce startup time and code size at the risk
   // of blocking execution.
   kLazy,
   // Compiles baseline ahead of execution and starts top tier compilation in
   // background (if applicable).
   kEager,
   // Triggers baseline compilation on first use (just like {kLazy}) with the
   // difference that top tier compilation is started eagerly.
   // This strategy can help to reduce startup time at the risk of blocking
   // execution, but only in its early phase (until top tier compilation
   // finishes).
   kLazyBaselineEagerTopTier,
   // Marker for default strategy.
   kDefault = kEager,
 };

 class CompilationStateImpl;

 class BackgroundCompileScope {
  public:
   explicit BackgroundCompileScope(std::weak_ptr<NativeModule> native_module)
       : native_module_(native_module.lock()) {}

   NativeModule* native_module() const {
     DCHECK(native_module_);
     return native_module_.get();
   }
   inline CompilationStateImpl* compilation_state() const;

   bool cancelled() const;

  private:
   // Keep the native module alive while in this scope.
   std::shared_ptr<NativeModule> native_module_;
 };

 enum CompileBaselineOnly : bool {
   kBaselineOnly = true,
   kBaselineOrTopTier = false
 };

 // A set of work-stealing queues (vectors of units). Each background compile
 // task owns one of the queues and steals from all others once its own queue
 // runs empty.
 class CompilationUnitQueues {
  public:
   // Public API for QueueImpl.
   struct Queue {
     bool ShouldPublish(int num_processed_units) const;
   };

   explicit CompilationUnitQueues(int num_declared_functions)
       : num_declared_functions_(num_declared_functions) {
     // Add one first queue, to add units to.
     queues_.emplace_back(std::make_unique<QueueImpl>(0));

     for (auto& atomic_counter : num_units_) {
       std::atomic_init(&atomic_counter, size_t{0});
     }

     top_tier_compiled_ =
         std::make_unique<std::atomic<bool>[]>(num_declared_functions);

     for (int i = 0; i < num_declared_functions; i++) {
       std::atomic_init(&top_tier_compiled_.get()[i], false);
     }
   }

   Queue* GetQueueForTask(int task_id) {
     int required_queues = task_id + 1;
     {
       base::SharedMutexGuard<base::kShared> queues_guard(&queues_mutex_);
       if (V8_LIKELY(static_cast<int>(queues_.size()) >= required_queues)) {
         return queues_[task_id].get();
       }
     }

     // Otherwise increase the number of queues.
     base::SharedMutexGuard<base::kExclusive> queues_guard(&queues_mutex_);
     int num_queues = static_cast<int>(queues_.size());
     while (num_queues < required_queues) {
       int steal_from = num_queues + 1;
       queues_.emplace_back(std::make_unique<QueueImpl>(steal_from));
       ++num_queues;
     }

     // Update the {publish_limit}s of all queues.

     // We want background threads to publish regularly (to avoid contention when
     // they are all publishing at the end). On the other side, each publishing
     // has some overhead (part of it for synchronizing between threads), so it
     // should not happen *too* often. Thus aim for 4-8 publishes per thread, but
     // distribute it such that publishing is likely to happen at different
     // times.
     int units_per_thread = num_declared_functions_ / num_queues;
     int min = std::max(10, units_per_thread / 8);
     int queue_id = 0;
     for (auto& queue : queues_) {
       // Set a limit between {min} and {2*min}, but not smaller than {10}.
       int limit = min + (min * queue_id / num_queues);
       queue->publish_limit.store(limit, std::memory_order_relaxed);
       ++queue_id;
     }

     return queues_[task_id].get();
   }

   base::Optional<WasmCompilationUnit> GetNextUnit(
       Queue* queue, CompileBaselineOnly baseline_only) {
     // As long as any lower-tier units are outstanding we need to steal them
     // before executing own higher-tier units.
     int max_tier = baseline_only ? kBaseline : kTopTier;
     for (int tier = GetLowestTierWithUnits(); tier <= max_tier; ++tier) {
       if (auto unit = GetNextUnitOfTier(queue, tier)) {
         size_t old_units_count =
             num_units_[tier].fetch_sub(1, std::memory_order_relaxed);
         DCHECK_LE(1, old_units_count);
         USE(old_units_count);
         return unit;
       }
     }
     return {};
   }

   void AddUnits(Vector<WasmCompilationUnit> baseline_units,
                 Vector<WasmCompilationUnit> top_tier_units,
                 const WasmModule* module) {
     DCHECK_LT(0, baseline_units.size() + top_tier_units.size());
     // Add to the individual queues in a round-robin fashion. No special care is
     // taken to balance them; they will be balanced by work stealing.
     QueueImpl* queue;
     {
       int queue_to_add = next_queue_to_add.load(std::memory_order_relaxed);
       base::SharedMutexGuard<base::kShared> queues_guard(&queues_mutex_);
       while (!next_queue_to_add.compare_exchange_weak(
           queue_to_add, next_task_id(queue_to_add, queues_.size()),
           std::memory_order_relaxed)) {
         // Retry with updated {queue_to_add}.
       }
       queue = queues_[queue_to_add].get();
     }

     base::MutexGuard guard(&queue->mutex);
     base::Optional<base::MutexGuard> big_units_guard;
     for (auto pair : {std::make_pair(int{kBaseline}, baseline_units),
                       std::make_pair(int{kTopTier}, top_tier_units)}) {
       int tier = pair.first;
       Vector<WasmCompilationUnit> units = pair.second;
       if (units.empty()) continue;
       num_units_[tier].fetch_add(units.size(), std::memory_order_relaxed);
       for (WasmCompilationUnit unit : units) {
         size_t func_size = module->functions[unit.func_index()].code.length();
         if (func_size <= kBigUnitsLimit) {
           queue->units[tier].push_back(unit);
         } else {
           if (!big_units_guard) {
             big_units_guard.emplace(&big_units_queue_.mutex);
           }
           big_units_queue_.has_units[tier].store(true,
                                                  std::memory_order_relaxed);
           big_units_queue_.units[tier].emplace(func_size, unit);
         }
       }
     }
   }

   void AddTopTierPriorityUnit(WasmCompilationUnit unit, size_t priority) {
     base::SharedMutexGuard<base::kShared> queues_guard(&queues_mutex_);
     // Add to the individual queues in a round-robin fashion. No special care is
     // taken to balance them; they will be balanced by work stealing. We use
     // the same counter for this reason.
     int queue_to_add = next_queue_to_add.load(std::memory_order_relaxed);
     while (!next_queue_to_add.compare_exchange_weak(
         queue_to_add, next_task_id(queue_to_add, queues_.size()),
         std::memory_order_relaxed)) {
       // Retry with updated {queue_to_add}.
     }

     {
       auto* queue = queues_[queue_to_add].get();
       base::MutexGuard guard(&queue->mutex);
       queue->top_tier_priority_units.emplace(priority, unit);
     }
     num_priority_units_.fetch_add(1, std::memory_order_relaxed);
     num_units_[kTopTier].fetch_add(1, std::memory_order_relaxed);
   }

   // Get the current total number of units in all queues. This is only a
   // momentary snapshot, it's not guaranteed that {GetNextUnit} returns a unit
   // if this method returns non-zero.
   size_t GetTotalSize() const {
     size_t total = 0;
     for (auto& atomic_counter : num_units_) {
       total += atomic_counter.load(std::memory_order_relaxed);
     }
     return total;
   }

  private:
   // Store tier in int so we can easily loop over it:
   static constexpr int kBaseline = 0;
   static constexpr int kTopTier = 1;
   static constexpr int kNumTiers = kTopTier + 1;

   // Functions bigger than {kBigUnitsLimit} will be compiled first, in ascending
   // order of their function body size.
   static constexpr size_t kBigUnitsLimit = 4096;

   struct BigUnit {
     BigUnit(size_t func_size, WasmCompilationUnit unit)
         : func_size{func_size}, unit(unit) {}

     size_t func_size;
     WasmCompilationUnit unit;

     bool operator<(const BigUnit& other) const {
       return func_size < other.func_size;
     }
   };

   struct TopTierPriorityUnit {
     TopTierPriorityUnit(int priority, WasmCompilationUnit unit)
         : priority(priority), unit(unit) {}

     size_t priority;
     WasmCompilationUnit unit;

     bool operator<(const TopTierPriorityUnit& other) const {
       return priority < other.priority;
     }
   };

   struct BigUnitsQueue {
     BigUnitsQueue() {
       for (auto& atomic : has_units) std::atomic_init(&atomic, false);
     }

     base::Mutex mutex;

     // Can be read concurrently to check whether any elements are in the queue.
     std::atomic<bool> has_units[kNumTiers];

     // Protected by {mutex}:
     std::priority_queue<BigUnit> units[kNumTiers];
   };

   struct QueueImpl : public Queue {
     explicit QueueImpl(int next_steal_task_id)
         : next_steal_task_id(next_steal_task_id) {}

     // Number of units after which the task processing this queue should publish
     // compilation results. Updated (reduced, using relaxed ordering) when new
     // queues are allocated. If there is only one thread running, we can delay
     // publishing arbitrarily.
     std::atomic<int> publish_limit{kMaxInt};

     base::Mutex mutex;

     // All fields below are protected by {mutex}.
     std::vector<WasmCompilationUnit> units[kNumTiers];
     std::priority_queue<TopTierPriorityUnit> top_tier_priority_units;
     int next_steal_task_id;
   };

   int next_task_id(int task_id, size_t num_queues) const {
     int next = task_id + 1;
     return next == static_cast<int>(num_queues) ? 0 : next;
   }

   int GetLowestTierWithUnits() const {
     for (int tier = 0; tier < kNumTiers; ++tier) {
       if (num_units_[tier].load(std::memory_order_relaxed) > 0) return tier;
     }
     return kNumTiers;
   }

   base::Optional<WasmCompilationUnit> GetNextUnitOfTier(Queue* public_queue,
                                                         int tier) {
     QueueImpl* queue = static_cast<QueueImpl*>(public_queue);

     // First check whether there is a priority unit. Execute that first.
     if (tier == kTopTier) {
       if (auto unit = GetTopTierPriorityUnit(queue)) {
         return unit;
       }
     }

     // Then check whether there is a big unit of that tier.
     if (auto unit = GetBigUnitOfTier(tier)) return unit;

     // Finally check whether our own queue has a unit of the wanted tier. If
     // so, return it, otherwise get the task id to steal from.
     int steal_task_id;
     {
       base::MutexGuard mutex_guard(&queue->mutex);
       if (!queue->units[tier].empty()) {
         auto unit = queue->units[tier].back();
         queue->units[tier].pop_back();
         return unit;
       }
       steal_task_id = queue->next_steal_task_id;
     }

     // Try to steal from all other queues. If this succeeds, return one of the
     // stolen units.
     {
       base::SharedMutexGuard<base::kShared> guard(&queues_mutex_);
       for (size_t steal_trials = 0; steal_trials < queues_.size();
            ++steal_trials, ++steal_task_id) {
         if (steal_task_id >= static_cast<int>(queues_.size())) {
           steal_task_id = 0;
         }
         if (auto unit = StealUnitsAndGetFirst(queue, steal_task_id, tier)) {
           return unit;
         }
       }
     }

     // If we reach here, we didn't find any unit of the requested tier.
     return {};
   }

   base::Optional<WasmCompilationUnit> GetBigUnitOfTier(int tier) {
     // Fast path without locking.
     if (!big_units_queue_.has_units[tier].load(std::memory_order_relaxed)) {
       return {};
     }
     base::MutexGuard guard(&big_units_queue_.mutex);
     if (big_units_queue_.units[tier].empty()) return {};
     WasmCompilationUnit unit = big_units_queue_.units[tier].top().unit;
     big_units_queue_.units[tier].pop();
     if (big_units_queue_.units[tier].empty()) {
       big_units_queue_.has_units[tier].store(false, std::memory_order_relaxed);
     }
     return unit;
   }

   base::Optional<WasmCompilationUnit> GetTopTierPriorityUnit(QueueImpl* queue) {
     // Fast path without locking.
     if (num_priority_units_.load(std::memory_order_relaxed) == 0) {
       return {};
     }

     int steal_task_id;
     {
       base::MutexGuard mutex_guard(&queue->mutex);
       while (!queue->top_tier_priority_units.empty()) {
         auto unit = queue->top_tier_priority_units.top().unit;
         queue->top_tier_priority_units.pop();
         num_priority_units_.fetch_sub(1, std::memory_order_relaxed);

         if (!top_tier_compiled_[unit.func_index()].exchange(
                 true, std::memory_order_relaxed)) {
           return unit;
         }
         num_units_[kTopTier].fetch_sub(1, std::memory_order_relaxed);
       }
       steal_task_id = queue->next_steal_task_id;
     }

     // Try to steal from all other queues. If this succeeds, return one of the
     // stolen units.
     {
       base::SharedMutexGuard<base::kShared> guard(&queues_mutex_);
       for (size_t steal_trials = 0; steal_trials < queues_.size();
            ++steal_trials, ++steal_task_id) {
         if (steal_task_id >= static_cast<int>(queues_.size())) {
           steal_task_id = 0;
         }
         if (auto unit = StealTopTierPriorityUnit(queue, steal_task_id)) {
           return unit;
         }
       }
     }

     return {};
   }

   // Steal units of {wanted_tier} from {steal_from_task_id} to {queue}. Return
   // first stolen unit (rest put in queue of {task_id}), or {nullopt} if
   // {steal_from_task_id} had no units of {wanted_tier}.
   // Hold a shared lock on {queues_mutex_} when calling this method.
   base::Optional<WasmCompilationUnit> StealUnitsAndGetFirst(
       QueueImpl* queue, int steal_from_task_id, int wanted_tier) {
     auto* steal_queue = queues_[steal_from_task_id].get();
     // Cannot steal from own queue.
     if (steal_queue == queue) return {};
     std::vector<WasmCompilationUnit> stolen;
     base::Optional<WasmCompilationUnit> returned_unit;
     {
       base::MutexGuard guard(&steal_queue->mutex);
       auto* steal_from_vector = &steal_queue->units[wanted_tier];
       if (steal_from_vector->empty()) return {};
       size_t remaining = steal_from_vector->size() / 2;
       auto steal_begin = steal_from_vector->begin() + remaining;
       returned_unit = *steal_begin;
       stolen.assign(steal_begin + 1, steal_from_vector->end());
       steal_from_vector->erase(steal_begin, steal_from_vector->end());
     }
     base::MutexGuard guard(&queue->mutex);
     auto* target_queue = &queue->units[wanted_tier];
     target_queue->insert(target_queue->end(), stolen.begin(), stolen.end());
     queue->next_steal_task_id = steal_from_task_id + 1;
     return returned_unit;
   }

   // Steal one priority unit from {steal_from_task_id} to {task_id}. Return
   // stolen unit, or {nullopt} if {steal_from_task_id} had no priority units.
   // Hold a shared lock on {queues_mutex_} when calling this method.
   base::Optional<WasmCompilationUnit> StealTopTierPriorityUnit(
       QueueImpl* queue, int steal_from_task_id) {
     auto* steal_queue = queues_[steal_from_task_id].get();
     // Cannot steal from own queue.
     if (steal_queue == queue) return {};
     base::Optional<WasmCompilationUnit> returned_unit;
     {
       base::MutexGuard guard(&steal_queue->mutex);
       while (true) {
         if (steal_queue->top_tier_priority_units.empty()) return {};

         auto unit = steal_queue->top_tier_priority_units.top().unit;
         steal_queue->top_tier_priority_units.pop();
         num_priority_units_.fetch_sub(1, std::memory_order_relaxed);

         if (!top_tier_compiled_[unit.func_index()].exchange(
                 true, std::memory_order_relaxed)) {
           returned_unit = unit;
           break;
         }
         num_units_[kTopTier].fetch_sub(1, std::memory_order_relaxed);
       }
     }
     base::MutexGuard guard(&queue->mutex);
     queue->next_steal_task_id = steal_from_task_id + 1;
     return returned_unit;
   }

   // {queues_mutex_} protectes {queues_};
   base::SharedMutex queues_mutex_;
   std::vector<std::unique_ptr<QueueImpl>> queues_;

   const int num_declared_functions_;

   BigUnitsQueue big_units_queue_;

   std::atomic<size_t> num_units_[kNumTiers];
   std::atomic<size_t> num_priority_units_{0};
   std::unique_ptr<std::atomic<bool>[]> top_tier_compiled_;
   std::atomic<int> next_queue_to_add{0};
 };

 bool CompilationUnitQueues::Queue::ShouldPublish(
     int num_processed_units) const {
   auto* queue = static_cast<const QueueImpl*>(this);
   return num_processed_units >=
          queue->publish_limit.load(std::memory_order_relaxed);
 }

 // The {CompilationStateImpl} keeps track of the compilation state of the
 // owning NativeModule, i.e. which functions are left to be compiled.
 // It contains a task manager to allow parallel and asynchronous background
 // compilation of functions.
 // Its public interface {CompilationState} lives in compilation-environment.h.
 class CompilationStateImpl {
  public:
   CompilationStateImpl(const std::shared_ptr<NativeModule>& native_module,
                        std::shared_ptr<Counters> async_counters);

   // Cancel all background compilation, without waiting for compile tasks to
   // finish.
   void CancelCompilation();
   bool cancelled() const;

   // Initialize compilation progress. Set compilation tiers to expect for
   // baseline and top tier compilation. Must be set before {AddCompilationUnits}
   // is invoked which triggers background compilation.
   void InitializeCompilationProgress(bool lazy_module, int num_import_wrappers,
                                      int num_export_wrappers);

   // Initialize the compilation progress after deserialization. This is needed
   // for recompilation (e.g. for tier down) to work later.
   void InitializeCompilationProgressAfterDeserialization();

   // Initialize recompilation of the whole module: Setup compilation progress
   // for recompilation and add the respective compilation units. The callback is
   // called immediately if no recompilation is needed, or called later
   // otherwise.
   void InitializeRecompilation(
       TieringState new_tiering_state,
       CompilationState::callback_t recompilation_finished_callback);

   // Add the callback function to be called on compilation events. Needs to be
   // set before {AddCompilationUnits} is run to ensure that it receives all
   // events. The callback object must support being deleted from any thread.
   void AddCallback(CompilationState::callback_t);

   // Inserts new functions to compile and kicks off compilation.
   void AddCompilationUnits(
       Vector<WasmCompilationUnit> baseline_units,
       Vector<WasmCompilationUnit> top_tier_units,
       Vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>>
           js_to_wasm_wrapper_units);
   void AddTopTierCompilationUnit(WasmCompilationUnit);
   void AddTopTierPriorityCompilationUnit(WasmCompilationUnit, size_t);

   CompilationUnitQueues::Queue* GetQueueForCompileTask(int task_id);

   base::Optional<WasmCompilationUnit> GetNextCompilationUnit(
       CompilationUnitQueues::Queue*, CompileBaselineOnly);

   std::shared_ptr<JSToWasmWrapperCompilationUnit>
   GetNextJSToWasmWrapperCompilationUnit();
   void FinalizeJSToWasmWrappers(Isolate* isolate, const WasmModule* module,
                                 Handle<FixedArray>* export_wrappers_out);

   void OnFinishedUnits(Vector<WasmCode*>);
   void OnFinishedJSToWasmWrapperUnits(int num);

   void OnCompilationStopped(const WasmFeatures& detected);
   void PublishDetectedFeatures(Isolate*);
   void SchedulePublishCompilationResults(
       std::vector<std::unique_ptr<WasmCode>> unpublished_code);
   // Ensure that a compilation job is running, and increase its concurrency if
   // needed.
   void ScheduleCompileJobForNewUnits();

   size_t NumOutstandingCompilations() const;

   void SetError();

   void WaitForCompilationEvent(CompilationEvent event);

   void SetHighPriority() { has_priority_ = true; }

   bool failed() const {
     return compile_failed_.load(std::memory_order_relaxed);
   }

   bool baseline_compilation_finished() const {
     base::MutexGuard guard(&callbacks_mutex_);
     return outstanding_baseline_units_ == 0 &&
            outstanding_export_wrappers_ == 0;
   }

   bool top_tier_compilation_finished() const {
     base::MutexGuard guard(&callbacks_mutex_);
     return outstanding_top_tier_functions_ == 0;
   }

   bool recompilation_finished() const {
     base::MutexGuard guard(&callbacks_mutex_);
     return outstanding_recompilation_functions_ == 0;
   }

   CompileMode compile_mode() const { return compile_mode_; }
   Counters* counters() const { return async_counters_.get(); }
   WasmFeatures* detected_features() { return &detected_features_; }

   void SetWireBytesStorage(
       std::shared_ptr<WireBytesStorage> wire_bytes_storage) {
     base::MutexGuard guard(&mutex_);
     wire_bytes_storage_ = wire_bytes_storage;
   }

   std::shared_ptr<WireBytesStorage> GetWireBytesStorage() const {
     base::MutexGuard guard(&mutex_);
     DCHECK_NOT_NULL(wire_bytes_storage_);
     return wire_bytes_storage_;
   }

  private:
   // Trigger callbacks according to the internal counters below
   // (outstanding_...), plus the given events.
   // Hold the {callbacks_mutex_} when calling this method.
   void TriggerCallbacks(base::EnumSet<CompilationEvent> additional_events = {});

   void PublishCompilationResults(
       std::vector<std::unique_ptr<WasmCode>> unpublished_code);
   void PublishCode(Vector<std::unique_ptr<WasmCode>> codes);

   NativeModule* const native_module_;
   std::weak_ptr<NativeModule> const native_module_weak_;
   const CompileMode compile_mode_;
   const std::shared_ptr<Counters> async_counters_;

   // Compilation error, atomically updated. This flag can be updated and read
   // using relaxed semantics.
   std::atomic<bool> compile_failed_{false};

   // True if compilation was cancelled and worker threads should return. This
   // flag can be updated and read using relaxed semantics.
   std::atomic<bool> compile_cancelled_{false};

   CompilationUnitQueues compilation_unit_queues_;

   // Index of the next wrapper to compile in {js_to_wasm_wrapper_units_}.
   std::atomic<int> js_to_wasm_wrapper_id_{0};
   // Wrapper compilation units are stored in shared_ptrs so that they are kept
   // alive by the tasks even if the NativeModule dies.
   std::vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>>
       js_to_wasm_wrapper_units_;

   bool has_priority_ = false;

   // This mutex protects all information of this {CompilationStateImpl} which is
   // being accessed concurrently.
   mutable base::Mutex mutex_;

   //////////////////////////////////////////////////////////////////////////////
   // Protected by {mutex_}:

   std::shared_ptr<JobHandle> current_compile_job_;

   // Features detected to be used in this module. Features can be detected
   // as a module is being compiled.
   WasmFeatures detected_features_ = WasmFeatures::None();

   // Abstraction over the storage of the wire bytes. Held in a shared_ptr so
   // that background compilation jobs can keep the storage alive while
   // compiling.
   std::shared_ptr<WireBytesStorage> wire_bytes_storage_;

   // End of fields protected by {mutex_}.
   //////////////////////////////////////////////////////////////////////////////

   // This mutex protects the callbacks vector, and the counters used to
   // determine which callbacks to call. The counters plus the callbacks
   // themselves need to be synchronized to ensure correct order of events.
   mutable base::Mutex callbacks_mutex_;

   //////////////////////////////////////////////////////////////////////////////
   // Protected by {callbacks_mutex_}:

   // Callback functions to be called on compilation events.
   std::vector<CompilationState::callback_t> callbacks_;

   // Events that already happened.
   base::EnumSet<CompilationEvent> finished_events_;

   int outstanding_baseline_units_ = 0;
   int outstanding_export_wrappers_ = 0;
   int outstanding_top_tier_functions_ = 0;
   std::vector<uint8_t> compilation_progress_;

   int outstanding_recompilation_functions_ = 0;
   TieringState tiering_state_ = kTieredUp;

   // End of fields protected by {callbacks_mutex_}.
   //////////////////////////////////////////////////////////////////////////////

   // {publish_mutex_} protects {publish_queue_} and {publisher_running_}.
   base::Mutex publish_mutex_;
   std::vector<std::unique_ptr<WasmCode>> publish_queue_;
   bool publisher_running_ = false;

   // Encoding of fields in the {compilation_progress_} vector.
   using RequiredBaselineTierField = base::BitField8<ExecutionTier, 0, 2>;
   using RequiredTopTierField = base::BitField8<ExecutionTier, 2, 2>;
   using ReachedTierField = base::BitField8<ExecutionTier, 4, 2>;
   using MissingRecompilationField = base::BitField8<bool, 6, 1>;
 };

 CompilationStateImpl* Impl(CompilationState* compilation_state) {
   return reinterpret_cast<CompilationStateImpl*>(compilation_state);
 }
 const CompilationStateImpl* Impl(const CompilationState* compilation_state) {
   return reinterpret_cast<const CompilationStateImpl*>(compilation_state);
 }

 CompilationStateImpl* BackgroundCompileScope::compilation_state() const {
   DCHECK(native_module_);
   return Impl(native_module_->compilation_state());
 }

 bool BackgroundCompileScope::cancelled() const {
   return native_module_ == nullptr ||
          Impl(native_module_->compilation_state())->cancelled();
 }

 void UpdateFeatureUseCounts(Isolate* isolate, const WasmFeatures& detected) {
   using Feature = v8::Isolate::UseCounterFeature;
   constexpr static std::pair<WasmFeature, Feature> kUseCounters[] = {
       {kFeature_reftypes, Feature::kWasmRefTypes},
       {kFeature_bulk_memory, Feature::kWasmBulkMemory},
       {kFeature_mv, Feature::kWasmMultiValue},
       {kFeature_simd, Feature::kWasmSimdOpcodes},
       {kFeature_threads, Feature::kWasmThreadOpcodes}};

   for (auto& feature : kUseCounters) {
     if (detected.contains(feature.first)) isolate->CountUsage(feature.second);
   }
 }

 }  // namespace

 // static
 constexpr uint32_t CompilationEnv::kMaxMemoryPagesAtRuntime;

 //////////////////////////////////////////////////////
 // PIMPL implementation of {CompilationState}.

 CompilationState::~CompilationState() { Impl(this)->~CompilationStateImpl(); }

 void CompilationState::CancelCompilation() { Impl(this)->CancelCompilation(); }

 void CompilationState::SetError() { Impl(this)->SetError(); }

 void CompilationState::SetWireBytesStorage(
     std::shared_ptr<WireBytesStorage> wire_bytes_storage) {
   Impl(this)->SetWireBytesStorage(std::move(wire_bytes_storage));
 }

 std::shared_ptr<WireBytesStorage> CompilationState::GetWireBytesStorage()
     const {
   return Impl(this)->GetWireBytesStorage();
 }

 void CompilationState::AddCallback(CompilationState::callback_t callback) {
   return Impl(this)->AddCallback(std::move(callback));
 }

 void CompilationState::WaitForTopTierFinished() {
   // TODO(clemensb): Contribute to compilation while waiting.
   auto top_tier_finished_semaphore = std::make_shared<base::Semaphore>(0);
   AddCallback([top_tier_finished_semaphore](CompilationEvent event) {
     if (event == CompilationEvent::kFailedCompilation ||
         event == CompilationEvent::kFinishedTopTierCompilation) {
       top_tier_finished_semaphore->Signal();
     }
   });
   top_tier_finished_semaphore->Wait();
 }

 void CompilationState::SetHighPriority() { Impl(this)->SetHighPriority(); }

 void CompilationState::InitializeAfterDeserialization() {
   Impl(this)->InitializeCompilationProgressAfterDeserialization();
 }

 bool CompilationState::failed() const { return Impl(this)->failed(); }

 bool CompilationState::baseline_compilation_finished() const {
   return Impl(this)->baseline_compilation_finished();
 }

 bool CompilationState::top_tier_compilation_finished() const {
   return Impl(this)->top_tier_compilation_finished();
 }

 bool CompilationState::recompilation_finished() const {
   return Impl(this)->recompilation_finished();
 }

 // static
 std::unique_ptr<CompilationState> CompilationState::New(
     const std::shared_ptr<NativeModule>& native_module,
     std::shared_ptr<Counters> async_counters) {
   return std::unique_ptr<CompilationState>(
       reinterpret_cast<CompilationState*>(new CompilationStateImpl(
           std::move(native_module), std::move(async_counters))));
 }

 // End of PIMPL implementation of {CompilationState}.
 //////////////////////////////////////////////////////

 namespace {

 ExecutionTier ApplyHintToExecutionTier(WasmCompilationHintTier hint,
                                        ExecutionTier default_tier) {
   switch (hint) {
     case WasmCompilationHintTier::kDefault:
       return default_tier;
     case WasmCompilationHintTier::kBaseline:
       return ExecutionTier::kLiftoff;
     case WasmCompilationHintTier::kOptimized:
       return ExecutionTier::kTurbofan;
   }
   UNREACHABLE();
 }

 const WasmCompilationHint* GetCompilationHint(const WasmModule* module,
                                               uint32_t func_index) {
   DCHECK_LE(module->num_imported_functions, func_index);
   uint32_t hint_index = declared_function_index(module, func_index);
   const std::vector<WasmCompilationHint>& compilation_hints =
       module->compilation_hints;
   if (hint_index < compilation_hints.size()) {
     return &compilation_hints[hint_index];
   }
   return nullptr;
 }

 CompileStrategy GetCompileStrategy(const WasmModule* module,
                                    const WasmFeatures& enabled_features,
                                    uint32_t func_index, bool lazy_module) {
   if (lazy_module) return CompileStrategy::kLazy;
   if (!enabled_features.has_compilation_hints()) {
     return CompileStrategy::kDefault;
   }
   auto* hint = GetCompilationHint(module, func_index);
   if (hint == nullptr) return CompileStrategy::kDefault;
   switch (hint->strategy) {
     case WasmCompilationHintStrategy::kLazy:
       return CompileStrategy::kLazy;
     case WasmCompilationHintStrategy::kEager:
       return CompileStrategy::kEager;
     case WasmCompilationHintStrategy::kLazyBaselineEagerTopTier:
       return CompileStrategy::kLazyBaselineEagerTopTier;
     case WasmCompilationHintStrategy::kDefault:
       return CompileStrategy::kDefault;
   }
 }

 struct ExecutionTierPair {
   ExecutionTier baseline_tier;
   ExecutionTier top_tier;
 };

 ExecutionTierPair GetRequestedExecutionTiers(
     const WasmModule* module, CompileMode compile_mode,
     const WasmFeatures& enabled_features, uint32_t func_index) {
   ExecutionTierPair result;

   result.baseline_tier = WasmCompilationUnit::GetBaselineExecutionTier(module);
   switch (compile_mode) {
     case CompileMode::kRegular:
       result.top_tier = result.baseline_tier;
       return result;

     case CompileMode::kTiering:

       // Default tiering behaviour.
       result.top_tier = ExecutionTier::kTurbofan;

       // Check if compilation hints override default tiering behaviour.
       if (enabled_features.has_compilation_hints()) {
         const WasmCompilationHint* hint =
             GetCompilationHint(module, func_index);
         if (hint != nullptr) {
           result.baseline_tier = ApplyHintToExecutionTier(hint->baseline_tier,
                                                           result.baseline_tier);
           result.top_tier =
               ApplyHintToExecutionTier(hint->top_tier, result.top_tier);
         }
       }

       // Correct top tier if necessary.
       static_assert(ExecutionTier::kLiftoff < ExecutionTier::kTurbofan,
                     "Assume an order on execution tiers");
       if (result.baseline_tier > result.top_tier) {
         result.top_tier = result.baseline_tier;
       }
       return result;
   }
   UNREACHABLE();
 }

 // The {CompilationUnitBuilder} builds compilation units and stores them in an
 // internal buffer. The buffer is moved into the working queue of the
 // {CompilationStateImpl} when {Commit} is called.
 class CompilationUnitBuilder {
  public:
   explicit CompilationUnitBuilder(NativeModule* native_module)
       : native_module_(native_module) {}

   void AddUnits(uint32_t func_index) {
     if (func_index < native_module_->module()->num_imported_functions) {
       baseline_units_.emplace_back(func_index, ExecutionTier::kNone,
                                    kNoDebugging);
       return;
     }
     ExecutionTierPair tiers = GetRequestedExecutionTiers(
         native_module_->module(), compilation_state()->compile_mode(),
         native_module_->enabled_features(), func_index);
     // Compile everything for non-debugging initially. If needed, we will tier
     // down when the module is fully compiled. Synchronization would be pretty
     // difficult otherwise.
     baseline_units_.emplace_back(func_index, tiers.baseline_tier, kNoDebugging);
     if (tiers.baseline_tier != tiers.top_tier) {
       tiering_units_.emplace_back(func_index, tiers.top_tier, kNoDebugging);
     }
   }

   void AddJSToWasmWrapperUnit(
       std::shared_ptr<JSToWasmWrapperCompilationUnit> unit) {
     js_to_wasm_wrapper_units_.emplace_back(std::move(unit));
   }

   void AddTopTierUnit(int func_index) {
     ExecutionTierPair tiers = GetRequestedExecutionTiers(
         native_module_->module(), compilation_state()->compile_mode(),
         native_module_->enabled_features(), func_index);
     // In this case, the baseline is lazily compiled, if at all. The compilation
     // unit is added even if the baseline tier is the same.
 #ifdef DEBUG
     auto* module = native_module_->module();
     DCHECK_EQ(kWasmOrigin, module->origin);
     const bool lazy_module = false;
     DCHECK_EQ(CompileStrategy::kLazyBaselineEagerTopTier,
               GetCompileStrategy(module, native_module_->enabled_features(),
                                  func_index, lazy_module));
 #endif
     tiering_units_.emplace_back(func_index, tiers.top_tier, kNoDebugging);
   }

   void AddRecompilationUnit(int func_index, ExecutionTier tier) {
     // For recompilation, just treat all units like baseline units.
     baseline_units_.emplace_back(
         func_index, tier,
         tier == ExecutionTier::kLiftoff ? kForDebugging : kNoDebugging);
   }

   bool Commit() {
     if (baseline_units_.empty() && tiering_units_.empty() &&
         js_to_wasm_wrapper_units_.empty()) {
       return false;
     }
     compilation_state()->AddCompilationUnits(
         VectorOf(baseline_units_), VectorOf(tiering_units_),
         VectorOf(js_to_wasm_wrapper_units_));
     Clear();
     return true;
   }

   void Clear() {
     baseline_units_.clear();
     tiering_units_.clear();
     js_to_wasm_wrapper_units_.clear();
   }

  private:
   CompilationStateImpl* compilation_state() const {
     return Impl(native_module_->compilation_state());
   }

   NativeModule* const native_module_;
   std::vector<WasmCompilationUnit> baseline_units_;
   std::vector<WasmCompilationUnit> tiering_units_;
   std::vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>>
       js_to_wasm_wrapper_units_;
 };

 void SetCompileError(ErrorThrower* thrower, ModuleWireBytes wire_bytes,
                      const WasmFunction* func, const WasmModule* module,
                      WasmError error) {
   WasmName name = wire_bytes.GetNameOrNull(func, module);
   if (name.begin() == nullptr) {
     thrower->CompileError("Compiling function #%d failed: %s @+%u",
                           func->func_index, error.message().c_str(),
                           error.offset());
   } else {
     TruncatedUserString<> truncated_name(name);
     thrower->CompileError("Compiling function #%d:\"%.*s\" failed: %s @+%u",
                           func->func_index, truncated_name.length(),
                           truncated_name.start(), error.message().c_str(),
                           error.offset());
   }
 }

 DecodeResult ValidateSingleFunction(const WasmModule* module, int func_index,
                                     Vector<const uint8_t> code,
                                     Counters* counters,
                                     AccountingAllocator* allocator,
                                     WasmFeatures enabled_features) {
   const WasmFunction* func = &module->functions[func_index];
   FunctionBody body{func->sig, func->code.offset(), code.begin(), code.end()};
   DecodeResult result;

   WasmFeatures detected;
   return VerifyWasmCode(allocator, enabled_features, module, &detected, body);
 }

 enum OnlyLazyFunctions : bool {
   kAllFunctions = false,
   kOnlyLazyFunctions = true,
 };

 void ValidateSequentially(
     const WasmModule* module, NativeModule* native_module, Counters* counters,
     AccountingAllocator* allocator, ErrorThrower* thrower, bool lazy_module,
     OnlyLazyFunctions only_lazy_functions = kAllFunctions) {
   DCHECK(!thrower->error());
   uint32_t start = module->num_imported_functions;
   uint32_t end = start + module->num_declared_functions;
   auto enabled_features = native_module->enabled_features();
   for (uint32_t func_index = start; func_index < end; func_index++) {
     // Skip non-lazy functions if requested.
     if (only_lazy_functions) {
       CompileStrategy strategy =
           GetCompileStrategy(module, enabled_features, func_index, lazy_module);
       if (strategy != CompileStrategy::kLazy &&
           strategy != CompileStrategy::kLazyBaselineEagerTopTier) {
         continue;
       }
     }

     ModuleWireBytes wire_bytes{native_module->wire_bytes()};
     const WasmFunction* func = &module->functions[func_index];
     Vector<const uint8_t> code = wire_bytes.GetFunctionBytes(func);
     DecodeResult result = ValidateSingleFunction(
         module, func_index, code, counters, allocator, enabled_features);
     if (result.failed()) {
       SetCompileError(thrower, wire_bytes, func, module, result.error());
     }
   }
 }

 bool IsLazyModule(const WasmModule* module) {
   return FLAG_wasm_lazy_compilation ||
          (FLAG_asm_wasm_lazy_compilation && is_asmjs_module(module));
 }

 }  // namespace

 bool CompileLazy(Isolate* isolate, NativeModule* native_module,
                  int func_index) {
   const WasmModule* module = native_module->module();
   auto enabled_features = native_module->enabled_features();
   Counters* counters = isolate->counters();

   DCHECK(!native_module->lazy_compile_frozen());
   NativeModuleModificationScope native_module_modification_scope(native_module);

   TRACE_LAZY("Compiling wasm-function#%d.\n", func_index);

   CompilationStateImpl* compilation_state =
       Impl(native_module->compilation_state());
   ExecutionTierPair tiers = GetRequestedExecutionTiers(
       module, compilation_state->compile_mode(), enabled_features, func_index);

   DCHECK_LE(native_module->num_imported_functions(), func_index);
   DCHECK_LT(func_index, native_module->num_functions());
   WasmCompilationUnit baseline_unit{func_index, tiers.baseline_tier,
                                     kNoDebugging};
   CompilationEnv env = native_module->CreateCompilationEnv();
   WasmCompilationResult result = baseline_unit.ExecuteCompilation(
       isolate->wasm_engine(), &env, compilation_state->GetWireBytesStorage(),
       counters, compilation_state->detected_features());

   // During lazy compilation, we can only get compilation errors when
   // {--wasm-lazy-validation} is enabled. Otherwise, the module was fully
   // verified before starting its execution.
   CHECK_IMPLIES(result.failed(), FLAG_wasm_lazy_validation);
   const WasmFunction* func = &module->functions[func_index];
   if (result.failed()) {
     ErrorThrower thrower(isolate, nullptr);
     Vector<const uint8_t> code =
         compilation_state->GetWireBytesStorage()->GetCode(func->code);
     DecodeResult decode_result = ValidateSingleFunction(
         module, func_index, code, counters, isolate->wasm_engine()->allocator(),
         enabled_features);
     CHECK(decode_result.failed());
     SetCompileError(&thrower, ModuleWireBytes(native_module->wire_bytes()),
                     func, module, decode_result.error());
     return false;
   }

   WasmCodeRefScope code_ref_scope;
   WasmCode* code = native_module->PublishCode(
       native_module->AddCompiledCode(std::move(result)));
   DCHECK_EQ(func_index, code->index());

   if (WasmCode::ShouldBeLogged(isolate)) code->LogCode(isolate);

   counters->wasm_lazily_compiled_functions()->Increment();

   const bool lazy_module = IsLazyModule(module);
   if (GetCompileStrategy(module, enabled_features, func_index, lazy_module) ==
           CompileStrategy::kLazy &&
       tiers.baseline_tier < tiers.top_tier) {
     WasmCompilationUnit tiering_unit{func_index, tiers.top_tier, kNoDebugging};
     compilation_state->AddTopTierCompilationUnit(tiering_unit);
   }

   return true;
 }

 void TriggerTierUp(Isolate* isolate, NativeModule* native_module,
                    int func_index) {
   CompilationStateImpl* compilation_state =
       Impl(native_module->compilation_state());
   WasmCompilationUnit tiering_unit{func_index, ExecutionTier::kTurbofan,
                                    kNoDebugging};

   uint32_t* call_array = native_module->num_liftoff_function_calls_array();
   int offset =
       wasm::declared_function_index(native_module->module(), func_index);

   size_t priority =
       base::Relaxed_Load(reinterpret_cast<int*>(&call_array[offset]));
   compilation_state->AddTopTierPriorityCompilationUnit(tiering_unit, priority);
 }

 namespace {

 void RecordStats(const Code code, Counters* counters) {
   counters->wasm_generated_code_size()->Increment(code.raw_body_size());
   counters->wasm_reloc_size()->Increment(code.relocation_info().length());
 }

 enum CompilationExecutionResult : int8_t { kNoMoreUnits, kYield };

 CompilationExecutionResult ExecuteJSToWasmWrapperCompilationUnits(
     std::weak_ptr<NativeModule> native_module, JobDelegate* delegate) {
   std::shared_ptr<JSToWasmWrapperCompilationUnit> wrapper_unit = nullptr;
   int num_processed_wrappers = 0;

   {
     BackgroundCompileScope compile_scope(native_module);
     if (compile_scope.cancelled()) return kNoMoreUnits;
     wrapper_unit = compile_scope.compilation_state()
                        ->GetNextJSToWasmWrapperCompilationUnit();
     if (!wrapper_unit) return kNoMoreUnits;
   }

   TRACE_EVENT0("v8.wasm", "wasm.JSToWasmWrapperCompilation");
   while (true) {
     wrapper_unit->Execute();
     ++num_processed_wrappers;
     bool yield = delegate && delegate->ShouldYield();
     BackgroundCompileScope compile_scope(native_module);
     if (compile_scope.cancelled()) return kNoMoreUnits;
     if (yield ||
         !(wrapper_unit = compile_scope.compilation_state()
                              ->GetNextJSToWasmWrapperCompilationUnit())) {
       compile_scope.compilation_state()->OnFinishedJSToWasmWrapperUnits(
           num_processed_wrappers);
       return yield ? kYield : kNoMoreUnits;
     }
   }
 }

 namespace {
 const char* GetCompilationEventName(const WasmCompilationUnit& unit,
                                     const CompilationEnv& env) {
   ExecutionTier tier = unit.tier();
   if (tier == ExecutionTier::kLiftoff) {
     return "wasm.BaselineCompilation";
   }
   if (tier == ExecutionTier::kTurbofan) {
     return "wasm.TopTierCompilation";
   }
   if (unit.func_index() <
       static_cast<int>(env.module->num_imported_functions)) {
     return "wasm.WasmToJSWrapperCompilation";
   }
   return "wasm.OtherCompilation";
 }
 }  // namespace

 // Run by the {BackgroundCompileJob} (on any thread).
 CompilationExecutionResult ExecuteCompilationUnits(
     std::weak_ptr<NativeModule> native_module, Counters* counters,
     JobDelegate* delegate, CompileBaselineOnly baseline_only) {
   TRACE_EVENT0("v8.wasm", "wasm.ExecuteCompilationUnits");

   // Execute JS to Wasm wrapper units first, so that they are ready to be
   // finalized by the main thread when the kFinishedBaselineCompilation event is
   // triggered.
   if (ExecuteJSToWasmWrapperCompilationUnits(native_module, delegate) ==
       kYield) {
     return kYield;
   }

   // These fields are initialized in a {BackgroundCompileScope} before
   // starting compilation.
   base::Optional<CompilationEnv> env;
   std::shared_ptr<WireBytesStorage> wire_bytes;
   std::shared_ptr<const WasmModule> module;
   WasmEngine* wasm_engine;
   // Task 0 is any main thread (there might be multiple from multiple isolates),
   // worker threads start at 1 (thus the "+ 1").
   int task_id = delegate ? (int{delegate->GetTaskId()} + 1) : 0;
   DCHECK_LE(0, task_id);
   CompilationUnitQueues::Queue* queue;
   base::Optional<WasmCompilationUnit> unit;

   WasmFeatures detected_features = WasmFeatures::None();

   // Preparation (synchronized): Initialize the fields above and get the first
   // compilation unit.
   {
     BackgroundCompileScope compile_scope(native_module);
     if (compile_scope.cancelled()) return kNoMoreUnits;
     auto* compilation_state = compile_scope.compilation_state();
     env.emplace(compile_scope.native_module()->CreateCompilationEnv());
     wire_bytes = compilation_state->GetWireBytesStorage();
     module = compile_scope.native_module()->shared_module();
     wasm_engine = compile_scope.native_module()->engine();
     queue = compilation_state->GetQueueForCompileTask(task_id);
     unit = compilation_state->GetNextCompilationUnit(queue, baseline_only);
     if (!unit) return kNoMoreUnits;
   }
   TRACE_COMPILE("ExecuteCompilationUnits (task id %d)\n", task_id);

   std::vector<WasmCompilationResult> results_to_publish;
   while (true) {
     ExecutionTier current_tier = unit->tier();
     const char* event_name = GetCompilationEventName(unit.value(), env.value());
     TRACE_EVENT0("v8.wasm", event_name);
     while (unit->tier() == current_tier) {
       // (asynchronous): Execute the compilation.
       WasmCompilationResult result = unit->ExecuteCompilation(
           wasm_engine, &env.value(), wire_bytes, counters, &detected_features);
       results_to_publish.emplace_back(std::move(result));

       bool yield = delegate && delegate->ShouldYield();

       // (synchronized): Publish the compilation result and get the next unit.
       BackgroundCompileScope compile_scope(native_module);
       if (compile_scope.cancelled()) return kNoMoreUnits;

       if (!results_to_publish.back().succeeded()) {
         compile_scope.compilation_state()->SetError();
         return kNoMoreUnits;
       }

       // Yield or get next unit.
       if (yield ||
           !(unit = compile_scope.compilation_state()->GetNextCompilationUnit(
                 queue, baseline_only))) {
         std::vector<std::unique_ptr<WasmCode>> unpublished_code =
             compile_scope.native_module()->AddCompiledCode(
                 VectorOf(std::move(results_to_publish)));
         results_to_publish.clear();
         compile_scope.compilation_state()->SchedulePublishCompilationResults(
             std::move(unpublished_code));
         compile_scope.compilation_state()->OnCompilationStopped(
             detected_features);
         return yield ? kYield : kNoMoreUnits;
       }

       // Before executing a TurboFan unit, ensure to publish all previous
       // units. If we compiled Liftoff before, we need to publish them anyway
       // to ensure fast completion of baseline compilation, if we compiled
       // TurboFan before, we publish to reduce peak memory consumption.
       // Also publish after finishing a certain amount of units, to avoid
       // contention when all threads publish at the end.
       if (unit->tier() == ExecutionTier::kTurbofan ||
           queue->ShouldPublish(static_cast<int>(results_to_publish.size()))) {
         std::vector<std::unique_ptr<WasmCode>> unpublished_code =
             compile_scope.native_module()->AddCompiledCode(
                 VectorOf(std::move(results_to_publish)));
         results_to_publish.clear();
         compile_scope.compilation_state()->SchedulePublishCompilationResults(
             std::move(unpublished_code));
       }
     }
   }
   UNREACHABLE();
 }

 using JSToWasmWrapperKey = std::pair<bool, FunctionSig>;

 // Returns the number of units added.
 int AddExportWrapperUnits(Isolate* isolate, WasmEngine* wasm_engine,
                           NativeModule* native_module,
                           CompilationUnitBuilder* builder,
                           const WasmFeatures& enabled_features) {
   std::unordered_set<JSToWasmWrapperKey, base::hash<JSToWasmWrapperKey>> keys;
   for (auto exp : native_module->module()->export_table) {
     if (exp.kind != kExternalFunction) continue;
     auto& function = native_module->module()->functions[exp.index];
     JSToWasmWrapperKey key(function.imported, *function.sig);
     if (keys.insert(key).second) {
       auto unit = std::make_shared<JSToWasmWrapperCompilationUnit>(
           isolate, wasm_engine, function.sig, native_module->module(),
           function.imported, enabled_features,
           JSToWasmWrapperCompilationUnit::kAllowGeneric);
       builder->AddJSToWasmWrapperUnit(std::move(unit));
     }
   }

   return static_cast<int>(keys.size());
 }

 // Returns the number of units added.
 int AddImportWrapperUnits(NativeModule* native_module,
                           CompilationUnitBuilder* builder) {
   std::unordered_set<WasmImportWrapperCache::CacheKey,
                      WasmImportWrapperCache::CacheKeyHash>
       keys;
   int num_imported_functions = native_module->num_imported_functions();
   for (int func_index = 0; func_index < num_imported_functions; func_index++) {
     const FunctionSig* sig = native_module->module()->functions[func_index].sig;
     if (!IsJSCompatibleSignature(sig, native_module->module(),
                                  native_module->enabled_features())) {
       continue;
     }
     WasmImportWrapperCache::CacheKey key(
         compiler::kDefaultImportCallKind, sig,
         static_cast<int>(sig->parameter_count()));
     auto it = keys.insert(key);
     if (it.second) {
       // Ensure that all keys exist in the cache, so that we can populate the
       // cache later without locking.
       (*native_module->import_wrapper_cache())[key] = nullptr;
       builder->AddUnits(func_index);
     }
   }
   return static_cast<int>(keys.size());
 }

 void InitializeCompilationUnits(Isolate* isolate, NativeModule* native_module) {
   CompilationStateImpl* compilation_state =
       Impl(native_module->compilation_state());
   const bool lazy_module = IsLazyModule(native_module->module());
   ModuleWireBytes wire_bytes(native_module->wire_bytes());
   CompilationUnitBuilder builder(native_module);
   auto* module = native_module->module();
   const bool prefer_liftoff = native_module->IsTieredDown();

   uint32_t start = module->num_imported_functions;
   uint32_t end = start + module->num_declared_functions;
   for (uint32_t func_index = start; func_index < end; func_index++) {
     if (prefer_liftoff) {
       builder.AddRecompilationUnit(func_index, ExecutionTier::kLiftoff);
       continue;
     }
     CompileStrategy strategy = GetCompileStrategy(
         module, native_module->enabled_features(), func_index, lazy_module);
     if (strategy == CompileStrategy::kLazy) {
       native_module->UseLazyStub(func_index);
     } else if (strategy == CompileStrategy::kLazyBaselineEagerTopTier) {
       builder.AddTopTierUnit(func_index);
       native_module->UseLazyStub(func_index);
     } else {
       DCHECK_EQ(strategy, CompileStrategy::kEager);
       builder.AddUnits(func_index);
     }
   }
   int num_import_wrappers = AddImportWrapperUnits(native_module, &builder);
   int num_export_wrappers =
       AddExportWrapperUnits(isolate, isolate->wasm_engine(), native_module,
                             &builder, WasmFeatures::FromIsolate(isolate));
   compilation_state->InitializeCompilationProgress(
       lazy_module, num_import_wrappers, num_export_wrappers);
   builder.Commit();
 }

 bool MayCompriseLazyFunctions(const WasmModule* module,
                               const WasmFeatures& enabled_features,
                               bool lazy_module) {
   if (lazy_module || enabled_features.has_compilation_hints()) return true;
 #ifdef ENABLE_SLOW_DCHECKS
   int start = module->num_imported_functions;
   int end = start + module->num_declared_functions;
   for (int func_index = start; func_index < end; func_index++) {
     SLOW_DCHECK(GetCompileStrategy(module, enabled_features, func_index,
                                    lazy_module) != CompileStrategy::kLazy);
   }
 #endif
   return false;
 }

 class CompilationTimeCallback {
  public:
   enum CompileMode { kSynchronous, kAsync, kStreaming };
   explicit CompilationTimeCallback(
       std::shared_ptr<Counters> async_counters,
       std::shared_ptr<metrics::Recorder> metrics_recorder,
       v8::metrics::Recorder::ContextId context_id,
       std::weak_ptr<NativeModule> native_module, CompileMode compile_mode)
       : start_time_(base::TimeTicks::Now()),
         async_counters_(std::move(async_counters)),
         metrics_recorder_(std::move(metrics_recorder)),
         context_id_(context_id),
         native_module_(std::move(native_module)),
         compile_mode_(compile_mode) {}

   void operator()(CompilationEvent event) {
     DCHECK(base::TimeTicks::IsHighResolution());
     std::shared_ptr<NativeModule> native_module = native_module_.lock();
     if (!native_module) return;
     auto now = base::TimeTicks::Now();
     auto duration = now - start_time_;
     if (event == CompilationEvent::kFinishedBaselineCompilation) {
       // Reset {start_time_} to measure tier-up time.
       start_time_ = now;
       if (compile_mode_ != kSynchronous) {
         TimedHistogram* histogram =
             compile_mode_ == kAsync
                 ? async_counters_->wasm_async_compile_wasm_module_time()
                 : async_counters_->wasm_streaming_compile_wasm_module_time();
         histogram->AddSample(static_cast<int>(duration.InMicroseconds()));
       }

       // TODO(sartang@microsoft.com): Remove wall_clock_time_in_us field
       v8::metrics::WasmModuleCompiled event{
           (compile_mode_ != kSynchronous),         // async
           (compile_mode_ == kStreaming),           // streamed
           false,                                   // cached
           false,                                   // deserialized
           FLAG_wasm_lazy_compilation,              // lazy
           true,                                    // success
           native_module->liftoff_code_size(),      // code_size_in_bytes
           native_module->liftoff_bailout_count(),  // liftoff_bailout_count
           duration.InMicroseconds(),               // wall_clock_time_in_us
           duration.InMicroseconds()                // wall_clock_duration_in_us
       };
       metrics_recorder_->DelayMainThreadEvent(event, context_id_);
     }
     if (event == CompilationEvent::kFinishedTopTierCompilation) {
       TimedHistogram* histogram = async_counters_->wasm_tier_up_module_time();
       histogram->AddSample(static_cast<int>(duration.InMicroseconds()));

       v8::metrics::WasmModuleTieredUp event{
           FLAG_wasm_lazy_compilation,           // lazy
           native_module->turbofan_code_size(),  // code_size_in_bytes
           duration.InMicroseconds(),            // wall_clock_time_in_us
           duration.InMicroseconds()             // wall_clock_duration_in_us
       };
       metrics_recorder_->DelayMainThreadEvent(event, context_id_);
     }
     if (event == CompilationEvent::kFailedCompilation) {
       v8::metrics::WasmModuleCompiled event{
           (compile_mode_ != kSynchronous),         // async
           (compile_mode_ == kStreaming),           // streamed
           false,                                   // cached
           false,                                   // deserialized
           FLAG_wasm_lazy_compilation,              // lazy
           false,                                   // success
           native_module->liftoff_code_size(),      // code_size_in_bytes
           native_module->liftoff_bailout_count(),  // liftoff_bailout_count
           duration.InMicroseconds(),               // wall_clock_time_in_us
           duration.InMicroseconds()                // wall_clock_duration_in_us
       };
       metrics_recorder_->DelayMainThreadEvent(event, context_id_);
     }
   }

  private:
   base::TimeTicks start_time_;
   const std::shared_ptr<Counters> async_counters_;
   std::shared_ptr<metrics::Recorder> metrics_recorder_;
   v8::metrics::Recorder::ContextId context_id_;
   std::weak_ptr<NativeModule> native_module_;
   const CompileMode compile_mode_;
 };

 void CompileNativeModule(Isolate* isolate,
                          v8::metrics::Recorder::ContextId context_id,
                          ErrorThrower* thrower, const WasmModule* wasm_module,
                          std::shared_ptr<NativeModule> native_module,
                          Handle<FixedArray>* export_wrappers_out) {
   CHECK(!FLAG_jitless);
   ModuleWireBytes wire_bytes(native_module->wire_bytes());
   const bool lazy_module = IsLazyModule(wasm_module);
   if (!FLAG_wasm_lazy_validation && wasm_module->origin == kWasmOrigin &&
       MayCompriseLazyFunctions(wasm_module, native_module->enabled_features(),
                                lazy_module)) {
     // Validate wasm modules for lazy compilation if requested. Never validate
     // asm.js modules as these are valid by construction (additionally a CHECK
     // will catch this during lazy compilation).
     ValidateSequentially(wasm_module, native_module.get(), isolate->counters(),
                          isolate->allocator(), thrower, lazy_module,
                          kOnlyLazyFunctions);
     // On error: Return and leave the module in an unexecutable state.
     if (thrower->error()) return;
   }

   DCHECK_GE(kMaxInt, native_module->module()->num_declared_functions);

   // The callback captures a shared ptr to the semaphore.
   auto* compilation_state = Impl(native_module->compilation_state());
   if (base::TimeTicks::IsHighResolution()) {
     compilation_state->AddCallback(CompilationTimeCallback{
         isolate->async_counters(), isolate->metrics_recorder(), context_id,
         native_module, CompilationTimeCallback::kSynchronous});
   }

   // Initialize the compilation units and kick off background compile tasks.
   InitializeCompilationUnits(isolate, native_module.get());

   compilation_state->WaitForCompilationEvent(
       CompilationEvent::kFinishedExportWrappers);

   if (compilation_state->failed()) {
     DCHECK_IMPLIES(lazy_module, !FLAG_wasm_lazy_validation);
     ValidateSequentially(wasm_module, native_module.get(), isolate->counters(),
                          isolate->allocator(), thrower, lazy_module);
     CHECK(thrower->error());
     return;
   }

   if (!FLAG_predictable) {
     // For predictable mode, do not finalize wrappers yet to make sure we catch
     // validation errors first.
     compilation_state->FinalizeJSToWasmWrappers(
         isolate, native_module->module(), export_wrappers_out);
   }

   compilation_state->WaitForCompilationEvent(
       CompilationEvent::kFinishedBaselineCompilation);

   compilation_state->PublishDetectedFeatures(isolate);

   if (compilation_state->failed()) {
     DCHECK_IMPLIES(lazy_module, !FLAG_wasm_lazy_validation);
     ValidateSequentially(wasm_module, native_module.get(), isolate->counters(),
                          isolate->allocator(), thrower, lazy_module);
     CHECK(thrower->error());
   } else if (FLAG_predictable) {
     compilation_state->FinalizeJSToWasmWrappers(
         isolate, native_module->module(), export_wrappers_out);
   }
 }

 class BackgroundCompileJob final : public JobTask {
  public:
   explicit BackgroundCompileJob(std::weak_ptr<NativeModule> native_module,
                                 std::shared_ptr<Counters> async_counters)
       : native_module_(std::move(native_module)),
         async_counters_(std::move(async_counters)) {}

   void Run(JobDelegate* delegate) override {
     ExecuteCompilationUnits(native_module_, async_counters_.get(), delegate,
                             kBaselineOrTopTier);
   }

   size_t GetMaxConcurrency(size_t worker_count) const override {
     BackgroundCompileScope scope(native_module_);
     if (scope.cancelled()) return 0;
     // NumOutstandingCompilations() does not reflect the units that running
     // workers are processing, thus add the current worker count to that number.
     size_t flag_limit =
         static_cast<size_t>(std::max(1, FLAG_wasm_num_compilation_tasks));
     return std::min(
         flag_limit,
         worker_count + scope.compilation_state()->NumOutstandingCompilations());
   }

  private:
   const std::weak_ptr<NativeModule> native_module_;
   const std::shared_ptr<Counters> async_counters_;
 };

 }  // namespace

 std::shared_ptr<NativeModule> CompileToNativeModule(
     Isolate* isolate, const WasmFeatures& enabled, ErrorThrower* thrower,
     std::shared_ptr<const WasmModule> module, const ModuleWireBytes& wire_bytes,
     Handle<FixedArray>* export_wrappers_out) {
   const WasmModule* wasm_module = module.get();
   OwnedVector<uint8_t> wire_bytes_copy =
       OwnedVector<uint8_t>::Of(wire_bytes.module_bytes());
   // Prefer {wire_bytes_copy} to {wire_bytes.module_bytes()} for the temporary
   // cache key. When we eventually install the module in the cache, the wire
   // bytes of the temporary key and the new key have the same base pointer and
   // we can skip the full bytes comparison.
   std::shared_ptr<NativeModule> native_module =
       isolate->wasm_engine()->MaybeGetNativeModule(
           wasm_module->origin, wire_bytes_copy.as_vector(), isolate);
   if (native_module) {
     // TODO(thibaudm): Look into sharing export wrappers.
     CompileJsToWasmWrappers(isolate, wasm_module, export_wrappers_out);
     return native_module;
   }

   TimedHistogramScope wasm_compile_module_time_scope(SELECT_WASM_COUNTER(
       isolate->counters(), wasm_module->origin, wasm_compile, module_time));

   // Embedder usage count for declared shared memories.
   if (wasm_module->has_shared_memory) {
     isolate->CountUsage(v8::Isolate::UseCounterFeature::kWasmSharedMemory);
   }

   // Create a new {NativeModule} first.
   const bool uses_liftoff = module->origin == kWasmOrigin && FLAG_liftoff;
   size_t code_size_estimate =
       wasm::WasmCodeManager::EstimateNativeModuleCodeSize(module.get(),
                                                           uses_liftoff);
   native_module = isolate->wasm_engine()->NewNativeModule(
       isolate, enabled, module, code_size_estimate);
   native_module->SetWireBytes(std::move(wire_bytes_copy));
   // Sync compilation is user blocking, so we increase the priority.
   native_module->compilation_state()->SetHighPriority();

   v8::metrics::Recorder::ContextId context_id =
       isolate->GetOrRegisterRecorderContextId(isolate->native_context());
   CompileNativeModule(isolate, context_id, thrower, wasm_module, native_module,
                       export_wrappers_out);
   bool cache_hit = !isolate->wasm_engine()->UpdateNativeModuleCache(
       thrower->error(), &native_module, isolate);
   if (thrower->error()) return {};

   if (cache_hit) {
     CompileJsToWasmWrappers(isolate, wasm_module, export_wrappers_out);
     return native_module;
   }

   // Ensure that the code objects are logged before returning.
   isolate->wasm_engine()->LogOutstandingCodesForIsolate(isolate);

   return native_module;
 }

 void RecompileNativeModule(NativeModule* native_module,
                            TieringState tiering_state) {
   // Install a callback to notify us once background recompilation finished.
   auto recompilation_finished_semaphore = std::make_shared<base::Semaphore>(0);
   auto* compilation_state = Impl(native_module->compilation_state());

   // The callback captures a shared ptr to the semaphore.
   // Initialize the compilation units and kick off background compile tasks.
   compilation_state->InitializeRecompilation(
       tiering_state,
       [recompilation_finished_semaphore](CompilationEvent event) {
         if (event == CompilationEvent::kFinishedRecompilation) {
           recompilation_finished_semaphore->Signal();
         }
       });

   // Now wait until all compilation units finished.
   // TODO(clemensb): Contribute to compilation while waiting.
   recompilation_finished_semaphore->Wait();
   DCHECK(!compilation_state->failed());
 }

 AsyncCompileJob::AsyncCompileJob(
     Isolate* isolate, const WasmFeatures& enabled,
     std::unique_ptr<byte[]> bytes_copy, size_t length, Handle<Context> context,
     Handle<Context> incumbent_context, const char* api_method_name,
     std::shared_ptr<CompilationResultResolver> resolver)
     : isolate_(isolate),
       api_method_name_(api_method_name),
       enabled_features_(enabled),
       wasm_lazy_compilation_(FLAG_wasm_lazy_compilation),
       start_time_(base::TimeTicks::Now()),
       bytes_copy_(std::move(bytes_copy)),
       wire_bytes_(bytes_copy_.get(), bytes_copy_.get() + length),
       resolver_(std::move(resolver)) {
   TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                "wasm.AsyncCompileJob");
   CHECK(FLAG_wasm_async_compilation);
   CHECK(!FLAG_jitless);
   v8::Isolate* v8_isolate = reinterpret_cast<v8::Isolate*>(isolate);
   v8::Platform* platform = V8::GetCurrentPlatform();
   foreground_task_runner_ = platform->GetForegroundTaskRunner(v8_isolate);
   native_context_ =
       isolate->global_handles()->Create(context->native_context());
   incumbent_context_ = isolate->global_handles()->Create(*incumbent_context);
   DCHECK(native_context_->IsNativeContext());
   context_id_ = isolate->GetOrRegisterRecorderContextId(native_context_);
   metrics_event_.async = true;
 }

 void AsyncCompileJob::Start() {
   DoAsync<DecodeModule>(isolate_->counters(),
                         isolate_->metrics_recorder());  // --
 }

 void AsyncCompileJob::Abort() {
   // Removing this job will trigger the destructor, which will cancel all
   // compilation.
   isolate_->wasm_engine()->RemoveCompileJob(this);
 }

 class AsyncStreamingProcessor final : public StreamingProcessor {
  public:
   explicit AsyncStreamingProcessor(AsyncCompileJob* job,
                                    std::shared_ptr<Counters> counters,
                                    AccountingAllocator* allocator);

   ~AsyncStreamingProcessor() override;

   bool ProcessModuleHeader(Vector<const uint8_t> bytes,
                            uint32_t offset) override;

   bool ProcessSection(SectionCode section_code, Vector<const uint8_t> bytes,
                       uint32_t offset) override;

   bool ProcessCodeSectionHeader(int num_functions, uint32_t offset,
                                 std::shared_ptr<WireBytesStorage>,
                                 int code_section_length) override;

   bool ProcessFunctionBody(Vector<const uint8_t> bytes,
                            uint32_t offset) override;

   void OnFinishedChunk() override;

   void OnFinishedStream(OwnedVector<uint8_t> bytes) override;

   void OnError(const WasmError&) override;

   void OnAbort() override;

   bool Deserialize(Vector<const uint8_t> wire_bytes,
                    Vector<const uint8_t> module_bytes) override;

  private:
   // Finishes the AsyncCompileJob with an error.
   void FinishAsyncCompileJobWithError(const WasmError&);

   void CommitCompilationUnits();

   ModuleDecoder decoder_;
   AsyncCompileJob* job_;
   WasmEngine* wasm_engine_;
   std::unique_ptr<CompilationUnitBuilder> compilation_unit_builder_;
   int num_functions_ = 0;
   bool prefix_cache_hit_ = false;
   bool before_code_section_ = true;
   std::shared_ptr<Counters> async_counters_;
   AccountingAllocator* allocator_;

   // Running hash of the wire bytes up to code section size, but excluding the
   // code section itself. Used by the {NativeModuleCache} to detect potential
   // duplicate modules.
   size_t prefix_hash_;
 };

 std::shared_ptr<StreamingDecoder> AsyncCompileJob::CreateStreamingDecoder() {
   DCHECK_NULL(stream_);
   stream_ = StreamingDecoder::CreateAsyncStreamingDecoder(
       std::make_unique<AsyncStreamingProcessor>(
           this, isolate_->async_counters(), isolate_->allocator()));
   return stream_;
 }

 AsyncCompileJob::~AsyncCompileJob() {
   // Note: This destructor always runs on the foreground thread of the isolate.
   background_task_manager_.CancelAndWait();
   // If the runtime objects were not created yet, then initial compilation did
   // not finish yet. In this case we can abort compilation.
   if (native_module_ && module_object_.is_null()) {
     Impl(native_module_->compilation_state())->CancelCompilation();
   }
   // Tell the streaming decoder that the AsyncCompileJob is not available
   // anymore.
   // TODO(ahaas): Is this notification really necessary? Check
   // https://crbug.com/888170.
   if (stream_) stream_->NotifyCompilationEnded();
   CancelPendingForegroundTask();
   isolate_->global_handles()->Destroy(native_context_.location());
   isolate_->global_handles()->Destroy(incumbent_context_.location());
   if (!module_object_.is_null()) {
     isolate_->global_handles()->Destroy(module_object_.location());
   }
 }

 void AsyncCompileJob::CreateNativeModule(
     std::shared_ptr<const WasmModule> module, size_t code_size_estimate) {
 #if !defined(DISABLE_WASM_COMPILER_ISSUE_STARBOARD)
   // Embedder usage count for declared shared memories.
   if (module->has_shared_memory) {
     isolate_->CountUsage(v8::Isolate::UseCounterFeature::kWasmSharedMemory);
   }

   // TODO(wasm): Improve efficiency of storing module wire bytes. Only store
   // relevant sections, not function bodies

   // Create the module object and populate with compiled functions and
   // information needed at instantiation time.

   native_module_ = isolate_->wasm_engine()->NewNativeModule(
       isolate_, enabled_features_, std::move(module), code_size_estimate);
   native_module_->SetWireBytes({std::move(bytes_copy_), wire_bytes_.length()});
 #endif
 }

 bool AsyncCompileJob::GetOrCreateNativeModule(
     std::shared_ptr<const WasmModule> module, size_t code_size_estimate) {
   native_module_ = isolate_->wasm_engine()->MaybeGetNativeModule(
       module->origin, wire_bytes_.module_bytes(), isolate_);
   if (native_module_ == nullptr) {
     CreateNativeModule(std::move(module), code_size_estimate);
     return false;
   }
   return true;
 }

 void AsyncCompileJob::PrepareRuntimeObjects() {
   // Create heap objects for script and module bytes to be stored in the
   // module object. Asm.js is not compiled asynchronously.
   DCHECK(module_object_.is_null());
   auto source_url = stream_ ? stream_->url() : Vector<const char>();
   auto script = isolate_->wasm_engine()->GetOrCreateScript(
       isolate_, native_module_, source_url);
   Handle<WasmModuleObject> module_object =
       WasmModuleObject::New(isolate_, native_module_, script);

   module_object_ = isolate_->global_handles()->Create(*module_object);
 }

 // This function assumes that it is executed in a HandleScope, and that a
 // context is set on the isolate.
 void AsyncCompileJob::FinishCompile(bool is_after_cache_hit) {
   TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                "wasm.FinishAsyncCompile");
   bool is_after_deserialization = !module_object_.is_null();
   auto compilation_state = Impl(native_module_->compilation_state());
   if (!is_after_deserialization) {
     if (stream_) {
       stream_->NotifyNativeModuleCreated(native_module_);
     }
     PrepareRuntimeObjects();
   }

   // Measure duration of baseline compilation or deserialization from cache.
   if (base::TimeTicks::IsHighResolution()) {
     base::TimeDelta duration = base::TimeTicks::Now() - start_time_;
     int duration_usecs = static_cast<int>(duration.InMicroseconds());
     isolate_->counters()->wasm_streaming_finish_wasm_module_time()->AddSample(
         duration_usecs);

     if (is_after_cache_hit || is_after_deserialization) {
       v8::metrics::WasmModuleCompiled event{
           true,                                     // async
           true,                                     // streamed
           is_after_cache_hit,                       // cached
           is_after_deserialization,                 // deserialized
           wasm_lazy_compilation_,                   // lazy
           !compilation_state->failed(),             // success
           native_module_->liftoff_code_size(),      // code_size_in_bytes
           native_module_->liftoff_bailout_count(),  // liftoff_bailout_count
           duration.InMicroseconds(),                // wall_clock_time_in_us
           duration.InMicroseconds()                 // wall_clock_duration_in_us
       };
       isolate_->metrics_recorder()->DelayMainThreadEvent(event, context_id_);
     }
   }

   DCHECK(!isolate_->context().is_null());
   // Finish the wasm script now and make it public to the debugger.
   Handle<Script> script(module_object_->script(), isolate_);
   const WasmModule* module = module_object_->module();
   if (script->type() == Script::TYPE_WASM &&
       module->debug_symbols.type == WasmDebugSymbols::Type::SourceMap &&
       !module->debug_symbols.external_url.is_empty()) {
     ModuleWireBytes wire_bytes(module_object_->native_module()->wire_bytes());
     MaybeHandle<String> src_map_str = isolate_->factory()->NewStringFromUtf8(
         wire_bytes.GetNameOrNull(module->debug_symbols.external_url),
         AllocationType::kOld);
     script->set_source_mapping_url(*src_map_str.ToHandleChecked());
   }
   {
     TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                  "wasm.Debug.OnAfterCompile");
     isolate_->debug()->OnAfterCompile(script);
   }

   // TODO(bbudge) Allow deserialization without wrapper compilation, so we can
   // just compile wrappers here.
   if (!is_after_deserialization) {
     Handle<FixedArray> export_wrappers;
     if (is_after_cache_hit) {
       // TODO(thibaudm): Look into sharing wrappers.
       CompileJsToWasmWrappers(isolate_, module, &export_wrappers);
     } else {
       compilation_state->FinalizeJSToWasmWrappers(isolate_, module,
                                                   &export_wrappers);
     }
     module_object_->set_export_wrappers(*export_wrappers);
   }
   // We can only update the feature counts once the entire compile is done.
   compilation_state->PublishDetectedFeatures(isolate_);

   FinishModule();
 }

 void AsyncCompileJob::DecodeFailed(const WasmError& error) {
   ErrorThrower thrower(isolate_, api_method_name_);
   thrower.CompileFailed(error);
   // {job} keeps the {this} pointer alive.
   std::shared_ptr<AsyncCompileJob> job =
       isolate_->wasm_engine()->RemoveCompileJob(this);
   resolver_->OnCompilationFailed(thrower.Reify());
 }

 void AsyncCompileJob::AsyncCompileFailed() {
   ErrorThrower thrower(isolate_, api_method_name_);
   DCHECK_EQ(native_module_->module()->origin, kWasmOrigin);
   const bool lazy_module = wasm_lazy_compilation_;
   ValidateSequentially(native_module_->module(), native_module_.get(),
                        isolate_->counters(), isolate_->allocator(), &thrower,
                        lazy_module);
   DCHECK(thrower.error());
   // {job} keeps the {this} pointer alive.
   std::shared_ptr<AsyncCompileJob> job =
       isolate_->wasm_engine()->RemoveCompileJob(this);
   resolver_->OnCompilationFailed(thrower.Reify());
 }

 void AsyncCompileJob::AsyncCompileSucceeded(Handle<WasmModuleObject> result) {
   TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                "wasm.OnCompilationSucceeded");
   // We have to make sure that an "incumbent context" is available in case
   // the module's start function calls out to Blink.
   Local<v8::Context> backup_incumbent_context =
       Utils::ToLocal(incumbent_context_);
   v8::Context::BackupIncumbentScope incumbent(backup_incumbent_context);
   resolver_->OnCompilationSucceeded(result);
 }

 class AsyncCompileJob::CompilationStateCallback {
  public:
   explicit CompilationStateCallback(AsyncCompileJob* job) : job_(job) {}

   void operator()(CompilationEvent event) {
     // This callback is only being called from a foreground task.
     switch (event) {
       case CompilationEvent::kFinishedExportWrappers:
         // Even if baseline compilation units finish first, we trigger the
         // "kFinishedExportWrappers" event first.
         DCHECK(!last_event_.has_value());
         break;
       case CompilationEvent::kFinishedBaselineCompilation:
         DCHECK_EQ(CompilationEvent::kFinishedExportWrappers, last_event_);
         if (job_->DecrementAndCheckFinisherCount()) {
           // Install the native module in the cache, or reuse a conflicting one.
           // If we get a conflicting module, wait until we are back in the
           // main thread to update {job_->native_module_} to avoid a data race.
           std::shared_ptr<NativeModule> native_module = job_->native_module_;
           bool cache_hit =
               !job_->isolate_->wasm_engine()->UpdateNativeModuleCache(
                   false, &native_module, job_->isolate_);
           DCHECK_EQ(cache_hit, native_module != job_->native_module_);
           job_->DoSync<CompileFinished>(cache_hit ? std::move(native_module)
                                                   : nullptr);
         }
         break;
       case CompilationEvent::kFinishedTopTierCompilation:
         DCHECK_EQ(CompilationEvent::kFinishedBaselineCompilation, last_event_);
         // At this point, the job will already be gone, thus do not access it
         // here.
         break;
       case CompilationEvent::kFailedCompilation:
         DCHECK(!last_event_.has_value() ||
                last_event_ == CompilationEvent::kFinishedExportWrappers);
         if (job_->DecrementAndCheckFinisherCount()) {
           // Don't update {job_->native_module_} to avoid data races with other
           // compilation threads. Use a copy of the shared pointer instead.
           std::shared_ptr<NativeModule> native_module = job_->native_module_;
           job_->isolate_->wasm_engine()->UpdateNativeModuleCache(
               true, &native_module, job_->isolate_);
           job_->DoSync<CompileFailed>();
         }
         break;
       case CompilationEvent::kFinishedRecompilation:
         // This event can happen either before or after
         // {kFinishedTopTierCompilation}, hence don't remember this in
         // {last_event_}.
         return;
     }
 #ifdef DEBUG
     last_event_ = event;
 #endif
   }

  private:
   AsyncCompileJob* job_;
 #ifdef DEBUG
   // This will be modified by different threads, but they externally
   // synchronize, so no explicit synchronization (currently) needed here.
   base::Optional<CompilationEvent> last_event_;
 #endif
 };

 // A closure to run a compilation step (either as foreground or background
 // task) and schedule the next step(s), if any.
 class AsyncCompileJob::CompileStep {
  public:
   virtual ~CompileStep() = default;

   void Run(AsyncCompileJob* job, bool on_foreground) {
     if (on_foreground) {
       HandleScope scope(job->isolate_);
       SaveAndSwitchContext saved_context(job->isolate_, *job->native_context_);
       RunInForeground(job);
     } else {
       RunInBackground(job);
     }
   }

   virtual void RunInForeground(AsyncCompileJob*) { UNREACHABLE(); }
   virtual void RunInBackground(AsyncCompileJob*) { UNREACHABLE(); }
 };

 class AsyncCompileJob::CompileTask : public CancelableTask {
  public:
   CompileTask(AsyncCompileJob* job, bool on_foreground)
       // We only manage the background tasks with the {CancelableTaskManager} of
       // the {AsyncCompileJob}. Foreground tasks are managed by the system's
       // {CancelableTaskManager}. Background tasks cannot spawn tasks managed by
       // their own task manager.
       : CancelableTask(on_foreground ? job->isolate_->cancelable_task_manager()
                                      : &job->background_task_manager_),
         job_(job),
         on_foreground_(on_foreground) {}

   ~CompileTask() override {
     if (job_ != nullptr && on_foreground_) ResetPendingForegroundTask();
   }

   void RunInternal() final {
     if (!job_) return;
     if (on_foreground_) ResetPendingForegroundTask();
     job_->step_->Run(job_, on_foreground_);
     // After execution, reset {job_} such that we don't try to reset the pending
     // foreground task when the task is deleted.
     job_ = nullptr;
   }

   void Cancel() {
     DCHECK_NOT_NULL(job_);
     job_ = nullptr;
   }

  private:
   // {job_} will be cleared to cancel a pending task.
   AsyncCompileJob* job_;
   bool on_foreground_;

   void ResetPendingForegroundTask() const {
     DCHECK_EQ(this, job_->pending_foreground_task_);
     job_->pending_foreground_task_ = nullptr;
   }
 };

 void AsyncCompileJob::StartForegroundTask() {
   DCHECK_NULL(pending_foreground_task_);

   auto new_task = std::make_unique<CompileTask>(this, true);
   pending_foreground_task_ = new_task.get();
   foreground_task_runner_->PostTask(std::move(new_task));
 }

 void AsyncCompileJob::ExecuteForegroundTaskImmediately() {
   DCHECK_NULL(pending_foreground_task_);

   auto new_task = std::make_unique<CompileTask>(this, true);
   pending_foreground_task_ = new_task.get();
   new_task->Run();
 }

 void AsyncCompileJob::CancelPendingForegroundTask() {
   if (!pending_foreground_task_) return;
   pending_foreground_task_->Cancel();
   pending_foreground_task_ = nullptr;
 }

 void AsyncCompileJob::StartBackgroundTask() {
   auto task = std::make_unique<CompileTask>(this, false);

   // If --wasm-num-compilation-tasks=0 is passed, do only spawn foreground
   // tasks. This is used to make timing deterministic.
   if (FLAG_wasm_num_compilation_tasks > 0) {
     V8::GetCurrentPlatform()->CallOnWorkerThread(std::move(task));
   } else {
     foreground_task_runner_->PostTask(std::move(task));
   }
 }

 template <typename Step,
           AsyncCompileJob::UseExistingForegroundTask use_existing_fg_task,
           typename... Args>
 void AsyncCompileJob::DoSync(Args&&... args) {
   NextStep<Step>(std::forward<Args>(args)...);
   if (use_existing_fg_task && pending_foreground_task_ != nullptr) return;
   StartForegroundTask();
 }

 template <typename Step, typename... Args>
 void AsyncCompileJob::DoImmediately(Args&&... args) {
   NextStep<Step>(std::forward<Args>(args)...);
   ExecuteForegroundTaskImmediately();
 }

 template <typename Step, typename... Args>
 void AsyncCompileJob::DoAsync(Args&&... args) {
   NextStep<Step>(std::forward<Args>(args)...);
   StartBackgroundTask();
 }

 template <typename Step, typename... Args>
 void AsyncCompileJob::NextStep(Args&&... args) {
   step_.reset(new Step(std::forward<Args>(args)...));
 }

 //==========================================================================
 // Step 1: (async) Decode the module.
 //==========================================================================
 class AsyncCompileJob::DecodeModule : public AsyncCompileJob::CompileStep {
  public:
   explicit DecodeModule(Counters* counters,
                         std::shared_ptr<metrics::Recorder> metrics_recorder)
       : counters_(counters), metrics_recorder_(std::move(metrics_recorder)) {}

   void RunInBackground(AsyncCompileJob* job) override {
     ModuleResult result;
     {
       DisallowHandleAllocation no_handle;
       DisallowHeapAllocation no_allocation;
       // Decode the module bytes.
       TRACE_COMPILE("(1) Decoding module...\n");
       TRACE_EVENT0(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                    "wasm.DecodeModule");
       auto enabled_features = job->enabled_features_;
       result = DecodeWasmModule(
           enabled_features, job->wire_bytes_.start(), job->wire_bytes_.end(),
           false, kWasmOrigin, counters_, metrics_recorder_, job->context_id(),
           DecodingMethod::kAsync, job->isolate()->wasm_engine()->allocator());

       // Validate lazy functions here if requested.
       if (!FLAG_wasm_lazy_validation && result.ok()) {
         const WasmModule* module = result.value().get();
         DCHECK_EQ(module->origin, kWasmOrigin);
         const bool lazy_module = job->wasm_lazy_compilation_;
         if (MayCompriseLazyFunctions(module, enabled_features, lazy_module)) {
           auto allocator = job->isolate()->wasm_engine()->allocator();
           int start = module->num_imported_functions;
           int end = start + module->num_declared_functions;

           for (int func_index = start; func_index < end; func_index++) {
             const WasmFunction* func = &module->functions[func_index];
             Vector<const uint8_t> code =
                 job->wire_bytes_.GetFunctionBytes(func);

             CompileStrategy strategy = GetCompileStrategy(
                 module, enabled_features, func_index, lazy_module);
             bool validate_lazily_compiled_function =
                 strategy == CompileStrategy::kLazy ||
                 strategy == CompileStrategy::kLazyBaselineEagerTopTier;
             if (validate_lazily_compiled_function) {
               DecodeResult function_result =
                   ValidateSingleFunction(module, func_index, code, counters_,
                                          allocator, enabled_features);
               if (function_result.failed()) {
                 result = ModuleResult(function_result.error());
                 break;
               }
             }
           }
         }
       }
     }
     if (result.failed()) {
       // Decoding failure; reject the promise and clean up.
       job->DoSync<DecodeFail>(std::move(result).error());
     } else {
       // Decode passed.
       std::shared_ptr<WasmModule> module = std::move(result).value();
       const bool kUsesLiftoff = false;
       size_t code_size_estimate =
           wasm::WasmCodeManager::EstimateNativeModuleCodeSize(module.get(),
                                                               kUsesLiftoff);
       job->DoSync<PrepareAndStartCompile>(std::move(module), true,
                                           code_size_estimate);
     }
   }

  private:
   Counters* const counters_;
   std::shared_ptr<metrics::Recorder> metrics_recorder_;
 };

 //==========================================================================
 // Step 1b: (sync) Fail decoding the module.
 //==========================================================================
 class AsyncCompileJob::DecodeFail : public CompileStep {
  public:
   explicit DecodeFail(WasmError error) : error_(std::move(error)) {}

  private:
   WasmError error_;

   void RunInForeground(AsyncCompileJob* job) override {
     TRACE_COMPILE("(1b) Decoding failed.\n");
     // {job_} is deleted in DecodeFailed, therefore the {return}.
     return job->DecodeFailed(error_);
   }
 };

 //==========================================================================
 // Step 2 (sync): Create heap-allocated data and start compile.
 //==========================================================================
 class AsyncCompileJob::PrepareAndStartCompile : public CompileStep {
  public:
   PrepareAndStartCompile(std::shared_ptr<const WasmModule> module,
                          bool start_compilation, size_t code_size_estimate)
       : module_(std::move(module)),
         start_compilation_(start_compilation),
         code_size_estimate_(code_size_estimate) {}

  private:
   const std::shared_ptr<const WasmModule> module_;
   const bool start_compilation_;
   const size_t code_size_estimate_;

   void RunInForeground(AsyncCompileJob* job) override {
     TRACE_COMPILE("(2) Prepare and start compile...\n");

     const bool streaming = job->wire_bytes_.length() == 0;
     if (streaming) {
       // Streaming compilation already checked for cache hits.
       job->CreateNativeModule(module_, code_size_estimate_);
     } else if (job->GetOrCreateNativeModule(std::move(module_),
                                             code_size_estimate_)) {
       job->FinishCompile(true);
       return;
     }

     // Make sure all compilation tasks stopped running. Decoding (async step)
     // is done.
     job->background_task_manager_.CancelAndWait();

     CompilationStateImpl* compilation_state =
         Impl(job->native_module_->compilation_state());
     compilation_state->AddCallback(CompilationStateCallback{job});
     if (base::TimeTicks::IsHighResolution()) {
       auto compile_mode = job->stream_ == nullptr
                               ? CompilationTimeCallback::kAsync
                               : CompilationTimeCallback::kStreaming;
       compilation_state->AddCallback(CompilationTimeCallback{
           job->isolate_->async_counters(), job->isolate_->metrics_recorder(),
           job->context_id_, job->native_module_, compile_mode});
     }

     if (start_compilation_) {
       // TODO(ahaas): Try to remove the {start_compilation_} check when
       // streaming decoding is done in the background. If
       // InitializeCompilationUnits always returns 0 for streaming compilation,
       // then DoAsync would do the same as NextStep already.

       // Add compilation units and kick off compilation.
       InitializeCompilationUnits(job->isolate(), job->native_module_.get());
     }
   }
 };

 //==========================================================================
 // Step 3a (sync): Compilation failed.
 //==========================================================================
 class AsyncCompileJob::CompileFailed : public CompileStep {
  private:
   void RunInForeground(AsyncCompileJob* job) override {
     TRACE_COMPILE("(3a) Compilation failed\n");
     DCHECK(job->native_module_->compilation_state()->failed());

     // {job_} is deleted in AsyncCompileFailed, therefore the {return}.
     return job->AsyncCompileFailed();
   }
 };

 namespace {
 class SampleTopTierCodeSizeCallback {
  public:
   explicit SampleTopTierCodeSizeCallback(
       std::weak_ptr<NativeModule> native_module)
       : native_module_(std::move(native_module)) {}

   void operator()(CompilationEvent event) {
     if (event != CompilationEvent::kFinishedTopTierCompilation) return;
     if (std::shared_ptr<NativeModule> native_module = native_module_.lock()) {
       native_module->engine()->SampleTopTierCodeSizeInAllIsolates(
           native_module);
     }
   }

  private:
   std::weak_ptr<NativeModule> native_module_;
 };
 }  // namespace

 //==========================================================================
 // Step 3b (sync): Compilation finished.
 //==========================================================================
 class AsyncCompileJob::CompileFinished : public CompileStep {
  public:
   explicit CompileFinished(std::shared_ptr<NativeModule> cached_native_module)
       : cached_native_module_(std::move(cached_native_module)) {}

  private:
   void RunInForeground(AsyncCompileJob* job) override {
     TRACE_COMPILE("(3b) Compilation finished\n");
     if (cached_native_module_) {
       job->native_module_ = cached_native_module_;
     } else {
       DCHECK(!job->native_module_->compilation_state()->failed());
       // Sample the generated code size when baseline compilation finished.
       job->native_module_->SampleCodeSize(job->isolate_->counters(),
                                           NativeModule::kAfterBaseline);
       // Also, set a callback to sample the code size after top-tier compilation
       // finished. This callback will *not* keep the NativeModule alive.
       job->native_module_->compilation_state()->AddCallback(
           SampleTopTierCodeSizeCallback{job->native_module_});
     }
     // Then finalize and publish the generated module.
     job->FinishCompile(cached_native_module_ != nullptr);
   }

   std::shared_ptr<NativeModule> cached_native_module_;
 };

 void AsyncCompileJob::FinishModule() {
   TRACE_COMPILE("(4) Finish module...\n");
   AsyncCompileSucceeded(module_object_);
   isolate_->wasm_engine()->RemoveCompileJob(this);
 }

 AsyncStreamingProcessor::AsyncStreamingProcessor(
     AsyncCompileJob* job, std::shared_ptr<Counters> async_counters,
     AccountingAllocator* allocator)
     : decoder_(job->enabled_features_),
       job_(job),
       wasm_engine_(job_->isolate_->wasm_engine()),
       compilation_unit_builder_(nullptr),
       async_counters_(async_counters),
       allocator_(allocator) {}

 AsyncStreamingProcessor::~AsyncStreamingProcessor() {
   if (job_->native_module_ && job_->native_module_->wire_bytes().empty()) {
     // Clean up the temporary cache entry.
     job_->isolate_->wasm_engine()->StreamingCompilationFailed(prefix_hash_);
   }
 }

 void AsyncStreamingProcessor::FinishAsyncCompileJobWithError(
     const WasmError& error) {
   DCHECK(error.has_error());
   // Make sure all background tasks stopped executing before we change the state
   // of the AsyncCompileJob to DecodeFail.
   job_->background_task_manager_.CancelAndWait();

   // Record event metrics.
   auto duration = base::TimeTicks::Now() - job_->start_time_;
   job_->metrics_event_.success = false;
   job_->metrics_event_.streamed = true;
   job_->metrics_event_.module_size_in_bytes = job_->wire_bytes_.length();
   job_->metrics_event_.function_count = num_functions_;
   job_->metrics_event_.wall_clock_time_in_us = duration.InMicroseconds();
   job_->metrics_event_.wall_clock_duration_in_us = duration.InMicroseconds();
   job_->isolate_->metrics_recorder()->DelayMainThreadEvent(job_->metrics_event_,
                                                            job_->context_id_);

   // Check if there is already a CompiledModule, in which case we have to clean
   // up the CompilationStateImpl as well.
   if (job_->native_module_) {
     Impl(job_->native_module_->compilation_state())->CancelCompilation();

     job_->DoSync<AsyncCompileJob::DecodeFail,
                  AsyncCompileJob::kUseExistingForegroundTask>(error);

     // Clear the {compilation_unit_builder_} if it exists. This is needed
     // because there is a check in the destructor of the
     // {CompilationUnitBuilder} that it is empty.
     if (compilation_unit_builder_) compilation_unit_builder_->Clear();
   } else {
     job_->DoSync<AsyncCompileJob::DecodeFail>(error);
   }
 }

 // Process the module header.
 bool AsyncStreamingProcessor::ProcessModuleHeader(Vector<const uint8_t> bytes,
                                                   uint32_t offset) {
   TRACE_STREAMING("Process module header...\n");
   decoder_.StartDecoding(
       job_->isolate()->counters(), job_->isolate()->metrics_recorder(),
       job_->context_id(), job_->isolate()->wasm_engine()->allocator());
   decoder_.DecodeModuleHeader(bytes, offset);
   if (!decoder_.ok()) {
     FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error());
     return false;
   }
   prefix_hash_ = NativeModuleCache::WireBytesHash(bytes);
   return true;
 }

 // Process all sections except for the code section.
 bool AsyncStreamingProcessor::ProcessSection(SectionCode section_code,
                                              Vector<const uint8_t> bytes,
                                              uint32_t offset) {
   TRACE_STREAMING("Process section %d ...\n", section_code);
   if (compilation_unit_builder_) {
     // We reached a section after the code section, we do not need the
     // compilation_unit_builder_ anymore.
     CommitCompilationUnits();
     compilation_unit_builder_.reset();
   }
   if (before_code_section_) {
     // Combine section hashes until code section.
     prefix_hash_ = base::hash_combine(prefix_hash_,
                                       NativeModuleCache::WireBytesHash(bytes));
   }
   if (section_code == SectionCode::kUnknownSectionCode) {
     size_t bytes_consumed = ModuleDecoder::IdentifyUnknownSection(
         &decoder_, bytes, offset, &section_code);
     if (!decoder_.ok()) {
       FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error());
       return false;
     }
     if (section_code == SectionCode::kUnknownSectionCode) {
       // Skip unknown sections that we do not know how to handle.
       return true;
     }
     // Remove the unknown section tag from the payload bytes.
     offset += bytes_consumed;
     bytes = bytes.SubVector(bytes_consumed, bytes.size());
   }
   constexpr bool verify_functions = false;
   decoder_.DecodeSection(section_code, bytes, offset, verify_functions);
   if (!decoder_.ok()) {
     FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error());
     return false;
   }
   return true;
 }

 // Start the code section.
 bool AsyncStreamingProcessor::ProcessCodeSectionHeader(
     int num_functions, uint32_t offset,
     std::shared_ptr<WireBytesStorage> wire_bytes_storage,
     int code_section_length) {
   DCHECK_LE(0, code_section_length);
   before_code_section_ = false;
   TRACE_STREAMING("Start the code section with %d functions...\n",
                   num_functions);
   if (!decoder_.CheckFunctionsCount(static_cast<uint32_t>(num_functions),
                                     offset)) {
     FinishAsyncCompileJobWithError(decoder_.FinishDecoding(false).error());
     return false;
   }

   decoder_.set_code_section(offset, static_cast<uint32_t>(code_section_length));

   prefix_hash_ = base::hash_combine(prefix_hash_,
                                     static_cast<uint32_t>(code_section_length));
   if (!wasm_engine_->GetStreamingCompilationOwnership(prefix_hash_)) {
     // Known prefix, wait until the end of the stream and check the cache.
     prefix_cache_hit_ = true;
     return true;
   }

   // Execute the PrepareAndStartCompile step immediately and not in a separate
   // task.
   int num_imported_functions =
       static_cast<int>(decoder_.module()->num_imported_functions);
   DCHECK_EQ(kWasmOrigin, decoder_.module()->origin);
   const bool uses_liftoff = FLAG_liftoff;
   size_t code_size_estimate =
       wasm::WasmCodeManager::EstimateNativeModuleCodeSize(
           num_functions, num_imported_functions, code_section_length,
           uses_liftoff);
   job_->DoImmediately<AsyncCompileJob::PrepareAndStartCompile>(
       decoder_.shared_module(), false, code_size_estimate);

   auto* compilation_state = Impl(job_->native_module_->compilation_state());
   compilation_state->SetWireBytesStorage(std::move(wire_bytes_storage));
   DCHECK_EQ(job_->native_module_->module()->origin, kWasmOrigin);
   const bool lazy_module = job_->wasm_lazy_compilation_;

   // Set outstanding_finishers_ to 2, because both the AsyncCompileJob and the
   // AsyncStreamingProcessor have to finish.
   job_->outstanding_finishers_.store(2);
   compilation_unit_builder_.reset(
       new CompilationUnitBuilder(job_->native_module_.get()));

   NativeModule* native_module = job_->native_module_.get();

   int num_import_wrappers =
       AddImportWrapperUnits(native_module, compilation_unit_builder_.get());
   int num_export_wrappers = AddExportWrapperUnits(
       job_->isolate_, wasm_engine_, native_module,
       compilation_unit_builder_.get(), job_->enabled_features_);
   compilation_state->InitializeCompilationProgress(
       lazy_module, num_import_wrappers, num_export_wrappers);
   return true;
 }

 // Process a function body.
 bool AsyncStreamingProcessor::ProcessFunctionBody(Vector<const uint8_t> bytes,
                                                   uint32_t offset) {
   TRACE_STREAMING("Process function body %d ...\n", num_functions_);

   decoder_.DecodeFunctionBody(
       num_functions_, static_cast<uint32_t>(bytes.length()), offset, false);

   const WasmModule* module = decoder_.module();
   auto enabled_features = job_->enabled_features_;
   uint32_t func_index =
       num_functions_ + decoder_.module()->num_imported_functions;
   DCHECK_EQ(module->origin, kWasmOrigin);
   const bool lazy_module = job_->wasm_lazy_compilation_;
   CompileStrategy strategy =
       GetCompileStrategy(module, enabled_features, func_index, lazy_module);
   bool validate_lazily_compiled_function =
       !FLAG_wasm_lazy_validation &&
       (strategy == CompileStrategy::kLazy ||
        strategy == CompileStrategy::kLazyBaselineEagerTopTier);
   if (validate_lazily_compiled_function) {
     // The native module does not own the wire bytes until {SetWireBytes} is
     // called in {OnFinishedStream}. Validation must use {bytes} parameter.
     DecodeResult result =
         ValidateSingleFunction(module, func_index, bytes, async_counters_.get(),
                                allocator_, enabled_features);

     if (result.failed()) {
       FinishAsyncCompileJobWithError(result.error());
       return false;
     }
   }

   // Don't compile yet if we might have a cache hit.
   if (prefix_cache_hit_) {
     num_functions_++;
     return true;
   }

   NativeModule* native_module = job_->native_module_.get();
   if (strategy == CompileStrategy::kLazy) {
     native_module->UseLazyStub(func_index);
   } else if (strategy == CompileStrategy::kLazyBaselineEagerTopTier) {
     compilation_unit_builder_->AddTopTierUnit(func_index);
     native_module->UseLazyStub(func_index);
   } else {
     DCHECK_EQ(strategy, CompileStrategy::kEager);
     compilation_unit_builder_->AddUnits(func_index);
   }

   ++num_functions_;

   return true;
 }

 void AsyncStreamingProcessor::CommitCompilationUnits() {
   DCHECK(compilation_unit_builder_);
   compilation_unit_builder_->Commit();
 }

 void AsyncStreamingProcessor::OnFinishedChunk() {
   TRACE_STREAMING("FinishChunk...\n");
   if (compilation_unit_builder_) CommitCompilationUnits();
 }

 // Finish the processing of the stream.
 void AsyncStreamingProcessor::OnFinishedStream(OwnedVector<uint8_t> bytes) {
   TRACE_STREAMING("Finish stream...\n");
   DCHECK_EQ(NativeModuleCache::PrefixHash(bytes.as_vector()), prefix_hash_);
   ModuleResult result = decoder_.FinishDecoding(false);
   if (result.failed()) {
     FinishAsyncCompileJobWithError(result.error());
     return;
   }

   job_->wire_bytes_ = ModuleWireBytes(bytes.as_vector());
   job_->bytes_copy_ = bytes.ReleaseData();

   // Record event metrics.
   auto duration = base::TimeTicks::Now() - job_->start_time_;
   job_->metrics_event_.success = true;
   job_->metrics_event_.streamed = true;
   job_->metrics_event_.module_size_in_bytes = job_->wire_bytes_.length();
   job_->metrics_event_.function_count = num_functions_;
   job_->metrics_event_.wall_clock_time_in_us = duration.InMicroseconds();
   job_->metrics_event_.wall_clock_duration_in_us = duration.InMicroseconds();
   job_->isolate_->metrics_recorder()->DelayMainThreadEvent(job_->metrics_event_,
                                                            job_->context_id_);

   if (prefix_cache_hit_) {
     // Restart as an asynchronous, non-streaming compilation. Most likely
     // {PrepareAndStartCompile} will get the native module from the cache.
     size_t code_size_estimate =
         wasm::WasmCodeManager::EstimateNativeModuleCodeSize(
             result.value().get(), FLAG_liftoff);
     job_->DoSync<AsyncCompileJob::PrepareAndStartCompile>(
         std::move(result).value(), true, code_size_estimate);
     return;
   }

   // We have to open a HandleScope and prepare the Context for
   // CreateNativeModule, PrepareRuntimeObjects and FinishCompile as this is a
   // callback from the embedder.
   HandleScope scope(job_->isolate_);
   SaveAndSwitchContext saved_context(job_->isolate_, *job_->native_context_);

   // Record the size of the wire bytes. In synchronous and asynchronous
   // (non-streaming) compilation, this happens in {DecodeWasmModule}.
   auto* histogram = job_->isolate_->counters()->wasm_wasm_module_size_bytes();
   histogram->AddSample(job_->wire_bytes_.module_bytes().length());

   const bool has_code_section = job_->native_module_ != nullptr;
   bool cache_hit = false;
   if (!has_code_section) {
     // We are processing a WebAssembly module without code section. Create the
     // native module now (would otherwise happen in {PrepareAndStartCompile} or
     // {ProcessCodeSectionHeader}).
     constexpr size_t kCodeSizeEstimate = 0;
     cache_hit = job_->GetOrCreateNativeModule(std::move(result).value(),
                                               kCodeSizeEstimate);
   } else {
 #if !defined(DISABLE_WASM_COMPILER_ISSUE_STARBOARD)
     job_->native_module_->SetWireBytes(
         {std::move(job_->bytes_copy_), job_->wire_bytes_.length()});
 #endif
     job_->native_module_->LogWasmCodes(job_->isolate_);
   }
   const bool needs_finish = job_->DecrementAndCheckFinisherCount();
   DCHECK_IMPLIES(!has_code_section, needs_finish);
   // We might need to recompile the module for debugging, if the debugger was
   // enabled while streaming compilation was running. Since handling this while
   // compiling via streaming is tricky, we just tier down now, before publishing
   // the module.
   if (job_->native_module_->IsTieredDown()) {
     job_->native_module_->RecompileForTiering();
   }
   if (needs_finish) {
     const bool failed = job_->native_module_->compilation_state()->failed();
     if (!cache_hit) {
       cache_hit = !job_->isolate_->wasm_engine()->UpdateNativeModuleCache(
           failed, &job_->native_module_, job_->isolate_);
     }
     if (failed) {
       job_->AsyncCompileFailed();
     } else {
       job_->FinishCompile(cache_hit);
     }
   }
 }

 // Report an error detected in the StreamingDecoder.
 void AsyncStreamingProcessor::OnError(const WasmError& error) {
   TRACE_STREAMING("Stream error...\n");
   FinishAsyncCompileJobWithError(error);
 }

 void AsyncStreamingProcessor::OnAbort() {
   TRACE_STREAMING("Abort stream...\n");
   job_->Abort();
 }

 bool AsyncStreamingProcessor::Deserialize(Vector<const uint8_t> module_bytes,
                                           Vector<const uint8_t> wire_bytes) {
   TRACE_EVENT0("v8.wasm", "wasm.Deserialize");
   // DeserializeNativeModule and FinishCompile assume that they are executed in
   // a HandleScope, and that a context is set on the isolate.
   HandleScope scope(job_->isolate_);
   SaveAndSwitchContext saved_context(job_->isolate_, *job_->native_context_);

   MaybeHandle<WasmModuleObject> result = DeserializeNativeModule(
       job_->isolate_, module_bytes, wire_bytes, job_->stream_->url());

   if (result.is_null()) return false;

   job_->module_object_ =
       job_->isolate_->global_handles()->Create(*result.ToHandleChecked());
   job_->native_module_ = job_->module_object_->shared_native_module();
   job_->wire_bytes_ = ModuleWireBytes(job_->native_module_->wire_bytes());
   job_->FinishCompile(false);
   return true;
 }

 CompilationStateImpl::CompilationStateImpl(
     const std::shared_ptr<NativeModule>& native_module,
     std::shared_ptr<Counters> async_counters)
     : native_module_(native_module.get()),
       native_module_weak_(std::move(native_module)),
       compile_mode_(FLAG_wasm_tier_up &&
                             native_module->module()->origin == kWasmOrigin
                         ? CompileMode::kTiering
                         : CompileMode::kRegular),
       async_counters_(std::move(async_counters)),
       compilation_unit_queues_(native_module->num_functions()) {}

 void CompilationStateImpl::CancelCompilation() {
   // No more callbacks after abort.
   base::MutexGuard callbacks_guard(&callbacks_mutex_);
   // std::memory_order_relaxed is sufficient because no other state is
   // synchronized with |compile_cancelled_|.
   compile_cancelled_.store(true, std::memory_order_relaxed);
   callbacks_.clear();
 }

 bool CompilationStateImpl::cancelled() const {
   return compile_cancelled_.load(std::memory_order_relaxed);
 }

 void CompilationStateImpl::InitializeCompilationProgress(
     bool lazy_module, int num_import_wrappers, int num_export_wrappers) {
   DCHECK(!failed());
   auto enabled_features = native_module_->enabled_features();
   auto* module = native_module_->module();

   base::MutexGuard guard(&callbacks_mutex_);
   DCHECK_EQ(0, outstanding_baseline_units_);
   DCHECK_EQ(0, outstanding_export_wrappers_);
   DCHECK_EQ(0, outstanding_top_tier_functions_);
   compilation_progress_.reserve(module->num_declared_functions);
   int start = module->num_imported_functions;
   int end = start + module->num_declared_functions;

   const bool prefer_liftoff = native_module_->IsTieredDown();
   for (int func_index = start; func_index < end; func_index++) {
     if (prefer_liftoff) {
       constexpr uint8_t kLiftoffOnlyFunctionProgress =
           RequiredTopTierField::encode(ExecutionTier::kLiftoff) |
           RequiredBaselineTierField::encode(ExecutionTier::kLiftoff) |
           ReachedTierField::encode(ExecutionTier::kNone);
       compilation_progress_.push_back(kLiftoffOnlyFunctionProgress);
       outstanding_baseline_units_++;
       outstanding_top_tier_functions_++;
       continue;
     }
     ExecutionTierPair requested_tiers = GetRequestedExecutionTiers(
         module, compile_mode(), enabled_features, func_index);
     CompileStrategy strategy =
         GetCompileStrategy(module, enabled_features, func_index, lazy_module);

     bool required_for_baseline = strategy == CompileStrategy::kEager;
     bool required_for_top_tier = strategy != CompileStrategy::kLazy;
     DCHECK_EQ(required_for_top_tier,
               strategy == CompileStrategy::kEager ||
                   strategy == CompileStrategy::kLazyBaselineEagerTopTier);

     // Count functions to complete baseline and top tier compilation.
     if (required_for_baseline) outstanding_baseline_units_++;
     if (required_for_top_tier) outstanding_top_tier_functions_++;

     // Initialize function's compilation progress.
     ExecutionTier required_baseline_tier = required_for_baseline
                                                ? requested_tiers.baseline_tier
                                                : ExecutionTier::kNone;
     ExecutionTier required_top_tier =
         required_for_top_tier ? requested_tiers.top_tier : ExecutionTier::kNone;
     uint8_t function_progress = ReachedTierField::encode(ExecutionTier::kNone);
     function_progress = RequiredBaselineTierField::update(
         function_progress, required_baseline_tier);
     function_progress =
         RequiredTopTierField::update(function_progress, required_top_tier);
     compilation_progress_.push_back(function_progress);
   }
   DCHECK_IMPLIES(lazy_module, outstanding_baseline_units_ == 0);
   DCHECK_IMPLIES(lazy_module, outstanding_top_tier_functions_ == 0);
   DCHECK_LE(0, outstanding_baseline_units_);
   DCHECK_LE(outstanding_baseline_units_, outstanding_top_tier_functions_);
   outstanding_baseline_units_ += num_import_wrappers;
   outstanding_export_wrappers_ = num_export_wrappers;

   // Trigger callbacks if module needs no baseline or top tier compilation. This
   // can be the case for an empty or fully lazy module.
   TriggerCallbacks();
 }

 void CompilationStateImpl::InitializeCompilationProgressAfterDeserialization() {
   auto* module = native_module_->module();
   base::MutexGuard guard(&callbacks_mutex_);
   DCHECK(compilation_progress_.empty());
   constexpr uint8_t kProgressAfterDeserialization =
       RequiredBaselineTierField::encode(ExecutionTier::kTurbofan) |
       RequiredTopTierField::encode(ExecutionTier::kTurbofan) |
       ReachedTierField::encode(ExecutionTier::kTurbofan);
   finished_events_.Add(CompilationEvent::kFinishedExportWrappers);
   finished_events_.Add(CompilationEvent::kFinishedBaselineCompilation);
   finished_events_.Add(CompilationEvent::kFinishedTopTierCompilation);
   compilation_progress_.assign(module->num_declared_functions,
                                kProgressAfterDeserialization);
 }

 void CompilationStateImpl::InitializeRecompilation(
     TieringState new_tiering_state,
     CompilationState::callback_t recompilation_finished_callback) {
   DCHECK(!failed());

   // Hold the mutex as long as possible, to synchronize between multiple
   // recompilations that are triggered at the same time (e.g. when the profiler
   // is disabled).
   base::Optional<base::MutexGuard> guard(&callbacks_mutex_);

   // For now, we cannot contribute to compilation here, because this would bump
   // the number of workers above the expected maximum concurrency. This can be
   // fixed once we grow the number of compilation unit queues dynamically.
   // TODO(clemensb): Contribute to compilation once the queues grow dynamically.
   while (outstanding_recompilation_functions_ > 0) {
     auto semaphore = std::make_shared<base::Semaphore>(0);
     callbacks_.emplace_back([semaphore](CompilationEvent event) {
       if (event == CompilationEvent::kFinishedRecompilation) {
         semaphore->Signal();
       }
     });
     guard.reset();
     semaphore->Wait();
     guard.emplace(&callbacks_mutex_);
   }

   // Information about compilation progress is shared between this class and the
   // NativeModule. Before updating information here, consult the NativeModule to
   // find all functions that need recompilation.
   // Since the current tiering state is updated on the NativeModule before
   // triggering recompilation, it's OK if the information is slightly outdated.
   // If we compile functions twice, the NativeModule will ignore all redundant
   // code (or code compiled for the wrong tier).
   std::vector<int> recompile_function_indexes =
       native_module_->FindFunctionsToRecompile(new_tiering_state);

   callbacks_.emplace_back(std::move(recompilation_finished_callback));
   tiering_state_ = new_tiering_state;

   // If compilation progress is not initialized yet, then compilation didn't
   // start yet, and new code will be kept tiered-down from the start. For
   // streaming compilation, there is a special path to tier down later, when
   // the module is complete. In any case, we don't need to recompile here.
   base::Optional<CompilationUnitBuilder> builder;
   if (compilation_progress_.size() > 0) {
     builder.emplace(native_module_);
     const WasmModule* module = native_module_->module();
     DCHECK_EQ(module->num_declared_functions, compilation_progress_.size());
     DCHECK_GE(module->num_declared_functions,
               recompile_function_indexes.size());
     outstanding_recompilation_functions_ =
         static_cast<int>(recompile_function_indexes.size());
     // Restart recompilation if another recompilation is already happening.
     for (auto& progress : compilation_progress_) {
       progress = MissingRecompilationField::update(progress, false);
     }
     auto new_tier = new_tiering_state == kTieredDown ? ExecutionTier::kLiftoff
                                                      : ExecutionTier::kTurbofan;
     int imported = module->num_imported_functions;
     // Generate necessary compilation units on the fly.
     for (int function_index : recompile_function_indexes) {
       DCHECK_LE(imported, function_index);
       int slot_index = function_index - imported;
       auto& progress = compilation_progress_[slot_index];
       progress = MissingRecompilationField::update(progress, true);
       builder->AddRecompilationUnit(function_index, new_tier);
     }
   }

   // Trigger callback if module needs no recompilation.
   if (outstanding_recompilation_functions_ == 0) {
     TriggerCallbacks(base::EnumSet<CompilationEvent>(
         {CompilationEvent::kFinishedRecompilation}));
   }

   if (builder.has_value()) {
     // Avoid holding lock while scheduling a compile job.
     guard.reset();
     builder->Commit();
   }
 }

 void CompilationStateImpl::AddCallback(CompilationState::callback_t callback) {
   base::MutexGuard callbacks_guard(&callbacks_mutex_);
   // Immediately trigger events that already happened.
   for (auto event : {CompilationEvent::kFinishedExportWrappers,
                      CompilationEvent::kFinishedBaselineCompilation,
                      CompilationEvent::kFinishedTopTierCompilation,
                      CompilationEvent::kFailedCompilation}) {
     if (finished_events_.contains(event)) {
       callback(event);
     }
   }
   constexpr base::EnumSet<CompilationEvent> kFinalEvents{
       CompilationEvent::kFinishedTopTierCompilation,
       CompilationEvent::kFailedCompilation};
   if (!finished_events_.contains_any(kFinalEvents)) {
     callbacks_.emplace_back(std::move(callback));
   }
 }

 void CompilationStateImpl::AddCompilationUnits(
     Vector<WasmCompilationUnit> baseline_units,
     Vector<WasmCompilationUnit> top_tier_units,
     Vector<std::shared_ptr<JSToWasmWrapperCompilationUnit>>
         js_to_wasm_wrapper_units) {
   if (!baseline_units.empty() || !top_tier_units.empty()) {
     compilation_unit_queues_.AddUnits(baseline_units, top_tier_units,
                                       native_module_->module());
   }
   if (!js_to_wasm_wrapper_units.empty()) {
     // |js_to_wasm_wrapper_units_| can only be modified before background
     // compilation started.
     DCHECK(!current_compile_job_ || !current_compile_job_->IsRunning());
     js_to_wasm_wrapper_units_.insert(js_to_wasm_wrapper_units_.end(),
                                      js_to_wasm_wrapper_units.begin(),
                                      js_to_wasm_wrapper_units.end());
   }
   ScheduleCompileJobForNewUnits();
 }

 void CompilationStateImpl::AddTopTierCompilationUnit(WasmCompilationUnit unit) {
   AddCompilationUnits({}, {&unit, 1}, {});
 }

 void CompilationStateImpl::AddTopTierPriorityCompilationUnit(
     WasmCompilationUnit unit, size_t priority) {
   compilation_unit_queues_.AddTopTierPriorityUnit(unit, priority);
   ScheduleCompileJobForNewUnits();
 }

 std::shared_ptr<JSToWasmWrapperCompilationUnit>
 CompilationStateImpl::GetNextJSToWasmWrapperCompilationUnit() {
   int wrapper_id =
       js_to_wasm_wrapper_id_.fetch_add(1, std::memory_order_relaxed);
   if (wrapper_id < static_cast<int>(js_to_wasm_wrapper_units_.size())) {
     return js_to_wasm_wrapper_units_[wrapper_id];
   }
   return nullptr;
 }

 void CompilationStateImpl::FinalizeJSToWasmWrappers(
     Isolate* isolate, const WasmModule* module,
     Handle<FixedArray>* export_wrappers_out) {
   *export_wrappers_out = isolate->factory()->NewFixedArray(
       MaxNumExportWrappers(module), AllocationType::kOld);
   // TODO(6792): Wrappers below are allocated with {Factory::NewCode}. As an
   // optimization we keep the code space unlocked to avoid repeated unlocking
   // because many such wrapper are allocated in sequence below.
   TRACE_EVENT1(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                "wasm.FinalizeJSToWasmWrappers", "wrappers",
                js_to_wasm_wrapper_units_.size());
   CodeSpaceMemoryModificationScope modification_scope(isolate->heap());
   for (auto& unit : js_to_wasm_wrapper_units_) {
     Handle<Code> code = unit->Finalize(isolate);
     int wrapper_index =
         GetExportWrapperIndex(module, unit->sig(), unit->is_import());
     (*export_wrappers_out)->set(wrapper_index, *code);
     RecordStats(*code, isolate->counters());
   }
 }

 CompilationUnitQueues::Queue* CompilationStateImpl::GetQueueForCompileTask(
     int task_id) {
   return compilation_unit_queues_.GetQueueForTask(task_id);
 }

 base::Optional<WasmCompilationUnit>
 CompilationStateImpl::GetNextCompilationUnit(
     CompilationUnitQueues::Queue* queue, CompileBaselineOnly baseline_only) {
   return compilation_unit_queues_.GetNextUnit(queue, baseline_only);
 }

 void CompilationStateImpl::OnFinishedUnits(Vector<WasmCode*> code_vector) {
   TRACE_EVENT1(TRACE_DISABLED_BY_DEFAULT("v8.wasm.detailed"),
                "wasm.OnFinishedUnits", "units", code_vector.size());

   base::MutexGuard guard(&callbacks_mutex_);

   // In case of no outstanding compilation units we can return early.
   // This is especially important for lazy modules that were deserialized.
   // Compilation progress was not set up in these cases.
   if (outstanding_baseline_units_ == 0 && outstanding_export_wrappers_ == 0 &&
       outstanding_top_tier_functions_ == 0 &&
       outstanding_recompilation_functions_ == 0) {
     return;
   }

   // Assume an order of execution tiers that represents the quality of their
   // generated code.
   static_assert(ExecutionTier::kNone < ExecutionTier::kLiftoff &&
                     ExecutionTier::kLiftoff < ExecutionTier::kTurbofan,
                 "Assume an order on execution tiers");

   DCHECK_EQ(compilation_progress_.size(),
             native_module_->module()->num_declared_functions);

   base::EnumSet<CompilationEvent> triggered_events;

   for (size_t i = 0; i < code_vector.size(); i++) {
     WasmCode* code = code_vector[i];
     DCHECK_NOT_NULL(code);
     DCHECK_LT(code->index(), native_module_->num_functions());

     if (code->index() < native_module_->num_imported_functions()) {
       // Import wrapper.
       DCHECK_EQ(code->tier(), ExecutionTier::kTurbofan);
       outstanding_baseline_units_--;
     } else {
       // Function.
       DCHECK_NE(code->tier(), ExecutionTier::kNone);

       // Read function's compilation progress.
       // This view on the compilation progress may differ from the actually
       // compiled code. Any lazily compiled function does not contribute to the
       // compilation progress but may publish code to the code manager.
       int slot_index =
           declared_function_index(native_module_->module(), code->index());
       uint8_t function_progress = compilation_progress_[slot_index];
       ExecutionTier required_baseline_tier =
           RequiredBaselineTierField::decode(function_progress);
       ExecutionTier required_top_tier =
           RequiredTopTierField::decode(function_progress);
       ExecutionTier reached_tier = ReachedTierField::decode(function_progress);

       // Check whether required baseline or top tier are reached.
       if (reached_tier < required_baseline_tier &&
           required_baseline_tier <= code->tier()) {
         DCHECK_GT(outstanding_baseline_units_, 0);
         outstanding_baseline_units_--;
       }
       if (reached_tier < required_top_tier &&
           required_top_tier <= code->tier()) {
         DCHECK_GT(outstanding_top_tier_functions_, 0);
         outstanding_top_tier_functions_--;
       }

       if (V8_UNLIKELY(MissingRecompilationField::decode(function_progress))) {
         DCHECK_LT(0, outstanding_recompilation_functions_);
         // If tiering up, accept any TurboFan code. For tiering down, look at
         // the {for_debugging} flag. The tier can be Liftoff or TurboFan and is
         // irrelevant here. In particular, we want to ignore any outstanding
         // non-debugging units.
         bool matches = tiering_state_ == kTieredDown
                            ? code->for_debugging()
                            : code->tier() == ExecutionTier::kTurbofan;
         if (matches) {
           outstanding_recompilation_functions_--;
           compilation_progress_[slot_index] = MissingRecompilationField::update(
               compilation_progress_[slot_index], false);
           if (outstanding_recompilation_functions_ == 0) {
             triggered_events.Add(CompilationEvent::kFinishedRecompilation);
           }
         }
       }

       // Update function's compilation progress.
       if (code->tier() > reached_tier) {
         compilation_progress_[slot_index] = ReachedTierField::update(
             compilation_progress_[slot_index], code->tier());
       }
       DCHECK_LE(0, outstanding_baseline_units_);
     }
   }

   TriggerCallbacks(triggered_events);
 }

 void CompilationStateImpl::OnFinishedJSToWasmWrapperUnits(int num) {
   if (num == 0) return;
   base::MutexGuard guard(&callbacks_mutex_);
   DCHECK_GE(outstanding_export_wrappers_, num);
   outstanding_export_wrappers_ -= num;
   TriggerCallbacks();
 }

 void CompilationStateImpl::TriggerCallbacks(
     base::EnumSet<CompilationEvent> triggered_events) {
   DCHECK(!callbacks_mutex_.TryLock());

   if (outstanding_export_wrappers_ == 0) {
     triggered_events.Add(CompilationEvent::kFinishedExportWrappers);
     if (outstanding_baseline_units_ == 0) {
       triggered_events.Add(CompilationEvent::kFinishedBaselineCompilation);
       if (outstanding_top_tier_functions_ == 0) {
         triggered_events.Add(CompilationEvent::kFinishedTopTierCompilation);
       }
     }
   }

   if (compile_failed_.load(std::memory_order_relaxed)) {
     // *Only* trigger the "failed" event.
     triggered_events =
         base::EnumSet<CompilationEvent>({CompilationEvent::kFailedCompilation});
   }

   if (triggered_events.empty()) return;

   // Don't trigger past events again.
   triggered_events -= finished_events_;
   // Recompilation can happen multiple times, thus do not store this.
   finished_events_ |=
       triggered_events - CompilationEvent::kFinishedRecompilation;

   for (auto event :
        {std::make_pair(CompilationEvent::kFailedCompilation,
                        "wasm.CompilationFailed"),
         std::make_pair(CompilationEvent::kFinishedExportWrappers,
                        "wasm.ExportWrappersFinished"),
         std::make_pair(CompilationEvent::kFinishedBaselineCompilation,
                        "wasm.BaselineFinished"),
         std::make_pair(CompilationEvent::kFinishedTopTierCompilation,
                        "wasm.TopTierFinished"),
         std::make_pair(CompilationEvent::kFinishedRecompilation,
                        "wasm.RecompilationFinished")}) {
     if (!triggered_events.contains(event.first)) continue;
     TRACE_EVENT0("v8.wasm", event.second);
     for (auto& callback : callbacks_) {
       callback(event.first);
     }
   }

   if (outstanding_baseline_units_ == 0 && outstanding_export_wrappers_ == 0 &&
       outstanding_top_tier_functions_ == 0 &&
       outstanding_recompilation_functions_ == 0) {
     // Clear the callbacks because no more events will be delivered.
     callbacks_.clear();
   }
 }

 void CompilationStateImpl::OnCompilationStopped(const WasmFeatures& detected) {
   base::MutexGuard guard(&mutex_);
   detected_features_.Add(detected);
 }

 void CompilationStateImpl::PublishDetectedFeatures(Isolate* isolate) {
   // Notifying the isolate of the feature counts must take place under
   // the mutex, because even if we have finished baseline compilation,
   // tiering compilations may still occur in the background.
   base::MutexGuard guard(&mutex_);
   UpdateFeatureUseCounts(isolate, detected_features_);
 }

 void CompilationStateImpl::PublishCompilationResults(
     std::vector<std::unique_ptr<WasmCode>> unpublished_code) {
   if (unpublished_code.empty()) return;

   // For import wrapper compilation units, add result to the cache.
   int num_imported_functions = native_module_->num_imported_functions();
   WasmImportWrapperCache* cache = native_module_->import_wrapper_cache();
   for (const auto& code : unpublished_code) {
     int func_index = code->index();
     DCHECK_LE(0, func_index);
     DCHECK_LT(func_index, native_module_->num_functions());
     if (func_index < num_imported_functions) {
       const FunctionSig* sig =
           native_module_->module()->functions[func_index].sig;
       WasmImportWrapperCache::CacheKey key(
           compiler::kDefaultImportCallKind, sig,
           static_cast<int>(sig->parameter_count()));
       // If two imported functions have the same key, only one of them should
       // have been added as a compilation unit. So it is always the first time
       // we compile a wrapper for this key here.
       DCHECK_NULL((*cache)[key]);
       (*cache)[key] = code.get();
       code->IncRef();
     }
   }
   PublishCode(VectorOf(unpublished_code));
 }

 void CompilationStateImpl::PublishCode(Vector<std::unique_ptr<WasmCode>> code) {
   WasmCodeRefScope code_ref_scope;
   std::vector<WasmCode*> published_code =
       native_module_->PublishCode(std::move(code));
   // Defer logging code in case wire bytes were not fully received yet.
   if (native_module_->HasWireBytes()) {
     native_module_->engine()->LogCode(VectorOf(published_code));
   }

   OnFinishedUnits(VectorOf(std::move(published_code)));
 }

 void CompilationStateImpl::SchedulePublishCompilationResults(
     std::vector<std::unique_ptr<WasmCode>> unpublished_code) {
   {
     base::MutexGuard guard(&publish_mutex_);
     if (publisher_running_) {
       // Add new code to the queue and return.
       publish_queue_.reserve(publish_queue_.size() + unpublished_code.size());
       for (auto& c : unpublished_code) {
         publish_queue_.emplace_back(std::move(c));
       }
       return;
     }
     publisher_running_ = true;
   }
   while (true) {
     PublishCompilationResults(std::move(unpublished_code));
     unpublished_code.clear();

     // Keep publishing new code that came in.
     base::MutexGuard guard(&publish_mutex_);
     DCHECK(publisher_running_);
     if (publish_queue_.empty()) {
       publisher_running_ = false;
       return;
     }
     unpublished_code.swap(publish_queue_);
   }
 }

 void CompilationStateImpl::ScheduleCompileJobForNewUnits() {
   if (failed()) return;

   std::shared_ptr<JobHandle> new_job_handle;
   {
     base::MutexGuard guard(&mutex_);
     if (current_compile_job_ && current_compile_job_->IsValid()) {
       current_compile_job_->NotifyConcurrencyIncrease();
       return;
     }

     std::unique_ptr<JobTask> new_compile_job =
         std::make_unique<BackgroundCompileJob>(native_module_weak_,
                                                async_counters_);
     // TODO(wasm): Lower priority for TurboFan-only jobs.
     new_job_handle = V8::GetCurrentPlatform()->PostJob(
         has_priority_ ? TaskPriority::kUserBlocking
                       : TaskPriority::kUserVisible,
         std::move(new_compile_job));
     current_compile_job_ = new_job_handle;
     // Reset the priority. Later uses of the compilation state, e.g. for
     // debugging, should compile with the default priority again.
     has_priority_ = false;
   }

   if (new_job_handle) {
     native_module_->engine()->ShepherdCompileJobHandle(
         std::move(new_job_handle));
   }
 }

 size_t CompilationStateImpl::NumOutstandingCompilations() const {
   size_t next_wrapper = js_to_wasm_wrapper_id_.load(std::memory_order_relaxed);
   size_t outstanding_wrappers =
       next_wrapper >= js_to_wasm_wrapper_units_.size()
           ? 0
           : js_to_wasm_wrapper_units_.size() - next_wrapper;
   size_t outstanding_functions = compilation_unit_queues_.GetTotalSize();
   return outstanding_wrappers + outstanding_functions;
 }

 void CompilationStateImpl::SetError() {
   compile_cancelled_.store(true, std::memory_order_relaxed);
   if (compile_failed_.exchange(true, std::memory_order_relaxed)) {
     return;  // Already failed before.
   }

   base::MutexGuard callbacks_guard(&callbacks_mutex_);
   TriggerCallbacks();
   callbacks_.clear();
 }

 void CompilationStateImpl::WaitForCompilationEvent(
     CompilationEvent expect_event) {
   auto compilation_event_semaphore = std::make_shared<base::Semaphore>(0);
   base::EnumSet<CompilationEvent> events{expect_event,
                                          CompilationEvent::kFailedCompilation};
   {
     base::MutexGuard callbacks_guard(&callbacks_mutex_);
     if (finished_events_.contains_any(events)) return;
     callbacks_.emplace_back(
         [compilation_event_semaphore, events](CompilationEvent event) {
           if (events.contains(event)) compilation_event_semaphore->Signal();
         });
   }

   constexpr JobDelegate* kNoDelegate = nullptr;
   ExecuteCompilationUnits(native_module_weak_, async_counters_.get(),
                           kNoDelegate, kBaselineOnly);
   compilation_event_semaphore->Wait();
 }

 namespace {
 using JSToWasmWrapperQueue =
     WrapperQueue<JSToWasmWrapperKey, base::hash<JSToWasmWrapperKey>>;
 using JSToWasmWrapperUnitMap =
     std::unordered_map<JSToWasmWrapperKey,
                        std::unique_ptr<JSToWasmWrapperCompilationUnit>,
                        base::hash<JSToWasmWrapperKey>>;

 class CompileJSToWasmWrapperJob final : public JobTask {
  public:
   CompileJSToWasmWrapperJob(JSToWasmWrapperQueue* queue,
                             JSToWasmWrapperUnitMap* compilation_units,
                             size_t max_concurrency)
       : queue_(queue),
         compilation_units_(compilation_units),
         outstanding_units_(queue->size()) {}

   void Run(JobDelegate* delegate) override {
     while (base::Optional<JSToWasmWrapperKey> key = queue_->pop()) {
       JSToWasmWrapperCompilationUnit* unit = (*compilation_units_)[*key].get();
       unit->Execute();
       outstanding_units_.fetch_sub(1, std::memory_order_relaxed);
       if (delegate->ShouldYield()) return;
     }
   }

   size_t GetMaxConcurrency(size_t /* worker_count */) const override {
     // {outstanding_units_} includes the units that other workers are currently
     // working on, so we can safely ignore the {worker_count} and just return
     // the current number of outstanding units.
     size_t flag_limit =
         static_cast<size_t>(std::max(1, FLAG_wasm_num_compilation_tasks));
     return std::min(flag_limit,
                     outstanding_units_.load(std::memory_order_relaxed));
   }

  private:
   JSToWasmWrapperQueue* const queue_;
   JSToWasmWrapperUnitMap* const compilation_units_;
   std::atomic<size_t> outstanding_units_;
 };
 }  // namespace

 void CompileJsToWasmWrappers(Isolate* isolate, const WasmModule* module,
                              Handle<FixedArray>* export_wrappers_out) {
   *export_wrappers_out = isolate->factory()->NewFixedArray(
       MaxNumExportWrappers(module), AllocationType::kOld);

   JSToWasmWrapperQueue queue;
   JSToWasmWrapperUnitMap compilation_units;
   WasmFeatures enabled_features = WasmFeatures::FromIsolate(isolate);

   // Prepare compilation units in the main thread.
   for (auto exp : module->export_table) {
     if (exp.kind != kExternalFunction) continue;
     auto& function = module->functions[exp.index];
     JSToWasmWrapperKey key(function.imported, *function.sig);
     if (queue.insert(key)) {
       auto unit = std::make_unique<JSToWasmWrapperCompilationUnit>(
           isolate, isolate->wasm_engine(), function.sig, module,
           function.imported, enabled_features,
           JSToWasmWrapperCompilationUnit::kAllowGeneric);
       compilation_units.emplace(key, std::move(unit));
     }
   }

   // Execute wrapper compilation in the background.
   int flag_value = FLAG_wasm_num_compilation_tasks;
   size_t max_concurrency = flag_value < 1 ? std::numeric_limits<size_t>::max()
                                           : static_cast<size_t>(flag_value);
   auto job = std::make_unique<CompileJSToWasmWrapperJob>(
       &queue, &compilation_units, max_concurrency);
   auto job_handle = V8::GetCurrentPlatform()->PostJob(
       TaskPriority::kUserVisible, std::move(job));

   // Wait for completion, while contributing to the work.
   job_handle->Join();

   // Finalize compilation jobs in the main thread.
   // TODO(6792): Wrappers below are allocated with {Factory::NewCode}. As an
   // optimization we keep the code space unlocked to avoid repeated unlocking
   // because many such wrapper are allocated in sequence below.
   CodeSpaceMemoryModificationScope modification_scope(isolate->heap());
   for (auto& pair : compilation_units) {
     JSToWasmWrapperKey key = pair.first;
     JSToWasmWrapperCompilationUnit* unit = pair.second.get();
     Handle<Code> code = unit->Finalize(isolate);
     int wrapper_index = GetExportWrapperIndex(module, &key.second, key.first);
     (*export_wrappers_out)->set(wrapper_index, *code);
     RecordStats(*code, isolate->counters());
   }
 }

 WasmCode* CompileImportWrapper(
     WasmEngine* wasm_engine, NativeModule* native_module, Counters* counters,
     compiler::WasmImportCallKind kind, const FunctionSig* sig,
     int expected_arity,
     WasmImportWrapperCache::ModificationScope* cache_scope) {
   // Entry should exist, so that we don't insert a new one and invalidate
   // other threads' iterators/references, but it should not have been compiled
   // yet.
   WasmImportWrapperCache::CacheKey key(kind, sig, expected_arity);
   DCHECK_NULL((*cache_scope)[key]);
   bool source_positions = is_asmjs_module(native_module->module());
   // Keep the {WasmCode} alive until we explicitly call {IncRef}.
   WasmCodeRefScope code_ref_scope;
   CompilationEnv env = native_module->CreateCompilationEnv();
   WasmCompilationResult result = compiler::CompileWasmImportCallWrapper(
       wasm_engine, &env, kind, sig, source_positions, expected_arity);
   std::unique_ptr<WasmCode> wasm_code = native_module->AddCode(
       result.func_index, result.code_desc, result.frame_slot_count,
       result.tagged_parameter_slots,
       result.protected_instructions_data.as_vector(),
       result.source_positions.as_vector(), GetCodeKind(result),
       ExecutionTier::kNone, kNoDebugging);
   WasmCode* published_code = native_module->PublishCode(std::move(wasm_code));
   (*cache_scope)[key] = published_code;
   published_code->IncRef();
   counters->wasm_generated_code_size()->Increment(
       published_code->instructions().length());
   counters->wasm_reloc_size()->Increment(published_code->reloc_info().length());
   return published_code;
 }

 }  // namespace wasm
 }  // namespace internal
 }  // namespace v8

 #undef TRACE_COMPILE
 #undef TRACE_STREAMING
 #undef TRACE_LAZY