src/passes/RemoveUnusedModuleElements.cpp - external/github.com/WebAssembly/binaryen - Git at Google

 /*
  * Copyright 2016 WebAssembly Community Group participants
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 //
 // Removes module elements that are not needed: functions, globals, tags, etc.
 // Basically "global dead code elimination" but not just for code.
 //
 // To do this optimally, we need to consider that an element may be in one of
 // three states:
 //
 //  * No references at all. We can simply remove it.
 //  * References, but no uses. We can't remove it, but we can change it (see
 //    below).
 //  * Uses (which imply references). We must keep it as it is, because it is
 //    fully used (e.g. for a function, it is called and may execute).
 //
 // An example of something with a reference but *not* a use is a RefFunc to a
 // function that has no corresponding CallRef to that type. We cannot just
 // remove the function, since the RefFunc must refer to an actual entity in the
 // IR, but we know it isn't actually used/called, so we can change it - we can
 // empty out the body and put an unreachable there, for example. That is, a
 // reference forces us to keep something in the IR to be referred to, but only
 // a use actually makes us keep its contents as well.
 //

 #include <memory>
 #include <vector>

 #include "ir/element-utils.h"
 #include "ir/find_all.h"
 #include "ir/intrinsics.h"
 #include "ir/module-utils.h"
 #include "ir/struct-utils.h"
 #include "ir/subtypes.h"
 #include "ir/utils.h"
 #include "pass.h"
 #include "support/insert_ordered.h"
 #include "support/stdckdint.h"
 #include "support/utilities.h"
 #include "wasm-builder.h"
 #include "wasm-traversal.h"
 #include "wasm.h"

 namespace wasm {

 // TODO: remove this alias
 using ModuleElementKind = ModuleItemKind;

 // An element in the module that we track: a kind (function, global, etc.) + the
 // name of the particular element.
 using ModuleElement = std::pair<ModuleElementKind, Name>;

 // Information from an indirect call: the name of the table, and the heap type.
 using IndirectCall = std::pair<Name, HeapType>;

 // Visit or walk an expression to find important things. We note them on data
 // structures that the caller can then process.
 //
 // We could in theory merge this class in with Analyzer, allowing us to
 // directly apply our findings - that is, rather than add to a data structure,
 // then the caller iterates on it and calls a method on them all, we could call
 // that method as we go. However, separating the classes is simpler as we need
 // different handling in different cases (when scanning for references vs when
 // scanning normally, see below).
 //
 // In theory we could parallelize this class, processing all functions in
 // advance, rather than as we go (single-threaded). However, this turns out not
 // to be faster in practice (perhaps because the single-threaded approach uses
 // less memory).
 struct Noter : public PostWalker<Noter, UnifiedExpressionVisitor<Noter>> {
   // We mark both uses and references, and also note specific things that
   // require special handling, like refFuncs.
   std::vector<ModuleElement> used, referenced;
   std::vector<HeapType> callRefTypes;
   std::vector<Name> refFuncs;
   std::vector<StructField> structFields;
   std::vector<IndirectCall> indirectCalls;

   // Note an item on our output data structures.
   void use(ModuleElement element) { used.push_back(element); }
   void reference(ModuleElement element) { referenced.push_back(element); }
   void noteCallRef(HeapType type) { callRefTypes.push_back(type); }
   void noteRefFunc(Name refFunc) { refFuncs.push_back(refFunc); }
   void noteStructField(StructField structField) {
     structFields.push_back(structField);
   }
   void noteIndirectCall(Name table, HeapType type) {
     indirectCalls.push_back({table, type});
   }

   // Generic visitor: Use all the things referenced. This handles e.g. using the
   // table of a table.get. When we do not want such unconditional use, we
   // override (e.g. for call_indirect, we don't want to mark the entire table as
   // used, see below).
   void visitExpression(Expression* curr) {
 #define DELEGATE_ID curr->_id

 #define DELEGATE_START(id) [[maybe_unused]] auto* cast = curr->cast<id>();

 #define DELEGATE_GET_FIELD(id, field) cast->field

 #define DELEGATE_FIELD_TYPE(id, field)
 #define DELEGATE_FIELD_HEAPTYPE(id, field)
 #define DELEGATE_FIELD_CHILD(id, field)
 #define DELEGATE_FIELD_OPTIONAL_CHILD(id, field)
 #define DELEGATE_FIELD_INT(id, field)
 #define DELEGATE_FIELD_LITERAL(id, field)
 #define DELEGATE_FIELD_NAME(id, field)
 #define DELEGATE_FIELD_SCOPE_NAME_DEF(id, field)
 #define DELEGATE_FIELD_SCOPE_NAME_USE(id, field)
 #define DELEGATE_FIELD_ADDRESS(id, field)

 #define DELEGATE_FIELD_NAME_KIND(id, field, kind)                              \
   if (cast->field.is()) {                                                      \
     use({kind, cast->field});                                                  \
   }

 #include "wasm-delegations-fields.def"
   }

   // Specific visitors

   void visitCall(Call* curr) {
     use({ModuleElementKind::Function, curr->target});

     if (Intrinsics(*getModule()).isCallWithoutEffects(curr)) {
       // A call-without-effects receives a function reference and calls it, the
       // same as a CallRef. When we have a flag for non-closed-world, we should
       // handle this automatically by the reference flowing out to an import,
       // which is what binaryen intrinsics look like. For now, to support use
       // cases of a closed world but that also use this intrinsic, handle the
       // intrinsic specifically here. (Without that, the closed world assumption
       // makes us ignore the function ref that flows to an import, so we are not
       // aware that it is actually called.)
       auto* target = curr->operands.back();
       if (auto* refFunc = target->dynCast<RefFunc>()) {
         // We can see exactly where this goes.
         Call call(getModule()->allocator);
         call.target = refFunc->func;
         visitCall(&call);
       } else {
         // All we can see is the type, so do a CallRef of that.
         CallRef callRef(getModule()->allocator);
         callRef.target = target;
         visitCallRef(&callRef);
       }
     }
   }

   void visitCallIndirect(CallIndirect* curr) {
     // We refer to the table, but may not use all parts of it, that depends on
     // the heap type we call with.
     reference({ModuleElementKind::Table, curr->table});
     noteIndirectCall(curr->table, curr->heapType);
     // Note a possible call of a function reference as well, as something might
     // be written into the table during runtime. With precise tracking of what
     // is written into the table we could do better here; we could also see
     // which tables are immutable. TODO
     noteCallRef(curr->heapType);
   }

   void visitCallRef(CallRef* curr) {
     // Ignore unreachable code.
     if (!curr->target->type.isRef()) {
       return;
     }

     noteCallRef(curr->target->type.getHeapType());
   }

   void visitRefFunc(RefFunc* curr) { noteRefFunc(curr->func); }

   void visitStructGet(StructGet* curr) {
     if (curr->ref->type == Type::unreachable || curr->ref->type.isNull()) {
       return;
     }
     auto type = curr->ref->type.getHeapType();
     noteStructField(StructField{type, curr->index});
   }

   void visitContNew(ContNew* curr) {
     // The function reference that is passed in here will be called, just as if
     // we were a call_ref, except at a potentially later time.
     if (!curr->func->type.isRef()) {
       return;
     }

     noteCallRef(curr->func->type.getHeapType());
   }
 };

 // Analyze a module to find what things are referenced and what things are used.
 struct Analyzer {
   Module* module;
   const PassOptions& options;

   // The set of all used things we've seen used so far.
   std::unordered_set<ModuleElement> used;

   // Things for whom there is a reference, but may be unused. It is ok for a
   // thing to appear both in |used| and here; we will check |used| first anyhow.
   // (That is, we don't need to be careful to remove things from here if they
   // begin as referenced and later become used; and we don't need to add things
   // to here if they are both used and referenced.)
   std::unordered_set<ModuleElement> referenced;

   // A queue of used module elements that we need to process. These appear in
   // |used|, and the work we do when we pop them from the queue is to look at
   // the things they reach that might become referenced or used.
   std::vector<ModuleElement> moduleQueue;

   // A stack of used expressions to walk. We do *not* use the normal
   // walking mechanism because we need more control. Specifically, we may defer
   // certain walks, such as this:
   //
   //   (struct.new $Foo
   //     (global.get $bar)
   //   )
   //
   // If we walked the child immediately then we would make $bar used. But that
   // global is only used if we actually read that field from the struct. We
   // perform that analysis in readStructFields  unreadStructFieldExprMap, below.
   std::vector<Expression*> expressionQueue;

   // The signatures that we have seen a call_ref for. When we see a RefFunc of a
   // signature in here, we know it is used; otherwise it may only be referred
   // to.
   std::unordered_set<HeapType> calledSignatures;

   // All the RefFuncs we've seen, grouped by heap type. When we see a CallRef of
   // one of the types here, we know all the RefFuncs corresponding to it are
   // potentially used (and also those of subtypes). This is the reverse side of
   // calledSignatures: for a function to be used via a reference, we need the
   // combination of a RefFunc of it as well as a CallRef of that, and we may see
   // them in any order. (Or, if the RefFunc is in a table, we need a
   // CallIndirect, which is handled in the table logic.)
   //
   // After we see a call for a type, we can clear out the entry here for it, as
   // we'll have that type in calledSignatures, and so this contains only
   // RefFuncs that we have not seen a call for yet, hence "uncalledRefFuncMap."
   //
   // We can only do this when assuming a closed world. TODO: In an open world we
   // could carefully track which types actually escape out to exports or
   // imports.
   std::unordered_map<HeapType, std::unordered_set<Name>> uncalledRefFuncMap;

   // Similar to calledSignatures/uncalledRefFuncMap, we store the StructFields
   // we've seen reads from, and also expressions stored in such fields that
   // could be read if ever we see a read of that field in the future. That is,
   // for an expression stored into a struct field to be read, we need to both
   // see that expression written to the field, and see some other place read
   // that field (similar to with functions that we need to see the RefFunc and
   // also a CallRef that can actually call it).
   std::unordered_set<StructField> readStructFields;
   std::unordered_map<StructField, std::vector<Expression*>>
     unreadStructFieldExprMap;

   Analyzer(Module* module,
            const PassOptions& options,
            const std::vector<ModuleElement>& roots)
     : module(module), options(options) {

     // All roots are used.
     for (auto& element : roots) {
       use(element);
     }

     // Main loop on both the module and the expression queues.
     while (processExpressions() || processModule()) {
     }
   }

   // Process expressions in the expression queue while we have any, visiting
   // them (using their contents) and adding children. Returns whether we did any
   // work.
   bool processExpressions() {
     bool worked = false;
     while (expressionQueue.size()) {
       worked = true;

       auto* curr = expressionQueue.back();
       expressionQueue.pop_back();

       // Find references in this expression, and apply them. Anything found here
       // is used.
       Noter noter;
       noter.setModule(module);
       noter.visit(curr);
       for (auto element : noter.used) {
         use(element);
       }
       for (auto element : noter.referenced) {
         reference(element);
       }
       for (auto type : noter.callRefTypes) {
         useCallRefType(type);
       }
       for (auto func : noter.refFuncs) {
         useRefFunc(func);
       }
       for (auto structField : noter.structFields) {
         useStructField(structField);
       }
       for (auto call : noter.indirectCalls) {
         useIndirectCall(call);
       }

       // Scan the children to continue our work.
       scanChildren(curr);
     }
     return worked;
   }

   // We'll compute SubTypes if we need them.
   std::optional<SubTypes> subTypes;

   void useCallRefType(HeapType type) {
     if (type.isBasic()) {
       // Nothing to do for something like a bottom type; attempts to call such a
       // type will trap at runtime.
       return;
     }

     if (!subTypes) {
       subTypes = SubTypes(*module);
     }

     // Call all the functions of that signature, and subtypes. We can then
     // forget about them, as those signatures will be marked as called.
     for (auto subType : subTypes->getSubTypes(type)) {
       auto iter = uncalledRefFuncMap.find(subType);
       if (iter != uncalledRefFuncMap.end()) {
         // We must not have a type in both calledSignatures and
         // uncalledRefFuncMap: once it is called, we do not track RefFuncs for
         // it any more.
         assert(calledSignatures.count(subType) == 0);

         for (Name target : iter->second) {
           use({ModuleElementKind::Function, target});
         }

         uncalledRefFuncMap.erase(iter);
       }

       calledSignatures.insert(subType);
     }
   }

   std::unordered_set<IndirectCall> usedIndirectCalls;

   void useIndirectCall(IndirectCall call) {
     auto [_, inserted] = usedIndirectCalls.insert(call);
     if (!inserted) {
       return;
     }

     // TODO: use structured bindings with c++20, needed for the capture below
     auto table = call.first;
     auto type = call.second;

     // Any function in the table of that signature may be called.
     ModuleUtils::iterTableSegments(
       *module, table, [&](ElementSegment* segment) {
         auto segmentReferenced = false;
         for (auto* item : segment->data) {
           if (auto* refFunc = item->dynCast<RefFunc>()) {
             auto* func = module->getFunction(refFunc->func);
             if (HeapType::isSubType(func->type.getHeapType(), type)) {
               use({ModuleElementKind::Function, refFunc->func});
               segmentReferenced = true;
             }
           }
         }
         if (segmentReferenced) {
           reference({ModuleElementKind::ElementSegment, segment->name});
         }
       });
   }

   void useRefFunc(Name func) {
     if (!options.closedWorld) {
       // The world is open, so assume the worst and something (inside or outside
       // of the module) can call this.
       use({ModuleElementKind::Function, func});
       return;
     }

     // Otherwise, we are in a closed world, and so we can try to optimize the
     // case where the target function is referenced but not used.
     auto element = ModuleElement{ModuleElementKind::Function, func};

     auto type = module->getFunction(func)->type.getHeapType();
     if (calledSignatures.count(type)) {
       // We must not have a type in both calledSignatures and
       // uncalledRefFuncMap: once it is called, we do not track RefFuncs for it
       // any more.
       assert(uncalledRefFuncMap.count(type) == 0);

       // We've seen a RefFunc for this, so it is used.
       use(element);
     } else {
       // We've never seen a CallRef for this, but might see one later.
       uncalledRefFuncMap[type].insert(func);

       reference(element);
     }
   }

   void useStructField(StructField structField) {
     if (!readStructFields.count(structField)) {
       // Avoid a structured binding as the C++ spec does not allow capturing
       // them in lambdas, which we need below.
       auto type = structField.first;
       auto index = structField.second;

       // This is the first time we see a read of this data. Note that it is
       // read, and also all subtypes since we might be reading from them as
       // well.
       if (!subTypes) {
         subTypes = SubTypes(*module);
       }
       subTypes->iterSubTypes(type, [&](HeapType subType, Index depth) {
         auto subStructField = StructField{subType, index};
         readStructFields.insert(subStructField);

         // Walk all the unread data we've queued: we queued it for the
         // possibility of it ever being read, which just happened.
         auto iter = unreadStructFieldExprMap.find(subStructField);
         if (iter != unreadStructFieldExprMap.end()) {
           for (auto* expr : iter->second) {
             use(expr);
           }
         }
         unreadStructFieldExprMap.erase(subStructField);
       });
     }
   }

   // As processExpressions, but for module elements.
   bool processModule() {
     bool worked = false;
     while (moduleQueue.size()) {
       worked = true;

       auto curr = moduleQueue.back();
       moduleQueue.pop_back();

       assert(used.count(curr));
       auto& [kind, value] = curr;
       switch (kind) {
         case ModuleElementKind::Function: {
           // if not an import, walk it
           auto* func = module->getFunction(value);
           if (!func->imported()) {
             use(func->body);
           }
           break;
         }
         case ModuleElementKind::Global: {
           // if not imported, it has an init expression we can walk
           auto* global = module->getGlobal(value);
           if (!global->imported()) {
             use(global->init);
           }
           break;
         }
         case ModuleElementKind::Tag:
           break;
         case ModuleElementKind::Memory:
           ModuleUtils::iterMemorySegments(
             *module, value, [&](DataSegment* segment) {
               if (!segment->data.empty()) {
                 use({ModuleElementKind::DataSegment, segment->name});
               }
             });
           break;
         case ModuleElementKind::Table:
           ModuleUtils::iterTableSegments(
             *module, value, [&](ElementSegment* segment) {
               if (!segment->data.empty()) {
                 use({ModuleElementKind::ElementSegment, segment->name});
               }
             });
           break;
         case ModuleElementKind::DataSegment: {
           auto* segment = module->getDataSegment(value);
           if (segment->offset) {
             use(segment->offset);
             use({ModuleElementKind::Memory, segment->memory});
           }
           break;
         }
         case ModuleElementKind::ElementSegment: {
           auto* segment = module->getElementSegment(value);
           if (segment->offset) {
             use(segment->offset);
             use({ModuleElementKind::Table, segment->table});
           }
           for (auto* expr : segment->data) {
             use(expr);
           }
           break;
         }
         default: {
           WASM_UNREACHABLE("invalid kind");
         }
       }
     }
     return worked;
   }

   // Mark something as used, if it hasn't already been, and if so add it to the
   // queue so we can process the things it can reach.
   void use(ModuleElement element) {
     auto [_, inserted] = used.emplace(element);
     if (inserted) {
       moduleQueue.emplace_back(element);
     }
   }
   void use(ModuleElementKind kind, Name value) {
     use(ModuleElement(kind, value));
   }

   void use(Expression* curr) {
     // For expressions we do not need to check if they have already been seen:
     // the tree structure guarantees that traversing children, recursively, will
     // only visit each expression once, since each expression has a single
     // parent.
     expressionQueue.emplace_back(curr);
   }

   // Add the children of a used expression to be walked, if we should do so.
   void scanChildren(Expression* curr) {
     // For now, the only special handling we have is fields of struct.new, which
     // we defer walking of to when we know there is a read that can actually
     // read them, see comments above on |expressionQueue|. We can only do that
     // optimization in closed world (as otherwise the field might be read
     // outside of the code we can see), and when it is reached (if it's
     // unreachable then we don't know the type, and can defer that to DCE to
     // remove).
     if (!options.closedWorld || curr->type == Type::unreachable ||
         !curr->is<StructNew>()) {
       for (auto* child : ChildIterator(curr)) {
         use(child);
       }
       return;
     }

     auto* new_ = curr->cast<StructNew>();

     // Use the descriptor right now, normally. We only have special
     // optimization for struct.new operands, below, because this is not needed
     // for descriptors: a descriptor must be a struct, and our "lazy reading"
     // optimization operates on it (if it could be a function, then we'd need to
     // do more here). In other words, descriptor reads always have a struct "in
     // the middle", that we can optimize, like here:
     //
     //  (struct.new $A
     //    (ref.func $c)
     //    (struct.new $A.desc
     //      (ref.func $d)
     //    )
     //  )
     //
     // The struct has a ref.func on it, and the descriptor as well. Say we never
     // read field 0 from $A, then we can avoid marking $c as reached; this is
     // the usual struct optimization we do, below. Now, say we never read the
     // descriptor, then we also never read field 0 from $A.desc, that is, the
     // usual struct optimization on the descriptor class is enough for us to
     // avoid marking $d as reached.
     if (new_->desc) {
       use(new_->desc);
     }

     auto type = new_->type.getHeapType();

     for (Index i = 0; i < new_->operands.size(); i++) {
       auto* operand = new_->operands[i];
       auto structField = StructField{type, i};

       // If this struct field has already been read, then we should use the
       // contents there now.
       auto useOperandNow = readStructFields.count(structField);

       // Side effects are tricky to reason about - the side effects must happen
       // even if we never read the struct field - so give up and consider it
       // used.
       if (!useOperandNow) {
         useOperandNow =
           EffectAnalyzer(options, *module, operand).hasSideEffects();
       }

       // We must handle the call.without.effects intrinsic here in a special
       // manner. That intrinsic is reported as having no side effects in
       // EffectAnalyzer, but even though for optimization purposes we can ignore
       // effects, the called code *is* actually reached, and it might have side
       // effects. In other words, the point of the intrinsic is to temporarily
       // ignore those effects during one phase of optimization. Or, put another
       // way, the intrinsic lets us ignore the effects of computing some value,
       // but we do still need to compute that value if it is received and used
       // (if it is not received and used, other passes will remove it).
       if (!useOperandNow) {
         // To detect this, look for any call. A non-intrinsic call would have
         // already been detected when we looked for side effects, so this will
         // only notice intrinsic calls.
         useOperandNow = !FindAll<Call>(operand).list.empty();
       }

       if (useOperandNow) {
         use(operand);
       } else {
         // This data does not need to be read now, but might be read later. Note
         // it as unread.
         unreadStructFieldExprMap[structField].push_back(operand);

         // We also must note that anything in this operand is referenced, even
         // if it never ends up used, so the IR remains valid.
         addReferences(operand);
       }
     }
   }

   // Add references to all things appearing in an expression. This is called
   // when we know an expression will appear in the output, which means it must
   // remain valid IR and not refer to nonexistent things.
   //
   // This is only called on things without side effects (if there are such
   // effects then we would have had to assume the worst earlier, and not get
   // here).
   void addReferences(Expression* curr) {
     // Find references anywhere in this expression so we can apply them.
     Noter noter;
     noter.setModule(module);
     noter.walk(curr);

     for (auto element : noter.used) {
       reference(element);
     }
     for (auto element : noter.referenced) {
       reference(element);
     }

     for (auto func : noter.refFuncs) {
       // If a function ends up referenced but not used then later down we will
       // empty it out by replacing its body with an unreachable, which always
       // validates. For that reason all we need to do here is mark the function
       // as referenced - we don't need to do anything with the body.
       //
       // Note that it is crucial that we do not call useRefFunc() here: we are
       // just adding a reference to the function, and not actually using the
       // RefFunc. (Only useRefFunc() + a CallRef of the proper type are enough
       // to make a function itself used.)
       reference({ModuleElementKind::Function, func});
     }

     // Note: nothing to do with |callRefTypes| and |structFields|, which only
     // involve types. This function only cares about references to module
     // elements like functions, globals, and tables. (References to types are
     // handled in an entirely different way in Binaryen IR, and we don't need to
     // worry about it.)
   }

   void reference(ModuleElement element) {
     // Avoid repeated work. Note that globals with multiple references to
     // previous globals can lead to exponential work, so this is important.
     // (If C refers twice to B, and B refers twice to A, then when we process
     // C we would, naively, scan B twice and A four times.)
     auto [_, inserted] = referenced.insert(element);
     if (!inserted) {
       return;
     }

     // Some references force references to their internals, just by being
     // referenced and present in the output.
     auto& [kind, value] = element;
     if (kind == ModuleElementKind::Global) {
       // Like functions, (non-imported) globals have contents. For functions,
       // things are simple: if a function ends up with references but no uses
       // then we can simply empty out the function (by setting its body to an
       // unreachable). We don't have a simple way to do the same for globals,
       // unfortunately. For now, scan the global's contents and add references
       // as needed.
       // TODO: We could try to empty the global out, for example, replace it
       //       with a null if it is nullable, or replace all gets of it with
       //       something else, but that is not trivial.
       auto* global = module->getGlobal(value);
       if (!global->imported()) {
         // Note that infinite recursion is not a danger here since a global
         // can only refer to previous globals.
         addReferences(global->init);
       }
     } else if (kind == ModuleElementKind::ElementSegment) {
       // TODO: We could empty out parts of the segment we don't need.
       auto* segment = module->getElementSegment(value);
       for (auto* item : segment->data) {
         addReferences(item);
       }
     }
   }
 };

 struct RemoveUnusedModuleElements : public Pass {
   // This pass only removes module elements, it never modifies function
   // contents (except to replace an entire body with unreachable, which does not
   // cause any need for local fixups).
   bool requiresNonNullableLocalFixups() override { return false; }

   bool rootAllFunctions;

   RemoveUnusedModuleElements(bool rootAllFunctions)
     : rootAllFunctions(rootAllFunctions) {}

   void run(Module* module) override {
     prepare(module);

     std::vector<ModuleElement> roots;
     // Module start is a root.
     if (module->start.is()) {
       auto startFunction = module->getFunction(module->start);
       // Can be skipped if the start function is empty.
       if (!startFunction->imported() && startFunction->body->is<Nop>()) {
         module->start = Name{};
       } else {
         roots.emplace_back(ModuleElementKind::Function, module->start);
       }
     }
     // If told to, root all the functions.
     if (rootAllFunctions) {
       ModuleUtils::iterDefinedFunctions(*module, [&](Function* func) {
         roots.emplace_back(ModuleElementKind::Function, func->name);
       });
     }
     // Exports are roots.
     for (auto& curr : module->exports) {
       if (curr->kind == ExternalKind::Function) {
         roots.emplace_back(ModuleElementKind::Function,
                            *curr->getInternalName());
       } else if (curr->kind == ExternalKind::Global) {
         roots.emplace_back(ModuleElementKind::Global, *curr->getInternalName());
       } else if (curr->kind == ExternalKind::Tag) {
         roots.emplace_back(ModuleElementKind::Tag, *curr->getInternalName());
       } else if (curr->kind == ExternalKind::Table) {
         roots.emplace_back(ModuleElementKind::Table, *curr->getInternalName());
       } else if (curr->kind == ExternalKind::Memory) {
         roots.emplace_back(ModuleElementKind::Memory, *curr->getInternalName());
       }
     }

     // Active segments that write to imported tables and memories are roots
     // because those writes are externally observable even if the module does
     // not otherwise use the tables or memories.
     //
     // Likewise, if traps are possible during startup then just trapping is an
     // effect (which can happen if the offset is out of bounds).
     auto maybeRootSegment = [&](ModuleElementKind kind,
                                 Name segmentName,
                                 Index segmentSize,
                                 Expression* offset,
                                 Importable* parent,
                                 Index parentSize) {
       auto writesToVisible = parent->imported() && segmentSize;
       auto mayTrap = false;
       if (!getPassOptions().trapsNeverHappen) {
         // Check if this might trap. If it is obviously in bounds then it
         // cannot.
         auto* c = offset->dynCast<Const>();
         // Check for overflow in the largest possible space of addresses.
         using AddressType = Address::address64_t;
         AddressType maxWritten;
         // If there is no integer, or if there is and the addition overflows, or
         // if the addition leads to a too-large value, then we may trap.
         mayTrap = !c ||
                   std::ckd_add(&maxWritten,
                                (AddressType)segmentSize,
                                (AddressType)c->value.getInteger()) ||
                   maxWritten > parentSize;
       }
       if (writesToVisible || mayTrap) {
         roots.emplace_back(kind, segmentName);
       }
     };
     ModuleUtils::iterActiveDataSegments(*module, [&](DataSegment* segment) {
       if (segment->memory.is()) {
         auto* memory = module->getMemory(segment->memory);
         maybeRootSegment(ModuleElementKind::DataSegment,
                          segment->name,
                          segment->data.size(),
                          segment->offset,
                          memory,
                          memory->initial * Memory::kPageSize);
       }
     });
     ModuleUtils::iterActiveElementSegments(
       *module, [&](ElementSegment* segment) {
         if (segment->table.is()) {
           auto* table = module->getTable(segment->table);
           maybeRootSegment(ModuleElementKind::ElementSegment,
                            segment->name,
                            segment->data.size(),
                            segment->offset,
                            table,
                            table->initial * Table::kPageSize);
         }
       });

     // Just as out-of-bound segments may cause observable traps at instantiation
     // time, so can struct.new instructions with null descriptors cause traps in
     // global or element segment initializers.
     if (!getPassOptions().trapsNeverHappen) {
       for (auto& segment : module->elementSegments) {
         for (auto* init : segment->data) {
           if (isMaybeTrappingInit(*module, init)) {
             roots.emplace_back(ModuleElementKind::ElementSegment,
                                segment->name);
             break;
           }
         }
       }
       for (auto& global : module->globals) {
         if (auto* init = global->init;
             init && isMaybeTrappingInit(*module, init)) {
           roots.emplace_back(ModuleElementKind::Global, global->name);
         }
       }
     }

     // Analyze the module.
     auto& options = getPassOptions();
     Analyzer analyzer(module, options, roots);

     // Remove unneeded elements.
     auto needed = [&](ModuleElement element) {
       // We need to emit something in the output if it has either a reference or
       // a use. Situations where we can do better (for the case of a reference
       // without any use) are handled separately below.
       return analyzer.used.count(element) || analyzer.referenced.count(element);
     };

     module->removeFunctions([&](Function* curr) {
       auto element = ModuleElement{ModuleElementKind::Function, curr->name};
       if (analyzer.used.count(element)) {
         // This is used.
         return false;
       }

       if (analyzer.referenced.count(element)) {
         // This is not used, but has a reference. See comment above on
         // uncalledRefFuncs.
         if (!curr->imported()) {
           curr->body = Builder(*module).makeUnreachable();
         }
         return false;
       }

       // The function is not used or referenced; remove it entirely.
       return true;
     });
     module->removeGlobals([&](Global* curr) {
       // See TODO in addReferences - we may be able to do better here.
       return !needed({ModuleElementKind::Global, curr->name});
     });
     module->removeTags([&](Tag* curr) {
       return !needed({ModuleElementKind::Tag, curr->name});
     });
     module->removeMemories([&](Memory* curr) {
       return !needed(ModuleElement(ModuleElementKind::Memory, curr->name));
     });
     module->removeTables([&](Table* curr) {
       return !needed(ModuleElement(ModuleElementKind::Table, curr->name));
     });
     module->removeDataSegments([&](DataSegment* curr) {
       return !needed(ModuleElement(ModuleElementKind::DataSegment, curr->name));
     });
     module->removeElementSegments([&](ElementSegment* curr) {
       return !needed({ModuleElementKind::ElementSegment, curr->name});
     });
     // TODO: After removing elements, we may be able to remove more things, and
     //       should continue to work. (For example, after removing a reference
     //       to a function from an element segment, we may be able to remove
     //       that function, etc.)
   }

   // Do simple work that prepares the module to be efficiently optimized.
   void prepare(Module* module) {
     // FIXME Disable these optimizations for now, as they uncovered bugs in
     //       both LLVM and Binaryen,
     //       https://github.com/WebAssembly/binaryen/pull/6026#issuecomment-1775674882
     return;

     // If a function export is a function that just calls another function, we
     // can export that one directly. Doing so might make the function in the
     // middle unused:
     //
     //  (export "export" (func $middle))
     //  (func $middle
     //    (call $real)
     //  )
     //
     // =>
     //
     //  (export "export" (func $real))  ;; this changed
     //  (func $middle
     //    (call $real)
     //  )
     //
     // (Normally this is not needed, as inlining will end up removing such
     // silly trampoline functions, but the case of an import being exported does
     // not have any code for inlining to work with, so we need to handle it
     // directly.)
     for (auto& exp : module->exports) {
       if (exp->kind != ExternalKind::Function) {
         continue;
       }

       auto* name = exp->getInternalName();
       auto* func = module->getFunction(*name);
       if (!func->body) {
         continue;
       }

       auto* call = func->body->dynCast<Call>();
       if (!call) {
         continue;
       }

       // Don't do this if the type is different, as then we might be
       // changing the external interface to the module.
       auto* calledFunc = module->getFunction(call->target);
       if (calledFunc->type != func->type) {
         continue;
       }

       // Finally, all the params must simply be forwarded.
       auto ok = true;
       for (Index i = 0; i < call->operands.size(); i++) {
         auto* get = call->operands[i]->dynCast<LocalGet>();
         if (!get || get->index != i) {
           ok = false;
           break;
         }
       }
       if (ok) {
         *name = calledFunc->name;
       }
     }
   }

   bool isMaybeTrappingInit(Module& wasm, Expression* root) {
     // Traverse the expression, looking for nullable descriptors passed to
     // struct.new. The descriptors might be null, which is the only situations
     // (beyond exceeded implementation limits, which we don't model) that can
     // lead a constant expression to trap. We depend on other optimizations to
     // make the descriptors non-nullable if we can determine that they are not
     // null.
     struct NullDescFinder : PostWalker<NullDescFinder> {
       bool mayTrap = false;
       void visitStructNew(StructNew* curr) {
         if (curr->desc && curr->desc->type.isNullable()) {
           mayTrap = true;
         }
       }
     };

     NullDescFinder finder;
     finder.walk(root);
     return finder.mayTrap;
   }
 };

 Pass* createRemoveUnusedModuleElementsPass() {
   return new RemoveUnusedModuleElements(false);
 }

 Pass* createRemoveUnusedNonFunctionModuleElementsPass() {
   return new RemoveUnusedModuleElements(true);
 }

 } // namespace wasm