| /* |
| * Copyright 2016 WebAssembly Community Group participants |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| // |
| // Removes module elements that are not needed: functions, globals, tags, etc. |
| // Basically "global dead code elimination" but not just for code. |
| // |
| // To do this optimally, we need to consider that an element may be in one of |
| // three states: |
| // |
| // * No references at all. We can simply remove it. |
| // * References, but no uses. We can't remove it, but we can change it (see |
| // below). |
| // * Uses (which imply references). We must keep it as it is. |
| // |
| // An example of something with a reference but *not* a use is a RefFunc to a |
| // function that has no corresponding CallRef to that type. We cannot just |
| // remove the function, since the RefFunc must refer to an actual entity in the |
| // IR, but we know it isn't actually used/called, so we can change it - we can |
| // empty out the body and put an unreachable there, for example. That is, a |
| // reference forces us to keep something in the IR to be referred to, but only |
| // a use actually makes us keep its contents as well. |
| // |
| |
| #include <memory> |
| |
| #include "ir/element-utils.h" |
| #include "ir/find_all.h" |
| #include "ir/intrinsics.h" |
| #include "ir/module-utils.h" |
| #include "ir/struct-utils.h" |
| #include "ir/subtypes.h" |
| #include "ir/utils.h" |
| #include "pass.h" |
| #include "support/stdckdint.h" |
| #include "wasm-builder.h" |
| #include "wasm.h" |
| |
| namespace wasm { |
| |
| // TODO: remove this alias |
| using ModuleElementKind = ModuleItemKind; |
| |
| // An element in the module that we track: a kind (function, global, etc.) + the |
| // name of the particular element. |
| using ModuleElement = std::pair<ModuleElementKind, Name>; |
| |
| // Visit or walk an expression to find what things are referenced. |
| struct ReferenceFinder |
| : public PostWalker<ReferenceFinder, |
| UnifiedExpressionVisitor<ReferenceFinder>> { |
| // Our findings are placed in these data structures, which the user of this |
| // code can then process. |
| std::vector<ModuleElement> elements; |
| std::vector<HeapType> callRefTypes; |
| std::vector<Name> refFuncs; |
| std::vector<StructField> structFields; |
| |
| // Add an item to the output data structures. |
| void note(ModuleElement element) { elements.push_back(element); } |
| void noteCallRef(HeapType type) { callRefTypes.push_back(type); } |
| void noteRefFunc(Name refFunc) { refFuncs.push_back(refFunc); } |
| void note(StructField structField) { structFields.push_back(structField); } |
| |
| // Generic visitor |
| |
| void visitExpression(Expression* curr) { |
| #define DELEGATE_ID curr->_id |
| |
| #define DELEGATE_START(id) [[maybe_unused]] auto* cast = curr->cast<id>(); |
| |
| #define DELEGATE_GET_FIELD(id, field) cast->field |
| |
| #define DELEGATE_FIELD_TYPE(id, field) |
| #define DELEGATE_FIELD_HEAPTYPE(id, field) |
| #define DELEGATE_FIELD_CHILD(id, field) |
| #define DELEGATE_FIELD_OPTIONAL_CHILD(id, field) |
| #define DELEGATE_FIELD_INT(id, field) |
| #define DELEGATE_FIELD_LITERAL(id, field) |
| #define DELEGATE_FIELD_NAME(id, field) |
| #define DELEGATE_FIELD_SCOPE_NAME_DEF(id, field) |
| #define DELEGATE_FIELD_SCOPE_NAME_USE(id, field) |
| #define DELEGATE_FIELD_ADDRESS(id, field) |
| |
| #define DELEGATE_FIELD_NAME_KIND(id, field, kind) \ |
| if (cast->field.is()) { \ |
| note({kind, cast->field}); \ |
| } |
| |
| #include "wasm-delegations-fields.def" |
| } |
| |
| // Specific visitors |
| |
| void visitCall(Call* curr) { |
| note({ModuleElementKind::Function, curr->target}); |
| |
| if (Intrinsics(*getModule()).isCallWithoutEffects(curr)) { |
| // A call-without-effects receives a function reference and calls it, the |
| // same as a CallRef. When we have a flag for non-closed-world, we should |
| // handle this automatically by the reference flowing out to an import, |
| // which is what binaryen intrinsics look like. For now, to support use |
| // cases of a closed world but that also use this intrinsic, handle the |
| // intrinsic specifically here. (Without that, the closed world assumption |
| // makes us ignore the function ref that flows to an import, so we are not |
| // aware that it is actually called.) |
| auto* target = curr->operands.back(); |
| if (auto* refFunc = target->dynCast<RefFunc>()) { |
| // We can see exactly where this goes. |
| Call call(getModule()->allocator); |
| call.target = refFunc->func; |
| visitCall(&call); |
| } else { |
| // All we can see is the type, so do a CallRef of that. |
| CallRef callRef(getModule()->allocator); |
| callRef.target = target; |
| visitCallRef(&callRef); |
| } |
| } |
| } |
| |
| void visitCallIndirect(CallIndirect* curr) { |
| note({ModuleElementKind::Table, curr->table}); |
| // Note a possible call of a function reference as well, as something might |
| // be written into the table during runtime. With precise tracking of what |
| // is written into the table we could do better here; we could also see |
| // which tables are immutable. TODO |
| noteCallRef(curr->heapType); |
| } |
| |
| void visitCallRef(CallRef* curr) { |
| // Ignore unreachable code. |
| if (!curr->target->type.isRef()) { |
| return; |
| } |
| |
| noteCallRef(curr->target->type.getHeapType()); |
| } |
| |
| void visitRefFunc(RefFunc* curr) { noteRefFunc(curr->func); } |
| |
| void visitStructGet(StructGet* curr) { |
| if (curr->ref->type == Type::unreachable || curr->ref->type.isNull()) { |
| return; |
| } |
| auto type = curr->ref->type.getHeapType(); |
| note(StructField{type, curr->index}); |
| } |
| }; |
| |
| // Analyze a module to find what things are referenced and what things are used. |
| struct Analyzer { |
| Module* module; |
| const PassOptions& options; |
| |
| // The set of all used things we've seen used so far. |
| std::unordered_set<ModuleElement> used; |
| |
| // Things for whom there is a reference, but may be unused. It is ok for a |
| // thing to appear both in |used| and here; we will check |used| first anyhow. |
| // (That is, we don't need to be careful to remove things from here if they |
| // begin as referenced and later become used; and we don't need to add things |
| // to here if they are both used and referenced.) |
| std::unordered_set<ModuleElement> referenced; |
| |
| // A queue of used module elements that we need to process. These appear in |
| // |used|, and the work we do when we pop them from the queue is to look at |
| // the things they reach that might become referenced or used. |
| std::vector<ModuleElement> moduleQueue; |
| |
| // A stack of used expressions to walk. We do *not* use the normal |
| // walking mechanism because we need more control. Specifically, we may defer |
| // certain walks, such as this: |
| // |
| // (struct.new $Foo |
| // (global.get $bar) |
| // ) |
| // |
| // If we walked the child immediately then we would make $bar used. But that |
| // global is only used if we actually read that field from the struct. We |
| // perform that analysis in readStructFields unreadStructFieldExprMap, below. |
| std::vector<Expression*> expressionQueue; |
| |
| // The signatures that we have seen a call_ref for. When we see a RefFunc of a |
| // signature in here, we know it is used; otherwise it may only be referred |
| // to. |
| std::unordered_set<HeapType> calledSignatures; |
| |
| // All the RefFuncs we've seen, grouped by heap type. When we see a CallRef of |
| // one of the types here, we know all the RefFuncs corresponding to it are |
| // potentially used (and also those of subtypes). This is the reverse side of |
| // calledSignatures: for a function to be used via a reference, we need the |
| // combination of a RefFunc of it as well as a CallRef of that, and we may see |
| // them in any order. (Or, if the RefFunc is in a table, we need a |
| // CallIndirect, which is handled in the table logic.) |
| // |
| // After we see a call for a type, we can clear out the entry here for it, as |
| // we'll have that type in calledSignatures, and so this contains only |
| // RefFuncs that we have not seen a call for yet, hence "uncalledRefFuncMap." |
| // |
| // We can only do this when assuming a closed world. TODO: In an open world we |
| // could carefully track which types actually escape out to exports or |
| // imports. |
| std::unordered_map<HeapType, std::unordered_set<Name>> uncalledRefFuncMap; |
| |
| // Similar to calledSignatures/uncalledRefFuncMap, we store the StructFields |
| // we've seen reads from, and also expressions stored in such fields that |
| // could be read if ever we see a read of that field in the future. That is, |
| // for an expression stored into a struct field to be read, we need to both |
| // see that expression written to the field, and see some other place read |
| // that field (similar to with functions that we need to see the RefFunc and |
| // also a CallRef that can actually call it). |
| std::unordered_set<StructField> readStructFields; |
| std::unordered_map<StructField, std::vector<Expression*>> |
| unreadStructFieldExprMap; |
| |
| Analyzer(Module* module, |
| const PassOptions& options, |
| const std::vector<ModuleElement>& roots) |
| : module(module), options(options) { |
| |
| // All roots are used. |
| for (auto& element : roots) { |
| use(element); |
| } |
| |
| // Main loop on both the module and the expression queues. |
| while (processExpressions() || processModule()) { |
| } |
| } |
| |
| // Process expressions in the expression queue while we have any, visiting |
| // them (using their contents) and adding children. Returns whether we did any |
| // work. |
| bool processExpressions() { |
| bool worked = false; |
| while (expressionQueue.size()) { |
| worked = true; |
| |
| auto* curr = expressionQueue.back(); |
| expressionQueue.pop_back(); |
| |
| // Find references in this expression, and apply them. Anything found here |
| // is used. |
| ReferenceFinder finder; |
| finder.setModule(module); |
| finder.visit(curr); |
| for (auto element : finder.elements) { |
| use(element); |
| } |
| for (auto type : finder.callRefTypes) { |
| useCallRefType(type); |
| } |
| for (auto func : finder.refFuncs) { |
| useRefFunc(func); |
| } |
| for (auto structField : finder.structFields) { |
| useStructField(structField); |
| } |
| |
| // Scan the children to continue our work. |
| scanChildren(curr); |
| } |
| return worked; |
| } |
| |
| // We'll compute SubTypes if we need them. |
| std::optional<SubTypes> subTypes; |
| |
| void useCallRefType(HeapType type) { |
| if (type.isBasic()) { |
| // Nothing to do for something like a bottom type; attempts to call such a |
| // type will trap at runtime. |
| return; |
| } |
| |
| if (!subTypes) { |
| subTypes = SubTypes(*module); |
| } |
| |
| // Call all the functions of that signature, and subtypes. We can then |
| // forget about them, as those signatures will be marked as called. |
| for (auto subType : subTypes->getSubTypes(type)) { |
| auto iter = uncalledRefFuncMap.find(subType); |
| if (iter != uncalledRefFuncMap.end()) { |
| // We must not have a type in both calledSignatures and |
| // uncalledRefFuncMap: once it is called, we do not track RefFuncs for |
| // it any more. |
| assert(calledSignatures.count(subType) == 0); |
| |
| for (Name target : iter->second) { |
| use({ModuleElementKind::Function, target}); |
| } |
| |
| uncalledRefFuncMap.erase(iter); |
| } |
| |
| calledSignatures.insert(subType); |
| } |
| } |
| |
| void useRefFunc(Name func) { |
| if (!options.closedWorld) { |
| // The world is open, so assume the worst and something (inside or outside |
| // of the module) can call this. |
| use({ModuleElementKind::Function, func}); |
| return; |
| } |
| |
| // Otherwise, we are in a closed world, and so we can try to optimize the |
| // case where the target function is referenced but not used. |
| auto element = ModuleElement{ModuleElementKind::Function, func}; |
| |
| auto type = module->getFunction(func)->type; |
| if (calledSignatures.count(type)) { |
| // We must not have a type in both calledSignatures and |
| // uncalledRefFuncMap: once it is called, we do not track RefFuncs for it |
| // any more. |
| assert(uncalledRefFuncMap.count(type) == 0); |
| |
| // We've seen a RefFunc for this, so it is used. |
| use(element); |
| } else { |
| // We've never seen a CallRef for this, but might see one later. |
| uncalledRefFuncMap[type].insert(func); |
| |
| referenced.insert(element); |
| } |
| } |
| |
| void useStructField(StructField structField) { |
| if (!readStructFields.count(structField)) { |
| // Avoid a structured binding as the C++ spec does not allow capturing |
| // them in lambdas, which we need below. |
| auto type = structField.first; |
| auto index = structField.second; |
| |
| // This is the first time we see a read of this data. Note that it is |
| // read, and also all subtypes since we might be reading from them as |
| // well. |
| if (!subTypes) { |
| subTypes = SubTypes(*module); |
| } |
| subTypes->iterSubTypes(type, [&](HeapType subType, Index depth) { |
| auto subStructField = StructField{subType, index}; |
| readStructFields.insert(subStructField); |
| |
| // Walk all the unread data we've queued: we queued it for the |
| // possibility of it ever being read, which just happened. |
| auto iter = unreadStructFieldExprMap.find(subStructField); |
| if (iter != unreadStructFieldExprMap.end()) { |
| for (auto* expr : iter->second) { |
| use(expr); |
| } |
| } |
| unreadStructFieldExprMap.erase(subStructField); |
| }); |
| } |
| } |
| |
| // As processExpressions, but for module elements. |
| bool processModule() { |
| bool worked = false; |
| while (moduleQueue.size()) { |
| worked = true; |
| |
| auto curr = moduleQueue.back(); |
| moduleQueue.pop_back(); |
| |
| assert(used.count(curr)); |
| auto& [kind, value] = curr; |
| switch (kind) { |
| case ModuleElementKind::Function: { |
| // if not an import, walk it |
| auto* func = module->getFunction(value); |
| if (!func->imported()) { |
| use(func->body); |
| } |
| break; |
| } |
| case ModuleElementKind::Global: { |
| // if not imported, it has an init expression we can walk |
| auto* global = module->getGlobal(value); |
| if (!global->imported()) { |
| use(global->init); |
| } |
| break; |
| } |
| case ModuleElementKind::Tag: |
| break; |
| case ModuleElementKind::Memory: |
| ModuleUtils::iterMemorySegments( |
| *module, value, [&](DataSegment* segment) { |
| if (!segment->data.empty()) { |
| use({ModuleElementKind::DataSegment, segment->name}); |
| } |
| }); |
| break; |
| case ModuleElementKind::Table: |
| ModuleUtils::iterTableSegments( |
| *module, value, [&](ElementSegment* segment) { |
| if (!segment->data.empty()) { |
| use({ModuleElementKind::ElementSegment, segment->name}); |
| } |
| }); |
| break; |
| case ModuleElementKind::DataSegment: { |
| auto* segment = module->getDataSegment(value); |
| if (segment->offset) { |
| use(segment->offset); |
| use({ModuleElementKind::Memory, segment->memory}); |
| } |
| break; |
| } |
| case ModuleElementKind::ElementSegment: { |
| auto* segment = module->getElementSegment(value); |
| if (segment->offset) { |
| use(segment->offset); |
| use({ModuleElementKind::Table, segment->table}); |
| } |
| for (auto* expr : segment->data) { |
| use(expr); |
| } |
| break; |
| } |
| default: { |
| WASM_UNREACHABLE("invalid kind"); |
| } |
| } |
| } |
| return worked; |
| } |
| |
| // Mark something as used, if it hasn't already been, and if so add it to the |
| // queue so we can process the things it can reach. |
| void use(ModuleElement element) { |
| auto [_, inserted] = used.emplace(element); |
| if (inserted) { |
| moduleQueue.emplace_back(element); |
| } |
| } |
| void use(ModuleElementKind kind, Name value) { |
| use(ModuleElement(kind, value)); |
| } |
| |
| void use(Expression* curr) { |
| // For expressions we do not need to check if they have already been seen: |
| // the tree structure guarantees that traversing children, recursively, will |
| // only visit each expression once, since each expression has a single |
| // parent. |
| expressionQueue.emplace_back(curr); |
| } |
| |
| // Add the children of a used expression to be walked, if we should do so. |
| void scanChildren(Expression* curr) { |
| // For now, the only special handling we have is fields of struct.new, which |
| // we defer walking of to when we know there is a read that can actually |
| // read them, see comments above on |expressionQueue|. We can only do that |
| // optimization in closed world (as otherwise the field might be read |
| // outside of the code we can see), and when it is reached (if it's |
| // unreachable then we don't know the type, and can defer that to DCE to |
| // remove). |
| if (!options.closedWorld || curr->type == Type::unreachable || |
| !curr->is<StructNew>()) { |
| for (auto* child : ChildIterator(curr)) { |
| use(child); |
| } |
| return; |
| } |
| |
| auto* new_ = curr->cast<StructNew>(); |
| auto type = new_->type.getHeapType(); |
| |
| for (Index i = 0; i < new_->operands.size(); i++) { |
| auto* operand = new_->operands[i]; |
| auto structField = StructField{type, i}; |
| |
| // If this struct field has already been read, then we should use the |
| // contents there now. |
| auto useOperandNow = readStructFields.count(structField); |
| |
| // Side effects are tricky to reason about - the side effects must happen |
| // even if we never read the struct field - so give up and consider it |
| // used. |
| if (!useOperandNow) { |
| useOperandNow = |
| EffectAnalyzer(options, *module, operand).hasSideEffects(); |
| } |
| |
| // We must handle the call.without.effects intrinsic here in a special |
| // manner. That intrinsic is reported as having no side effects in |
| // EffectAnalyzer, but even though for optimization purposes we can ignore |
| // effects, the called code *is* actually reached, and it might have side |
| // effects. In other words, the point of the intrinsic is to temporarily |
| // ignore those effects during one phase of optimization. Or, put another |
| // way, the intrinsic lets us ignore the effects of computing some value, |
| // but we do still need to compute that value if it is received and used |
| // (if it is not received and used, other passes will remove it). |
| if (!useOperandNow) { |
| // To detect this, look for any call. A non-intrinsic call would have |
| // already been detected when we looked for side effects, so this will |
| // only notice intrinsic calls. |
| useOperandNow = !FindAll<Call>(operand).list.empty(); |
| } |
| |
| if (useOperandNow) { |
| use(operand); |
| } else { |
| // This data does not need to be read now, but might be read later. Note |
| // it as unread. |
| unreadStructFieldExprMap[structField].push_back(operand); |
| |
| // We also must note that anything in this operand is referenced, even |
| // if it never ends up used, so the IR remains valid. |
| addReferences(operand); |
| } |
| } |
| } |
| |
| // Add references to all things appearing in an expression. This is called |
| // when we know an expression will appear in the output, which means it must |
| // remain valid IR and not refer to nonexistent things. |
| // |
| // This is only called on things without side effects (if there are such |
| // effects then we would have had to assume the worst earlier, and not get |
| // here). |
| void addReferences(Expression* curr) { |
| // Find references anywhere in this expression so we can apply them. |
| ReferenceFinder finder; |
| finder.setModule(module); |
| finder.walk(curr); |
| |
| for (auto element : finder.elements) { |
| referenced.insert(element); |
| |
| auto& [kind, value] = element; |
| if (kind == ModuleElementKind::Global) { |
| // Like functions, (non-imported) globals have contents. For functions, |
| // things are simple: if a function ends up with references but no uses |
| // then we can simply empty out the function (by setting its body to an |
| // unreachable). We don't have a simple way to do the same for globals, |
| // unfortunately. For now, scan the global's contents and add references |
| // as needed. |
| // TODO: We could try to empty the global out, for example, replace it |
| // with a null if it is nullable, or replace all gets of it with |
| // something else, but that is not trivial. |
| auto* global = module->getGlobal(value); |
| if (!global->imported()) { |
| // Note that infinite recursion is not a danger here since a global |
| // can only refer to previous globals. |
| addReferences(global->init); |
| } |
| } |
| } |
| |
| for (auto func : finder.refFuncs) { |
| // If a function ends up referenced but not used then later down we will |
| // empty it out by replacing its body with an unreachable, which always |
| // validates. For that reason all we need to do here is mark the function |
| // as referenced - we don't need to do anything with the body. |
| // |
| // Note that it is crucial that we do not call useRefFunc() here: we are |
| // just adding a reference to the function, and not actually using the |
| // RefFunc. (Only useRefFunc() + a CallRef of the proper type are enough |
| // to make a function itself used.) |
| referenced.insert({ModuleElementKind::Function, func}); |
| } |
| |
| // Note: nothing to do with |callRefTypes| and |structFields|, which only |
| // involve types. This function only cares about references to module |
| // elements like functions, globals, and tables. (References to types are |
| // handled in an entirely different way in Binaryen IR, and we don't need to |
| // worry about it.) |
| } |
| }; |
| |
| struct RemoveUnusedModuleElements : public Pass { |
| // This pass only removes module elements, it never modifies function |
| // contents (except to replace an entire body with unreachable, which does not |
| // cause any need for local fixups). |
| bool requiresNonNullableLocalFixups() override { return false; } |
| |
| bool rootAllFunctions; |
| |
| RemoveUnusedModuleElements(bool rootAllFunctions) |
| : rootAllFunctions(rootAllFunctions) {} |
| |
| void run(Module* module) override { |
| prepare(module); |
| |
| std::vector<ModuleElement> roots; |
| // Module start is a root. |
| if (module->start.is()) { |
| auto startFunction = module->getFunction(module->start); |
| // Can be skipped if the start function is empty. |
| if (!startFunction->imported() && startFunction->body->is<Nop>()) { |
| module->start = Name{}; |
| } else { |
| roots.emplace_back(ModuleElementKind::Function, module->start); |
| } |
| } |
| // If told to, root all the functions. |
| if (rootAllFunctions) { |
| ModuleUtils::iterDefinedFunctions(*module, [&](Function* func) { |
| roots.emplace_back(ModuleElementKind::Function, func->name); |
| }); |
| } |
| // Exports are roots. |
| for (auto& curr : module->exports) { |
| if (curr->kind == ExternalKind::Function) { |
| roots.emplace_back(ModuleElementKind::Function, curr->value); |
| } else if (curr->kind == ExternalKind::Global) { |
| roots.emplace_back(ModuleElementKind::Global, curr->value); |
| } else if (curr->kind == ExternalKind::Tag) { |
| roots.emplace_back(ModuleElementKind::Tag, curr->value); |
| } else if (curr->kind == ExternalKind::Table) { |
| roots.emplace_back(ModuleElementKind::Table, curr->value); |
| } else if (curr->kind == ExternalKind::Memory) { |
| roots.emplace_back(ModuleElementKind::Memory, curr->value); |
| } |
| } |
| |
| // Active segments that write to imported tables and memories are roots |
| // because those writes are externally observable even if the module does |
| // not otherwise use the tables or memories. |
| // |
| // Likewise, if traps are possible during startup then just trapping is an |
| // effect (which can happen if the offset is out of bounds). |
| auto maybeRootSegment = [&](ModuleElementKind kind, |
| Name segmentName, |
| Index segmentSize, |
| Expression* offset, |
| Importable* parent, |
| Index parentSize) { |
| auto writesToVisible = parent->imported() && segmentSize; |
| auto mayTrap = false; |
| if (!getPassOptions().trapsNeverHappen) { |
| // Check if this might trap. If it is obviously in bounds then it |
| // cannot. |
| auto* c = offset->dynCast<Const>(); |
| // Check for overflow in the largest possible space of addresses. |
| using AddressType = Address::address64_t; |
| AddressType maxWritten; |
| // If there is no integer, or if there is and the addition overflows, or |
| // if the addition leads to a too-large value, then we may trap. |
| mayTrap = !c || |
| std::ckd_add(&maxWritten, |
| (AddressType)segmentSize, |
| (AddressType)c->value.getInteger()) || |
| maxWritten > parentSize; |
| } |
| if (writesToVisible || mayTrap) { |
| roots.emplace_back(kind, segmentName); |
| } |
| }; |
| ModuleUtils::iterActiveDataSegments(*module, [&](DataSegment* segment) { |
| if (segment->memory.is()) { |
| auto* memory = module->getMemory(segment->memory); |
| maybeRootSegment(ModuleElementKind::DataSegment, |
| segment->name, |
| segment->data.size(), |
| segment->offset, |
| memory, |
| memory->initial * Memory::kPageSize); |
| } |
| }); |
| ModuleUtils::iterActiveElementSegments( |
| *module, [&](ElementSegment* segment) { |
| if (segment->table.is()) { |
| auto* table = module->getTable(segment->table); |
| maybeRootSegment(ModuleElementKind::ElementSegment, |
| segment->name, |
| segment->data.size(), |
| segment->offset, |
| table, |
| table->initial * Table::kPageSize); |
| } |
| }); |
| |
| // For now, all functions that can be called indirectly are marked as roots. |
| // TODO: Compute this based on which ElementSegments are actually used, |
| // and which functions have a call_indirect of the proper type. |
| ElementUtils::iterAllElementFunctionNames(module, [&](Name& name) { |
| roots.emplace_back(ModuleElementKind::Function, name); |
| }); |
| |
| // Analyze the module. |
| auto& options = getPassOptions(); |
| Analyzer analyzer(module, options, roots); |
| |
| // Remove unneeded elements. |
| auto needed = [&](ModuleElement element) { |
| // We need to emit something in the output if it has either a reference or |
| // a use. Situations where we can do better (for the case of a reference |
| // without any use) are handled separately below. |
| return analyzer.used.count(element) || analyzer.referenced.count(element); |
| }; |
| |
| module->removeFunctions([&](Function* curr) { |
| auto element = ModuleElement{ModuleElementKind::Function, curr->name}; |
| if (analyzer.used.count(element)) { |
| // This is used. |
| return false; |
| } |
| |
| if (analyzer.referenced.count(element)) { |
| // This is not used, but has a reference. See comment above on |
| // uncalledRefFuncs. |
| if (!curr->imported()) { |
| curr->body = Builder(*module).makeUnreachable(); |
| } |
| return false; |
| } |
| |
| // The function is not used or referenced; remove it entirely. |
| return true; |
| }); |
| module->removeGlobals([&](Global* curr) { |
| // See TODO in addReferences - we may be able to do better here. |
| return !needed({ModuleElementKind::Global, curr->name}); |
| }); |
| module->removeTags([&](Tag* curr) { |
| return !needed({ModuleElementKind::Tag, curr->name}); |
| }); |
| module->removeMemories([&](Memory* curr) { |
| return !needed(ModuleElement(ModuleElementKind::Memory, curr->name)); |
| }); |
| module->removeTables([&](Table* curr) { |
| return !needed(ModuleElement(ModuleElementKind::Table, curr->name)); |
| }); |
| module->removeDataSegments([&](DataSegment* curr) { |
| return !needed(ModuleElement(ModuleElementKind::DataSegment, curr->name)); |
| }); |
| module->removeElementSegments([&](ElementSegment* curr) { |
| return !needed({ModuleElementKind::ElementSegment, curr->name}); |
| }); |
| // TODO: After removing elements, we may be able to remove more things, and |
| // should continue to work. (For example, after removing a reference |
| // to a function from an element segment, we may be able to remove |
| // that function, etc.) |
| } |
| |
| // Do simple work that prepares the module to be efficiently optimized. |
| void prepare(Module* module) { |
| // FIXME Disable these optimizations for now, as they uncovered bugs in |
| // both LLVM and Binaryen, |
| // https://github.com/WebAssembly/binaryen/pull/6026#issuecomment-1775674882 |
| return; |
| |
| // If a function export is a function that just calls another function, we |
| // can export that one directly. Doing so might make the function in the |
| // middle unused: |
| // |
| // (export "export" (func $middle)) |
| // (func $middle |
| // (call $real) |
| // ) |
| // |
| // => |
| // |
| // (export "export" (func $real)) ;; this changed |
| // (func $middle |
| // (call $real) |
| // ) |
| // |
| // (Normally this is not needed, as inlining will end up removing such |
| // silly trampoline functions, but the case of an import being exported does |
| // not have any code for inlining to work with, so we need to handle it |
| // directly.) |
| for (auto& exp : module->exports) { |
| if (exp->kind != ExternalKind::Function) { |
| continue; |
| } |
| |
| auto* func = module->getFunction(exp->value); |
| if (!func->body) { |
| continue; |
| } |
| |
| auto* call = func->body->dynCast<Call>(); |
| if (!call) { |
| continue; |
| } |
| |
| // Don't do this if the type is different, as then we might be |
| // changing the external interface to the module. |
| auto* calledFunc = module->getFunction(call->target); |
| if (calledFunc->type != func->type) { |
| continue; |
| } |
| |
| // Finally, all the params must simply be forwarded. |
| auto ok = true; |
| for (Index i = 0; i < call->operands.size(); i++) { |
| auto* get = call->operands[i]->dynCast<LocalGet>(); |
| if (!get || get->index != i) { |
| ok = false; |
| break; |
| } |
| } |
| if (ok) { |
| exp->value = calledFunc->name; |
| } |
| } |
| } |
| }; |
| |
| Pass* createRemoveUnusedModuleElementsPass() { |
| return new RemoveUnusedModuleElements(false); |
| } |
| |
| Pass* createRemoveUnusedNonFunctionModuleElementsPass() { |
| return new RemoveUnusedModuleElements(true); |
| } |
| |
| } // namespace wasm |