blob: f299d7a3554e73e611f962ee4b042825e28e2130 [file] [log] [blame] [edit]
/*
* Copyright 2020 WebAssembly Community Group participants
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
// The process of module splitting involves these steps:
//
// 1. Create the new secondary module.
//
// 2. Export globals, tags, tables, and memories from the primary module and
// import them in the secondary module.
//
// 3. Move the deferred functions from the primary to the secondary module.
//
// 4. For any secondary function exported from the primary module, export in
// its place a trampoline function that makes an indirect call to its
// placeholder function (and eventually to the original secondary
// function), allocating a new table slot for the placeholder if necessary.
//
// 5. Rewrite direct calls from primary functions to secondary functions to be
// indirect calls to their placeholder functions (and eventually to their
// original secondary functions), allocating new table slots for the
// placeholders if necessary.
//
// 6. For each primary function directly called from a secondary function,
// export the primary function if it is not already exported and import it
// into the secondary module.
//
// 7. Replace all references to secondary functions in the primary module's
// table segments with references to imported placeholder functions.
//
// 8. Create new active table segments in the secondary module that will
// replace all the placeholder function references in the table with
// references to their corresponding secondary functions upon
// instantiation.
//
// Functions can be used or referenced three ways in a WebAssembly module: they
// can be exported, called, or placed in a table. The above procedure introduces
// a layer of indirection to each of those mechanisms that removes all
// references to secondary functions from the primary module but restores the
// original program's semantics once the secondary module is instantiated. As
// more mechanisms that reference functions are added in the future, such as
// ref.func instructions, they will have to be modified to use a similar layer
// of indirection.
//
// The code as currently written makes a couple assumptions about the module
// that is being split:
//
// 1. It assumes that mutable-globals is allowed. This could be worked around
// by introducing wrapper functions for globals and rewriting secondary
// code that accesses them, but now that mutable-globals is shipped on all
// browsers, hopefully that extra complexity won't be necessary.
//
// 2. It assumes that either all table segment offsets are constants or there
// is exactly one segment that may have a non-constant offset. It also
// assumes that all segments are active segments (although Binaryen does
// not yet support passive table segments anyway).
#include "ir/module-splitting.h"
#include "asmjs/shared-constants.h"
#include "ir/element-utils.h"
#include "ir/export-utils.h"
#include "ir/manipulation.h"
#include "ir/module-utils.h"
#include "ir/names.h"
#include "pass.h"
#include "support/insert_ordered.h"
#include "wasm-builder.h"
#include "wasm.h"
namespace wasm::ModuleSplitting {
namespace {
static const Name LOAD_SECONDARY_STATUS = "load_secondary_module_status";
template<class F> void forEachElement(Module& module, F f) {
ModuleUtils::iterActiveElementSegments(module, [&](ElementSegment* segment) {
Name base = "";
Index offset = 0;
if (auto* c = segment->offset->dynCast<Const>()) {
offset = c->value.geti32();
} else if (auto* g = segment->offset->dynCast<GlobalGet>()) {
base = g->name;
}
for (Index i = 0; i < segment->data.size(); ++i) {
f(segment->table, base, offset + i, segment->data[i]);
}
});
}
struct TableSlotManager {
struct Slot {
Name tableName;
// If `global` is empty, then this slot is at a statically known index.
Name global;
Index index = 0;
// Generate code to compute the index of this table slot
Expression* makeExpr(Module& module);
};
Module& module;
Table* activeTable = nullptr;
ElementSegment* activeSegment = nullptr;
Slot activeBase;
std::map<Name, Slot> funcIndices;
std::vector<ElementSegment*> activeTableSegments;
TableSlotManager(Module& module);
Table* makeTable();
ElementSegment* makeElementSegment();
// Returns the table index for `func`, allocating a new index if necessary.
Slot getSlot(Name func, HeapType type);
void addSlot(Name func, Slot slot);
};
Expression* TableSlotManager::Slot::makeExpr(Module& module) {
Builder builder(module);
auto makeIndex = [&]() { return builder.makeConst(int32_t(index)); };
if (global.size()) {
Expression* getBase = builder.makeGlobalGet(global, Type::i32);
return index == 0 ? getBase
: builder.makeBinary(AddInt32, getBase, makeIndex());
} else {
return makeIndex();
}
}
void TableSlotManager::addSlot(Name func, Slot slot) {
// Ignore functions that already have slots.
funcIndices.insert({func, slot});
}
TableSlotManager::TableSlotManager(Module& module) : module(module) {
if (module.features.hasReferenceTypes()) {
// Just create a new table to manage all primary-to-secondary calls lazily.
// Do not re-use slots for functions that will already be in existing
// tables, since that is not correct in the face of table mutations.
// TODO: Reduce overhead by creating a separate table for each function type
// if WasmGC is enabled.
return;
}
// TODO: Reject or handle passive element segments
auto funcref = Type(HeapType::func, Nullable);
auto it = std::find_if(
module.tables.begin(),
module.tables.end(),
[&](std::unique_ptr<Table>& table) { return table->type == funcref; });
if (it == module.tables.end()) {
// There is no indirect function table, so we will create one lazily.
return;
}
activeTable = it->get();
ModuleUtils::iterTableSegments(
module, activeTable->name, [&](ElementSegment* segment) {
activeTableSegments.push_back(segment);
});
if (activeTableSegments.empty()) {
// There are no active segments, so we will lazily create one and start
// filling it at index 0.
activeBase = {activeTable->name, "", 0};
} else if (activeTableSegments.size() == 1 &&
activeTableSegments[0]->type == funcref &&
!activeTableSegments[0]->offset->is<Const>()) {
// If there is exactly one table segment and that segment has a non-constant
// offset, append new items to the end of that segment. In all other cases,
// append new items at constant offsets after all existing items at constant
// offsets.
assert(activeTableSegments[0]->offset->is<GlobalGet>() &&
"Unexpected initializer instruction");
activeSegment = activeTableSegments[0];
activeBase = {activeTable->name,
activeTableSegments[0]->offset->cast<GlobalGet>()->name,
0};
} else {
// Finds the segment with the highest occupied table slot so that new items
// can be inserted contiguously at the end of it without accidentally
// overwriting any other items. TODO: be more clever about filling gaps in
// the table, if that is ever useful.
Index maxIndex = 0;
for (auto& segment : activeTableSegments) {
assert(segment->offset->is<Const>() &&
"Unexpected non-const segment offset with multiple segments");
Index segmentBase = segment->offset->cast<Const>()->value.geti32();
if (segmentBase + segment->data.size() >= maxIndex) {
maxIndex = segmentBase + segment->data.size();
activeSegment = segment;
activeBase = {activeTable->name, "", segmentBase};
}
}
}
// Initialize funcIndices with the functions already in the table.
forEachElement(module,
[&](Name table, Name base, Index offset, Expression* elem) {
if (auto* func = elem->dynCast<RefFunc>()) {
addSlot(func->func, {table, base, offset});
}
});
}
Table* TableSlotManager::makeTable() {
return module.addTable(
Builder::makeTable(Names::getValidTableName(module, Name::fromInt(0))));
}
ElementSegment* TableSlotManager::makeElementSegment() {
return module.addElementSegment(Builder::makeElementSegment(
Names::getValidElementSegmentName(module, Name::fromInt(0)),
activeTable->name,
Builder(module).makeConst(int32_t(0))));
}
TableSlotManager::Slot TableSlotManager::getSlot(Name func, HeapType type) {
auto slotIt = funcIndices.find(func);
if (slotIt != funcIndices.end()) {
return slotIt->second;
}
// If there are no segments yet, allocate one.
if (activeSegment == nullptr) {
if (activeTable == nullptr) {
activeTable = makeTable();
activeBase = {activeTable->name, "", 0};
}
// None of the existing segments should refer to the active table
assert(std::all_of(module.elementSegments.begin(),
module.elementSegments.end(),
[&](std::unique_ptr<ElementSegment>& segment) {
return segment->table != activeTable->name;
}));
activeSegment = makeElementSegment();
}
Slot newSlot = {activeBase.tableName,
activeBase.global,
activeBase.index + Index(activeSegment->data.size())};
Builder builder(module);
activeSegment->data.push_back(builder.makeRefFunc(func, type));
addSlot(func, newSlot);
if (activeTable->initial <= newSlot.index) {
activeTable->initial = newSlot.index + 1;
// TODO: handle the active table not being the dylink table (#3823)
if (module.dylinkSection) {
module.dylinkSection->tableSize = activeTable->initial;
}
}
if (activeTable->max <= newSlot.index) {
activeTable->max = newSlot.index + 1;
}
return newSlot;
}
struct ModuleSplitter {
const Config& config;
std::unique_ptr<Module> secondaryPtr;
Module& primary;
Module& secondary;
const std::pair<std::set<Name>, std::set<Name>> classifiedFuncs;
const std::set<Name>& primaryFuncs;
const std::set<Name>& secondaryFuncs;
TableSlotManager tableManager;
Names::MinifiedNameGenerator minified;
// Map from internal function names to (one of) their corresponding export
// names.
std::map<Name, Name> exportedPrimaryFuncs;
// Map placeholder indices to the names of the functions they replace.
std::map<size_t, Name> placeholderMap;
// Internal name of the LOAD_SECONDARY_MODULE function.
Name internalLoadSecondaryModule;
// Initialization helpers
static std::unique_ptr<Module> initSecondary(const Module& primary);
static std::pair<std::set<Name>, std::set<Name>>
classifyFunctions(Module& primary, const Config& config);
static std::map<Name, Name> initExportedPrimaryFuncs(const Module& primary);
// Other helpers
void exportImportFunction(Name func);
Expression* maybeLoadSecondary(Builder& builder, Expression* callIndirect);
// Main splitting steps
void setupJSPI();
void moveSecondaryFunctions();
void thunkExportedSecondaryFunctions();
void indirectCallsToSecondaryFunctions();
void indirectReferencesToSecondaryFunctions();
void exportImportCalledPrimaryFunctions();
void setupTablePatching();
void shareImportableItems();
void removeUnusedSecondaryElements();
ModuleSplitter(Module& primary, const Config& config)
: config(config), secondaryPtr(initSecondary(primary)), primary(primary),
secondary(*secondaryPtr),
classifiedFuncs(classifyFunctions(primary, config)),
primaryFuncs(classifiedFuncs.first),
secondaryFuncs(classifiedFuncs.second), tableManager(primary),
exportedPrimaryFuncs(initExportedPrimaryFuncs(primary)) {
if (config.jspi) {
setupJSPI();
}
moveSecondaryFunctions();
thunkExportedSecondaryFunctions();
indirectReferencesToSecondaryFunctions();
indirectCallsToSecondaryFunctions();
exportImportCalledPrimaryFunctions();
setupTablePatching();
shareImportableItems();
removeUnusedSecondaryElements();
}
};
void ModuleSplitter::setupJSPI() {
// Support the first version of JSPI, where the JSPI pass added the load
// secondary module export.
// TODO: remove this when the new JSPI API is only supported.
if (primary.getExportOrNull(LOAD_SECONDARY_MODULE)) {
internalLoadSecondaryModule =
primary.getExport(LOAD_SECONDARY_MODULE)->value;
// Remove the exported LOAD_SECONDARY_MODULE function since it's only needed
// internally.
primary.removeExport(LOAD_SECONDARY_MODULE);
} else {
// Add an imported function to load the secondary module.
auto import = Builder::makeFunction(ModuleSplitting::LOAD_SECONDARY_MODULE,
Signature(Type::none, Type::none),
{});
import->module = ENV;
import->base = ModuleSplitting::LOAD_SECONDARY_MODULE;
primary.addFunction(std::move(import));
internalLoadSecondaryModule = ModuleSplitting::LOAD_SECONDARY_MODULE;
}
Builder builder(primary);
// Add a global to track whether the secondary module has been loaded yet.
primary.addGlobal(builder.makeGlobal(LOAD_SECONDARY_STATUS,
Type::i32,
builder.makeConst(int32_t(0)),
Builder::Mutable));
primary.addExport(builder.makeExport(
LOAD_SECONDARY_STATUS, LOAD_SECONDARY_STATUS, ExternalKind::Global));
}
std::unique_ptr<Module> ModuleSplitter::initSecondary(const Module& primary) {
// Create the secondary module and copy trivial properties.
auto secondary = std::make_unique<Module>();
secondary->features = primary.features;
secondary->hasFeaturesSection = primary.hasFeaturesSection;
return secondary;
}
std::pair<std::set<Name>, std::set<Name>>
ModuleSplitter::classifyFunctions(Module& primary, const Config& config) {
// Find functions that refer to data or element segments. These functions must
// remain in the primary module because segments cannot be exported to be
// accessed from the secondary module.
//
// TODO: Investigate other options, such as moving the segments to the
// secondary module or replacing the segment-using instructions in the
// secondary module with calls to imports.
ModuleUtils::ParallelFunctionAnalysis<std::vector<Name>>
segmentReferrerCollector(
primary, [&](Function* func, std::vector<Name>& segmentReferrers) {
if (func->imported()) {
return;
}
struct SegmentReferrerCollector
: PostWalker<SegmentReferrerCollector,
UnifiedExpressionVisitor<SegmentReferrerCollector>> {
bool hasSegmentReference = false;
void visitExpression(Expression* curr) {
#define DELEGATE_ID curr->_id
#define DELEGATE_START(id) [[maybe_unused]] auto* cast = curr->cast<id>();
#define DELEGATE_GET_FIELD(id, field) cast->field
#define DELEGATE_FIELD_TYPE(id, field)
#define DELEGATE_FIELD_HEAPTYPE(id, field)
#define DELEGATE_FIELD_CHILD(id, field)
#define DELEGATE_FIELD_OPTIONAL_CHILD(id, field)
#define DELEGATE_FIELD_INT(id, field)
#define DELEGATE_FIELD_LITERAL(id, field)
#define DELEGATE_FIELD_NAME(id, field)
#define DELEGATE_FIELD_SCOPE_NAME_DEF(id, field)
#define DELEGATE_FIELD_SCOPE_NAME_USE(id, field)
#define DELEGATE_FIELD_ADDRESS(id, field)
#define DELEGATE_FIELD_NAME_KIND(id, field, kind) \
if (kind == ModuleItemKind::DataSegment || \
kind == ModuleItemKind::ElementSegment) { \
hasSegmentReference = true; \
}
#include "wasm-delegations-fields.def"
}
};
SegmentReferrerCollector collector;
collector.walkFunction(func);
if (collector.hasSegmentReference) {
segmentReferrers.push_back(func->name);
}
});
std::unordered_set<Name> segmentReferrers;
for (auto& [_, referrers] : segmentReferrerCollector.map) {
segmentReferrers.insert(referrers.begin(), referrers.end());
}
std::set<Name> primaryFuncs, secondaryFuncs;
for (auto& func : primary.functions) {
// In JSPI mode exported functions cannot be moved to the secondary
// module since that would make them async when they may not have the JSPI
// wrapper. Exported JSPI functions can still benefit from splitting though
// since only the JSPI wrapper stub will remain in the primary module.
if (func->imported() || !config.secondaryFuncs.count(func->name) ||
(config.jspi && ExportUtils::isExported(primary, *func)) ||
segmentReferrers.count(func->name)) {
primaryFuncs.insert(func->name);
} else {
assert(func->name != primary.start && "The start function must be kept");
secondaryFuncs.insert(func->name);
}
}
return std::make_pair(std::move(primaryFuncs), std::move(secondaryFuncs));
}
std::map<Name, Name>
ModuleSplitter::initExportedPrimaryFuncs(const Module& primary) {
std::map<Name, Name> functionExportNames;
for (auto& ex : primary.exports) {
if (ex->kind == ExternalKind::Function) {
functionExportNames[ex->value] = ex->name;
}
}
return functionExportNames;
}
void ModuleSplitter::exportImportFunction(Name funcName) {
Name exportName;
// If the function is already exported, use the existing export name.
// Otherwise, create a new export for it.
auto exportIt = exportedPrimaryFuncs.find(funcName);
if (exportIt != exportedPrimaryFuncs.end()) {
exportName = exportIt->second;
} else {
if (config.minimizeNewExportNames) {
do {
exportName = config.newExportPrefix + minified.getName();
} while (primary.getExportOrNull(exportName) != nullptr);
} else {
exportName = Names::getValidExportName(
primary, config.newExportPrefix + funcName.toString());
}
primary.addExport(
Builder::makeExport(exportName, funcName, ExternalKind::Function));
exportedPrimaryFuncs[funcName] = exportName;
}
// Import the function if it is not already imported into the secondary
// module.
if (secondary.getFunctionOrNull(funcName) == nullptr) {
auto primaryFunc = primary.getFunction(funcName);
auto func = Builder::makeFunction(funcName, primaryFunc->type, {});
func->hasExplicitName = primaryFunc->hasExplicitName;
func->module = config.importNamespace;
func->base = exportName;
secondary.addFunction(std::move(func));
}
}
void ModuleSplitter::moveSecondaryFunctions() {
// Move the specified functions from the primary to the secondary module.
for (auto funcName : secondaryFuncs) {
auto* func = primary.getFunction(funcName);
ModuleUtils::copyFunction(func, secondary);
primary.removeFunction(funcName);
}
}
void ModuleSplitter::thunkExportedSecondaryFunctions() {
// Update exports of secondary functions in the primary module to export
// wrapper functions that indirectly call the secondary functions. We are
// adding secondary function names to the primary table here, but they will be
// replaced with placeholder functions later along with any references to
// secondary functions that were already in the table.
Builder builder(primary);
for (auto& ex : primary.exports) {
if (ex->kind != ExternalKind::Function ||
!secondaryFuncs.count(ex->value)) {
continue;
}
Name secondaryFunc = ex->value;
if (primary.getFunctionOrNull(secondaryFunc)) {
// We've already created a thunk for this function
continue;
}
auto* func = primary.addFunction(Builder::makeFunction(
secondaryFunc, secondary.getFunction(secondaryFunc)->type, {}));
std::vector<Expression*> args;
Type params = func->getParams();
for (size_t i = 0, size = params.size(); i < size; ++i) {
args.push_back(builder.makeLocalGet(i, params[i]));
}
auto tableSlot = tableManager.getSlot(secondaryFunc, func->type);
func->body = builder.makeCallIndirect(
tableSlot.tableName, tableSlot.makeExpr(primary), args, func->type);
}
}
Expression* ModuleSplitter::maybeLoadSecondary(Builder& builder,
Expression* callIndirect) {
if (!config.jspi) {
return callIndirect;
}
// Check if the secondary module is loaded and if it isn't, call the
// function to load it.
auto* loadSecondary = builder.makeIf(
builder.makeUnary(EqZInt32,
builder.makeGlobalGet(LOAD_SECONDARY_STATUS, Type::i32)),
builder.makeCall(internalLoadSecondaryModule, {}, Type::none));
return builder.makeSequence(loadSecondary, callIndirect);
}
void ModuleSplitter::indirectReferencesToSecondaryFunctions() {
// Turn references to secondary functions into references to thunks that
// perform a direct call to the original referent. The direct calls in the
// thunks will be handled like all other cross-module calls later, in
// |indirectCallsToSecondaryFunctions|.
struct Gatherer : public PostWalker<Gatherer> {
ModuleSplitter& parent;
Gatherer(ModuleSplitter& parent) : parent(parent) {}
// Collect RefFuncs in a map from the function name to all RefFuncs that
// refer to it. We only collect this for secondary funcs.
InsertOrderedMap<Name, std::vector<RefFunc*>> map;
void visitRefFunc(RefFunc* curr) {
if (parent.secondaryFuncs.count(curr->func)) {
map[curr->func].push_back(curr);
}
}
} gatherer(*this);
gatherer.walkModule(&primary);
// Ignore references to secondary functions that occur in the active segment
// that will contain the imported placeholders. Indirect calls to table slots
// initialized by that segment will already go to the right place once the
// secondary module has been loaded and the table has been patched.
std::unordered_set<RefFunc*> ignore;
if (tableManager.activeSegment) {
for (auto* expr : tableManager.activeSegment->data) {
if (auto* ref = expr->dynCast<RefFunc>()) {
ignore.insert(ref);
}
}
}
// Fix up what we found: Generate trampolines as described earlier, and apply
// them.
Builder builder(primary);
// Generate the new trampoline function and add it to the module.
for (auto& [name, refFuncs] : gatherer.map) {
// Find the relevant (non-ignored) RefFuncs. If there are none, we can skip
// creating a thunk entirely.
std::vector<RefFunc*> relevantRefFuncs;
for (auto* refFunc : refFuncs) {
assert(refFunc->func == name);
if (!ignore.count(refFunc)) {
relevantRefFuncs.push_back(refFunc);
}
}
if (relevantRefFuncs.empty()) {
continue;
}
auto* oldFunc = secondary.getFunction(name);
auto newName = Names::getValidFunctionName(
primary, std::string("trampoline_") + name.toString());
// Generate the call and the function.
std::vector<Expression*> args;
for (Index i = 0; i < oldFunc->getNumParams(); i++) {
args.push_back(builder.makeLocalGet(i, oldFunc->getLocalType(i)));
}
auto* call = builder.makeCall(name, args, oldFunc->getResults());
primary.addFunction(builder.makeFunction(newName, oldFunc->type, {}, call));
// Update RefFuncs to refer to it.
for (auto* refFunc : relevantRefFuncs) {
refFunc->func = newName;
}
}
}
void ModuleSplitter::indirectCallsToSecondaryFunctions() {
// Update direct calls of secondary functions to be indirect calls of their
// corresponding table indices instead.
struct CallIndirector : public PostWalker<CallIndirector> {
ModuleSplitter& parent;
Builder builder;
CallIndirector(ModuleSplitter& parent)
: parent(parent), builder(parent.primary) {}
// Avoid visitRefFunc on element segment data
void walkElementSegment(ElementSegment* segment) {}
void visitCall(Call* curr) {
if (!parent.secondaryFuncs.count(curr->target)) {
return;
}
auto* func = parent.secondary.getFunction(curr->target);
auto tableSlot = parent.tableManager.getSlot(curr->target, func->type);
replaceCurrent(parent.maybeLoadSecondary(
builder,
builder.makeCallIndirect(tableSlot.tableName,
tableSlot.makeExpr(parent.primary),
curr->operands,
func->type,
curr->isReturn)));
}
};
CallIndirector(*this).walkModule(&primary);
}
void ModuleSplitter::exportImportCalledPrimaryFunctions() {
// Find primary functions called/referred in the secondary module.
ModuleUtils::ParallelFunctionAnalysis<std::vector<Name>> callCollector(
secondary, [&](Function* func, std::vector<Name>& calledPrimaryFuncs) {
struct CallCollector : PostWalker<CallCollector> {
const std::set<Name>& primaryFuncs;
std::vector<Name>& calledPrimaryFuncs;
CallCollector(const std::set<Name>& primaryFuncs,
std::vector<Name>& calledPrimaryFuncs)
: primaryFuncs(primaryFuncs), calledPrimaryFuncs(calledPrimaryFuncs) {
}
void visitCall(Call* curr) {
if (primaryFuncs.count(curr->target)) {
calledPrimaryFuncs.push_back(curr->target);
}
}
void visitRefFunc(RefFunc* curr) {
if (primaryFuncs.count(curr->func)) {
calledPrimaryFuncs.push_back(curr->func);
}
}
};
CallCollector(primaryFuncs, calledPrimaryFuncs).walkFunction(func);
});
std::set<Name> calledPrimaryFuncs;
for (auto& entry : callCollector.map) {
auto& calledFuncs = entry.second;
calledPrimaryFuncs.insert(calledFuncs.begin(), calledFuncs.end());
}
// Ensure each called primary function is exported and imported
for (auto func : calledPrimaryFuncs) {
exportImportFunction(func);
}
}
void ModuleSplitter::setupTablePatching() {
if (!tableManager.activeTable) {
return;
}
std::map<Index, Function*> replacedElems;
// Replace table references to secondary functions with an imported
// placeholder that encodes the table index in its name:
// `importNamespace`.`index`.
forEachElement(primary, [&](Name, Name, Index index, Expression*& elem) {
auto* ref = elem->dynCast<RefFunc>();
if (!ref) {
return;
}
if (!secondaryFuncs.count(ref->func)) {
return;
}
placeholderMap[index] = ref->func;
auto* secondaryFunc = secondary.getFunction(ref->func);
replacedElems[index] = secondaryFunc;
if (!config.usePlaceholders) {
// TODO: This can create active element segments with lots of nulls. We
// should optimize them like we do data segments with zeros.
elem = Builder(primary).makeRefNull(HeapType::nofunc);
return;
}
auto placeholder = std::make_unique<Function>();
placeholder->module = config.placeholderNamespace;
placeholder->base = std::to_string(index);
placeholder->name = Names::getValidFunctionName(
primary, std::string("placeholder_") + placeholder->base.toString());
placeholder->hasExplicitName = true;
placeholder->type = secondaryFunc->type;
elem = Builder(primary).makeRefFunc(placeholder->name, placeholder->type);
primary.addFunction(std::move(placeholder));
});
if (replacedElems.size() == 0) {
// No placeholders to patch out of the table
return;
}
auto secondaryTable =
ModuleUtils::copyTable(tableManager.activeTable, secondary);
if (tableManager.activeBase.global.size()) {
assert(tableManager.activeTableSegments.size() == 1 &&
"Unexpected number of segments with non-const base");
assert(secondary.tables.size() == 1 && secondary.elementSegments.empty());
// Since addition is not currently allowed in initializer expressions, we
// need to start the new secondary segment where the primary segment starts.
// The secondary segment will contain the same primary functions as the
// primary module except in positions where it needs to overwrite a
// placeholder function. All primary functions in the table therefore need
// to be imported into the second module. TODO: use better strategies here,
// such as using ref.func in the start function or standardizing addition in
// initializer expressions.
ElementSegment* primarySeg = tableManager.activeTableSegments.front();
std::vector<Expression*> secondaryElems;
secondaryElems.reserve(primarySeg->data.size());
// Copy functions from the primary segment to the secondary segment,
// replacing placeholders and creating new exports and imports as necessary.
auto replacement = replacedElems.begin();
for (Index i = 0;
i < primarySeg->data.size() && replacement != replacedElems.end();
++i) {
if (replacement->first == i) {
// primarySeg->data[i] is a placeholder, so use the secondary function.
auto* func = replacement->second;
auto* ref = Builder(secondary).makeRefFunc(func->name, func->type);
secondaryElems.push_back(ref);
++replacement;
} else if (auto* get = primarySeg->data[i]->dynCast<RefFunc>()) {
exportImportFunction(get->func);
auto* copied =
ExpressionManipulator::copy(primarySeg->data[i], secondary);
secondaryElems.push_back(copied);
}
}
auto offset = ExpressionManipulator::copy(primarySeg->offset, secondary);
auto secondarySeg = std::make_unique<ElementSegment>(
secondaryTable->name, offset, secondaryTable->type, secondaryElems);
secondarySeg->setName(primarySeg->name, primarySeg->hasExplicitName);
secondary.addElementSegment(std::move(secondarySeg));
return;
}
// Create active table segments in the secondary module to patch in the
// original functions when it is instantiated.
Index currBase = replacedElems.begin()->first;
std::vector<Expression*> currData;
auto finishSegment = [&]() {
auto* offset = Builder(secondary).makeConst(int32_t(currBase));
auto secondarySeg = std::make_unique<ElementSegment>(
secondaryTable->name, offset, secondaryTable->type, currData);
Name name = Names::getValidElementSegmentName(
secondary, Name::fromInt(secondary.elementSegments.size()));
secondarySeg->setName(name, false);
secondary.addElementSegment(std::move(secondarySeg));
};
for (auto curr = replacedElems.begin(); curr != replacedElems.end(); ++curr) {
if (curr->first != currBase + currData.size()) {
finishSegment();
currBase = curr->first;
currData.clear();
}
auto* func = curr->second;
currData.push_back(Builder(secondary).makeRefFunc(func->name, func->type));
}
if (currData.size()) {
finishSegment();
}
}
void ModuleSplitter::shareImportableItems() {
// Map internal names to (one of) their corresponding export names. Don't
// consider functions because they have already been imported and exported as
// necessary.
std::unordered_map<std::pair<ExternalKind, Name>, Name> exports;
for (auto& ex : primary.exports) {
if (ex->kind != ExternalKind::Function) {
exports[std::make_pair(ex->kind, ex->value)] = ex->name;
}
}
auto makeImportExport = [&](Importable& primaryItem,
Importable& secondaryItem,
const std::string& genericExportName,
ExternalKind kind) {
secondaryItem.name = primaryItem.name;
secondaryItem.hasExplicitName = primaryItem.hasExplicitName;
secondaryItem.module = config.importNamespace;
auto exportIt = exports.find(std::make_pair(kind, primaryItem.name));
if (exportIt != exports.end()) {
secondaryItem.base = exportIt->second;
} else {
std::string baseName =
config.newExportPrefix + (config.minimizeNewExportNames
? minified.getName()
: genericExportName);
Name exportName = Names::getValidExportName(primary, baseName);
primary.addExport(new Export{exportName, primaryItem.name, kind});
secondaryItem.base = exportName;
}
};
// TODO: Be more selective by only sharing global items that are actually used
// in the secondary module, just like we do for functions.
for (auto& memory : primary.memories) {
auto secondaryMemory = ModuleUtils::copyMemory(memory.get(), secondary);
makeImportExport(*memory, *secondaryMemory, "memory", ExternalKind::Memory);
}
for (auto& table : primary.tables) {
auto secondaryTable = secondary.getTableOrNull(table->name);
if (!secondaryTable) {
secondaryTable = ModuleUtils::copyTable(table.get(), secondary);
}
makeImportExport(*table, *secondaryTable, "table", ExternalKind::Table);
}
for (auto& global : primary.globals) {
if (global->mutable_) {
assert(primary.features.hasMutableGlobals() &&
"TODO: add wrapper functions for disallowed mutable globals");
}
auto secondaryGlobal = std::make_unique<Global>();
secondaryGlobal->type = global->type;
secondaryGlobal->mutable_ = global->mutable_;
secondaryGlobal->init =
global->init == nullptr
? nullptr
: ExpressionManipulator::copy(global->init, secondary);
makeImportExport(*global, *secondaryGlobal, "global", ExternalKind::Global);
secondary.addGlobal(std::move(secondaryGlobal));
}
for (auto& tag : primary.tags) {
auto secondaryTag = std::make_unique<Tag>();
secondaryTag->sig = tag->sig;
makeImportExport(*tag, *secondaryTag, "tag", ExternalKind::Tag);
secondary.addTag(std::move(secondaryTag));
}
}
void ModuleSplitter::removeUnusedSecondaryElements() {
// TODO: It would be better to be more selective about only exporting and
// importing those items that the secondary module needs. This would reduce
// code size in the primary module as well.
PassRunner runner(&secondary);
runner.add("remove-unused-module-elements");
runner.run();
}
} // anonymous namespace
Results splitFunctions(Module& primary, const Config& config) {
ModuleSplitter split(primary, config);
return {std::move(split.secondaryPtr), std::move(split.placeholderMap)};
}
} // namespace wasm::ModuleSplitting