Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
212 changes: 166 additions & 46 deletions src/ir/module-splitting.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -47,9 +47,6 @@
// 8. Export globals, tags, tables, and memories from the primary module and
// import them in the secondary modules.
//
// 9. Run RemoveUnusedModuleElements pass on the secondary modules in order to
// remove unused imports.
//
// Functions can be used or referenced three ways in a WebAssembly module: they
// can be exported, called, or referenced with ref.func. The above procedure
// introduces a layer of indirection to each of those mechanisms that removes
Expand Down Expand Up @@ -77,10 +74,9 @@
#include "ir/module-splitting.h"
#include "asmjs/shared-constants.h"
#include "ir/export-utils.h"
#include "ir/find_all.h"
#include "ir/module-utils.h"
#include "ir/names.h"
#include "ir/utils.h"
#include "pass.h"
#include "support/insert_ordered.h"
#include "wasm-builder.h"
#include "wasm.h"
Expand Down Expand Up @@ -963,13 +959,11 @@ void ModuleSplitter::shareImportableItems() {
}
};

for (auto& secondaryPtr : secondaries) {
Module& secondary = *secondaryPtr;

// Collect names used in the secondary module
// Given a module, collect names used in the module
auto getUsedNames = [&](Module& module) {
UsedNames used;
ModuleUtils::ParallelFunctionAnalysis<UsedNames> nameCollector(
secondary, [&](Function* func, UsedNames& used) {
module, [&](Function* func, UsedNames& used) {
if (!func->imported()) {
NameCollector(used).walk(func->body);
}
Expand All @@ -983,65 +977,191 @@ void ModuleSplitter::shareImportableItems() {
}

NameCollector collector(used);
collector.walkModuleCode(&secondary);
for (auto& segment : secondary.dataSegments) {
collector.walkModuleCode(&module);
for (auto& segment : module.dataSegments) {
if (segment->memory.is()) {
used.memories.insert(segment->memory);
}
}
for (auto& segment : secondary.elementSegments) {
for (auto& segment : module.elementSegments) {
if (segment->table.is()) {
used.tables.insert(segment->table);
}
}
// If primary module has exports, they are "used" in it
for (auto& ex : module.exports) {
Comment on lines +991 to +992
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Do secondary module not have imports yet at this point, so we know these exports are all primary module exports? That would be helpful to mention in the comment if so.

if (ex->kind == ExternalKind::Global) {
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Let's use a switch (ex->kind) so the compiler will force us to handle new kinds of exports in the future.

used.globals.insert(*ex->getInternalName());
} else if (ex->kind == ExternalKind::Memory) {
used.memories.insert(*ex->getInternalName());
} else if (ex->kind == ExternalKind::Table) {
used.tables.insert(*ex->getInternalName());
} else if (ex->kind == ExternalKind::Tag) {
used.tags.insert(*ex->getInternalName());
}
}
return used;
};

UsedNames primaryUsed = getUsedNames(primary);
std::vector<UsedNames> secondaryUsed;
for (auto& secondaryPtr : secondaries) {
secondaryUsed.push_back(getUsedNames(*secondaryPtr));
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I wonder if using emplace_back would have a noticeable performance difference here.

}

// Compute globals referenced in other globals' initializers. Since globals
// can reference other globals, we must ensure that if a global is used in a
// module, all its dependencies are also marked as used.
auto computeDependentItems = [&](UsedNames& used) {
std::vector<Name> worklist(used.globals.begin(), used.globals.end());
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

In principle globals could also appear in segment offsets, element segment elements, and soon table default values. Is there a way we can generalize this to handle arbitrary module-level code?

for (auto name : worklist) {
// At this point all globals are still in the primary module, so this
// exists
auto* global = primary.getGlobal(name);
if (!global->imported() && global->init) {
for (auto* get : FindAll<GlobalGet>(global->init).list) {
used.globals.insert(get->name);
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Do we also need to add the newly found used global back to the worklist?

}
}
}
};

for (auto& used : secondaryUsed) {
computeDependentItems(used);
}

// Export module items that are used in the secondary module
for (auto& memory : primary.memories) {
if (!used.memories.count(memory->name)) {
continue;
// Given a name and module item kind, returns the list of secondary modules
// using that name
auto getUsingSecondaries = [&](const Name& name, auto UsedNames::* field) {
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Whoah, I've never seen this member pointer syntax before. Neat!

std::vector<Module*> usingModules;
for (size_t i = 0; i < secondaries.size(); ++i) {
if ((secondaryUsed[i].*field).count(name)) {
usingModules.push_back(secondaries[i].get());
}
auto secondaryMemory = ModuleUtils::copyMemory(memory.get(), secondary);
makeImportExport(
*memory, *secondaryMemory, "memory", ExternalKind::Memory);
}
return usingModules;
};

for (auto& table : primary.tables) {
// 1. In case we copied this table to this secondary module in
// setupTablePatching(), secondary.getTableOrNull(table->name) is not
// null, and we need to export it.
// 2. As in the case with other module elements, if the table is used in
// the secondary module's instructions, we need to export it.
auto secondaryTable = secondary.getTableOrNull(table->name);
if (!secondaryTable && !used.tables.count(table->name)) {
continue;
// Share module items with secondary modules.
// 1. Only share an item with the modules that use it
// 2. If an item is used by only a single secondary module, move the item to
// that secondary module. If an item is used by multiple modules (including
// the primary and secondary modules), export the item from the primary and
// import it from the using secondary modules.

std::vector<Name> memoriesToRemove;
for (auto& memory : primary.memories) {
auto usingSecondaries =
getUsingSecondaries(memory->name, &UsedNames::memories);
bool inPrimary = primaryUsed.memories.count(memory->name);
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
bool inPrimary = primaryUsed.memories.count(memory->name);
bool usedInPrimary = primaryUsed.memories.count(memory->name);

Otherwise it sounds like this says whether it's defined in the primary module, but that's always true IIUC.


if (!inPrimary && usingSecondaries.size() == 1) {
auto* secondary = usingSecondaries[0];
ModuleUtils::copyMemory(memory.get(), *secondary);
memoriesToRemove.push_back(memory->name);
} else {
for (auto* secondary : usingSecondaries) {
auto* secondaryMemory =
ModuleUtils::copyMemory(memory.get(), *secondary);
makeImportExport(
*memory, *secondaryMemory, "memory", ExternalKind::Memory);
}
if (!secondaryTable) {
secondaryTable = ModuleUtils::copyTable(table.get(), secondary);
}
}
for (auto& name : memoriesToRemove) {
primary.removeMemory(name);
}

std::vector<Name> tablesToRemove;
for (auto& table : primary.tables) {
auto usingSecondaries =
getUsingSecondaries(table->name, &UsedNames::tables);
bool inPrimary = primaryUsed.tables.count(table->name);

if (!inPrimary && usingSecondaries.size() == 1) {
auto* secondary = usingSecondaries[0];
// In case we copied this table to this secondary module in
// setupTablePatching(), !inPrimary can't be satisfied, because the
// primary module should have an element segment that refers to this
// table.
assert(!secondary->getTableOrNull(table->name));
ModuleUtils::copyTable(table.get(), *secondary);
tablesToRemove.push_back(table->name);
} else {
for (auto* secondary : usingSecondaries) {
// 1. In case we copied this table to this secondary module in
// setupTablePatching(), secondary.getTableOrNull(table->name) is not
// null, and we need to export it.
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
// null, and we need to export it.
// null, and we need to import it.

Is this right?

// 2. As in the case with other module elements, if the table is used in
// the secondary module's instructions, we need to export it.
auto secondaryTable = secondary->getTableOrNull(table->name);
if (!secondaryTable) {
secondaryTable = ModuleUtils::copyTable(table.get(), *secondary);
}
makeImportExport(*table, *secondaryTable, "table", ExternalKind::Table);
}
makeImportExport(*table, *secondaryTable, "table", ExternalKind::Table);
}
}
for (auto& name : tablesToRemove) {
primary.removeTable(name);
}

std::vector<Name> globalsToRemove;
for (auto& global : primary.globals) {
if (global->mutable_) {
assert(primary.features.hasMutableGlobals() &&
"TODO: add wrapper functions for disallowed mutable globals");
}

for (auto& global : primary.globals) {
if (!used.globals.count(global->name)) {
continue;
auto usingSecondaries =
getUsingSecondaries(global->name, &UsedNames::globals);
bool inPrimary = primaryUsed.globals.count(global->name);
if (!inPrimary && usingSecondaries.size() == 1) {
auto* secondary = usingSecondaries[0];
ModuleUtils::copyGlobal(global.get(), *secondary);
globalsToRemove.push_back(global->name);
// Import global initializer's ref.func dependences
if (global->init) {
for (auto* ref : FindAll<RefFunc>(global->init).list) {
// Here, ref->func is either a function the primary module, or a
// trampoline created in indirectReferencesToSecondaryFunctions in
// case the original function is in one of the secondaries.
assert(primary.getFunctionOrNull(ref->func));
exportImportFunction(ref->func, {secondary});
}
}
if (global->mutable_) {
assert(primary.features.hasMutableGlobals() &&
"TODO: add wrapper functions for disallowed mutable globals");
} else {
for (auto* secondary : usingSecondaries) {
auto* secondaryGlobal =
ModuleUtils::copyGlobal(global.get(), *secondary);
makeImportExport(
*global, *secondaryGlobal, "global", ExternalKind::Global);
}
auto* secondaryGlobal = ModuleUtils::copyGlobal(global.get(), secondary);
makeImportExport(
*global, *secondaryGlobal, "global", ExternalKind::Global);
}
}
for (auto& name : globalsToRemove) {
primary.removeGlobal(name);
}

std::vector<Name> tagsToRemove;
for (auto& tag : primary.tags) {
auto usingSecondaries = getUsingSecondaries(tag->name, &UsedNames::tags);
bool inPrimary = primaryUsed.tags.count(tag->name);

for (auto& tag : primary.tags) {
if (!used.tags.count(tag->name)) {
continue;
if (!inPrimary && usingSecondaries.size() == 1) {
auto* secondary = usingSecondaries[0];
ModuleUtils::copyTag(tag.get(), *secondary);
tagsToRemove.push_back(tag->name);
} else {
for (auto* secondary : usingSecondaries) {
auto* secondaryTag = ModuleUtils::copyTag(tag.get(), *secondary);
makeImportExport(*tag, *secondaryTag, "tag", ExternalKind::Tag);
}
auto* secondaryTag = ModuleUtils::copyTag(tag.get(), secondary);
makeImportExport(*tag, *secondaryTag, "tag", ExternalKind::Tag);
}
}
for (auto& name : tagsToRemove) {
primary.removeTag(name);
}
}

} // anonymous namespace
Expand Down
38 changes: 38 additions & 0 deletions test/lit/wasm-split/global-funcref.wast
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
;; RUN: wasm-split %s -all -g -o1 %t.1.wasm -o2 %t.2.wasm --keep-funcs=keep
;; RUN: wasm-dis %t.1.wasm | filecheck %s --check-prefix PRIMARY
;; RUN: wasm-dis %t.2.wasm | filecheck %s --check-prefix SECONDARY

;; When a split global ($a here)'s initializer contains a ref.func of a split
;; function, currently we create its trampoline in the primary module and export
;; it.
;; TODO Use $split in the secondary module directly in the split global

(module
;; PRIMARY: (export "trampoline_split" (func $trampoline_split))

;; PRIMARY: (func $keep
;; PRIMARY-NEXT: )
(func $keep)

;; PRIMARY: (func $trampoline_split
;; PRIMARY-NEXT: (call_indirect (type $0)
;; PRIMARY-NEXT: (i32.const 0)
;; PRIMARY-NEXT: )
;; PRIMARY-NEXT: )


;; SECONDARY: (import "primary" "trampoline_split" (func $trampoline_split (exact)))
;; SECONDARY: (global $a funcref (ref.func $trampoline_split))
(global $a funcref (ref.func $split))

;; SECONDARY: (func $split
;; SECONDARY-NEXT: (drop
;; SECONDARY-NEXT: (global.get $a)
;; SECONDARY-NEXT: )
;; SECONDARY-NEXT: )
(func $split
(drop
(global.get $a)
)
)
)
57 changes: 0 additions & 57 deletions test/lit/wasm-split/selective-exports.wast

This file was deleted.

Loading
Loading