mirror of
https://github.com/llvm/llvm-project.git
synced 2025-04-24 00:36:04 +00:00

Change the global variable reference to a member access of another variable `ctx`. In the future, we may pass through `ctx` to functions to eliminate global variables. Pull Request: https://github.com/llvm/llvm-project/pull/119835
233 lines
7.3 KiB
C++
233 lines
7.3 KiB
C++
//===- MarkLive.cpp -------------------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements --gc-sections, which is a feature to remove unused
|
|
// chunks from the output. Unused chunks are those that are not reachable from
|
|
// known root symbols or chunks. This feature is implemented as a mark-sweep
|
|
// garbage collector.
|
|
//
|
|
// Here's how it works. Each InputChunk has a "Live" bit. The bit is off by
|
|
// default. Starting with the GC-roots, visit all reachable chunks and set their
|
|
// Live bits. The Writer will then ignore chunks whose Live bits are off, so
|
|
// that such chunk are not appear in the output.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "MarkLive.h"
|
|
#include "Config.h"
|
|
#include "InputChunks.h"
|
|
#include "InputElement.h"
|
|
#include "SymbolTable.h"
|
|
#include "Symbols.h"
|
|
|
|
#define DEBUG_TYPE "lld"
|
|
|
|
using namespace llvm;
|
|
using namespace llvm::wasm;
|
|
|
|
namespace lld::wasm {
|
|
|
|
namespace {
|
|
|
|
class MarkLive {
|
|
public:
|
|
void run();
|
|
|
|
private:
|
|
void enqueue(Symbol *sym);
|
|
void enqueue(InputChunk *chunk);
|
|
void enqueueInitFunctions(const ObjFile *sym);
|
|
void enqueueRetainedSegments(const ObjFile *file);
|
|
void mark();
|
|
bool isCallCtorsLive();
|
|
|
|
// A list of chunks to visit.
|
|
SmallVector<InputChunk *, 256> queue;
|
|
};
|
|
|
|
} // namespace
|
|
|
|
void MarkLive::enqueue(Symbol *sym) {
|
|
if (!sym || sym->isLive())
|
|
return;
|
|
LLVM_DEBUG(dbgs() << "markLive: " << sym->getName() << "\n");
|
|
|
|
InputFile *file = sym->getFile();
|
|
bool markImplicitDeps = file && !file->isLive() && sym->isDefined();
|
|
|
|
sym->markLive();
|
|
|
|
if (markImplicitDeps) {
|
|
if (auto obj = dyn_cast<ObjFile>(file)) {
|
|
// Mark as live the ctor functions in the object that defines this symbol.
|
|
// The ctor functions are all referenced by the synthetic callCtors
|
|
// function. However, this function does not contain relocations so we
|
|
// have to manually mark the ctors as live.
|
|
enqueueInitFunctions(obj);
|
|
// Mark retained segments in the object that defines this symbol live.
|
|
enqueueRetainedSegments(obj);
|
|
}
|
|
}
|
|
|
|
if (InputChunk *chunk = sym->getChunk())
|
|
queue.push_back(chunk);
|
|
}
|
|
|
|
void MarkLive::enqueue(InputChunk *chunk) {
|
|
LLVM_DEBUG(dbgs() << "markLive: " << toString(chunk) << "\n");
|
|
chunk->live = true;
|
|
queue.push_back(chunk);
|
|
}
|
|
|
|
// The ctor functions are all referenced by the synthetic callCtors
|
|
// function. However, this function does not contain relocations so we
|
|
// have to manually mark the ctors as live.
|
|
void MarkLive::enqueueInitFunctions(const ObjFile *obj) {
|
|
const WasmLinkingData &l = obj->getWasmObj()->linkingData();
|
|
for (const WasmInitFunc &f : l.InitFunctions) {
|
|
auto *initSym = obj->getFunctionSymbol(f.Symbol);
|
|
if (!initSym->isDiscarded())
|
|
enqueue(initSym);
|
|
}
|
|
}
|
|
|
|
// Mark segments flagged by segment-level no-strip. Segment-level no-strip is
|
|
// usually used to retain segments without having symbol table entry.
|
|
void MarkLive::enqueueRetainedSegments(const ObjFile *file) {
|
|
for (InputChunk *chunk : file->segments)
|
|
if (chunk->isRetained())
|
|
enqueue(chunk);
|
|
}
|
|
|
|
void MarkLive::run() {
|
|
// Add GC root symbols.
|
|
if (!ctx.arg.entry.empty())
|
|
enqueue(symtab->find(ctx.arg.entry));
|
|
|
|
// We need to preserve any no-strip or exported symbol
|
|
for (Symbol *sym : symtab->symbols())
|
|
if (sym->isNoStrip() || sym->isExported())
|
|
enqueue(sym);
|
|
|
|
if (WasmSym::callDtors)
|
|
enqueue(WasmSym::callDtors);
|
|
|
|
for (const ObjFile *obj : ctx.objectFiles)
|
|
if (obj->isLive()) {
|
|
// Enqueue constructors in objects explicitly live from the command-line.
|
|
enqueueInitFunctions(obj);
|
|
// Enqueue retained segments in objects explicitly live from the
|
|
// command-line.
|
|
enqueueRetainedSegments(obj);
|
|
}
|
|
|
|
mark();
|
|
|
|
// If we have any non-discarded init functions, mark `__wasm_call_ctors` as
|
|
// live so that we assign it an index and call it.
|
|
if (isCallCtorsLive())
|
|
WasmSym::callCtors->markLive();
|
|
}
|
|
|
|
void MarkLive::mark() {
|
|
// Follow relocations to mark all reachable chunks.
|
|
while (!queue.empty()) {
|
|
InputChunk *c = queue.pop_back_val();
|
|
|
|
for (const WasmRelocation reloc : c->getRelocations()) {
|
|
if (reloc.Type == R_WASM_TYPE_INDEX_LEB)
|
|
continue;
|
|
Symbol *sym = c->file->getSymbol(reloc.Index);
|
|
|
|
// If the function has been assigned the special index zero in the table,
|
|
// the relocation doesn't pull in the function body, since the function
|
|
// won't actually go in the table (the runtime will trap attempts to call
|
|
// that index, since we don't use it). A function with a table index of
|
|
// zero is only reachable via "call", not via "call_indirect". The stub
|
|
// functions used for weak-undefined symbols have this behaviour (compare
|
|
// equal to null pointer, only reachable via direct call).
|
|
if (reloc.Type == R_WASM_TABLE_INDEX_SLEB ||
|
|
reloc.Type == R_WASM_TABLE_INDEX_SLEB64 ||
|
|
reloc.Type == R_WASM_TABLE_INDEX_I32 ||
|
|
reloc.Type == R_WASM_TABLE_INDEX_I64) {
|
|
auto *funcSym = cast<FunctionSymbol>(sym);
|
|
if (funcSym->isStub)
|
|
continue;
|
|
}
|
|
|
|
enqueue(sym);
|
|
}
|
|
}
|
|
}
|
|
|
|
void markLive() {
|
|
if (!ctx.arg.gcSections)
|
|
return;
|
|
|
|
LLVM_DEBUG(dbgs() << "markLive\n");
|
|
|
|
MarkLive marker;
|
|
marker.run();
|
|
|
|
// Report garbage-collected sections.
|
|
if (ctx.arg.printGcSections) {
|
|
for (const ObjFile *obj : ctx.objectFiles) {
|
|
for (InputChunk *c : obj->functions)
|
|
if (!c->live)
|
|
message("removing unused section " + toString(c));
|
|
for (InputChunk *c : obj->segments)
|
|
if (!c->live)
|
|
message("removing unused section " + toString(c));
|
|
for (InputGlobal *g : obj->globals)
|
|
if (!g->live)
|
|
message("removing unused section " + toString(g));
|
|
for (InputTag *t : obj->tags)
|
|
if (!t->live)
|
|
message("removing unused section " + toString(t));
|
|
for (InputTable *t : obj->tables)
|
|
if (!t->live)
|
|
message("removing unused section " + toString(t));
|
|
}
|
|
for (InputChunk *c : ctx.syntheticFunctions)
|
|
if (!c->live)
|
|
message("removing unused section " + toString(c));
|
|
for (InputGlobal *g : ctx.syntheticGlobals)
|
|
if (!g->live)
|
|
message("removing unused section " + toString(g));
|
|
for (InputTable *t : ctx.syntheticTables)
|
|
if (!t->live)
|
|
message("removing unused section " + toString(t));
|
|
}
|
|
}
|
|
|
|
bool MarkLive::isCallCtorsLive() {
|
|
// In a reloctable link, we don't call `__wasm_call_ctors`.
|
|
if (ctx.arg.relocatable)
|
|
return false;
|
|
|
|
// In Emscripten-style PIC, we call `__wasm_call_ctors` which calls
|
|
// `__wasm_apply_data_relocs`.
|
|
if (ctx.isPic)
|
|
return true;
|
|
|
|
// If there are any init functions, mark `__wasm_call_ctors` live so that
|
|
// it can call them.
|
|
for (const ObjFile *file : ctx.objectFiles) {
|
|
const WasmLinkingData &l = file->getWasmObj()->linkingData();
|
|
for (const WasmInitFunc &f : l.InitFunctions) {
|
|
auto *sym = file->getFunctionSymbol(f.Symbol);
|
|
if (!sym->isDiscarded() && sym->isLive())
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
} // namespace lld::wasm
|