diff --git a/lld/test/wasm/no-strip-segment.s b/lld/test/wasm/no-strip-segment.s new file mode 100644 index 00000000000000..e70acae296d1a6 --- /dev/null +++ b/lld/test/wasm/no-strip-segment.s @@ -0,0 +1,62 @@ +# RUN: split-file %s %t +# RUN: llvm-mc -filetype=obj --triple=wasm32-unknown-unknown -o %t/main.o %t/main.s +# RUN: llvm-mc -filetype=obj --triple=wasm32-unknown-unknown -o %t/liba_x.o %t/liba_x.s +# RUN: llvm-mc -filetype=obj --triple=wasm32-unknown-unknown -o %t/liba_y.o %t/liba_y.s +# RUN: rm -f %t/liba.a +# RUN: llvm-ar rcs %t/liba.a %t/liba_x.o %t/liba_y.o +# RUN: wasm-ld %t/main.o %t/liba.a --gc-sections -o %t/main.wasm --print-gc-sections | FileCheck %s --check-prefix=GC +# RUN: obj2yaml %t/main.wasm | FileCheck %s + +# --gc-sections should remove non-retained and unused "weathers" section from live object liba_x.o +# GC: removing unused section {{.*}}/liba.a(liba_x.o):(weathers) +# Should not remove retained "greetings" sections from live objects main.o and liba_x.o +# GC-NOT: removing unused section %t/main.o:(greetings) +# GC-NOT: removing unused section %t/liba_x.o:(greetings) + +# Note: All symbols are private so that they don't join the symbol table. + +#--- main.s + .functype grab_liba () -> () + .globl _start +_start: + .functype _start () -> () + call grab_liba + end_function + + .section greetings,"R",@ + .asciz "hello" + .section weathers,"R",@ + .asciz "cloudy" + +#--- liba_x.s + .globl grab_liba +grab_liba: + .functype grab_liba () -> () + end_function + + .section greetings,"R",@ + .asciz "world" + .section weathers,"",@ + .asciz "rainy" + +#--- liba_y.s + .section greetings,"R",@ + .asciz "bye" + + +# "greetings" section +# CHECK: - Type: DATA +# CHECK: Segments: +# CHECK: - SectionOffset: 7 +# CHECK: InitFlags: 0 +# CHECK: Offset: +# CHECK: Opcode: I32_CONST +# CHECK: Value: 1024 +# CHECK: Content: 68656C6C6F00776F726C6400 +# "weahters" section. +# CHECK: - SectionOffset: 25 +# CHECK: InitFlags: 0 +# CHECK: Offset: +# CHECK: Opcode: I32_CONST +# CHECK: Value: 1036 +# CHECK: Content: 636C6F75647900 diff --git a/lld/wasm/InputChunks.h b/lld/wasm/InputChunks.h index 1e430832fb84c7..2ddf9232f01388 100644 --- a/lld/wasm/InputChunks.h +++ b/lld/wasm/InputChunks.h @@ -81,6 +81,7 @@ class InputChunk { void generateRelocationCode(raw_ostream &os) const; bool isTLS() const { return flags & llvm::wasm::WASM_SEG_FLAG_TLS; } + bool isRetained() const { return flags & llvm::wasm::WASM_SEG_FLAG_RETAIN; } ObjFile *file; OutputSection *outputSec = nullptr; diff --git a/lld/wasm/MarkLive.cpp b/lld/wasm/MarkLive.cpp index a59a80ad2cc3a7..085022b3d0c8cc 100644 --- a/lld/wasm/MarkLive.cpp +++ b/lld/wasm/MarkLive.cpp @@ -40,7 +40,9 @@ class MarkLive { private: void enqueue(Symbol *sym); + void enqueue(InputChunk *chunk); void enqueueInitFunctions(const ObjFile *sym); + void enqueueRetainedSegments(const ObjFile *file); void mark(); bool isCallCtorsLive(); @@ -56,21 +58,30 @@ void MarkLive::enqueue(Symbol *sym) { LLVM_DEBUG(dbgs() << "markLive: " << sym->getName() << "\n"); InputFile *file = sym->getFile(); - bool needInitFunctions = file && !file->isLive() && sym->isDefined(); + bool markImplicitDeps = file && !file->isLive() && sym->isDefined(); sym->markLive(); - // Mark ctor functions in the object that defines this symbol live. - // The ctor functions are all referenced by the synthetic callCtors - // function. However, this function does not contain relocations so we - // have to manually mark the ctors as live. - if (needInitFunctions) + if (markImplicitDeps) { + // Mark ctor functions in the object that defines this symbol live. + // The ctor functions are all referenced by the synthetic callCtors + // function. However, this function does not contain relocations so we + // have to manually mark the ctors as live. enqueueInitFunctions(cast(file)); + // Mark retained segments in the object that defines this symbol live. + enqueueRetainedSegments(cast(file)); + } if (InputChunk *chunk = sym->getChunk()) queue.push_back(chunk); } +void MarkLive::enqueue(InputChunk *chunk) { + LLVM_DEBUG(dbgs() << "markLive: " << toString(chunk) << "\n"); + chunk->live = true; + queue.push_back(chunk); +} + // The ctor functions are all referenced by the synthetic callCtors // function. However, this function does not contain relocations so we // have to manually mark the ctors as live. @@ -83,6 +94,14 @@ void MarkLive::enqueueInitFunctions(const ObjFile *obj) { } } +// Mark segments flagged by segment-level no-strip. Segment-level no-strip is +// usually used to retain segments without having symbol table entry. +void MarkLive::enqueueRetainedSegments(const ObjFile *file) { + for (InputChunk *chunk : file->segments) + if (chunk->isRetained()) + enqueue(chunk); +} + void MarkLive::run() { // Add GC root symbols. if (!config->entry.empty()) @@ -96,10 +115,14 @@ void MarkLive::run() { if (WasmSym::callDtors) enqueue(WasmSym::callDtors); - // Enqueue constructors in objects explicitly live from the command-line. for (const ObjFile *obj : symtab->objectFiles) - if (obj->isLive()) + if (obj->isLive()) { + // Enqueue constructors in objects explicitly live from the command-line. enqueueInitFunctions(obj); + // Enqueue retained segments in objects explicitly live from the + // command-line. + enqueueRetainedSegments(obj); + } mark(); diff --git a/llvm/include/llvm/BinaryFormat/Wasm.h b/llvm/include/llvm/BinaryFormat/Wasm.h index 48195af7def30e..3913a96d6c08db 100644 --- a/llvm/include/llvm/BinaryFormat/Wasm.h +++ b/llvm/include/llvm/BinaryFormat/Wasm.h @@ -391,6 +391,7 @@ enum WasmSymbolType : unsigned { enum WasmSegmentFlag : unsigned { WASM_SEG_FLAG_STRINGS = 0x1, WASM_SEG_FLAG_TLS = 0x2, + WASM_SEG_FLAG_RETAIN = 0x4, }; // Kinds of tag attributes. diff --git a/llvm/include/llvm/CodeGen/TargetLoweringObjectFileImpl.h b/llvm/include/llvm/CodeGen/TargetLoweringObjectFileImpl.h index 9f92b919824d2d..f76c137e40cc4b 100644 --- a/llvm/include/llvm/CodeGen/TargetLoweringObjectFileImpl.h +++ b/llvm/include/llvm/CodeGen/TargetLoweringObjectFileImpl.h @@ -207,11 +207,14 @@ class TargetLoweringObjectFileCOFF : public TargetLoweringObjectFile { class TargetLoweringObjectFileWasm : public TargetLoweringObjectFile { mutable unsigned NextUniqueID = 0; + SmallPtrSet Used; public: TargetLoweringObjectFileWasm() = default; ~TargetLoweringObjectFileWasm() override = default; + void getModuleMetadata(Module &M) override; + MCSection *getExplicitSectionGlobal(const GlobalObject *GO, SectionKind Kind, const TargetMachine &TM) const override; diff --git a/llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp b/llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp index 71c5521a3f2060..84ca6d8944774b 100644 --- a/llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp +++ b/llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp @@ -2128,7 +2128,7 @@ static const Comdat *getWasmComdat(const GlobalValue *GV) { return C; } -static unsigned getWasmSectionFlags(SectionKind K) { +static unsigned getWasmSectionFlags(SectionKind K, bool Retain) { unsigned Flags = 0; if (K.isThreadLocal()) @@ -2137,11 +2137,22 @@ static unsigned getWasmSectionFlags(SectionKind K) { if (K.isMergeableCString()) Flags |= wasm::WASM_SEG_FLAG_STRINGS; + if (Retain) + Flags |= wasm::WASM_SEG_FLAG_RETAIN; + // TODO(sbc): Add suport for K.isMergeableConst() return Flags; } +void TargetLoweringObjectFileWasm::getModuleMetadata(Module &M) { + SmallVector Vec; + collectUsedGlobalVariables(M, Vec, false); + for (GlobalValue *GV : Vec) + if (auto *GO = dyn_cast(GV)) + Used.insert(GO); +} + MCSection *TargetLoweringObjectFileWasm::getExplicitSectionGlobal( const GlobalObject *GO, SectionKind Kind, const TargetMachine &TM) const { // We don't support explict section names for functions in the wasm object @@ -2165,16 +2176,18 @@ MCSection *TargetLoweringObjectFileWasm::getExplicitSectionGlobal( Group = C->getName(); } - unsigned Flags = getWasmSectionFlags(Kind); + unsigned Flags = getWasmSectionFlags(Kind, Used.count(GO)); MCSectionWasm *Section = getContext().getWasmSection( Name, Kind, Flags, Group, MCContext::GenericSectionID); return Section; } -static MCSectionWasm *selectWasmSectionForGlobal( - MCContext &Ctx, const GlobalObject *GO, SectionKind Kind, Mangler &Mang, - const TargetMachine &TM, bool EmitUniqueSection, unsigned *NextUniqueID) { +static MCSectionWasm * +selectWasmSectionForGlobal(MCContext &Ctx, const GlobalObject *GO, + SectionKind Kind, Mangler &Mang, + const TargetMachine &TM, bool EmitUniqueSection, + unsigned *NextUniqueID, bool Retain) { StringRef Group = ""; if (const Comdat *C = getWasmComdat(GO)) { Group = C->getName(); @@ -2199,7 +2212,7 @@ static MCSectionWasm *selectWasmSectionForGlobal( (*NextUniqueID)++; } - unsigned Flags = getWasmSectionFlags(Kind); + unsigned Flags = getWasmSectionFlags(Kind, Retain); return Ctx.getWasmSection(Name, Kind, Flags, Group, UniqueID); } @@ -2217,9 +2230,11 @@ MCSection *TargetLoweringObjectFileWasm::SelectSectionForGlobal( else EmitUniqueSection = TM.getDataSections(); EmitUniqueSection |= GO->hasComdat(); + bool Retain = Used.count(GO); + EmitUniqueSection |= Retain; return selectWasmSectionForGlobal(getContext(), GO, Kind, getMangler(), TM, - EmitUniqueSection, &NextUniqueID); + EmitUniqueSection, &NextUniqueID, Retain); } bool TargetLoweringObjectFileWasm::shouldPutJumpTableInFunctionSection( diff --git a/llvm/lib/MC/MCParser/WasmAsmParser.cpp b/llvm/lib/MC/MCParser/WasmAsmParser.cpp index 97045495a60dec..b95ee33debc37b 100644 --- a/llvm/lib/MC/MCParser/WasmAsmParser.cpp +++ b/llvm/lib/MC/MCParser/WasmAsmParser.cpp @@ -115,6 +115,9 @@ class WasmAsmParser : public MCAsmParserExtension { case 'S': flags |= wasm::WASM_SEG_FLAG_STRINGS; break; + case 'R': + flags |= wasm::WASM_SEG_FLAG_RETAIN; + break; default: return -1U; } diff --git a/llvm/lib/MC/MCSectionWasm.cpp b/llvm/lib/MC/MCSectionWasm.cpp index e90f401b1efa1f..e3761820bb4c3e 100644 --- a/llvm/lib/MC/MCSectionWasm.cpp +++ b/llvm/lib/MC/MCSectionWasm.cpp @@ -70,6 +70,8 @@ void MCSectionWasm::printSwitchToSection(const MCAsmInfo &MAI, const Triple &T, OS << 'S'; if (SegmentFlags & wasm::WASM_SEG_FLAG_TLS) OS << 'T'; + if (SegmentFlags & wasm::WASM_SEG_FLAG_RETAIN) + OS << 'R'; OS << '"'; diff --git a/llvm/lib/ObjectYAML/WasmYAML.cpp b/llvm/lib/ObjectYAML/WasmYAML.cpp index ef47766a239420..69e59cc8612881 100644 --- a/llvm/lib/ObjectYAML/WasmYAML.cpp +++ b/llvm/lib/ObjectYAML/WasmYAML.cpp @@ -556,6 +556,7 @@ void ScalarBitSetTraits::bitset( #define BCase(X) IO.bitSetCase(Value, #X, wasm::WASM_SEG_FLAG_##X) BCase(STRINGS); BCase(TLS); + BCase(RETAIN); #undef BCase } diff --git a/llvm/test/CodeGen/WebAssembly/no-strip.ll b/llvm/test/CodeGen/WebAssembly/no-strip.ll new file mode 100644 index 00000000000000..e6206aebdce8e2 --- /dev/null +++ b/llvm/test/CodeGen/WebAssembly/no-strip.ll @@ -0,0 +1,22 @@ +; RUN: llc < %s --mtriple=wasm32-unknown-unknown | FileCheck %s + +@llvm.used = appending global [ + 5 x ptr +] [ + ptr @ga, ptr @gb, ptr @gc, ptr @gd, ptr @ge +], section "llvm.metadata" + +; CHECK: .section .data.ga,"R",@ +@ga = global i32 42 +; CHECK: .section .data.gb,"R",@ +@gb = internal global i32 41 +; CHECK: .section .data..Lgc,"R",@ +@gc = private global i32 40 +; CHECK: .section .rodata.gd,"R",@ +@gd = constant i32 39 + +; All sections with the same explicit name are flagged as retained if a part of them is retained. +; CHECK: .section dddd,"R",@ +@ge = global i32 38, section "dddd" +; CHECK: .section dddd,"R",@ +@gg = global i32 37, section "dddd" diff --git a/llvm/test/MC/WebAssembly/no-dead-strip.ll b/llvm/test/MC/WebAssembly/no-dead-strip.ll index 9b550ec6cefbc2..6b3f090d9cab8f 100644 --- a/llvm/test/MC/WebAssembly/no-dead-strip.ll +++ b/llvm/test/MC/WebAssembly/no-dead-strip.ll @@ -1,21 +1,69 @@ -; RUN: llc -filetype=obj -wasm-keep-registers %s -o - | llvm-readobj --symbols - | FileCheck %s +; RUN: llc < %s --mtriple=wasm32-unknown-unknown -filetype=obj -wasm-keep-registers -o - | obj2yaml - | FileCheck %s -target triple = "wasm32-unknown-unknown" - -@llvm.used = appending global [1 x ptr] [ptr @foo], section "llvm.metadata" +@llvm.used = appending global [5 x ptr] [ + ptr @foo, ptr @gv0, ptr @gv1, ptr @gv2, ptr @gv3 +], section "llvm.metadata" define i32 @foo() { entry: ret i32 0 } -; CHECK: Symbols [ -; CHECK-NEXT: Symbol { -; CHECK-NEXT: Name: foo -; CHECK-NEXT: Type: FUNCTION (0x0) -; CHECK-NEXT: Flags [ (0x80) -; CHECK-NEXT: NO_STRIP (0x80) -; CHECK-NEXT: ] -; CHECK-NEXT: ElementIndex: 0x0 -; CHECK-NEXT: } -; CHECK-NEXT: ] +; externally visible GV has NO_STRIP/RETAIN in both symtab entry and segment info +@gv0 = global i32 42 +; internal GV has NO_STRIP/RETAIN in both symtab entry and segment info +@gv1 = internal global i32 41 +; private GV has RETAIN in segment info only (no symtab entry) +@gv2 = private global i32 40 +; explicit section names +@gv3 = global i32 39, section "ddd.hello" +@gv4.not.used = global i64 38, section "ddd.hello" + +; CHECK: SymbolTable: +; CHECK-NEXT: - Index: 0 +; CHECK-NEXT: Kind: FUNCTION +; CHECK-NEXT: Name: foo +; CHECK-NEXT: Flags: [ NO_STRIP ] +; CHECK-NEXT: Function: 0 +; CHECK-NEXT: - Index: 1 +; CHECK-NEXT: Kind: DATA +; CHECK-NEXT: Name: gv0 +; CHECK-NEXT: Flags: [ NO_STRIP ] +; CHECK-NEXT: Segment: 0 +; CHECK-NEXT: Size: 4 +; CHECK-NEXT: - Index: 2 +; CHECK-NEXT: Kind: DATA +; CHECK-NEXT: Name: gv1 +; CHECK-NEXT: Flags: [ BINDING_LOCAL, NO_STRIP ] +; CHECK-NEXT: Segment: 1 +; CHECK-NEXT: Size: 4 +; CHECK-NEXT: - Index: 3 +; CHECK-NEXT: Kind: DATA +; CHECK-NEXT: Name: gv3 +; CHECK-NEXT: Flags: [ NO_STRIP ] +; CHECK-NEXT: Segment: 3 +; CHECK-NEXT: Size: 4 +; CHECK-NEXT: - Index: 4 +; CHECK-NEXT: Kind: DATA +; CHECK-NEXT: Name: gv4.not.used +; CHECK-NEXT: Flags: [ ] +; CHECK-NEXT: Segment: 3 +; CHECK-NEXT: Offset: 8 +; CHECK-NEXT: Size: 8 +; CHECK-NEXT: SegmentInfo: +; CHECK-NEXT: - Index: 0 +; CHECK-NEXT: Name: .data.gv0 +; CHECK-NEXT: Alignment: 2 +; CHECK-NEXT: Flags: [ RETAIN ] +; CHECK-NEXT: - Index: 1 +; CHECK-NEXT: Name: .data.gv1 +; CHECK-NEXT: Alignment: 2 +; CHECK-NEXT: Flags: [ RETAIN ] +; CHECK-NEXT: - Index: 2 +; CHECK-NEXT: Name: .data..Lgv2 +; CHECK-NEXT: Alignment: 2 +; CHECK-NEXT: Flags: [ RETAIN ] +; CHECK-NEXT: - Index: 3 +; CHECK-NEXT: Name: ddd.hello +; CHECK-NEXT: Alignment: 3 +; CHECK-NEXT: Flags: [ RETAIN ]