45#define DEBUG_TYPE "mc"
49 IndirectSymBase.clear();
50 IndirectSymbols.clear();
52 SectionAddress.
clear();
55 LocalSymbolData.clear();
56 ExternalSymbolData.clear();
57 UndefinedSymbolData.clear();
59 VersionInfo.Major = 0;
61 TargetVariantVersionInfo.Major = 0;
63 LinkerOptions.clear();
74 if (cast<MCSymbolMachO>(S).isWeakDefinition())
81bool MachObjectWriter::
82MachSymbolData::operator<(
const MachSymbolData &RHS)
const {
83 return Symbol->getName() <
RHS.Symbol->
getName();
97 Asm.getFragmentOffset(*Fragment);
106 return C->getValue();
114 if (
Target.getSymA() &&
Target.getSymA()->getSymbol().isUndefined())
117 if (
Target.getSymB() &&
Target.getSymB()->getSymbol().isUndefined())
130 Asm.getSymbolOffset(S);
136 unsigned Next = cast<MCSectionMachO>(Sec)->getLayoutOrder() + 1;
137 if (Next >= SectionOrder.
size())
140 const MCSection &NextSec = *SectionOrder[Next];
148 if (!Symbol.isTemporary())
151 if (Symbol.isUsedInReloc())
177 unsigned NumLoadCommands,
178 unsigned LoadCommandsSize,
179 bool SubsectionsViaSymbols) {
227 unsigned SegmentLoadCommandSize =
235 writeWithPadding(
Name, 16);
259 uint64_t FileOffset,
unsigned Flags,
261 unsigned NumRelocations) {
262 uint64_t SectionSize = Asm.getSectionAddressSize(Sec);
266 if (Section.isVirtualSection()) {
267 assert(Asm.getSectionFileSize(Sec) == 0 &&
"Invalid file size!");
277 writeWithPadding(Section.getName(), 16);
278 writeWithPadding(Section.getSegmentName(), 16);
286 assert(isUInt<32>(FileOffset) &&
"Cannot encode offset of section");
290 assert((!NumRelocations || isUInt<32>(RelocationsStart)) &&
291 "Cannot encode offset of relocations");
360MachObjectWriter::MachSymbolData *
361MachObjectWriter::findSymbolData(
const MCSymbol &
Sym) {
362 for (
auto *SymbolData :
363 {&LocalSymbolData, &ExternalSymbolData, &UndefinedSymbolData})
364 for (MachSymbolData &Entry : *SymbolData)
365 if (Entry.Symbol == &
Sym)
375 const auto *
Ref = dyn_cast<MCSymbolRefExpr>(
Value);
378 S = &
Ref->getSymbol();
384 const MCSymbol *Symbol = MSD.Symbol;
385 const auto &
Data = cast<MCSymbolMachO>(*Symbol);
387 uint8_t SectionIndex = MSD.SectionIndex;
390 bool IsAlias = Symbol != AliasedSymbol;
392 const MCSymbol &OrigSymbol = *Symbol;
393 MachSymbolData *AliaseeInfo;
395 AliaseeInfo = findSymbolData(*AliasedSymbol);
397 SectionIndex = AliaseeInfo->SectionIndex;
398 Symbol = AliasedSymbol;
405 if (IsAlias && Symbol->isUndefined())
407 else if (Symbol->isUndefined())
409 else if (Symbol->isAbsolute())
416 if (
Data.isPrivateExtern())
420 if (
Data.isExternal() || (!IsAlias && Symbol->isUndefined()))
424 if (IsAlias && Symbol->isUndefined())
425 Address = AliaseeInfo->StringIndex;
426 else if (Symbol->isDefined())
428 else if (Symbol->isCommon()) {
431 Address = Symbol->getCommonSize();
442 bool EncodeAsAltEntry =
443 IsAlias && cast<MCSymbolMachO>(OrigSymbol).isAltEntry();
444 W.
write<
uint16_t>(cast<MCSymbolMachO>(Symbol)->getEncodedFlags(EncodeAsAltEntry));
469 for (
const std::string &Option :
Options)
470 Size += Option.size() + 1;
475 const std::vector<std::string> &
Options)
485 for (
const std::string &Option :
Options) {
487 W.
OS << Option <<
'\0';
488 BytesWritten += Option.size() + 1;
511 Asm.getContext().reportError(
Fixup.getLoc(),
512 "unsupported relocation expression");
516 TargetObjectWriter->recordRelocation(
this, Asm, Fragment,
Fixup,
Target,
530 for (IndirectSymbolData &ISD : IndirectSymbols) {
531 const MCSectionMachO &Section = cast<MCSectionMachO>(*ISD.Section);
539 "' not in a symbol pointer or stub section");
544 for (
auto [IndirectIndex, ISD] :
enumerate(IndirectSymbols)) {
545 const auto &Section = cast<MCSectionMachO>(*ISD.Section);
552 IndirectSymBase.insert(std::make_pair(ISD.Section, IndirectIndex));
554 Asm.registerSymbol(*ISD.Symbol);
558 for (
auto [IndirectIndex, ISD] :
enumerate(IndirectSymbols)) {
559 const auto &Section = cast<MCSectionMachO>(*ISD.Section);
566 IndirectSymBase.insert(std::make_pair(ISD.Section, IndirectIndex));
571 if (Asm.registerSymbol(*ISD.Symbol))
572 cast<MCSymbolMachO>(ISD.Symbol)->setReferenceTypeUndefinedLazy(
true);
578 MCAssembler &Asm, std::vector<MachSymbolData> &LocalSymbolData,
579 std::vector<MachSymbolData> &ExternalSymbolData,
580 std::vector<MachSymbolData> &UndefinedSymbolData) {
585 SectionIndexMap[&Sec] =
Index++;
589 for (
const MCSymbol &Symbol : Asm.symbols()) {
593 StringTable.
add(Symbol.getName());
602 for (
const MCSymbol &Symbol : Asm.symbols()) {
607 if (!Symbol.isExternal() && !Symbol.isUndefined())
611 MSD.Symbol = &Symbol;
612 MSD.StringIndex = StringTable.
getOffset(Symbol.getName());
614 if (Symbol.isUndefined()) {
615 MSD.SectionIndex = 0;
616 UndefinedSymbolData.push_back(MSD);
617 }
else if (Symbol.isAbsolute()) {
618 MSD.SectionIndex = 0;
619 ExternalSymbolData.push_back(MSD);
621 MSD.SectionIndex = SectionIndexMap.
lookup(&Symbol.getSection());
622 assert(MSD.SectionIndex &&
"Invalid section index!");
623 ExternalSymbolData.push_back(MSD);
628 for (
const MCSymbol &Symbol : Asm.symbols()) {
633 if (Symbol.isExternal() || Symbol.isUndefined())
637 MSD.Symbol = &Symbol;
638 MSD.StringIndex = StringTable.
getOffset(Symbol.getName());
640 if (Symbol.isAbsolute()) {
641 MSD.SectionIndex = 0;
642 LocalSymbolData.push_back(MSD);
644 MSD.SectionIndex = SectionIndexMap.
lookup(&Symbol.getSection());
645 assert(MSD.SectionIndex &&
"Invalid section index!");
646 LocalSymbolData.push_back(MSD);
656 for (
auto *SymbolData :
657 {&LocalSymbolData, &ExternalSymbolData, &UndefinedSymbolData})
658 for (MachSymbolData &Entry : *SymbolData)
659 Entry.Symbol->setIndex(
Index++);
662 for (RelAndSymbol &Rel : Relocations[&Section]) {
667 unsigned Index = Rel.Sym->getIndex();
670 Rel.MRE.r_word1 = (Rel.MRE.r_word1 & (~0U << 24)) |
Index | (1 << 27);
672 Rel.MRE.r_word1 = (Rel.MRE.r_word1 & 0xff) |
Index << 8 | (1 << 4);
682 if (!Sec.isVirtualSection()) {
684 cast<MCSectionMachO>(Sec).setLayoutOrder(i++);
688 if (Sec.isVirtualSection()) {
690 cast<MCSectionMachO>(Sec).setLayoutOrder(i++);
695 for (
const MCSection *Sec : SectionOrder) {
696 StartAddress =
alignTo(StartAddress, Sec->getAlign());
697 SectionAddress[Sec] = StartAddress;
698 StartAddress += Asm.getSectionAddressSize(*Sec);
716 bool InSet,
bool IsPCRel)
const {
743 bool hasReliableSymbolDifference =
isX86_64();
744 if (!hasReliableSymbolDifference) {
773 Asm.getContext().getObjectFileInfo()->getAddrSigSection();
774 unsigned Log2Size =
is64Bit() ? 3 : 2;
776 if (!S->isRegistered())
787 auto NumBytesWritten = [&] {
return W.
OS.
tell() - StartOffset; };
793 UndefinedSymbolData);
796 MCSection *CGProfileSection = Asm.getContext().getMachOSection(
798 auto &Frag = cast<MCDataFragment>(*CGProfileSection->
begin());
799 Frag.getContents().clear();
802 uint32_t FromIndex = CGPE.From->getSymbol().getIndex();
803 uint32_t ToIndex = CGPE.To->getSymbol().getIndex();
810 unsigned NumSections = Asm.end() - Asm.begin();
814 unsigned NumLoadCommands = 1;
820 if (VersionInfo.Major != 0) {
822 if (VersionInfo.EmitBuildVersion)
829 if (TargetVariantVersionInfo.Major != 0) {
831 assert(TargetVariantVersionInfo.EmitBuildVersion &&
832 "target variant should use build version");
837 unsigned NumDataRegions = DataRegions.size();
838 if (NumDataRegions) {
852 unsigned NumSymbols = LocalSymbolData.size() + ExternalSymbolData.size() +
853 UndefinedSymbolData.size();
855 NumLoadCommands += 2;
861 for (
const auto &Option : LinkerOptions) {
876 uint64_t FileSize = Asm.getSectionFileSize(Sec);
881 if (Sec.isVirtualSection())
884 SectionDataSize = std::max(SectionDataSize,
Address +
Size);
885 SectionDataFileSize = std::max(SectionDataFileSize,
Address + FileSize);
891 unsigned SectionDataPadding =
893 SectionDataFileSize += SectionDataPadding;
901 SectionDataSize, Prot, Prot);
904 uint64_t RelocTableEnd = SectionDataStart + SectionDataFileSize;
906 const auto &Sec = cast<MCSectionMachO>(Section);
907 std::vector<RelAndSymbol> &Relocs = Relocations[&Sec];
908 unsigned NumRelocs = Relocs.size();
910 unsigned Flags = Sec.getTypeAndAttributes();
911 if (Sec.hasInstructions())
913 if (!cast<MCSectionMachO>(Sec).isVirtualSection() &&
914 !isUInt<32>(SectionStart)) {
915 Asm.getContext().reportError(
916 SMLoc(),
"cannot encode offset of section; object file too large");
917 return NumBytesWritten();
919 if (NumRelocs && !isUInt<32>(RelocTableEnd)) {
920 Asm.getContext().reportError(
922 "cannot encode offset of relocations; object file too large");
923 return NumBytesWritten();
926 RelocTableEnd, NumRelocs);
931 auto EmitDeploymentTargetVersion =
934 assert(!V.empty() &&
"empty version");
935 unsigned Update = V.getSubminor().value_or(0);
936 unsigned Minor = V.getMinor().value_or(0);
937 assert(
Update < 256 &&
"unencodable update target version");
938 assert(
Minor < 256 &&
"unencodable minor target version");
939 assert(V.getMajor() < 65536 &&
"unencodable major target version");
940 return Update | (
Minor << 8) | (V.getMajor() << 16);
943 VersionInfo.Major, VersionInfo.Minor, VersionInfo.Update));
945 ? EncodeVersion(VersionInfo.SDKVersion)
947 if (VersionInfo.EmitBuildVersion) {
964 if (VersionInfo.Major != 0)
965 EmitDeploymentTargetVersion(VersionInfo);
966 if (TargetVariantVersionInfo.Major != 0)
967 EmitDeploymentTargetVersion(TargetVariantVersionInfo);
970 uint64_t DataInCodeTableEnd = RelocTableEnd + NumDataRegions * 8;
971 if (NumDataRegions) {
972 uint64_t DataRegionsOffset = RelocTableEnd;
973 uint64_t DataRegionsSize = NumDataRegions * 8;
979 uint64_t LOHTableEnd = DataInCodeTableEnd + LOHSize;
982 DataInCodeTableEnd, LOHSize);
986 unsigned FirstLocalSymbol = 0;
987 unsigned NumLocalSymbols = LocalSymbolData.size();
988 unsigned FirstExternalSymbol = FirstLocalSymbol + NumLocalSymbols;
989 unsigned NumExternalSymbols = ExternalSymbolData.size();
990 unsigned FirstUndefinedSymbol = FirstExternalSymbol + NumExternalSymbols;
991 unsigned NumUndefinedSymbols = UndefinedSymbolData.size();
992 unsigned NumIndirectSymbols = IndirectSymbols.size();
993 unsigned NumSymTabSymbols =
994 NumLocalSymbols + NumExternalSymbols + NumUndefinedSymbols;
995 uint64_t IndirectSymbolSize = NumIndirectSymbols * 4;
999 if (NumIndirectSymbols)
1000 IndirectSymbolOffset = LOHTableEnd;
1003 uint64_t SymbolTableOffset = LOHTableEnd + IndirectSymbolSize;
1007 SymbolTableOffset + NumSymTabSymbols * (
is64Bit() ?
1011 StringTableOffset, StringTable.
getSize());
1014 FirstExternalSymbol, NumExternalSymbols,
1015 FirstUndefinedSymbol, NumUndefinedSymbols,
1016 IndirectSymbolOffset, NumIndirectSymbols);
1020 for (
const auto &Option : LinkerOptions)
1025 Asm.writeSectionData(
W.
OS, &Sec);
1038 std::vector<RelAndSymbol> &Relocs = Relocations[&Sec];
1055 <<
" start: " << Start <<
"(" <<
Data.Start->getName()
1056 <<
")" <<
" end: " <<
End <<
"(" <<
Data.End->getName()
1057 <<
")" <<
" size: " <<
End - Start <<
"\n");
1068 LOHContainer.
emit(Asm, *
this);
1078 for (
auto &ISD : IndirectSymbols) {
1085 if (ISD.Symbol->isDefined() && !ISD.Symbol->isExternal()) {
1087 if (ISD.Symbol->isAbsolute())
1100 for (
auto *SymbolData :
1101 {&LocalSymbolData, &ExternalSymbolData, &UndefinedSymbolData})
1102 for (MachSymbolData &Entry : *SymbolData)
1109 return NumBytesWritten();
This file defines the DenseMap class.
static unsigned ComputeLinkerOptionsLoadCommandSize(const std::vector< std::string > &Options, bool is64Bit)
static bool isFixupTargetValid(const MCValue &Target)
static MachO::LoadCommandType getLCFromMCVM(MCVersionMinType Type)
static bool isSymbolLinkerVisible(const MCSymbol &Symbol)
PowerPC TLS Dynamic Call Fixup
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
static bool is64Bit(const char *name)
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
static bool isSectionAtomizableBySymbols(const MCSection &Section)
True if the section is atomized using the symbols in it.
Base class for the full range of assembler expressions which are needed for parsing.
bool evaluateAsRelocatable(MCValue &Res, const MCAssembler *Asm, const MCFixup *Fixup) const
Try to evaluate the expression to a relocatable value, i.e.
Encode information on a single operation to perform on a byte sequence (e.g., an encoded instruction)...
const MCSymbol * getAtom() const
MCSection * getParent() const
void emit(const MCAssembler &Asm, MachObjectWriter &ObjWriter) const
Emit all Linker Optimization Hint in one big table.
uint64_t getEmitSize(const MCAssembler &Asm, const MachObjectWriter &ObjWriter) const
Get the size of the directives if emitted.
SmallVector< CGProfileEntry, 0 > CGProfile
bool SubsectionsViaSymbols
std::vector< const MCSymbol * > & getAddrsigSyms()
virtual void reset()
lifetime management
This represents a section on a Mach-O system (used by Mac OS X).
Instances of this class represent a uniqued identifier for a section in the current translation unit.
bool isVirtualSection() const
Check whether this section is "virtual", that is has no actual object file contents.
MCSymbol - Instances of this class represent a symbol name in the MC file, and MCSymbols are created ...
const MCExpr * getVariableValue(bool SetUsed=true) const
getVariableValue - Get the value for variable symbols.
bool isInSection() const
isInSection - Check if this symbol is defined in some section (i.e., it is defined but not absolute).
StringRef getName() const
getName - Get the symbol name.
bool isVariable() const
isVariable - Check if this is a variable symbol.
bool isUndefined(bool SetUsed=true) const
isUndefined - Check if this symbol undefined (i.e., implicitly defined).
MCSection & getSection() const
Get the section associated with a defined, non-absolute symbol.
bool isTemporary() const
isTemporary - Check if this is an assembler temporary symbol.
MCFragment * getFragment(bool SetUsed=true) const
This represents an "assembler immediate".
uint64_t getPaddingSize(const MCAssembler &Asm, const MCSection *SD) const
void computeSectionAddresses(const MCAssembler &Asm)
void writeSection(const MCAssembler &Asm, const MCSection &Sec, uint64_t VMAddr, uint64_t FileOffset, unsigned Flags, uint64_t RelocationsStart, unsigned NumRelocations)
bool doesSymbolRequireExternRelocation(const MCSymbol &S)
void computeSymbolTable(MCAssembler &Asm, std::vector< MachSymbolData > &LocalSymbolData, std::vector< MachSymbolData > &ExternalSymbolData, std::vector< MachSymbolData > &UndefinedSymbolData)
Compute the symbol table data.
uint64_t getFragmentAddress(const MCAssembler &Asm, const MCFragment *Fragment) const
{ bool EmitBuildVersion VersionInfoType
void executePostLayoutBinding(MCAssembler &Asm) override
Perform any late binding of symbols (for example, to assign symbol indices for use when generating re...
uint64_t getSectionAddress(const MCSection *Sec) const
void addRelocation(const MCSymbol *RelSymbol, const MCSection *Sec, MachO::any_relocation_info &MRE)
void populateAddrSigSection(MCAssembler &Asm)
bool isFixupKindPCRel(const MCAssembler &Asm, unsigned Kind)
support::endian::Writer W
void writeLinkerOptionsLoadCommand(const std::vector< std::string > &Options)
void recordRelocation(MCAssembler &Asm, const MCFragment *Fragment, const MCFixup &Fixup, MCValue Target, uint64_t &FixedValue) override
Record a relocation entry.
void writeNlist(MachSymbolData &MSD, const MCAssembler &Asm)
VersionTuple SDKVersion
An optional version of the SDK that was used to build the source.
bool isSymbolRefDifferenceFullyResolvedImpl(const MCAssembler &Asm, const MCSymbol &SymA, const MCFragment &FB, bool InSet, bool IsPCRel) const override
void writeDysymtabLoadCommand(uint32_t FirstLocalSymbol, uint32_t NumLocalSymbols, uint32_t FirstExternalSymbol, uint32_t NumExternalSymbols, uint32_t FirstUndefinedSymbol, uint32_t NumUndefinedSymbols, uint32_t IndirectSymbolOffset, uint32_t NumIndirectSymbols)
const MCSymbol & findAliasedSymbol(const MCSymbol &Sym) const
uint64_t getSymbolAddress(const MCSymbol &S, const MCAssembler &Asm) const
MCVersionMinType Type
Used when EmitBuildVersion==false.
void writeSegmentLoadCommand(StringRef Name, unsigned NumSections, uint64_t VMAddr, uint64_t VMSize, uint64_t SectionDataStartOffset, uint64_t SectionDataSize, uint32_t MaxProt, uint32_t InitProt)
Write a segment load command.
const MCSymbol * getAtom(const MCSymbol &S) const
void writeLinkeditLoadCommand(uint32_t Type, uint32_t DataOffset, uint32_t DataSize)
void writeHeader(MachO::HeaderFileType Type, unsigned NumLoadCommands, unsigned LoadCommandsSize, bool SubsectionsViaSymbols)
void reset() override
lifetime management
void writeSymtabLoadCommand(uint32_t SymbolOffset, uint32_t NumSymbols, uint32_t StringTableOffset, uint32_t StringTableSize)
void bindIndirectSymbols(MCAssembler &Asm)
uint64_t writeObject(MCAssembler &Asm) override
Write the object file and returns the number of bytes written.
Represents a location in source code.
static SectionKind getMetadata()
void push_back(const T &Elt)
StringRef - Represent a constant reference to a string, i.e.
size_t getOffset(CachedHashStringRef S) const
Get the offest of a string in the string table.
void write(raw_ostream &OS) const
size_t add(CachedHashStringRef S)
Add a string to the builder.
void finalize()
Analyze the strings and build the final table.
Target - Wrapper for Target specific information.
const char * getName() const
getName - Get the target name.
The instances of the Type class are immutable: once they are created, they are never changed.
LLVM Value Representation.
StringRef getName() const
Return a constant reference to the value's name.
Represents a version number in the form major[.minor[.subminor[.build]]].
raw_ostream & write_zeros(unsigned NumZeros)
write_zeros - Insert 'NumZeros' nulls.
uint64_t tell() const
tell - Return the current offset with the file.
A raw_ostream that writes to an SmallVector or SmallString.
This provides a very simple, boring adaptor for a begin and end iterator into a range type.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
@ S_ATTR_SOME_INSTRUCTIONS
S_ATTR_SOME_INSTRUCTIONS - Section contains some machine instructions.
@ S_THREAD_LOCAL_VARIABLE_POINTERS
S_THREAD_LOCAL_VARIABLE_POINTERS - Section with pointers to thread local structures.
@ S_LAZY_SYMBOL_POINTERS
S_LAZY_SYMBOL_POINTERS - Section with lazy symbol pointers.
@ S_NON_LAZY_SYMBOL_POINTERS
S_NON_LAZY_SYMBOL_POINTERS - Section with non-lazy symbol pointers.
@ S_SYMBOL_STUBS
S_SYMBOL_STUBS - Section with symbol stubs, byte size of stub in the Reserved2 field.
@ MH_SUBSECTIONS_VIA_SYMBOLS
void write(void *memory, value_type value, endianness endian)
Write a value to memory with a particular endianness.
This is an optimization pass for GlobalISel generic memory operations.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
auto reverse(ContainerTy &&C)
void sort(IteratorTy Start, IteratorTy End)
@ MCVM_WatchOSVersionMin
.watchos_version_min
@ MCVM_OSXVersionMin
.macosx_version_min
@ MCVM_TvOSVersionMin
.tvos_version_min
@ MCVM_IOSVersionMin
.ios_version_min
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
void report_fatal_error(Error Err, bool gen_crash_diag=true)
Report a serious error, calling any installed error handler.
MCFixupKind
Extensible enumeration to represent the type of a fixup.
uint64_t offsetToAlignment(uint64_t Value, Align Alignment)
Returns the offset to the next integer (mod 2**64) that is greater than or equal to Value and is a mu...
@ Ref
The access may reference the value stored in memory.
uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
unsigned Log2(Align A)
Returns the log2 of the alignment.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Target independent information on a fixup kind.
@ FKF_IsPCRel
Is this fixup kind PCrelative? This is used by the assembler backend to evaluate fixup values in a ta...
unsigned Flags
Flags describing additional information on this fixup kind.
void write(ArrayRef< value_type > Val)