blob: 189484deac7e56189636185f8de4b14541d151d2 [file] [log] [blame]
Andrew Scull5e1ddfa2018-08-14 10:06:54 +01001//===- MCSymbol.h - Machine Code Symbols ------------------------*- C++ -*-===//
2//
Andrew Walbran16937d02019-10-22 13:54:20 +01003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Andrew Scull5e1ddfa2018-08-14 10:06:54 +01006//
7//===----------------------------------------------------------------------===//
8//
9// This file contains the declaration of the MCSymbol class.
10//
11//===----------------------------------------------------------------------===//
12
13#ifndef LLVM_MC_MCSYMBOL_H
14#define LLVM_MC_MCSYMBOL_H
15
16#include "llvm/ADT/PointerIntPair.h"
17#include "llvm/ADT/StringMap.h"
18#include "llvm/ADT/StringRef.h"
19#include "llvm/MC/MCFragment.h"
20#include "llvm/Support/ErrorHandling.h"
21#include "llvm/Support/MathExtras.h"
22#include <cassert>
23#include <cstddef>
24#include <cstdint>
25
26namespace llvm {
27
28class MCAsmInfo;
29class MCContext;
30class MCExpr;
31class MCSection;
32class raw_ostream;
33
34/// MCSymbol - Instances of this class represent a symbol name in the MC file,
35/// and MCSymbols are created and uniqued by the MCContext class. MCSymbols
36/// should only be constructed with valid names for the object file.
37///
38/// If the symbol is defined/emitted into the current translation unit, the
39/// Section member is set to indicate what section it lives in. Otherwise, if
40/// it is a reference to an external entity, it has a null section.
41class MCSymbol {
42protected:
43 /// The kind of the symbol. If it is any value other than unset then this
44 /// class is actually one of the appropriate subclasses of MCSymbol.
45 enum SymbolKind {
46 SymbolKindUnset,
47 SymbolKindCOFF,
48 SymbolKindELF,
49 SymbolKindMachO,
50 SymbolKindWasm,
Andrew Walbran3d2c1972020-04-07 12:24:26 +010051 SymbolKindXCOFF,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010052 };
53
54 /// A symbol can contain an Offset, or Value, or be Common, but never more
55 /// than one of these.
56 enum Contents : uint8_t {
57 SymContentsUnset,
58 SymContentsOffset,
59 SymContentsVariable,
60 SymContentsCommon,
Andrew Walbran3d2c1972020-04-07 12:24:26 +010061 SymContentsTargetCommon, // Index stores the section index
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010062 };
63
64 // Special sentinal value for the absolute pseudo fragment.
65 static MCFragment *AbsolutePseudoFragment;
66
67 /// If a symbol has a Fragment, the section is implied, so we only need
68 /// one pointer.
69 /// The special AbsolutePseudoFragment value is for absolute symbols.
70 /// If this is a variable symbol, this caches the variable value's fragment.
71 /// FIXME: We might be able to simplify this by having the asm streamer create
72 /// dummy fragments.
73 /// If this is a section, then it gives the symbol is defined in. This is null
74 /// for undefined symbols.
75 ///
76 /// If this is a fragment, then it gives the fragment this symbol's value is
77 /// relative to, if any.
78 ///
79 /// For the 'HasName' integer, this is true if this symbol is named.
80 /// A named symbol will have a pointer to the name allocated in the bytes
81 /// immediately prior to the MCSymbol.
82 mutable PointerIntPair<MCFragment *, 1> FragmentAndHasName;
83
84 /// IsTemporary - True if this is an assembler temporary label, which
85 /// typically does not survive in the .o file's symbol table. Usually
86 /// "Lfoo" or ".foo".
87 unsigned IsTemporary : 1;
88
Andrew Scullcdfcccc2018-10-05 20:58:37 +010089 /// True if this symbol can be redefined.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010090 unsigned IsRedefinable : 1;
91
92 /// IsUsed - True if this symbol has been used.
93 mutable unsigned IsUsed : 1;
94
95 mutable unsigned IsRegistered : 1;
96
97 /// This symbol is visible outside this translation unit.
98 mutable unsigned IsExternal : 1;
99
100 /// This symbol is private extern.
101 mutable unsigned IsPrivateExtern : 1;
102
103 /// LLVM RTTI discriminator. This is actually a SymbolKind enumerator, but is
104 /// unsigned to avoid sign extension and achieve better bitpacking with MSVC.
105 unsigned Kind : 3;
106
107 /// True if we have created a relocation that uses this symbol.
108 mutable unsigned IsUsedInReloc : 1;
109
110 /// This is actually a Contents enumerator, but is unsigned to avoid sign
111 /// extension and achieve better bitpacking with MSVC.
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100112 unsigned SymbolContents : 3;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100113
114 /// The alignment of the symbol, if it is 'common', or -1.
115 ///
116 /// The alignment is stored as log2(align) + 1. This allows all values from
117 /// 0 to 2^31 to be stored which is every power of 2 representable by an
118 /// unsigned.
119 enum : unsigned { NumCommonAlignmentBits = 5 };
120 unsigned CommonAlignLog2 : NumCommonAlignmentBits;
121
122 /// The Flags field is used by object file implementations to store
123 /// additional per symbol information which is not easily classified.
124 enum : unsigned { NumFlagsBits = 16 };
125 mutable uint32_t Flags : NumFlagsBits;
126
127 /// Index field, for use by the object file implementation.
128 mutable uint32_t Index = 0;
129
130 union {
131 /// The offset to apply to the fragment address to form this symbol's value.
132 uint64_t Offset;
133
134 /// The size of the symbol, if it is 'common'.
135 uint64_t CommonSize;
136
137 /// If non-null, the value for a variable symbol.
138 const MCExpr *Value;
139 };
140
141 // MCContext creates and uniques these.
142 friend class MCExpr;
143 friend class MCContext;
144
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100145 /// The name for a symbol.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100146 /// MCSymbol contains a uint64_t so is probably aligned to 8. On a 32-bit
147 /// system, the name is a pointer so isn't going to satisfy the 8 byte
148 /// alignment of uint64_t. Account for that here.
149 using NameEntryStorageTy = union {
150 const StringMapEntry<bool> *NameEntry;
151 uint64_t AlignmentPadding;
152 };
153
154 MCSymbol(SymbolKind Kind, const StringMapEntry<bool> *Name, bool isTemporary)
155 : IsTemporary(isTemporary), IsRedefinable(false), IsUsed(false),
156 IsRegistered(false), IsExternal(false), IsPrivateExtern(false),
157 Kind(Kind), IsUsedInReloc(false), SymbolContents(SymContentsUnset),
158 CommonAlignLog2(0), Flags(0) {
159 Offset = 0;
160 FragmentAndHasName.setInt(!!Name);
161 if (Name)
162 getNameEntryPtr() = Name;
163 }
164
165 // Provide custom new/delete as we will only allocate space for a name
166 // if we need one.
167 void *operator new(size_t s, const StringMapEntry<bool> *Name,
168 MCContext &Ctx);
169
170private:
171 void operator delete(void *);
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100172 /// Placement delete - required by std, but never called.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100173 void operator delete(void*, unsigned) {
174 llvm_unreachable("Constructor throws?");
175 }
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100176 /// Placement delete - required by std, but never called.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100177 void operator delete(void*, unsigned, bool) {
178 llvm_unreachable("Constructor throws?");
179 }
180
181 MCSection *getSectionPtr() const {
182 if (MCFragment *F = getFragment()) {
183 assert(F != AbsolutePseudoFragment);
184 return F->getParent();
185 }
186 return nullptr;
187 }
188
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100189 /// Get a reference to the name field. Requires that we have a name
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100190 const StringMapEntry<bool> *&getNameEntryPtr() {
191 assert(FragmentAndHasName.getInt() && "Name is required");
192 NameEntryStorageTy *Name = reinterpret_cast<NameEntryStorageTy *>(this);
193 return (*(Name - 1)).NameEntry;
194 }
195 const StringMapEntry<bool> *&getNameEntryPtr() const {
196 return const_cast<MCSymbol*>(this)->getNameEntryPtr();
197 }
198
199public:
200 MCSymbol(const MCSymbol &) = delete;
201 MCSymbol &operator=(const MCSymbol &) = delete;
202
203 /// getName - Get the symbol name.
204 StringRef getName() const {
205 if (!FragmentAndHasName.getInt())
206 return StringRef();
207
208 return getNameEntryPtr()->first();
209 }
210
211 bool isRegistered() const { return IsRegistered; }
212 void setIsRegistered(bool Value) const { IsRegistered = Value; }
213
214 void setUsedInReloc() const { IsUsedInReloc = true; }
215 bool isUsedInReloc() const { return IsUsedInReloc; }
216
217 /// \name Accessors
218 /// @{
219
220 /// isTemporary - Check if this is an assembler temporary symbol.
221 bool isTemporary() const { return IsTemporary; }
222
223 /// isUsed - Check if this is used.
224 bool isUsed() const { return IsUsed; }
225
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100226 /// Check if this symbol is redefinable.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100227 bool isRedefinable() const { return IsRedefinable; }
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100228 /// Mark this symbol as redefinable.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100229 void setRedefinable(bool Value) { IsRedefinable = Value; }
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100230 /// Prepare this symbol to be redefined.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100231 void redefineIfPossible() {
232 if (IsRedefinable) {
233 if (SymbolContents == SymContentsVariable) {
234 Value = nullptr;
235 SymbolContents = SymContentsUnset;
236 }
237 setUndefined();
238 IsRedefinable = false;
239 }
240 }
241
242 /// @}
243 /// \name Associated Sections
244 /// @{
245
246 /// isDefined - Check if this symbol is defined (i.e., it has an address).
247 ///
248 /// Defined symbols are either absolute or in some section.
249 bool isDefined() const { return !isUndefined(); }
250
251 /// isInSection - Check if this symbol is defined in some section (i.e., it
252 /// is defined but not absolute).
253 bool isInSection() const {
254 return isDefined() && !isAbsolute();
255 }
256
257 /// isUndefined - Check if this symbol undefined (i.e., implicitly defined).
258 bool isUndefined(bool SetUsed = true) const {
259 return getFragment(SetUsed) == nullptr;
260 }
261
262 /// isAbsolute - Check if this is an absolute symbol.
263 bool isAbsolute() const {
264 return getFragment() == AbsolutePseudoFragment;
265 }
266
267 /// Get the section associated with a defined, non-absolute symbol.
268 MCSection &getSection() const {
269 assert(isInSection() && "Invalid accessor!");
270 return *getSectionPtr();
271 }
272
273 /// Mark the symbol as defined in the fragment \p F.
274 void setFragment(MCFragment *F) const {
275 assert(!isVariable() && "Cannot set fragment of variable");
276 FragmentAndHasName.setPointer(F);
277 }
278
279 /// Mark the symbol as undefined.
280 void setUndefined() { FragmentAndHasName.setPointer(nullptr); }
281
282 bool isELF() const { return Kind == SymbolKindELF; }
283
284 bool isCOFF() const { return Kind == SymbolKindCOFF; }
285
286 bool isMachO() const { return Kind == SymbolKindMachO; }
287
288 bool isWasm() const { return Kind == SymbolKindWasm; }
289
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100290 bool isXCOFF() const { return Kind == SymbolKindXCOFF; }
291
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100292 /// @}
293 /// \name Variable Symbols
294 /// @{
295
296 /// isVariable - Check if this is a variable symbol.
297 bool isVariable() const {
298 return SymbolContents == SymContentsVariable;
299 }
300
301 /// getVariableValue - Get the value for variable symbols.
302 const MCExpr *getVariableValue(bool SetUsed = true) const {
303 assert(isVariable() && "Invalid accessor!");
304 IsUsed |= SetUsed;
305 return Value;
306 }
307
308 void setVariableValue(const MCExpr *Value);
309
310 /// @}
311
312 /// Get the (implementation defined) index.
313 uint32_t getIndex() const {
314 return Index;
315 }
316
317 /// Set the (implementation defined) index.
318 void setIndex(uint32_t Value) const {
319 Index = Value;
320 }
321
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100322 bool isUnset() const { return SymbolContents == SymContentsUnset; }
323
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100324 uint64_t getOffset() const {
325 assert((SymbolContents == SymContentsUnset ||
326 SymbolContents == SymContentsOffset) &&
327 "Cannot get offset for a common/variable symbol");
328 return Offset;
329 }
330 void setOffset(uint64_t Value) {
331 assert((SymbolContents == SymContentsUnset ||
332 SymbolContents == SymContentsOffset) &&
333 "Cannot set offset for a common/variable symbol");
334 Offset = Value;
335 SymbolContents = SymContentsOffset;
336 }
337
338 /// Return the size of a 'common' symbol.
339 uint64_t getCommonSize() const {
340 assert(isCommon() && "Not a 'common' symbol!");
341 return CommonSize;
342 }
343
344 /// Mark this symbol as being 'common'.
345 ///
346 /// \param Size - The size of the symbol.
347 /// \param Align - The alignment of the symbol.
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100348 /// \param Target - Is the symbol a target-specific common-like symbol.
349 void setCommon(uint64_t Size, unsigned Align, bool Target = false) {
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100350 assert(getOffset() == 0);
351 CommonSize = Size;
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100352 SymbolContents = Target ? SymContentsTargetCommon : SymContentsCommon;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100353
354 assert((!Align || isPowerOf2_32(Align)) &&
355 "Alignment must be a power of 2");
356 unsigned Log2Align = Log2_32(Align) + 1;
357 assert(Log2Align < (1U << NumCommonAlignmentBits) &&
358 "Out of range alignment");
359 CommonAlignLog2 = Log2Align;
360 }
361
362 /// Return the alignment of a 'common' symbol.
363 unsigned getCommonAlignment() const {
364 assert(isCommon() && "Not a 'common' symbol!");
365 return CommonAlignLog2 ? (1U << (CommonAlignLog2 - 1)) : 0;
366 }
367
368 /// Declare this symbol as being 'common'.
369 ///
370 /// \param Size - The size of the symbol.
371 /// \param Align - The alignment of the symbol.
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100372 /// \param Target - Is the symbol a target-specific common-like symbol.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100373 /// \return True if symbol was already declared as a different type
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100374 bool declareCommon(uint64_t Size, unsigned Align, bool Target = false) {
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100375 assert(isCommon() || getOffset() == 0);
376 if(isCommon()) {
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100377 if (CommonSize != Size || getCommonAlignment() != Align ||
378 isTargetCommon() != Target)
379 return true;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100380 } else
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100381 setCommon(Size, Align, Target);
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100382 return false;
383 }
384
385 /// Is this a 'common' symbol.
386 bool isCommon() const {
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100387 return SymbolContents == SymContentsCommon ||
388 SymbolContents == SymContentsTargetCommon;
389 }
390
391 /// Is this a target-specific common-like symbol.
392 bool isTargetCommon() const {
393 return SymbolContents == SymContentsTargetCommon;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100394 }
395
396 MCFragment *getFragment(bool SetUsed = true) const {
397 MCFragment *Fragment = FragmentAndHasName.getPointer();
398 if (Fragment || !isVariable())
399 return Fragment;
400 Fragment = getVariableValue(SetUsed)->findAssociatedFragment();
401 FragmentAndHasName.setPointer(Fragment);
402 return Fragment;
403 }
404
405 bool isExternal() const { return IsExternal; }
406 void setExternal(bool Value) const { IsExternal = Value; }
407
408 bool isPrivateExtern() const { return IsPrivateExtern; }
409 void setPrivateExtern(bool Value) { IsPrivateExtern = Value; }
410
411 /// print - Print the value to the stream \p OS.
412 void print(raw_ostream &OS, const MCAsmInfo *MAI) const;
413
414 /// dump - Print the value to stderr.
415 void dump() const;
416
417protected:
418 /// Get the (implementation defined) symbol flags.
419 uint32_t getFlags() const { return Flags; }
420
421 /// Set the (implementation defined) symbol flags.
422 void setFlags(uint32_t Value) const {
423 assert(Value < (1U << NumFlagsBits) && "Out of range flags");
424 Flags = Value;
425 }
426
427 /// Modify the flags via a mask
428 void modifyFlags(uint32_t Value, uint32_t Mask) const {
429 assert(Value < (1U << NumFlagsBits) && "Out of range flags");
430 Flags = (Flags & ~Mask) | Value;
431 }
432};
433
434inline raw_ostream &operator<<(raw_ostream &OS, const MCSymbol &Sym) {
435 Sym.print(OS, nullptr);
436 return OS;
437}
438
439} // end namespace llvm
440
441#endif // LLVM_MC_MCSYMBOL_H