1 //===- ELFAsmParser.cpp - ELF Assembly Parser -----------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8
9 #include "llvm/ADT/StringRef.h"
10 #include "llvm/ADT/StringSwitch.h"
11 #include "llvm/BinaryFormat/ELF.h"
12 #include "llvm/MC/MCAsmInfo.h"
13 #include "llvm/MC/MCContext.h"
14 #include "llvm/MC/MCDirectives.h"
15 #include "llvm/MC/MCExpr.h"
16 #include "llvm/MC/MCParser/MCAsmLexer.h"
17 #include "llvm/MC/MCParser/MCAsmParser.h"
18 #include "llvm/MC/MCParser/MCAsmParserExtension.h"
19 #include "llvm/MC/MCSection.h"
20 #include "llvm/MC/MCSectionELF.h"
21 #include "llvm/MC/MCStreamer.h"
22 #include "llvm/MC/MCSymbol.h"
23 #include "llvm/MC/MCSymbolELF.h"
24 #include "llvm/MC/SectionKind.h"
25 #include "llvm/Support/Casting.h"
26 #include "llvm/Support/MathExtras.h"
27 #include "llvm/Support/SMLoc.h"
28 #include <cassert>
29 #include <cstdint>
30 #include <utility>
31
32 using namespace llvm;
33
34 namespace {
35
36 class ELFAsmParser : public MCAsmParserExtension {
37 template<bool (ELFAsmParser::*HandlerMethod)(StringRef, SMLoc)>
addDirectiveHandler(StringRef Directive)38 void addDirectiveHandler(StringRef Directive) {
39 MCAsmParser::ExtensionDirectiveHandler Handler = std::make_pair(
40 this, HandleDirective<ELFAsmParser, HandlerMethod>);
41
42 getParser().addDirectiveHandler(Directive, Handler);
43 }
44
45 bool ParseSectionSwitch(StringRef Section, unsigned Type, unsigned Flags,
46 SectionKind Kind);
47
48 public:
ELFAsmParser()49 ELFAsmParser() { BracketExpressionsSupported = true; }
50
Initialize(MCAsmParser & Parser)51 void Initialize(MCAsmParser &Parser) override {
52 // Call the base implementation.
53 this->MCAsmParserExtension::Initialize(Parser);
54
55 addDirectiveHandler<&ELFAsmParser::ParseSectionDirectiveData>(".data");
56 addDirectiveHandler<&ELFAsmParser::ParseSectionDirectiveText>(".text");
57 addDirectiveHandler<&ELFAsmParser::ParseSectionDirectiveBSS>(".bss");
58 addDirectiveHandler<&ELFAsmParser::ParseSectionDirectiveRoData>(".rodata");
59 addDirectiveHandler<&ELFAsmParser::ParseSectionDirectiveTData>(".tdata");
60 addDirectiveHandler<&ELFAsmParser::ParseSectionDirectiveTBSS>(".tbss");
61 addDirectiveHandler<
62 &ELFAsmParser::ParseSectionDirectiveDataRel>(".data.rel");
63 addDirectiveHandler<
64 &ELFAsmParser::ParseSectionDirectiveDataRelRo>(".data.rel.ro");
65 addDirectiveHandler<
66 &ELFAsmParser::ParseSectionDirectiveEhFrame>(".eh_frame");
67 addDirectiveHandler<&ELFAsmParser::ParseDirectiveSection>(".section");
68 addDirectiveHandler<
69 &ELFAsmParser::ParseDirectivePushSection>(".pushsection");
70 addDirectiveHandler<&ELFAsmParser::ParseDirectivePopSection>(".popsection");
71 addDirectiveHandler<&ELFAsmParser::ParseDirectiveSize>(".size");
72 addDirectiveHandler<&ELFAsmParser::ParseDirectivePrevious>(".previous");
73 addDirectiveHandler<&ELFAsmParser::ParseDirectiveType>(".type");
74 addDirectiveHandler<&ELFAsmParser::ParseDirectiveIdent>(".ident");
75 addDirectiveHandler<&ELFAsmParser::ParseDirectiveSymver>(".symver");
76 addDirectiveHandler<&ELFAsmParser::ParseDirectiveVersion>(".version");
77 addDirectiveHandler<&ELFAsmParser::ParseDirectiveWeakref>(".weakref");
78 addDirectiveHandler<&ELFAsmParser::ParseDirectiveSymbolAttribute>(".weak");
79 addDirectiveHandler<&ELFAsmParser::ParseDirectiveSymbolAttribute>(".local");
80 addDirectiveHandler<
81 &ELFAsmParser::ParseDirectiveSymbolAttribute>(".protected");
82 addDirectiveHandler<
83 &ELFAsmParser::ParseDirectiveSymbolAttribute>(".internal");
84 addDirectiveHandler<
85 &ELFAsmParser::ParseDirectiveSymbolAttribute>(".hidden");
86 addDirectiveHandler<&ELFAsmParser::ParseDirectiveSubsection>(".subsection");
87 addDirectiveHandler<&ELFAsmParser::ParseDirectiveCGProfile>(".cg_profile");
88 }
89
90 // FIXME: Part of this logic is duplicated in the MCELFStreamer. What is
91 // the best way for us to get access to it?
ParseSectionDirectiveData(StringRef,SMLoc)92 bool ParseSectionDirectiveData(StringRef, SMLoc) {
93 return ParseSectionSwitch(".data", ELF::SHT_PROGBITS,
94 ELF::SHF_WRITE | ELF::SHF_ALLOC,
95 SectionKind::getData());
96 }
ParseSectionDirectiveText(StringRef,SMLoc)97 bool ParseSectionDirectiveText(StringRef, SMLoc) {
98 return ParseSectionSwitch(".text", ELF::SHT_PROGBITS,
99 ELF::SHF_EXECINSTR |
100 ELF::SHF_ALLOC, SectionKind::getText());
101 }
ParseSectionDirectiveBSS(StringRef,SMLoc)102 bool ParseSectionDirectiveBSS(StringRef, SMLoc) {
103 return ParseSectionSwitch(".bss", ELF::SHT_NOBITS,
104 ELF::SHF_WRITE |
105 ELF::SHF_ALLOC, SectionKind::getBSS());
106 }
ParseSectionDirectiveRoData(StringRef,SMLoc)107 bool ParseSectionDirectiveRoData(StringRef, SMLoc) {
108 return ParseSectionSwitch(".rodata", ELF::SHT_PROGBITS,
109 ELF::SHF_ALLOC,
110 SectionKind::getReadOnly());
111 }
ParseSectionDirectiveTData(StringRef,SMLoc)112 bool ParseSectionDirectiveTData(StringRef, SMLoc) {
113 return ParseSectionSwitch(".tdata", ELF::SHT_PROGBITS,
114 ELF::SHF_ALLOC |
115 ELF::SHF_TLS | ELF::SHF_WRITE,
116 SectionKind::getThreadData());
117 }
ParseSectionDirectiveTBSS(StringRef,SMLoc)118 bool ParseSectionDirectiveTBSS(StringRef, SMLoc) {
119 return ParseSectionSwitch(".tbss", ELF::SHT_NOBITS,
120 ELF::SHF_ALLOC |
121 ELF::SHF_TLS | ELF::SHF_WRITE,
122 SectionKind::getThreadBSS());
123 }
ParseSectionDirectiveDataRel(StringRef,SMLoc)124 bool ParseSectionDirectiveDataRel(StringRef, SMLoc) {
125 return ParseSectionSwitch(".data.rel", ELF::SHT_PROGBITS,
126 ELF::SHF_ALLOC | ELF::SHF_WRITE,
127 SectionKind::getData());
128 }
ParseSectionDirectiveDataRelRo(StringRef,SMLoc)129 bool ParseSectionDirectiveDataRelRo(StringRef, SMLoc) {
130 return ParseSectionSwitch(".data.rel.ro", ELF::SHT_PROGBITS,
131 ELF::SHF_ALLOC |
132 ELF::SHF_WRITE,
133 SectionKind::getReadOnlyWithRel());
134 }
ParseSectionDirectiveEhFrame(StringRef,SMLoc)135 bool ParseSectionDirectiveEhFrame(StringRef, SMLoc) {
136 return ParseSectionSwitch(".eh_frame", ELF::SHT_PROGBITS,
137 ELF::SHF_ALLOC | ELF::SHF_WRITE,
138 SectionKind::getData());
139 }
140 bool ParseDirectivePushSection(StringRef, SMLoc);
141 bool ParseDirectivePopSection(StringRef, SMLoc);
142 bool ParseDirectiveSection(StringRef, SMLoc);
143 bool ParseDirectiveSize(StringRef, SMLoc);
144 bool ParseDirectivePrevious(StringRef, SMLoc);
145 bool ParseDirectiveType(StringRef, SMLoc);
146 bool ParseDirectiveIdent(StringRef, SMLoc);
147 bool ParseDirectiveSymver(StringRef, SMLoc);
148 bool ParseDirectiveVersion(StringRef, SMLoc);
149 bool ParseDirectiveWeakref(StringRef, SMLoc);
150 bool ParseDirectiveSymbolAttribute(StringRef, SMLoc);
151 bool ParseDirectiveSubsection(StringRef, SMLoc);
152 bool ParseDirectiveCGProfile(StringRef, SMLoc);
153
154 private:
155 bool ParseSectionName(StringRef &SectionName);
156 bool ParseSectionArguments(bool IsPush, SMLoc loc);
157 unsigned parseSunStyleSectionFlags();
158 bool maybeParseSectionType(StringRef &TypeName);
159 bool parseMergeSize(int64_t &Size);
160 bool parseGroup(StringRef &GroupName, bool &IsComdat);
161 bool parseLinkedToSym(MCSymbolELF *&LinkedToSym);
162 bool maybeParseUniqueID(int64_t &UniqueID);
163 };
164
165 } // end anonymous namespace
166
167 /// ParseDirectiveSymbolAttribute
168 /// ::= { ".local", ".weak", ... } [ identifier ( , identifier )* ]
ParseDirectiveSymbolAttribute(StringRef Directive,SMLoc)169 bool ELFAsmParser::ParseDirectiveSymbolAttribute(StringRef Directive, SMLoc) {
170 MCSymbolAttr Attr = StringSwitch<MCSymbolAttr>(Directive)
171 .Case(".weak", MCSA_Weak)
172 .Case(".local", MCSA_Local)
173 .Case(".hidden", MCSA_Hidden)
174 .Case(".internal", MCSA_Internal)
175 .Case(".protected", MCSA_Protected)
176 .Default(MCSA_Invalid);
177 assert(Attr != MCSA_Invalid && "unexpected symbol attribute directive!");
178 if (getLexer().isNot(AsmToken::EndOfStatement)) {
179 while (true) {
180 StringRef Name;
181
182 if (getParser().parseIdentifier(Name))
183 return TokError("expected identifier in directive");
184
185 if (getParser().discardLTOSymbol(Name)) {
186 if (getLexer().is(AsmToken::EndOfStatement))
187 break;
188 continue;
189 }
190
191 MCSymbol *Sym = getContext().getOrCreateSymbol(Name);
192
193 getStreamer().emitSymbolAttribute(Sym, Attr);
194
195 if (getLexer().is(AsmToken::EndOfStatement))
196 break;
197
198 if (getLexer().isNot(AsmToken::Comma))
199 return TokError("unexpected token in directive");
200 Lex();
201 }
202 }
203
204 Lex();
205 return false;
206 }
207
ParseSectionSwitch(StringRef Section,unsigned Type,unsigned Flags,SectionKind Kind)208 bool ELFAsmParser::ParseSectionSwitch(StringRef Section, unsigned Type,
209 unsigned Flags, SectionKind Kind) {
210 const MCExpr *Subsection = nullptr;
211 if (getLexer().isNot(AsmToken::EndOfStatement)) {
212 if (getParser().parseExpression(Subsection))
213 return true;
214 }
215 Lex();
216
217 getStreamer().SwitchSection(getContext().getELFSection(Section, Type, Flags),
218 Subsection);
219
220 return false;
221 }
222
ParseDirectiveSize(StringRef,SMLoc)223 bool ELFAsmParser::ParseDirectiveSize(StringRef, SMLoc) {
224 StringRef Name;
225 if (getParser().parseIdentifier(Name))
226 return TokError("expected identifier in directive");
227 MCSymbolELF *Sym = cast<MCSymbolELF>(getContext().getOrCreateSymbol(Name));
228
229 if (getLexer().isNot(AsmToken::Comma))
230 return TokError("unexpected token in directive");
231 Lex();
232
233 const MCExpr *Expr;
234 if (getParser().parseExpression(Expr))
235 return true;
236
237 if (getLexer().isNot(AsmToken::EndOfStatement))
238 return TokError("unexpected token in directive");
239 Lex();
240
241 getStreamer().emitELFSize(Sym, Expr);
242 return false;
243 }
244
ParseSectionName(StringRef & SectionName)245 bool ELFAsmParser::ParseSectionName(StringRef &SectionName) {
246 // A section name can contain -, so we cannot just use
247 // parseIdentifier.
248 SMLoc FirstLoc = getLexer().getLoc();
249 unsigned Size = 0;
250
251 if (getLexer().is(AsmToken::String)) {
252 SectionName = getTok().getIdentifier();
253 Lex();
254 return false;
255 }
256
257 while (!getParser().hasPendingError()) {
258 SMLoc PrevLoc = getLexer().getLoc();
259 if (getLexer().is(AsmToken::Comma) ||
260 getLexer().is(AsmToken::EndOfStatement))
261 break;
262
263 unsigned CurSize;
264 if (getLexer().is(AsmToken::String)) {
265 CurSize = getTok().getIdentifier().size() + 2;
266 Lex();
267 } else if (getLexer().is(AsmToken::Identifier)) {
268 CurSize = getTok().getIdentifier().size();
269 Lex();
270 } else {
271 CurSize = getTok().getString().size();
272 Lex();
273 }
274 Size += CurSize;
275 SectionName = StringRef(FirstLoc.getPointer(), Size);
276
277 // Make sure the following token is adjacent.
278 if (PrevLoc.getPointer() + CurSize != getTok().getLoc().getPointer())
279 break;
280 }
281 if (Size == 0)
282 return true;
283
284 return false;
285 }
286
parseSectionFlags(StringRef flagsStr,bool * UseLastGroup)287 static unsigned parseSectionFlags(StringRef flagsStr, bool *UseLastGroup) {
288 unsigned flags = 0;
289
290 // If a valid numerical value is set for the section flag, use it verbatim
291 if (!flagsStr.getAsInteger(0, flags))
292 return flags;
293
294 for (char i : flagsStr) {
295 switch (i) {
296 case 'a':
297 flags |= ELF::SHF_ALLOC;
298 break;
299 case 'e':
300 flags |= ELF::SHF_EXCLUDE;
301 break;
302 case 'x':
303 flags |= ELF::SHF_EXECINSTR;
304 break;
305 case 'w':
306 flags |= ELF::SHF_WRITE;
307 break;
308 case 'o':
309 flags |= ELF::SHF_LINK_ORDER;
310 break;
311 case 'M':
312 flags |= ELF::SHF_MERGE;
313 break;
314 case 'S':
315 flags |= ELF::SHF_STRINGS;
316 break;
317 case 'T':
318 flags |= ELF::SHF_TLS;
319 break;
320 case 'c':
321 flags |= ELF::XCORE_SHF_CP_SECTION;
322 break;
323 case 'd':
324 flags |= ELF::XCORE_SHF_DP_SECTION;
325 break;
326 case 'y':
327 flags |= ELF::SHF_ARM_PURECODE;
328 break;
329 case 's':
330 flags |= ELF::SHF_HEX_GPREL;
331 break;
332 case 'G':
333 flags |= ELF::SHF_GROUP;
334 break;
335 case 'R':
336 flags |= ELF::SHF_GNU_RETAIN;
337 break;
338 case '?':
339 *UseLastGroup = true;
340 break;
341 default:
342 return -1U;
343 }
344 }
345
346 return flags;
347 }
348
parseSunStyleSectionFlags()349 unsigned ELFAsmParser::parseSunStyleSectionFlags() {
350 unsigned flags = 0;
351 while (getLexer().is(AsmToken::Hash)) {
352 Lex(); // Eat the #.
353
354 if (!getLexer().is(AsmToken::Identifier))
355 return -1U;
356
357 StringRef flagId = getTok().getIdentifier();
358 if (flagId == "alloc")
359 flags |= ELF::SHF_ALLOC;
360 else if (flagId == "execinstr")
361 flags |= ELF::SHF_EXECINSTR;
362 else if (flagId == "write")
363 flags |= ELF::SHF_WRITE;
364 else if (flagId == "tls")
365 flags |= ELF::SHF_TLS;
366 else
367 return -1U;
368
369 Lex(); // Eat the flag.
370
371 if (!getLexer().is(AsmToken::Comma))
372 break;
373 Lex(); // Eat the comma.
374 }
375 return flags;
376 }
377
378
ParseDirectivePushSection(StringRef s,SMLoc loc)379 bool ELFAsmParser::ParseDirectivePushSection(StringRef s, SMLoc loc) {
380 getStreamer().PushSection();
381
382 if (ParseSectionArguments(/*IsPush=*/true, loc)) {
383 getStreamer().PopSection();
384 return true;
385 }
386
387 return false;
388 }
389
ParseDirectivePopSection(StringRef,SMLoc)390 bool ELFAsmParser::ParseDirectivePopSection(StringRef, SMLoc) {
391 if (!getStreamer().PopSection())
392 return TokError(".popsection without corresponding .pushsection");
393 return false;
394 }
395
ParseDirectiveSection(StringRef,SMLoc loc)396 bool ELFAsmParser::ParseDirectiveSection(StringRef, SMLoc loc) {
397 return ParseSectionArguments(/*IsPush=*/false, loc);
398 }
399
maybeParseSectionType(StringRef & TypeName)400 bool ELFAsmParser::maybeParseSectionType(StringRef &TypeName) {
401 MCAsmLexer &L = getLexer();
402 if (L.isNot(AsmToken::Comma))
403 return false;
404 Lex();
405 if (L.isNot(AsmToken::At) && L.isNot(AsmToken::Percent) &&
406 L.isNot(AsmToken::String)) {
407 if (L.getAllowAtInIdentifier())
408 return TokError("expected '@<type>', '%<type>' or \"<type>\"");
409 else
410 return TokError("expected '%<type>' or \"<type>\"");
411 }
412 if (!L.is(AsmToken::String))
413 Lex();
414 if (L.is(AsmToken::Integer)) {
415 TypeName = getTok().getString();
416 Lex();
417 } else if (getParser().parseIdentifier(TypeName))
418 return TokError("expected identifier in directive");
419 return false;
420 }
421
parseMergeSize(int64_t & Size)422 bool ELFAsmParser::parseMergeSize(int64_t &Size) {
423 if (getLexer().isNot(AsmToken::Comma))
424 return TokError("expected the entry size");
425 Lex();
426 if (getParser().parseAbsoluteExpression(Size))
427 return true;
428 if (Size <= 0)
429 return TokError("entry size must be positive");
430 return false;
431 }
432
parseGroup(StringRef & GroupName,bool & IsComdat)433 bool ELFAsmParser::parseGroup(StringRef &GroupName, bool &IsComdat) {
434 MCAsmLexer &L = getLexer();
435 if (L.isNot(AsmToken::Comma))
436 return TokError("expected group name");
437 Lex();
438 if (L.is(AsmToken::Integer)) {
439 GroupName = getTok().getString();
440 Lex();
441 } else if (getParser().parseIdentifier(GroupName)) {
442 return TokError("invalid group name");
443 }
444 if (L.is(AsmToken::Comma)) {
445 Lex();
446 StringRef Linkage;
447 if (getParser().parseIdentifier(Linkage))
448 return TokError("invalid linkage");
449 if (Linkage != "comdat")
450 return TokError("Linkage must be 'comdat'");
451 IsComdat = true;
452 } else {
453 IsComdat = false;
454 }
455 return false;
456 }
457
parseLinkedToSym(MCSymbolELF * & LinkedToSym)458 bool ELFAsmParser::parseLinkedToSym(MCSymbolELF *&LinkedToSym) {
459 MCAsmLexer &L = getLexer();
460 if (L.isNot(AsmToken::Comma))
461 return TokError("expected linked-to symbol");
462 Lex();
463 StringRef Name;
464 SMLoc StartLoc = L.getLoc();
465 if (getParser().parseIdentifier(Name)) {
466 if (getParser().getTok().getString() == "0") {
467 getParser().Lex();
468 LinkedToSym = nullptr;
469 return false;
470 }
471 return TokError("invalid linked-to symbol");
472 }
473 LinkedToSym = dyn_cast_or_null<MCSymbolELF>(getContext().lookupSymbol(Name));
474 if (!LinkedToSym || !LinkedToSym->isInSection())
475 return Error(StartLoc, "linked-to symbol is not in a section: " + Name);
476 return false;
477 }
478
maybeParseUniqueID(int64_t & UniqueID)479 bool ELFAsmParser::maybeParseUniqueID(int64_t &UniqueID) {
480 MCAsmLexer &L = getLexer();
481 if (L.isNot(AsmToken::Comma))
482 return false;
483 Lex();
484 StringRef UniqueStr;
485 if (getParser().parseIdentifier(UniqueStr))
486 return TokError("expected identifier in directive");
487 if (UniqueStr != "unique")
488 return TokError("expected 'unique'");
489 if (L.isNot(AsmToken::Comma))
490 return TokError("expected commma");
491 Lex();
492 if (getParser().parseAbsoluteExpression(UniqueID))
493 return true;
494 if (UniqueID < 0)
495 return TokError("unique id must be positive");
496 if (!isUInt<32>(UniqueID) || UniqueID == ~0U)
497 return TokError("unique id is too large");
498 return false;
499 }
500
hasPrefix(StringRef SectionName,StringRef Prefix)501 static bool hasPrefix(StringRef SectionName, StringRef Prefix) {
502 return SectionName.startswith(Prefix) || SectionName == Prefix.drop_back();
503 }
504
allowSectionTypeMismatch(const Triple & TT,StringRef SectionName,unsigned Type)505 static bool allowSectionTypeMismatch(const Triple &TT, StringRef SectionName,
506 unsigned Type) {
507 if (TT.getArch() == Triple::x86_64) {
508 // x86-64 psABI names SHT_X86_64_UNWIND as the canonical type for .eh_frame,
509 // but GNU as emits SHT_PROGBITS .eh_frame for .cfi_* directives. Don't
510 // error for SHT_PROGBITS .eh_frame
511 return SectionName == ".eh_frame" && Type == ELF::SHT_PROGBITS;
512 }
513 if (TT.isMIPS()) {
514 // MIPS .debug_* sections should have SHT_MIPS_DWARF section type to
515 // distinguish among sections contain DWARF and ECOFF debug formats,
516 // but in assembly files these sections have SHT_PROGBITS type.
517 return hasPrefix(SectionName, ".debug_") && Type == ELF::SHT_PROGBITS;
518 }
519 return false;
520 }
521
ParseSectionArguments(bool IsPush,SMLoc loc)522 bool ELFAsmParser::ParseSectionArguments(bool IsPush, SMLoc loc) {
523 StringRef SectionName;
524
525 if (ParseSectionName(SectionName))
526 return TokError("expected identifier in directive");
527
528 StringRef TypeName;
529 int64_t Size = 0;
530 StringRef GroupName;
531 bool IsComdat = false;
532 unsigned Flags = 0;
533 unsigned extraFlags = 0;
534 const MCExpr *Subsection = nullptr;
535 bool UseLastGroup = false;
536 MCSymbolELF *LinkedToSym = nullptr;
537 int64_t UniqueID = ~0;
538
539 // Set the defaults first.
540 if (hasPrefix(SectionName, ".rodata.") || SectionName == ".rodata1")
541 Flags |= ELF::SHF_ALLOC;
542 else if (SectionName == ".fini" || SectionName == ".init" ||
543 hasPrefix(SectionName, ".text."))
544 Flags |= ELF::SHF_ALLOC | ELF::SHF_EXECINSTR;
545 else if (hasPrefix(SectionName, ".data.") || SectionName == ".data1" ||
546 hasPrefix(SectionName, ".bss.") ||
547 hasPrefix(SectionName, ".init_array.") ||
548 hasPrefix(SectionName, ".fini_array.") ||
549 hasPrefix(SectionName, ".preinit_array."))
550 Flags |= ELF::SHF_ALLOC | ELF::SHF_WRITE;
551 else if (hasPrefix(SectionName, ".tdata.") ||
552 hasPrefix(SectionName, ".tbss."))
553 Flags |= ELF::SHF_ALLOC | ELF::SHF_WRITE | ELF::SHF_TLS;
554
555 if (getLexer().is(AsmToken::Comma)) {
556 Lex();
557
558 if (IsPush && getLexer().isNot(AsmToken::String)) {
559 if (getParser().parseExpression(Subsection))
560 return true;
561 if (getLexer().isNot(AsmToken::Comma))
562 goto EndStmt;
563 Lex();
564 }
565
566 if (getLexer().isNot(AsmToken::String)) {
567 if (!getContext().getAsmInfo()->usesSunStyleELFSectionSwitchSyntax()
568 || getLexer().isNot(AsmToken::Hash))
569 return TokError("expected string in directive");
570 extraFlags = parseSunStyleSectionFlags();
571 } else {
572 StringRef FlagsStr = getTok().getStringContents();
573 Lex();
574 extraFlags = parseSectionFlags(FlagsStr, &UseLastGroup);
575 }
576
577 if (extraFlags == -1U)
578 return TokError("unknown flag");
579 Flags |= extraFlags;
580
581 bool Mergeable = Flags & ELF::SHF_MERGE;
582 bool Group = Flags & ELF::SHF_GROUP;
583 if (Group && UseLastGroup)
584 return TokError("Section cannot specifiy a group name while also acting "
585 "as a member of the last group");
586
587 if (maybeParseSectionType(TypeName))
588 return true;
589
590 MCAsmLexer &L = getLexer();
591 if (TypeName.empty()) {
592 if (Mergeable)
593 return TokError("Mergeable section must specify the type");
594 if (Group)
595 return TokError("Group section must specify the type");
596 if (L.isNot(AsmToken::EndOfStatement))
597 return TokError("unexpected token in directive");
598 }
599
600 if (Mergeable)
601 if (parseMergeSize(Size))
602 return true;
603 if (Group)
604 if (parseGroup(GroupName, IsComdat))
605 return true;
606 if (Flags & ELF::SHF_LINK_ORDER)
607 if (parseLinkedToSym(LinkedToSym))
608 return true;
609 if (maybeParseUniqueID(UniqueID))
610 return true;
611 }
612
613 EndStmt:
614 if (getLexer().isNot(AsmToken::EndOfStatement))
615 return TokError("unexpected token in directive");
616 Lex();
617
618 unsigned Type = ELF::SHT_PROGBITS;
619
620 if (TypeName.empty()) {
621 if (SectionName.startswith(".note"))
622 Type = ELF::SHT_NOTE;
623 else if (hasPrefix(SectionName, ".init_array."))
624 Type = ELF::SHT_INIT_ARRAY;
625 else if (hasPrefix(SectionName, ".bss."))
626 Type = ELF::SHT_NOBITS;
627 else if (hasPrefix(SectionName, ".tbss."))
628 Type = ELF::SHT_NOBITS;
629 else if (hasPrefix(SectionName, ".fini_array."))
630 Type = ELF::SHT_FINI_ARRAY;
631 else if (hasPrefix(SectionName, ".preinit_array."))
632 Type = ELF::SHT_PREINIT_ARRAY;
633 } else {
634 if (TypeName == "init_array")
635 Type = ELF::SHT_INIT_ARRAY;
636 else if (TypeName == "fini_array")
637 Type = ELF::SHT_FINI_ARRAY;
638 else if (TypeName == "preinit_array")
639 Type = ELF::SHT_PREINIT_ARRAY;
640 else if (TypeName == "nobits")
641 Type = ELF::SHT_NOBITS;
642 else if (TypeName == "progbits")
643 Type = ELF::SHT_PROGBITS;
644 else if (TypeName == "note")
645 Type = ELF::SHT_NOTE;
646 else if (TypeName == "unwind")
647 Type = ELF::SHT_X86_64_UNWIND;
648 else if (TypeName == "llvm_odrtab")
649 Type = ELF::SHT_LLVM_ODRTAB;
650 else if (TypeName == "llvm_linker_options")
651 Type = ELF::SHT_LLVM_LINKER_OPTIONS;
652 else if (TypeName == "llvm_call_graph_profile")
653 Type = ELF::SHT_LLVM_CALL_GRAPH_PROFILE;
654 else if (TypeName == "llvm_dependent_libraries")
655 Type = ELF::SHT_LLVM_DEPENDENT_LIBRARIES;
656 else if (TypeName == "llvm_sympart")
657 Type = ELF::SHT_LLVM_SYMPART;
658 else if (TypeName == "llvm_bb_addr_map")
659 Type = ELF::SHT_LLVM_BB_ADDR_MAP;
660 else if (TypeName.getAsInteger(0, Type))
661 return TokError("unknown section type");
662 }
663
664 if (UseLastGroup) {
665 MCSectionSubPair CurrentSection = getStreamer().getCurrentSection();
666 if (const MCSectionELF *Section =
667 cast_or_null<MCSectionELF>(CurrentSection.first))
668 if (const MCSymbol *Group = Section->getGroup()) {
669 GroupName = Group->getName();
670 IsComdat = Section->isComdat();
671 Flags |= ELF::SHF_GROUP;
672 }
673 }
674
675 MCSectionELF *Section =
676 getContext().getELFSection(SectionName, Type, Flags, Size, GroupName,
677 IsComdat, UniqueID, LinkedToSym);
678 getStreamer().SwitchSection(Section, Subsection);
679 // Check that flags are used consistently. However, the GNU assembler permits
680 // to leave out in subsequent uses of the same sections; for compatibility,
681 // do likewise.
682 if (!TypeName.empty() && Section->getType() != Type &&
683 !allowSectionTypeMismatch(getContext().getTargetTriple(), SectionName,
684 Type))
685 Error(loc, "changed section type for " + SectionName + ", expected: 0x" +
686 utohexstr(Section->getType()));
687 if ((extraFlags || Size || !TypeName.empty()) && Section->getFlags() != Flags)
688 Error(loc, "changed section flags for " + SectionName + ", expected: 0x" +
689 utohexstr(Section->getFlags()));
690 if ((extraFlags || Size || !TypeName.empty()) &&
691 Section->getEntrySize() != Size)
692 Error(loc, "changed section entsize for " + SectionName +
693 ", expected: " + Twine(Section->getEntrySize()));
694
695 if (getContext().getGenDwarfForAssembly() &&
696 (Section->getFlags() & ELF::SHF_ALLOC) &&
697 (Section->getFlags() & ELF::SHF_EXECINSTR)) {
698 bool InsertResult = getContext().addGenDwarfSection(Section);
699 if (InsertResult) {
700 if (getContext().getDwarfVersion() <= 2)
701 Warning(loc, "DWARF2 only supports one section per compilation unit");
702
703 if (!Section->getBeginSymbol()) {
704 MCSymbol *SectionStartSymbol = getContext().createTempSymbol();
705 getStreamer().emitLabel(SectionStartSymbol);
706 Section->setBeginSymbol(SectionStartSymbol);
707 }
708 }
709 }
710
711 return false;
712 }
713
ParseDirectivePrevious(StringRef DirName,SMLoc)714 bool ELFAsmParser::ParseDirectivePrevious(StringRef DirName, SMLoc) {
715 MCSectionSubPair PreviousSection = getStreamer().getPreviousSection();
716 if (PreviousSection.first == nullptr)
717 return TokError(".previous without corresponding .section");
718 getStreamer().SwitchSection(PreviousSection.first, PreviousSection.second);
719
720 return false;
721 }
722
MCAttrForString(StringRef Type)723 static MCSymbolAttr MCAttrForString(StringRef Type) {
724 return StringSwitch<MCSymbolAttr>(Type)
725 .Cases("STT_FUNC", "function", MCSA_ELF_TypeFunction)
726 .Cases("STT_OBJECT", "object", MCSA_ELF_TypeObject)
727 .Cases("STT_TLS", "tls_object", MCSA_ELF_TypeTLS)
728 .Cases("STT_COMMON", "common", MCSA_ELF_TypeCommon)
729 .Cases("STT_NOTYPE", "notype", MCSA_ELF_TypeNoType)
730 .Cases("STT_GNU_IFUNC", "gnu_indirect_function",
731 MCSA_ELF_TypeIndFunction)
732 .Case("gnu_unique_object", MCSA_ELF_TypeGnuUniqueObject)
733 .Default(MCSA_Invalid);
734 }
735
736 /// ParseDirectiveELFType
737 /// ::= .type identifier , STT_<TYPE_IN_UPPER_CASE>
738 /// ::= .type identifier , #attribute
739 /// ::= .type identifier , @attribute
740 /// ::= .type identifier , %attribute
741 /// ::= .type identifier , "attribute"
ParseDirectiveType(StringRef,SMLoc)742 bool ELFAsmParser::ParseDirectiveType(StringRef, SMLoc) {
743 StringRef Name;
744 if (getParser().parseIdentifier(Name))
745 return TokError("expected identifier in directive");
746
747 // Handle the identifier as the key symbol.
748 MCSymbol *Sym = getContext().getOrCreateSymbol(Name);
749
750 // NOTE the comma is optional in all cases. It is only documented as being
751 // optional in the first case, however, GAS will silently treat the comma as
752 // optional in all cases. Furthermore, although the documentation states that
753 // the first form only accepts STT_<TYPE_IN_UPPER_CASE>, in reality, GAS
754 // accepts both the upper case name as well as the lower case aliases.
755 if (getLexer().is(AsmToken::Comma))
756 Lex();
757
758 if (getLexer().isNot(AsmToken::Identifier) &&
759 getLexer().isNot(AsmToken::Hash) &&
760 getLexer().isNot(AsmToken::Percent) &&
761 getLexer().isNot(AsmToken::String)) {
762 if (!getLexer().getAllowAtInIdentifier())
763 return TokError("expected STT_<TYPE_IN_UPPER_CASE>, '#<type>', "
764 "'%<type>' or \"<type>\"");
765 else if (getLexer().isNot(AsmToken::At))
766 return TokError("expected STT_<TYPE_IN_UPPER_CASE>, '#<type>', '@<type>', "
767 "'%<type>' or \"<type>\"");
768 }
769
770 if (getLexer().isNot(AsmToken::String) &&
771 getLexer().isNot(AsmToken::Identifier))
772 Lex();
773
774 SMLoc TypeLoc = getLexer().getLoc();
775
776 StringRef Type;
777 if (getParser().parseIdentifier(Type))
778 return TokError("expected symbol type in directive");
779
780 MCSymbolAttr Attr = MCAttrForString(Type);
781 if (Attr == MCSA_Invalid)
782 return Error(TypeLoc, "unsupported attribute in '.type' directive");
783
784 if (getLexer().isNot(AsmToken::EndOfStatement))
785 return TokError("unexpected token in '.type' directive");
786 Lex();
787
788 getStreamer().emitSymbolAttribute(Sym, Attr);
789
790 return false;
791 }
792
793 /// ParseDirectiveIdent
794 /// ::= .ident string
ParseDirectiveIdent(StringRef,SMLoc)795 bool ELFAsmParser::ParseDirectiveIdent(StringRef, SMLoc) {
796 if (getLexer().isNot(AsmToken::String))
797 return TokError("unexpected token in '.ident' directive");
798
799 StringRef Data = getTok().getIdentifier();
800
801 Lex();
802
803 if (getLexer().isNot(AsmToken::EndOfStatement))
804 return TokError("unexpected token in '.ident' directive");
805 Lex();
806
807 getStreamer().emitIdent(Data);
808 return false;
809 }
810
811 /// ParseDirectiveSymver
812 /// ::= .symver foo, bar2@zed
ParseDirectiveSymver(StringRef,SMLoc)813 bool ELFAsmParser::ParseDirectiveSymver(StringRef, SMLoc) {
814 StringRef OriginalName, Name, Action;
815 if (getParser().parseIdentifier(OriginalName))
816 return TokError("expected identifier in directive");
817
818 if (getLexer().isNot(AsmToken::Comma))
819 return TokError("expected a comma");
820
821 // ARM assembly uses @ for a comment...
822 // except when parsing the second parameter of the .symver directive.
823 // Force the next symbol to allow @ in the identifier, which is
824 // required for this directive and then reset it to its initial state.
825 const bool AllowAtInIdentifier = getLexer().getAllowAtInIdentifier();
826 getLexer().setAllowAtInIdentifier(true);
827 Lex();
828 getLexer().setAllowAtInIdentifier(AllowAtInIdentifier);
829
830 if (getParser().parseIdentifier(Name))
831 return TokError("expected identifier in directive");
832
833 if (Name.find('@') == StringRef::npos)
834 return TokError("expected a '@' in the name");
835 bool KeepOriginalSym = !Name.contains("@@@");
836 if (parseOptionalToken(AsmToken::Comma)) {
837 if (getParser().parseIdentifier(Action) || Action != "remove")
838 return TokError("expected 'remove'");
839 KeepOriginalSym = false;
840 }
841 (void)parseOptionalToken(AsmToken::EndOfStatement);
842
843 getStreamer().emitELFSymverDirective(
844 getContext().getOrCreateSymbol(OriginalName), Name, KeepOriginalSym);
845 return false;
846 }
847
848 /// ParseDirectiveVersion
849 /// ::= .version string
ParseDirectiveVersion(StringRef,SMLoc)850 bool ELFAsmParser::ParseDirectiveVersion(StringRef, SMLoc) {
851 if (getLexer().isNot(AsmToken::String))
852 return TokError("unexpected token in '.version' directive");
853
854 StringRef Data = getTok().getIdentifier();
855
856 Lex();
857
858 MCSection *Note = getContext().getELFSection(".note", ELF::SHT_NOTE, 0);
859
860 getStreamer().PushSection();
861 getStreamer().SwitchSection(Note);
862 getStreamer().emitInt32(Data.size() + 1); // namesz
863 getStreamer().emitInt32(0); // descsz = 0 (no description).
864 getStreamer().emitInt32(1); // type = NT_VERSION
865 getStreamer().emitBytes(Data); // name
866 getStreamer().emitInt8(0); // NUL
867 getStreamer().emitValueToAlignment(4);
868 getStreamer().PopSection();
869 return false;
870 }
871
872 /// ParseDirectiveWeakref
873 /// ::= .weakref foo, bar
ParseDirectiveWeakref(StringRef,SMLoc)874 bool ELFAsmParser::ParseDirectiveWeakref(StringRef, SMLoc) {
875 // FIXME: Share code with the other alias building directives.
876
877 StringRef AliasName;
878 if (getParser().parseIdentifier(AliasName))
879 return TokError("expected identifier in directive");
880
881 if (getLexer().isNot(AsmToken::Comma))
882 return TokError("expected a comma");
883
884 Lex();
885
886 StringRef Name;
887 if (getParser().parseIdentifier(Name))
888 return TokError("expected identifier in directive");
889
890 MCSymbol *Alias = getContext().getOrCreateSymbol(AliasName);
891
892 MCSymbol *Sym = getContext().getOrCreateSymbol(Name);
893
894 getStreamer().emitWeakReference(Alias, Sym);
895 return false;
896 }
897
ParseDirectiveSubsection(StringRef,SMLoc)898 bool ELFAsmParser::ParseDirectiveSubsection(StringRef, SMLoc) {
899 const MCExpr *Subsection = nullptr;
900 if (getLexer().isNot(AsmToken::EndOfStatement)) {
901 if (getParser().parseExpression(Subsection))
902 return true;
903 }
904
905 if (getLexer().isNot(AsmToken::EndOfStatement))
906 return TokError("unexpected token in directive");
907
908 Lex();
909
910 getStreamer().SubSection(Subsection);
911 return false;
912 }
913
ParseDirectiveCGProfile(StringRef S,SMLoc Loc)914 bool ELFAsmParser::ParseDirectiveCGProfile(StringRef S, SMLoc Loc) {
915 return MCAsmParserExtension::ParseDirectiveCGProfile(S, Loc);
916 }
917
918 namespace llvm {
919
createELFAsmParser()920 MCAsmParserExtension *createELFAsmParser() {
921 return new ELFAsmParser;
922 }
923
924 } // end namespace llvm
925