295 lines
		
	
	
		
			9.9 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			295 lines
		
	
	
		
			9.9 KiB
		
	
	
	
		
			C++
		
	
	
	
//===- WasmAsmParser.cpp - Wasm Assembly Parser -----------------------------===//
 | 
						|
//
 | 
						|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | 
						|
// See https://llvm.org/LICENSE.txt for license information.
 | 
						|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | 
						|
//
 | 
						|
// --
 | 
						|
//
 | 
						|
// Note, this is for wasm, the binary format (analogous to ELF), not wasm,
 | 
						|
// the instruction set (analogous to x86), for which parsing code lives in
 | 
						|
// WebAssemblyAsmParser.
 | 
						|
//
 | 
						|
// This file contains processing for generic directives implemented using
 | 
						|
// MCTargetStreamer, the ones that depend on WebAssemblyTargetStreamer are in
 | 
						|
// WebAssemblyAsmParser.
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#include "llvm/BinaryFormat/Wasm.h"
 | 
						|
#include "llvm/MC/MCContext.h"
 | 
						|
#include "llvm/MC/MCParser/MCAsmLexer.h"
 | 
						|
#include "llvm/MC/MCParser/MCAsmParser.h"
 | 
						|
#include "llvm/MC/MCParser/MCAsmParserExtension.h"
 | 
						|
#include "llvm/MC/MCSectionWasm.h"
 | 
						|
#include "llvm/MC/MCStreamer.h"
 | 
						|
#include "llvm/MC/MCSymbol.h"
 | 
						|
#include "llvm/MC/MCSymbolWasm.h"
 | 
						|
#include "llvm/Support/MachineValueType.h"
 | 
						|
 | 
						|
using namespace llvm;
 | 
						|
 | 
						|
namespace {
 | 
						|
 | 
						|
class WasmAsmParser : public MCAsmParserExtension {
 | 
						|
  MCAsmParser *Parser = nullptr;
 | 
						|
  MCAsmLexer *Lexer = nullptr;
 | 
						|
 | 
						|
  template<bool (WasmAsmParser::*HandlerMethod)(StringRef, SMLoc)>
 | 
						|
  void addDirectiveHandler(StringRef Directive) {
 | 
						|
    MCAsmParser::ExtensionDirectiveHandler Handler = std::make_pair(
 | 
						|
        this, HandleDirective<WasmAsmParser, HandlerMethod>);
 | 
						|
 | 
						|
    getParser().addDirectiveHandler(Directive, Handler);
 | 
						|
  }
 | 
						|
 | 
						|
public:
 | 
						|
  WasmAsmParser() { BracketExpressionsSupported = true; }
 | 
						|
 | 
						|
  void Initialize(MCAsmParser &P) override {
 | 
						|
    Parser = &P;
 | 
						|
    Lexer = &Parser->getLexer();
 | 
						|
    // Call the base implementation.
 | 
						|
    this->MCAsmParserExtension::Initialize(*Parser);
 | 
						|
 | 
						|
    addDirectiveHandler<&WasmAsmParser::parseSectionDirectiveText>(".text");
 | 
						|
    addDirectiveHandler<&WasmAsmParser::parseSectionDirective>(".section");
 | 
						|
    addDirectiveHandler<&WasmAsmParser::parseDirectiveSize>(".size");
 | 
						|
    addDirectiveHandler<&WasmAsmParser::parseDirectiveType>(".type");
 | 
						|
    addDirectiveHandler<&WasmAsmParser::ParseDirectiveIdent>(".ident");
 | 
						|
    addDirectiveHandler<
 | 
						|
      &WasmAsmParser::ParseDirectiveSymbolAttribute>(".weak");
 | 
						|
    addDirectiveHandler<
 | 
						|
      &WasmAsmParser::ParseDirectiveSymbolAttribute>(".local");
 | 
						|
    addDirectiveHandler<
 | 
						|
      &WasmAsmParser::ParseDirectiveSymbolAttribute>(".internal");
 | 
						|
    addDirectiveHandler<
 | 
						|
      &WasmAsmParser::ParseDirectiveSymbolAttribute>(".hidden");
 | 
						|
  }
 | 
						|
 | 
						|
  bool error(const StringRef &Msg, const AsmToken &Tok) {
 | 
						|
    return Parser->Error(Tok.getLoc(), Msg + Tok.getString());
 | 
						|
  }
 | 
						|
 | 
						|
  bool isNext(AsmToken::TokenKind Kind) {
 | 
						|
    auto Ok = Lexer->is(Kind);
 | 
						|
    if (Ok)
 | 
						|
      Lex();
 | 
						|
    return Ok;
 | 
						|
  }
 | 
						|
 | 
						|
  bool expect(AsmToken::TokenKind Kind, const char *KindName) {
 | 
						|
    if (!isNext(Kind))
 | 
						|
      return error(std::string("Expected ") + KindName + ", instead got: ",
 | 
						|
                   Lexer->getTok());
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  bool parseSectionDirectiveText(StringRef, SMLoc) {
 | 
						|
    // FIXME: .text currently no-op.
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  bool parseSectionFlags(StringRef FlagStr, bool &Passive, bool &Group) {
 | 
						|
    for (char C : FlagStr) {
 | 
						|
      switch (C) {
 | 
						|
      case 'p':
 | 
						|
        Passive = true;
 | 
						|
        break;
 | 
						|
      case 'G':
 | 
						|
        Group = true;
 | 
						|
        break;
 | 
						|
      default:
 | 
						|
        return Parser->Error(getTok().getLoc(),
 | 
						|
                             StringRef("Unexepcted section flag: ") + FlagStr);
 | 
						|
      }
 | 
						|
    }
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  bool parseGroup(StringRef &GroupName) {
 | 
						|
    if (Lexer->isNot(AsmToken::Comma))
 | 
						|
      return TokError("expected group name");
 | 
						|
    Lex();
 | 
						|
    if (Lexer->is(AsmToken::Integer)) {
 | 
						|
      GroupName = getTok().getString();
 | 
						|
      Lex();
 | 
						|
    } else if (Parser->parseIdentifier(GroupName)) {
 | 
						|
      return TokError("invalid group name");
 | 
						|
    }
 | 
						|
    if (Lexer->is(AsmToken::Comma)) {
 | 
						|
      Lex();
 | 
						|
      StringRef Linkage;
 | 
						|
      if (Parser->parseIdentifier(Linkage))
 | 
						|
        return TokError("invalid linkage");
 | 
						|
      if (Linkage != "comdat")
 | 
						|
        return TokError("Linkage must be 'comdat'");
 | 
						|
    }
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  bool parseSectionDirective(StringRef, SMLoc) {
 | 
						|
    StringRef Name;
 | 
						|
    if (Parser->parseIdentifier(Name))
 | 
						|
      return TokError("expected identifier in directive");
 | 
						|
 | 
						|
    if (expect(AsmToken::Comma, ","))
 | 
						|
      return true;
 | 
						|
 | 
						|
    if (Lexer->isNot(AsmToken::String))
 | 
						|
      return error("expected string in directive, instead got: ", Lexer->getTok());
 | 
						|
 | 
						|
    auto Kind = StringSwitch<Optional<SectionKind>>(Name)
 | 
						|
                    .StartsWith(".data", SectionKind::getData())
 | 
						|
                    .StartsWith(".tdata", SectionKind::getThreadData())
 | 
						|
                    .StartsWith(".tbss", SectionKind::getThreadBSS())
 | 
						|
                    .StartsWith(".rodata", SectionKind::getReadOnly())
 | 
						|
                    .StartsWith(".text", SectionKind::getText())
 | 
						|
                    .StartsWith(".custom_section", SectionKind::getMetadata())
 | 
						|
                    .StartsWith(".bss", SectionKind::getBSS())
 | 
						|
                    // See use of .init_array in WasmObjectWriter and
 | 
						|
                    // TargetLoweringObjectFileWasm
 | 
						|
                    .StartsWith(".init_array", SectionKind::getData())
 | 
						|
                    .StartsWith(".debug_", SectionKind::getMetadata())
 | 
						|
                    .Default(Optional<SectionKind>());
 | 
						|
    if (!Kind.hasValue())
 | 
						|
      return Parser->Error(Lexer->getLoc(), "unknown section kind: " + Name);
 | 
						|
 | 
						|
 | 
						|
    // Update section flags if present in this .section directive
 | 
						|
    bool Passive = false;
 | 
						|
    bool Group = false;
 | 
						|
    if (parseSectionFlags(getTok().getStringContents(), Passive, Group))
 | 
						|
      return true;
 | 
						|
 | 
						|
    Lex();
 | 
						|
 | 
						|
    if (expect(AsmToken::Comma, ",") || expect(AsmToken::At, "@"))
 | 
						|
      return true;
 | 
						|
 | 
						|
    StringRef GroupName;
 | 
						|
    if (Group && parseGroup(GroupName))
 | 
						|
      return true;
 | 
						|
 | 
						|
    if (expect(AsmToken::EndOfStatement, "eol"))
 | 
						|
      return true;
 | 
						|
 | 
						|
    // TODO: Parse UniqueID
 | 
						|
    MCSectionWasm *WS = getContext().getWasmSection(
 | 
						|
        Name, Kind.getValue(), GroupName, MCContext::GenericSectionID);
 | 
						|
    if (Passive) {
 | 
						|
      if (!WS->isWasmData())
 | 
						|
        return Parser->Error(getTok().getLoc(),
 | 
						|
                             "Only data sections can be passive");
 | 
						|
      WS->setPassive();
 | 
						|
    }
 | 
						|
    getStreamer().SwitchSection(WS);
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  // TODO: This function is almost the same as ELFAsmParser::ParseDirectiveSize
 | 
						|
  // so maybe could be shared somehow.
 | 
						|
  bool parseDirectiveSize(StringRef, SMLoc) {
 | 
						|
    StringRef Name;
 | 
						|
    if (Parser->parseIdentifier(Name))
 | 
						|
      return TokError("expected identifier in directive");
 | 
						|
    auto Sym = getContext().getOrCreateSymbol(Name);
 | 
						|
    if (expect(AsmToken::Comma, ","))
 | 
						|
      return true;
 | 
						|
    const MCExpr *Expr;
 | 
						|
    if (Parser->parseExpression(Expr))
 | 
						|
      return true;
 | 
						|
    if (expect(AsmToken::EndOfStatement, "eol"))
 | 
						|
      return true;
 | 
						|
    // This is done automatically by the assembler for functions currently,
 | 
						|
    // so this is only currently needed for data sections:
 | 
						|
    getStreamer().emitELFSize(Sym, Expr);
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  bool parseDirectiveType(StringRef, SMLoc) {
 | 
						|
    // This could be the start of a function, check if followed by
 | 
						|
    // "label,@function"
 | 
						|
    if (!Lexer->is(AsmToken::Identifier))
 | 
						|
      return error("Expected label after .type directive, got: ",
 | 
						|
                   Lexer->getTok());
 | 
						|
    auto WasmSym = cast<MCSymbolWasm>(
 | 
						|
                     getStreamer().getContext().getOrCreateSymbol(
 | 
						|
                       Lexer->getTok().getString()));
 | 
						|
    Lex();
 | 
						|
    if (!(isNext(AsmToken::Comma) && isNext(AsmToken::At) &&
 | 
						|
          Lexer->is(AsmToken::Identifier)))
 | 
						|
      return error("Expected label,@type declaration, got: ", Lexer->getTok());
 | 
						|
    auto TypeName = Lexer->getTok().getString();
 | 
						|
    if (TypeName == "function") {
 | 
						|
      WasmSym->setType(wasm::WASM_SYMBOL_TYPE_FUNCTION);
 | 
						|
      auto *Current =
 | 
						|
          cast<MCSectionWasm>(getStreamer().getCurrentSection().first);
 | 
						|
      if (Current->getGroup())
 | 
						|
        WasmSym->setComdat(true);
 | 
						|
    } else if (TypeName == "global")
 | 
						|
      WasmSym->setType(wasm::WASM_SYMBOL_TYPE_GLOBAL);
 | 
						|
    else if (TypeName == "object")
 | 
						|
      WasmSym->setType(wasm::WASM_SYMBOL_TYPE_DATA);
 | 
						|
    else
 | 
						|
      return error("Unknown WASM symbol type: ", Lexer->getTok());
 | 
						|
    Lex();
 | 
						|
    return expect(AsmToken::EndOfStatement, "EOL");
 | 
						|
  }
 | 
						|
 | 
						|
  // FIXME: Shared with ELF.
 | 
						|
  /// ParseDirectiveIdent
 | 
						|
  ///  ::= .ident string
 | 
						|
  bool ParseDirectiveIdent(StringRef, SMLoc) {
 | 
						|
    if (getLexer().isNot(AsmToken::String))
 | 
						|
      return TokError("unexpected token in '.ident' directive");
 | 
						|
    StringRef Data = getTok().getIdentifier();
 | 
						|
    Lex();
 | 
						|
    if (getLexer().isNot(AsmToken::EndOfStatement))
 | 
						|
      return TokError("unexpected token in '.ident' directive");
 | 
						|
    Lex();
 | 
						|
    getStreamer().emitIdent(Data);
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  // FIXME: Shared with ELF.
 | 
						|
  /// ParseDirectiveSymbolAttribute
 | 
						|
  ///  ::= { ".local", ".weak", ... } [ identifier ( , identifier )* ]
 | 
						|
  bool ParseDirectiveSymbolAttribute(StringRef Directive, SMLoc) {
 | 
						|
    MCSymbolAttr Attr = StringSwitch<MCSymbolAttr>(Directive)
 | 
						|
      .Case(".weak", MCSA_Weak)
 | 
						|
      .Case(".local", MCSA_Local)
 | 
						|
      .Case(".hidden", MCSA_Hidden)
 | 
						|
      .Case(".internal", MCSA_Internal)
 | 
						|
      .Case(".protected", MCSA_Protected)
 | 
						|
      .Default(MCSA_Invalid);
 | 
						|
    assert(Attr != MCSA_Invalid && "unexpected symbol attribute directive!");
 | 
						|
    if (getLexer().isNot(AsmToken::EndOfStatement)) {
 | 
						|
      while (true) {
 | 
						|
        StringRef Name;
 | 
						|
        if (getParser().parseIdentifier(Name))
 | 
						|
          return TokError("expected identifier in directive");
 | 
						|
        MCSymbol *Sym = getContext().getOrCreateSymbol(Name);
 | 
						|
        getStreamer().emitSymbolAttribute(Sym, Attr);
 | 
						|
        if (getLexer().is(AsmToken::EndOfStatement))
 | 
						|
          break;
 | 
						|
        if (getLexer().isNot(AsmToken::Comma))
 | 
						|
          return TokError("unexpected token in directive");
 | 
						|
        Lex();
 | 
						|
      }
 | 
						|
    }
 | 
						|
    Lex();
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
};
 | 
						|
 | 
						|
} // end anonymous namespace
 | 
						|
 | 
						|
namespace llvm {
 | 
						|
 | 
						|
MCAsmParserExtension *createWasmAsmParser() {
 | 
						|
  return new WasmAsmParser;
 | 
						|
}
 | 
						|
 | 
						|
} // end namespace llvm
 |