1 //===-- llvm-ml.cpp - masm-compatible assembler -----------------*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // A simple driver around MasmParser; based on llvm-mc. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "llvm/ADT/StringSwitch.h" 14 #include "llvm/MC/MCAsmBackend.h" 15 #include "llvm/MC/MCAsmInfo.h" 16 #include "llvm/MC/MCCodeEmitter.h" 17 #include "llvm/MC/MCContext.h" 18 #include "llvm/MC/MCInstPrinter.h" 19 #include "llvm/MC/MCInstrInfo.h" 20 #include "llvm/MC/MCObjectFileInfo.h" 21 #include "llvm/MC/MCObjectWriter.h" 22 #include "llvm/MC/MCParser/AsmLexer.h" 23 #include "llvm/MC/MCParser/MCTargetAsmParser.h" 24 #include "llvm/MC/MCRegisterInfo.h" 25 #include "llvm/MC/MCStreamer.h" 26 #include "llvm/MC/MCSubtargetInfo.h" 27 #include "llvm/MC/MCSymbol.h" 28 #include "llvm/MC/MCTargetOptionsCommandFlags.h" 29 #include "llvm/MC/TargetRegistry.h" 30 #include "llvm/Option/Arg.h" 31 #include "llvm/Option/ArgList.h" 32 #include "llvm/Option/Option.h" 33 #include "llvm/Support/Compression.h" 34 #include "llvm/Support/FileUtilities.h" 35 #include "llvm/Support/FormatVariadic.h" 36 #include "llvm/Support/FormattedStream.h" 37 #include "llvm/Support/Host.h" 38 #include "llvm/Support/InitLLVM.h" 39 #include "llvm/Support/MemoryBuffer.h" 40 #include "llvm/Support/Path.h" 41 #include "llvm/Support/Process.h" 42 #include "llvm/Support/SourceMgr.h" 43 #include "llvm/Support/TargetSelect.h" 44 #include "llvm/Support/ToolOutputFile.h" 45 #include "llvm/Support/WithColor.h" 46 #include <ctime> 47 48 using namespace llvm; 49 using namespace llvm::opt; 50 51 namespace { 52 53 enum ID { 54 OPT_INVALID = 0, // This is not an option ID. 55 #define OPTION(PREFIX, NAME, ID, KIND, GROUP, ALIAS, ALIASARGS, FLAGS, PARAM, \ 56 HELPTEXT, METAVAR, VALUES) \ 57 OPT_##ID, 58 #include "Opts.inc" 59 #undef OPTION 60 }; 61 62 #define PREFIX(NAME, VALUE) const char *const NAME[] = VALUE; 63 #include "Opts.inc" 64 #undef PREFIX 65 66 const opt::OptTable::Info InfoTable[] = { 67 #define OPTION(PREFIX, NAME, ID, KIND, GROUP, ALIAS, ALIASARGS, FLAGS, PARAM, \ 68 HELPTEXT, METAVAR, VALUES) \ 69 { \ 70 PREFIX, NAME, HELPTEXT, \ 71 METAVAR, OPT_##ID, opt::Option::KIND##Class, \ 72 PARAM, FLAGS, OPT_##GROUP, \ 73 OPT_##ALIAS, ALIASARGS, VALUES}, 74 #include "Opts.inc" 75 #undef OPTION 76 }; 77 78 class MLOptTable : public opt::OptTable { 79 public: 80 MLOptTable() : OptTable(InfoTable, /*IgnoreCase=*/false) {} 81 }; 82 } // namespace 83 84 static Triple GetTriple(StringRef ProgName, opt::InputArgList &Args) { 85 // Figure out the target triple. 86 StringRef DefaultBitness = "32"; 87 SmallString<255> Program = ProgName; 88 sys::path::replace_extension(Program, ""); 89 if (Program.endswith("ml64")) 90 DefaultBitness = "64"; 91 92 StringRef TripleName = 93 StringSwitch<StringRef>(Args.getLastArgValue(OPT_bitness, DefaultBitness)) 94 .Case("32", "i386-pc-windows") 95 .Case("64", "x86_64-pc-windows") 96 .Default(""); 97 return Triple(Triple::normalize(TripleName)); 98 } 99 100 static std::unique_ptr<ToolOutputFile> GetOutputStream(StringRef Path) { 101 std::error_code EC; 102 auto Out = std::make_unique<ToolOutputFile>(Path, EC, sys::fs::OF_None); 103 if (EC) { 104 WithColor::error() << EC.message() << '\n'; 105 return nullptr; 106 } 107 108 return Out; 109 } 110 111 static int AsLexInput(SourceMgr &SrcMgr, MCAsmInfo &MAI, raw_ostream &OS) { 112 AsmLexer Lexer(MAI); 113 Lexer.setBuffer(SrcMgr.getMemoryBuffer(SrcMgr.getMainFileID())->getBuffer()); 114 Lexer.setLexMasmIntegers(true); 115 Lexer.useMasmDefaultRadix(true); 116 Lexer.setLexMasmHexFloats(true); 117 Lexer.setLexMasmStrings(true); 118 119 bool Error = false; 120 while (Lexer.Lex().isNot(AsmToken::Eof)) { 121 Lexer.getTok().dump(OS); 122 OS << "\n"; 123 if (Lexer.getTok().getKind() == AsmToken::Error) 124 Error = true; 125 } 126 127 return Error; 128 } 129 130 static int AssembleInput(StringRef ProgName, const Target *TheTarget, 131 SourceMgr &SrcMgr, MCContext &Ctx, MCStreamer &Str, 132 MCAsmInfo &MAI, MCSubtargetInfo &STI, 133 MCInstrInfo &MCII, MCTargetOptions &MCOptions, 134 const opt::ArgList &InputArgs) { 135 struct tm TM; 136 time_t Timestamp; 137 if (InputArgs.hasArg(OPT_timestamp)) { 138 StringRef TimestampStr = InputArgs.getLastArgValue(OPT_timestamp); 139 int64_t IntTimestamp; 140 if (TimestampStr.getAsInteger(10, IntTimestamp)) { 141 WithColor::error(errs(), ProgName) 142 << "invalid timestamp '" << TimestampStr 143 << "'; must be expressed in seconds since the UNIX epoch.\n"; 144 return 1; 145 } 146 Timestamp = IntTimestamp; 147 } else { 148 Timestamp = time(nullptr); 149 } 150 if (InputArgs.hasArg(OPT_utc)) { 151 // Not thread-safe. 152 TM = *gmtime(&Timestamp); 153 } else { 154 // Not thread-safe. 155 TM = *localtime(&Timestamp); 156 } 157 158 std::unique_ptr<MCAsmParser> Parser( 159 createMCMasmParser(SrcMgr, Ctx, Str, MAI, TM, 0)); 160 std::unique_ptr<MCTargetAsmParser> TAP( 161 TheTarget->createMCAsmParser(STI, *Parser, MCII, MCOptions)); 162 163 if (!TAP) { 164 WithColor::error(errs(), ProgName) 165 << "this target does not support assembly parsing.\n"; 166 return 1; 167 } 168 169 Parser->setShowParsedOperands(InputArgs.hasArg(OPT_show_inst_operands)); 170 Parser->setTargetParser(*TAP); 171 Parser->getLexer().setLexMasmIntegers(true); 172 Parser->getLexer().useMasmDefaultRadix(true); 173 Parser->getLexer().setLexMasmHexFloats(true); 174 Parser->getLexer().setLexMasmStrings(true); 175 176 auto Defines = InputArgs.getAllArgValues(OPT_define); 177 for (StringRef Define : Defines) { 178 const auto NameValue = Define.split('='); 179 StringRef Name = NameValue.first, Value = NameValue.second; 180 if (Parser->defineMacro(Name, Value)) { 181 WithColor::error(errs(), ProgName) 182 << "can't define macro '" << Name << "' = '" << Value << "'\n"; 183 return 1; 184 } 185 } 186 187 int Res = Parser->Run(/*NoInitialTextSection=*/true); 188 189 return Res; 190 } 191 192 int main(int Argc, char **Argv) { 193 InitLLVM X(Argc, Argv); 194 StringRef ProgName = sys::path::filename(Argv[0]); 195 196 // Initialize targets and assembly printers/parsers. 197 llvm::InitializeAllTargetInfos(); 198 llvm::InitializeAllTargetMCs(); 199 llvm::InitializeAllAsmParsers(); 200 llvm::InitializeAllDisassemblers(); 201 202 MLOptTable T; 203 unsigned MissingArgIndex, MissingArgCount; 204 ArrayRef<const char *> ArgsArr = makeArrayRef(Argv + 1, Argc - 1); 205 opt::InputArgList InputArgs = 206 T.ParseArgs(ArgsArr, MissingArgIndex, MissingArgCount); 207 208 std::string InputFilename; 209 for (auto *Arg : InputArgs.filtered(OPT_INPUT)) { 210 std::string ArgString = Arg->getAsString(InputArgs); 211 if (ArgString == "-" || StringRef(ArgString).endswith(".asm")) { 212 if (!InputFilename.empty()) { 213 WithColor::warning(errs(), ProgName) 214 << "does not support multiple assembly files in one command; " 215 << "ignoring '" << InputFilename << "'\n"; 216 } 217 InputFilename = ArgString; 218 } else { 219 std::string Diag; 220 raw_string_ostream OS(Diag); 221 OS << "invalid option '" << ArgString << "'"; 222 223 std::string Nearest; 224 if (T.findNearest(ArgString, Nearest) < 2) 225 OS << ", did you mean '" << Nearest << "'?"; 226 227 WithColor::error(errs(), ProgName) << OS.str() << '\n'; 228 exit(1); 229 } 230 } 231 for (auto *Arg : InputArgs.filtered(OPT_assembly_file)) { 232 if (!InputFilename.empty()) { 233 WithColor::warning(errs(), ProgName) 234 << "does not support multiple assembly files in one command; " 235 << "ignoring '" << InputFilename << "'\n"; 236 } 237 InputFilename = Arg->getAsString(InputArgs); 238 } 239 240 for (auto *Arg : InputArgs.filtered(OPT_unsupported_Group)) { 241 WithColor::warning(errs(), ProgName) 242 << "ignoring unsupported '" << Arg->getOption().getName() 243 << "' option\n"; 244 } 245 246 if (InputArgs.hasArg(OPT_debug)) { 247 DebugFlag = true; 248 } 249 for (auto *Arg : InputArgs.filtered(OPT_debug_only)) { 250 setCurrentDebugTypes(Arg->getValues().data(), Arg->getNumValues()); 251 } 252 253 if (InputArgs.hasArg(OPT_help)) { 254 std::string Usage = llvm::formatv("{0} [ /options ] file", ProgName).str(); 255 T.printHelp(outs(), Usage.c_str(), "LLVM MASM Assembler", 256 /*ShowHidden=*/false); 257 return 0; 258 } else if (InputFilename.empty()) { 259 outs() << "USAGE: " << ProgName << " [ /options ] file\n" 260 << "Run \"" << ProgName << " /?\" or \"" << ProgName 261 << " /help\" for more info.\n"; 262 return 0; 263 } 264 265 MCTargetOptions MCOptions; 266 MCOptions.AssemblyLanguage = "masm"; 267 MCOptions.MCFatalWarnings = InputArgs.hasArg(OPT_fatal_warnings); 268 269 Triple TheTriple = GetTriple(ProgName, InputArgs); 270 std::string Error; 271 const Target *TheTarget = TargetRegistry::lookupTarget("", TheTriple, Error); 272 if (!TheTarget) { 273 WithColor::error(errs(), ProgName) << Error; 274 return 1; 275 } 276 const std::string &TripleName = TheTriple.getTriple(); 277 278 bool SafeSEH = InputArgs.hasArg(OPT_safeseh); 279 if (SafeSEH && !(TheTriple.isArch32Bit() && TheTriple.isX86())) { 280 WithColor::warning() 281 << "/safeseh applies only to 32-bit X86 platforms; ignoring.\n"; 282 SafeSEH = false; 283 } 284 285 ErrorOr<std::unique_ptr<MemoryBuffer>> BufferPtr = 286 MemoryBuffer::getFileOrSTDIN(InputFilename); 287 if (std::error_code EC = BufferPtr.getError()) { 288 WithColor::error(errs(), ProgName) 289 << InputFilename << ": " << EC.message() << '\n'; 290 return 1; 291 } 292 293 SourceMgr SrcMgr; 294 295 // Tell SrcMgr about this buffer, which is what the parser will pick up. 296 SrcMgr.AddNewSourceBuffer(std::move(*BufferPtr), SMLoc()); 297 298 // Record the location of the include directories so that the lexer can find 299 // included files later. 300 std::vector<std::string> IncludeDirs = 301 InputArgs.getAllArgValues(OPT_include_path); 302 if (!InputArgs.hasArg(OPT_ignore_include_envvar)) { 303 if (llvm::Optional<std::string> IncludeEnvVar = 304 llvm::sys::Process::GetEnv("INCLUDE")) { 305 SmallVector<StringRef, 8> Dirs; 306 StringRef(*IncludeEnvVar) 307 .split(Dirs, ";", /*MaxSplit=*/-1, /*KeepEmpty=*/false); 308 IncludeDirs.reserve(IncludeDirs.size() + Dirs.size()); 309 for (StringRef Dir : Dirs) 310 IncludeDirs.push_back(Dir.str()); 311 } 312 } 313 SrcMgr.setIncludeDirs(IncludeDirs); 314 315 std::unique_ptr<MCRegisterInfo> MRI(TheTarget->createMCRegInfo(TripleName)); 316 assert(MRI && "Unable to create target register info!"); 317 318 std::unique_ptr<MCAsmInfo> MAI( 319 TheTarget->createMCAsmInfo(*MRI, TripleName, MCOptions)); 320 assert(MAI && "Unable to create target asm info!"); 321 322 MAI->setPreserveAsmComments(InputArgs.hasArg(OPT_preserve_comments)); 323 324 std::unique_ptr<MCSubtargetInfo> STI(TheTarget->createMCSubtargetInfo( 325 TripleName, /*CPU=*/"", /*Features=*/"")); 326 assert(STI && "Unable to create subtarget info!"); 327 328 // FIXME: This is not pretty. MCContext has a ptr to MCObjectFileInfo and 329 // MCObjectFileInfo needs a MCContext reference in order to initialize itself. 330 MCContext Ctx(TheTriple, MAI.get(), MRI.get(), STI.get(), &SrcMgr); 331 std::unique_ptr<MCObjectFileInfo> MOFI(TheTarget->createMCObjectFileInfo( 332 Ctx, /*PIC=*/false, /*LargeCodeModel=*/true)); 333 Ctx.setObjectFileInfo(MOFI.get()); 334 335 if (InputArgs.hasArg(OPT_save_temp_labels)) 336 Ctx.setAllowTemporaryLabels(false); 337 338 // Set compilation information. 339 SmallString<128> CWD; 340 if (!sys::fs::current_path(CWD)) 341 Ctx.setCompilationDir(CWD); 342 Ctx.setMainFileName(InputFilename); 343 344 StringRef FileType = InputArgs.getLastArgValue(OPT_filetype, "obj"); 345 SmallString<255> DefaultOutputFilename; 346 if (InputArgs.hasArg(OPT_as_lex)) { 347 DefaultOutputFilename = "-"; 348 } else { 349 DefaultOutputFilename = InputFilename; 350 sys::path::replace_extension(DefaultOutputFilename, FileType); 351 } 352 const StringRef OutputFilename = 353 InputArgs.getLastArgValue(OPT_output_file, DefaultOutputFilename); 354 std::unique_ptr<ToolOutputFile> Out = GetOutputStream(OutputFilename); 355 if (!Out) 356 return 1; 357 358 std::unique_ptr<buffer_ostream> BOS; 359 raw_pwrite_stream *OS = &Out->os(); 360 std::unique_ptr<MCStreamer> Str; 361 362 std::unique_ptr<MCInstrInfo> MCII(TheTarget->createMCInstrInfo()); 363 assert(MCII && "Unable to create instruction info!"); 364 365 MCInstPrinter *IP = nullptr; 366 if (FileType == "s") { 367 const bool OutputATTAsm = InputArgs.hasArg(OPT_output_att_asm); 368 const unsigned OutputAsmVariant = OutputATTAsm ? 0U // ATT dialect 369 : 1U; // Intel dialect 370 IP = TheTarget->createMCInstPrinter(TheTriple, OutputAsmVariant, *MAI, 371 *MCII, *MRI); 372 373 if (!IP) { 374 WithColor::error() 375 << "unable to create instruction printer for target triple '" 376 << TheTriple.normalize() << "' with " 377 << (OutputATTAsm ? "ATT" : "Intel") << " assembly variant.\n"; 378 return 1; 379 } 380 381 // Set the display preference for hex vs. decimal immediates. 382 IP->setPrintImmHex(InputArgs.hasArg(OPT_print_imm_hex)); 383 384 // Set up the AsmStreamer. 385 std::unique_ptr<MCCodeEmitter> CE; 386 if (InputArgs.hasArg(OPT_show_encoding)) 387 CE.reset(TheTarget->createMCCodeEmitter(*MCII, Ctx)); 388 389 std::unique_ptr<MCAsmBackend> MAB( 390 TheTarget->createMCAsmBackend(*STI, *MRI, MCOptions)); 391 auto FOut = std::make_unique<formatted_raw_ostream>(*OS); 392 Str.reset(TheTarget->createAsmStreamer( 393 Ctx, std::move(FOut), /*asmverbose*/ true, 394 /*useDwarfDirectory*/ true, IP, std::move(CE), std::move(MAB), 395 InputArgs.hasArg(OPT_show_inst))); 396 397 } else if (FileType == "null") { 398 Str.reset(TheTarget->createNullStreamer(Ctx)); 399 } else if (FileType == "obj") { 400 if (!Out->os().supportsSeeking()) { 401 BOS = std::make_unique<buffer_ostream>(Out->os()); 402 OS = BOS.get(); 403 } 404 405 MCCodeEmitter *CE = TheTarget->createMCCodeEmitter(*MCII, Ctx); 406 MCAsmBackend *MAB = TheTarget->createMCAsmBackend(*STI, *MRI, MCOptions); 407 Str.reset(TheTarget->createMCObjectStreamer( 408 TheTriple, Ctx, std::unique_ptr<MCAsmBackend>(MAB), 409 MAB->createObjectWriter(*OS), std::unique_ptr<MCCodeEmitter>(CE), *STI, 410 MCOptions.MCRelaxAll, MCOptions.MCIncrementalLinkerCompatible, 411 /*DWARFMustBeAtTheEnd*/ false)); 412 } else { 413 llvm_unreachable("Invalid file type!"); 414 } 415 416 if (TheTriple.isOSBinFormatCOFF()) { 417 // Emit an absolute @feat.00 symbol. This is a features bitfield read by 418 // link.exe. 419 int64_t Feat00Flags = 0x2; 420 if (SafeSEH) { 421 // According to the PE-COFF spec, the LSB of this value marks the object 422 // for "registered SEH". This means that all SEH handler entry points 423 // must be registered in .sxdata. Use of any unregistered handlers will 424 // cause the process to terminate immediately. 425 Feat00Flags |= 0x1; 426 } 427 MCSymbol *Feat00Sym = Ctx.getOrCreateSymbol("@feat.00"); 428 Feat00Sym->setRedefinable(true); 429 Str->emitSymbolAttribute(Feat00Sym, MCSA_Global); 430 Str->emitAssignment(Feat00Sym, MCConstantExpr::create(Feat00Flags, Ctx)); 431 } 432 433 // Use Assembler information for parsing. 434 Str->setUseAssemblerInfoForParsing(true); 435 436 int Res = 1; 437 if (InputArgs.hasArg(OPT_as_lex)) { 438 // -as-lex; Lex only, and output a stream of tokens 439 Res = AsLexInput(SrcMgr, *MAI, Out->os()); 440 } else { 441 Res = AssembleInput(ProgName, TheTarget, SrcMgr, Ctx, *Str, *MAI, *STI, 442 *MCII, MCOptions, InputArgs); 443 } 444 445 // Keep output if no errors. 446 if (Res == 0) 447 Out->keep(); 448 return Res; 449 } 450