10b57cec5SDimitry Andric //===--- COFFModuleDefinition.cpp - Simple DEF parser ---------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric // 90b57cec5SDimitry Andric // Windows-specific. 100b57cec5SDimitry Andric // A parser for the module-definition file (.def file). 110b57cec5SDimitry Andric // 120b57cec5SDimitry Andric // The format of module-definition files are described in this document: 130b57cec5SDimitry Andric // https://msdn.microsoft.com/en-us/library/28d6s79h.aspx 140b57cec5SDimitry Andric // 150b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 160b57cec5SDimitry Andric 170b57cec5SDimitry Andric #include "llvm/Object/COFFModuleDefinition.h" 180b57cec5SDimitry Andric #include "llvm/ADT/StringRef.h" 190b57cec5SDimitry Andric #include "llvm/ADT/StringSwitch.h" 200b57cec5SDimitry Andric #include "llvm/Object/COFFImportFile.h" 210b57cec5SDimitry Andric #include "llvm/Object/Error.h" 220b57cec5SDimitry Andric #include "llvm/Support/Error.h" 230b57cec5SDimitry Andric #include "llvm/Support/Path.h" 240b57cec5SDimitry Andric 250b57cec5SDimitry Andric using namespace llvm::COFF; 260b57cec5SDimitry Andric using namespace llvm; 270b57cec5SDimitry Andric 280b57cec5SDimitry Andric namespace llvm { 290b57cec5SDimitry Andric namespace object { 300b57cec5SDimitry Andric 310b57cec5SDimitry Andric enum Kind { 320b57cec5SDimitry Andric Unknown, 330b57cec5SDimitry Andric Eof, 340b57cec5SDimitry Andric Identifier, 350b57cec5SDimitry Andric Comma, 360b57cec5SDimitry Andric Equal, 370b57cec5SDimitry Andric EqualEqual, 380b57cec5SDimitry Andric KwBase, 390b57cec5SDimitry Andric KwConstant, 400b57cec5SDimitry Andric KwData, 410b57cec5SDimitry Andric KwExports, 42*0fca6ea1SDimitry Andric KwExportAs, 430b57cec5SDimitry Andric KwHeapsize, 440b57cec5SDimitry Andric KwLibrary, 450b57cec5SDimitry Andric KwName, 460b57cec5SDimitry Andric KwNoname, 470b57cec5SDimitry Andric KwPrivate, 480b57cec5SDimitry Andric KwStacksize, 490b57cec5SDimitry Andric KwVersion, 500b57cec5SDimitry Andric }; 510b57cec5SDimitry Andric 520b57cec5SDimitry Andric struct Token { 530b57cec5SDimitry Andric explicit Token(Kind T = Unknown, StringRef S = "") : K(T), Value(S) {} 540b57cec5SDimitry Andric Kind K; 550b57cec5SDimitry Andric StringRef Value; 560b57cec5SDimitry Andric }; 570b57cec5SDimitry Andric 580b57cec5SDimitry Andric static bool isDecorated(StringRef Sym, bool MingwDef) { 590b57cec5SDimitry Andric // In def files, the symbols can either be listed decorated or undecorated. 600b57cec5SDimitry Andric // 610b57cec5SDimitry Andric // - For cdecl symbols, only the undecorated form is allowed. 620b57cec5SDimitry Andric // - For fastcall and vectorcall symbols, both fully decorated or 630b57cec5SDimitry Andric // undecorated forms can be present. 640b57cec5SDimitry Andric // - For stdcall symbols in non-MinGW environments, the decorated form is 650b57cec5SDimitry Andric // fully decorated with leading underscore and trailing stack argument 660b57cec5SDimitry Andric // size - like "_Func@0". 670b57cec5SDimitry Andric // - In MinGW def files, a decorated stdcall symbol does not include the 680b57cec5SDimitry Andric // leading underscore though, like "Func@0". 690b57cec5SDimitry Andric 700b57cec5SDimitry Andric // This function controls whether a leading underscore should be added to 710b57cec5SDimitry Andric // the given symbol name or not. For MinGW, treat a stdcall symbol name such 720b57cec5SDimitry Andric // as "Func@0" as undecorated, i.e. a leading underscore must be added. 730b57cec5SDimitry Andric // For non-MinGW, look for '@' in the whole string and consider "_Func@0" 740b57cec5SDimitry Andric // as decorated, i.e. don't add any more leading underscores. 750b57cec5SDimitry Andric // We can't check for a leading underscore here, since function names 760b57cec5SDimitry Andric // themselves can start with an underscore, while a second one still needs 770b57cec5SDimitry Andric // to be added. 785f757f3fSDimitry Andric return Sym.starts_with("@") || Sym.contains("@@") || Sym.starts_with("?") || 790b57cec5SDimitry Andric (!MingwDef && Sym.contains('@')); 800b57cec5SDimitry Andric } 810b57cec5SDimitry Andric 820b57cec5SDimitry Andric class Lexer { 830b57cec5SDimitry Andric public: 840b57cec5SDimitry Andric Lexer(StringRef S) : Buf(S) {} 850b57cec5SDimitry Andric 860b57cec5SDimitry Andric Token lex() { 870b57cec5SDimitry Andric Buf = Buf.trim(); 880b57cec5SDimitry Andric if (Buf.empty()) 890b57cec5SDimitry Andric return Token(Eof); 900b57cec5SDimitry Andric 910b57cec5SDimitry Andric switch (Buf[0]) { 920b57cec5SDimitry Andric case '\0': 930b57cec5SDimitry Andric return Token(Eof); 940b57cec5SDimitry Andric case ';': { 950b57cec5SDimitry Andric size_t End = Buf.find('\n'); 960b57cec5SDimitry Andric Buf = (End == Buf.npos) ? "" : Buf.drop_front(End); 970b57cec5SDimitry Andric return lex(); 980b57cec5SDimitry Andric } 990b57cec5SDimitry Andric case '=': 1000b57cec5SDimitry Andric Buf = Buf.drop_front(); 101*0fca6ea1SDimitry Andric if (Buf.consume_front("=")) 1020b57cec5SDimitry Andric return Token(EqualEqual, "=="); 1030b57cec5SDimitry Andric return Token(Equal, "="); 1040b57cec5SDimitry Andric case ',': 1050b57cec5SDimitry Andric Buf = Buf.drop_front(); 1060b57cec5SDimitry Andric return Token(Comma, ","); 1070b57cec5SDimitry Andric case '"': { 1080b57cec5SDimitry Andric StringRef S; 1090b57cec5SDimitry Andric std::tie(S, Buf) = Buf.substr(1).split('"'); 1100b57cec5SDimitry Andric return Token(Identifier, S); 1110b57cec5SDimitry Andric } 1120b57cec5SDimitry Andric default: { 1130b57cec5SDimitry Andric size_t End = Buf.find_first_of("=,;\r\n \t\v"); 1140b57cec5SDimitry Andric StringRef Word = Buf.substr(0, End); 1150b57cec5SDimitry Andric Kind K = llvm::StringSwitch<Kind>(Word) 1160b57cec5SDimitry Andric .Case("BASE", KwBase) 1170b57cec5SDimitry Andric .Case("CONSTANT", KwConstant) 1180b57cec5SDimitry Andric .Case("DATA", KwData) 1190b57cec5SDimitry Andric .Case("EXPORTS", KwExports) 120*0fca6ea1SDimitry Andric .Case("EXPORTAS", KwExportAs) 1210b57cec5SDimitry Andric .Case("HEAPSIZE", KwHeapsize) 1220b57cec5SDimitry Andric .Case("LIBRARY", KwLibrary) 1230b57cec5SDimitry Andric .Case("NAME", KwName) 1240b57cec5SDimitry Andric .Case("NONAME", KwNoname) 1250b57cec5SDimitry Andric .Case("PRIVATE", KwPrivate) 1260b57cec5SDimitry Andric .Case("STACKSIZE", KwStacksize) 1270b57cec5SDimitry Andric .Case("VERSION", KwVersion) 1280b57cec5SDimitry Andric .Default(Identifier); 1290b57cec5SDimitry Andric Buf = (End == Buf.npos) ? "" : Buf.drop_front(End); 1300b57cec5SDimitry Andric return Token(K, Word); 1310b57cec5SDimitry Andric } 1320b57cec5SDimitry Andric } 1330b57cec5SDimitry Andric } 1340b57cec5SDimitry Andric 1350b57cec5SDimitry Andric private: 1360b57cec5SDimitry Andric StringRef Buf; 1370b57cec5SDimitry Andric }; 1380b57cec5SDimitry Andric 1390b57cec5SDimitry Andric class Parser { 1400b57cec5SDimitry Andric public: 14106c3fb27SDimitry Andric explicit Parser(StringRef S, MachineTypes M, bool B, bool AU) 14206c3fb27SDimitry Andric : Lex(S), Machine(M), MingwDef(B), AddUnderscores(AU) { 14306c3fb27SDimitry Andric if (Machine != IMAGE_FILE_MACHINE_I386) 14406c3fb27SDimitry Andric AddUnderscores = false; 14506c3fb27SDimitry Andric } 1460b57cec5SDimitry Andric 1470b57cec5SDimitry Andric Expected<COFFModuleDefinition> parse() { 1480b57cec5SDimitry Andric do { 1490b57cec5SDimitry Andric if (Error Err = parseOne()) 1500b57cec5SDimitry Andric return std::move(Err); 1510b57cec5SDimitry Andric } while (Tok.K != Eof); 1520b57cec5SDimitry Andric return Info; 1530b57cec5SDimitry Andric } 1540b57cec5SDimitry Andric 1550b57cec5SDimitry Andric private: 1560b57cec5SDimitry Andric void read() { 1570b57cec5SDimitry Andric if (Stack.empty()) { 1580b57cec5SDimitry Andric Tok = Lex.lex(); 1590b57cec5SDimitry Andric return; 1600b57cec5SDimitry Andric } 1610b57cec5SDimitry Andric Tok = Stack.back(); 1620b57cec5SDimitry Andric Stack.pop_back(); 1630b57cec5SDimitry Andric } 1640b57cec5SDimitry Andric 1650b57cec5SDimitry Andric Error readAsInt(uint64_t *I) { 1660b57cec5SDimitry Andric read(); 1670b57cec5SDimitry Andric if (Tok.K != Identifier || Tok.Value.getAsInteger(10, *I)) 1680b57cec5SDimitry Andric return createError("integer expected"); 1690b57cec5SDimitry Andric return Error::success(); 1700b57cec5SDimitry Andric } 1710b57cec5SDimitry Andric 1720b57cec5SDimitry Andric Error expect(Kind Expected, StringRef Msg) { 1730b57cec5SDimitry Andric read(); 1740b57cec5SDimitry Andric if (Tok.K != Expected) 1750b57cec5SDimitry Andric return createError(Msg); 1760b57cec5SDimitry Andric return Error::success(); 1770b57cec5SDimitry Andric } 1780b57cec5SDimitry Andric 1790b57cec5SDimitry Andric void unget() { Stack.push_back(Tok); } 1800b57cec5SDimitry Andric 1810b57cec5SDimitry Andric Error parseOne() { 1820b57cec5SDimitry Andric read(); 1830b57cec5SDimitry Andric switch (Tok.K) { 1840b57cec5SDimitry Andric case Eof: 1850b57cec5SDimitry Andric return Error::success(); 1860b57cec5SDimitry Andric case KwExports: 1870b57cec5SDimitry Andric for (;;) { 1880b57cec5SDimitry Andric read(); 1890b57cec5SDimitry Andric if (Tok.K != Identifier) { 1900b57cec5SDimitry Andric unget(); 1910b57cec5SDimitry Andric return Error::success(); 1920b57cec5SDimitry Andric } 1930b57cec5SDimitry Andric if (Error Err = parseExport()) 1940b57cec5SDimitry Andric return Err; 1950b57cec5SDimitry Andric } 1960b57cec5SDimitry Andric case KwHeapsize: 1970b57cec5SDimitry Andric return parseNumbers(&Info.HeapReserve, &Info.HeapCommit); 1980b57cec5SDimitry Andric case KwStacksize: 1990b57cec5SDimitry Andric return parseNumbers(&Info.StackReserve, &Info.StackCommit); 2000b57cec5SDimitry Andric case KwLibrary: 2010b57cec5SDimitry Andric case KwName: { 2020b57cec5SDimitry Andric bool IsDll = Tok.K == KwLibrary; // Check before parseName. 2030b57cec5SDimitry Andric std::string Name; 2040b57cec5SDimitry Andric if (Error Err = parseName(&Name, &Info.ImageBase)) 2050b57cec5SDimitry Andric return Err; 2060b57cec5SDimitry Andric 2070b57cec5SDimitry Andric Info.ImportName = Name; 2080b57cec5SDimitry Andric 2090b57cec5SDimitry Andric // Set the output file, but don't override /out if it was already passed. 2100b57cec5SDimitry Andric if (Info.OutputFile.empty()) { 2110b57cec5SDimitry Andric Info.OutputFile = Name; 2120b57cec5SDimitry Andric // Append the appropriate file extension if not already present. 2130b57cec5SDimitry Andric if (!sys::path::has_extension(Name)) 2140b57cec5SDimitry Andric Info.OutputFile += IsDll ? ".dll" : ".exe"; 2150b57cec5SDimitry Andric } 2160b57cec5SDimitry Andric 2170b57cec5SDimitry Andric return Error::success(); 2180b57cec5SDimitry Andric } 2190b57cec5SDimitry Andric case KwVersion: 2200b57cec5SDimitry Andric return parseVersion(&Info.MajorImageVersion, &Info.MinorImageVersion); 2210b57cec5SDimitry Andric default: 2220b57cec5SDimitry Andric return createError("unknown directive: " + Tok.Value); 2230b57cec5SDimitry Andric } 2240b57cec5SDimitry Andric } 2250b57cec5SDimitry Andric 2260b57cec5SDimitry Andric Error parseExport() { 2270b57cec5SDimitry Andric COFFShortExport E; 2285ffd83dbSDimitry Andric E.Name = std::string(Tok.Value); 2290b57cec5SDimitry Andric read(); 2300b57cec5SDimitry Andric if (Tok.K == Equal) { 2310b57cec5SDimitry Andric read(); 2320b57cec5SDimitry Andric if (Tok.K != Identifier) 2330b57cec5SDimitry Andric return createError("identifier expected, but got " + Tok.Value); 2340b57cec5SDimitry Andric E.ExtName = E.Name; 2355ffd83dbSDimitry Andric E.Name = std::string(Tok.Value); 2360b57cec5SDimitry Andric } else { 2370b57cec5SDimitry Andric unget(); 2380b57cec5SDimitry Andric } 2390b57cec5SDimitry Andric 24006c3fb27SDimitry Andric if (AddUnderscores) { 2410b57cec5SDimitry Andric if (!isDecorated(E.Name, MingwDef)) 2420b57cec5SDimitry Andric E.Name = (std::string("_").append(E.Name)); 2430b57cec5SDimitry Andric if (!E.ExtName.empty() && !isDecorated(E.ExtName, MingwDef)) 2440b57cec5SDimitry Andric E.ExtName = (std::string("_").append(E.ExtName)); 2450b57cec5SDimitry Andric } 2460b57cec5SDimitry Andric 2470b57cec5SDimitry Andric for (;;) { 2480b57cec5SDimitry Andric read(); 2490b57cec5SDimitry Andric if (Tok.K == Identifier && Tok.Value[0] == '@') { 2500b57cec5SDimitry Andric if (Tok.Value == "@") { 2510b57cec5SDimitry Andric // "foo @ 10" 2520b57cec5SDimitry Andric read(); 2530b57cec5SDimitry Andric Tok.Value.getAsInteger(10, E.Ordinal); 2540b57cec5SDimitry Andric } else if (Tok.Value.drop_front().getAsInteger(10, E.Ordinal)) { 2550b57cec5SDimitry Andric // "foo \n @bar" - Not an ordinal modifier at all, but the next 2560b57cec5SDimitry Andric // export (fastcall decorated) - complete the current one. 2570b57cec5SDimitry Andric unget(); 2580b57cec5SDimitry Andric Info.Exports.push_back(E); 2590b57cec5SDimitry Andric return Error::success(); 2600b57cec5SDimitry Andric } 2610b57cec5SDimitry Andric // "foo @10" 2620b57cec5SDimitry Andric read(); 2630b57cec5SDimitry Andric if (Tok.K == KwNoname) { 2640b57cec5SDimitry Andric E.Noname = true; 2650b57cec5SDimitry Andric } else { 2660b57cec5SDimitry Andric unget(); 2670b57cec5SDimitry Andric } 2680b57cec5SDimitry Andric continue; 2690b57cec5SDimitry Andric } 2700b57cec5SDimitry Andric if (Tok.K == KwData) { 2710b57cec5SDimitry Andric E.Data = true; 2720b57cec5SDimitry Andric continue; 2730b57cec5SDimitry Andric } 2740b57cec5SDimitry Andric if (Tok.K == KwConstant) { 2750b57cec5SDimitry Andric E.Constant = true; 2760b57cec5SDimitry Andric continue; 2770b57cec5SDimitry Andric } 2780b57cec5SDimitry Andric if (Tok.K == KwPrivate) { 2790b57cec5SDimitry Andric E.Private = true; 2800b57cec5SDimitry Andric continue; 2810b57cec5SDimitry Andric } 2820b57cec5SDimitry Andric if (Tok.K == EqualEqual) { 2830b57cec5SDimitry Andric read(); 284*0fca6ea1SDimitry Andric E.ImportName = std::string(Tok.Value); 2850b57cec5SDimitry Andric continue; 2860b57cec5SDimitry Andric } 287*0fca6ea1SDimitry Andric // EXPORTAS must be at the end of export definition 288*0fca6ea1SDimitry Andric if (Tok.K == KwExportAs) { 289*0fca6ea1SDimitry Andric read(); 290*0fca6ea1SDimitry Andric if (Tok.K == Eof) 291*0fca6ea1SDimitry Andric return createError( 292*0fca6ea1SDimitry Andric "unexpected end of file, EXPORTAS identifier expected"); 293*0fca6ea1SDimitry Andric E.ExportAs = std::string(Tok.Value); 294*0fca6ea1SDimitry Andric } else { 2950b57cec5SDimitry Andric unget(); 296*0fca6ea1SDimitry Andric } 2970b57cec5SDimitry Andric Info.Exports.push_back(E); 2980b57cec5SDimitry Andric return Error::success(); 2990b57cec5SDimitry Andric } 3000b57cec5SDimitry Andric } 3010b57cec5SDimitry Andric 3020b57cec5SDimitry Andric // HEAPSIZE/STACKSIZE reserve[,commit] 3030b57cec5SDimitry Andric Error parseNumbers(uint64_t *Reserve, uint64_t *Commit) { 3040b57cec5SDimitry Andric if (Error Err = readAsInt(Reserve)) 3050b57cec5SDimitry Andric return Err; 3060b57cec5SDimitry Andric read(); 3070b57cec5SDimitry Andric if (Tok.K != Comma) { 3080b57cec5SDimitry Andric unget(); 3090b57cec5SDimitry Andric Commit = nullptr; 3100b57cec5SDimitry Andric return Error::success(); 3110b57cec5SDimitry Andric } 3120b57cec5SDimitry Andric if (Error Err = readAsInt(Commit)) 3130b57cec5SDimitry Andric return Err; 3140b57cec5SDimitry Andric return Error::success(); 3150b57cec5SDimitry Andric } 3160b57cec5SDimitry Andric 3170b57cec5SDimitry Andric // NAME outputPath [BASE=address] 3180b57cec5SDimitry Andric Error parseName(std::string *Out, uint64_t *Baseaddr) { 3190b57cec5SDimitry Andric read(); 3200b57cec5SDimitry Andric if (Tok.K == Identifier) { 3215ffd83dbSDimitry Andric *Out = std::string(Tok.Value); 3220b57cec5SDimitry Andric } else { 3230b57cec5SDimitry Andric *Out = ""; 3240b57cec5SDimitry Andric unget(); 3250b57cec5SDimitry Andric return Error::success(); 3260b57cec5SDimitry Andric } 3270b57cec5SDimitry Andric read(); 3280b57cec5SDimitry Andric if (Tok.K == KwBase) { 3290b57cec5SDimitry Andric if (Error Err = expect(Equal, "'=' expected")) 3300b57cec5SDimitry Andric return Err; 3310b57cec5SDimitry Andric if (Error Err = readAsInt(Baseaddr)) 3320b57cec5SDimitry Andric return Err; 3330b57cec5SDimitry Andric } else { 3340b57cec5SDimitry Andric unget(); 3350b57cec5SDimitry Andric *Baseaddr = 0; 3360b57cec5SDimitry Andric } 3370b57cec5SDimitry Andric return Error::success(); 3380b57cec5SDimitry Andric } 3390b57cec5SDimitry Andric 3400b57cec5SDimitry Andric // VERSION major[.minor] 3410b57cec5SDimitry Andric Error parseVersion(uint32_t *Major, uint32_t *Minor) { 3420b57cec5SDimitry Andric read(); 3430b57cec5SDimitry Andric if (Tok.K != Identifier) 3440b57cec5SDimitry Andric return createError("identifier expected, but got " + Tok.Value); 3450b57cec5SDimitry Andric StringRef V1, V2; 3460b57cec5SDimitry Andric std::tie(V1, V2) = Tok.Value.split('.'); 3470b57cec5SDimitry Andric if (V1.getAsInteger(10, *Major)) 3480b57cec5SDimitry Andric return createError("integer expected, but got " + Tok.Value); 3490b57cec5SDimitry Andric if (V2.empty()) 3500b57cec5SDimitry Andric *Minor = 0; 3510b57cec5SDimitry Andric else if (V2.getAsInteger(10, *Minor)) 3520b57cec5SDimitry Andric return createError("integer expected, but got " + Tok.Value); 3530b57cec5SDimitry Andric return Error::success(); 3540b57cec5SDimitry Andric } 3550b57cec5SDimitry Andric 3560b57cec5SDimitry Andric Lexer Lex; 3570b57cec5SDimitry Andric Token Tok; 3580b57cec5SDimitry Andric std::vector<Token> Stack; 3590b57cec5SDimitry Andric MachineTypes Machine; 3600b57cec5SDimitry Andric COFFModuleDefinition Info; 3610b57cec5SDimitry Andric bool MingwDef; 36206c3fb27SDimitry Andric bool AddUnderscores; 3630b57cec5SDimitry Andric }; 3640b57cec5SDimitry Andric 3650b57cec5SDimitry Andric Expected<COFFModuleDefinition> parseCOFFModuleDefinition(MemoryBufferRef MB, 3660b57cec5SDimitry Andric MachineTypes Machine, 36706c3fb27SDimitry Andric bool MingwDef, 36806c3fb27SDimitry Andric bool AddUnderscores) { 36906c3fb27SDimitry Andric return Parser(MB.getBuffer(), Machine, MingwDef, AddUnderscores).parse(); 3700b57cec5SDimitry Andric } 3710b57cec5SDimitry Andric 3720b57cec5SDimitry Andric } // namespace object 3730b57cec5SDimitry Andric } // namespace llvm 374