123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383 |
- //===- unittests/Lex/LexerTest.cpp ------ Lexer tests ---------------------===//
- //
- // The LLVM Compiler Infrastructure
- //
- // This file is distributed under the University of Illinois Open Source
- // License. See LICENSE.TXT for details.
- //
- //===----------------------------------------------------------------------===//
- #include "clang/Lex/Lexer.h"
- #include "clang/Basic/Diagnostic.h"
- #include "clang/Basic/DiagnosticOptions.h"
- #include "clang/Basic/FileManager.h"
- #include "clang/Basic/LangOptions.h"
- #include "clang/Basic/SourceManager.h"
- #include "clang/Basic/TargetInfo.h"
- #include "clang/Basic/TargetOptions.h"
- #include "clang/Lex/HeaderSearch.h"
- #include "clang/Lex/HeaderSearchOptions.h"
- #include "clang/Lex/ModuleLoader.h"
- #include "clang/Lex/Preprocessor.h"
- #include "clang/Lex/PreprocessorOptions.h"
- #include "gtest/gtest.h"
- using namespace clang;
- namespace {
- class VoidModuleLoader : public ModuleLoader {
- ModuleLoadResult loadModule(SourceLocation ImportLoc,
- ModuleIdPath Path,
- Module::NameVisibilityKind Visibility,
- bool IsInclusionDirective) override {
- return ModuleLoadResult();
- }
- void makeModuleVisible(Module *Mod,
- Module::NameVisibilityKind Visibility,
- SourceLocation ImportLoc) override { }
- GlobalModuleIndex *loadGlobalModuleIndex(SourceLocation TriggerLoc) override
- { return nullptr; }
- bool lookupMissingImports(StringRef Name, SourceLocation TriggerLoc) override
- { return 0; }
- };
- // The test fixture.
- class LexerTest : public ::testing::Test {
- protected:
- LexerTest()
- : FileMgr(FileMgrOpts),
- DiagID(new DiagnosticIDs()),
- Diags(DiagID, new DiagnosticOptions, new IgnoringDiagConsumer()),
- SourceMgr(Diags, FileMgr),
- TargetOpts(new TargetOptions)
- {
- TargetOpts->Triple = "x86_64-apple-darwin11.1.0";
- Target = TargetInfo::CreateTargetInfo(Diags, TargetOpts);
- }
- std::vector<Token> Lex(StringRef Source) {
- std::unique_ptr<llvm::MemoryBuffer> Buf =
- llvm::MemoryBuffer::getMemBuffer(Source);
- SourceMgr.setMainFileID(SourceMgr.createFileID(std::move(Buf)));
- VoidModuleLoader ModLoader;
- HeaderSearch HeaderInfo(std::make_shared<HeaderSearchOptions>(), SourceMgr,
- Diags, LangOpts, Target.get());
- Preprocessor PP(std::make_shared<PreprocessorOptions>(), Diags, LangOpts,
- SourceMgr, HeaderInfo, ModLoader, /*IILookup =*/nullptr,
- /*OwnsHeaderSearch =*/false);
- PP.Initialize(*Target);
- PP.EnterMainSourceFile();
- std::vector<Token> toks;
- while (1) {
- Token tok;
- PP.Lex(tok);
- if (tok.is(tok::eof))
- break;
- toks.push_back(tok);
- }
- return toks;
- }
- std::vector<Token> CheckLex(StringRef Source,
- ArrayRef<tok::TokenKind> ExpectedTokens) {
- auto toks = Lex(Source);
- EXPECT_EQ(ExpectedTokens.size(), toks.size());
- for (unsigned i = 0, e = ExpectedTokens.size(); i != e; ++i) {
- EXPECT_EQ(ExpectedTokens[i], toks[i].getKind());
- }
- return toks;
- }
- std::string getSourceText(Token Begin, Token End) {
- bool Invalid;
- StringRef Str =
- Lexer::getSourceText(CharSourceRange::getTokenRange(SourceRange(
- Begin.getLocation(), End.getLocation())),
- SourceMgr, LangOpts, &Invalid);
- if (Invalid)
- return "<INVALID>";
- return Str;
- }
- FileSystemOptions FileMgrOpts;
- FileManager FileMgr;
- IntrusiveRefCntPtr<DiagnosticIDs> DiagID;
- DiagnosticsEngine Diags;
- SourceManager SourceMgr;
- LangOptions LangOpts;
- std::shared_ptr<TargetOptions> TargetOpts;
- IntrusiveRefCntPtr<TargetInfo> Target;
- };
- TEST_F(LexerTest, GetSourceTextExpandsToMaximumInMacroArgument) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "M(f(M(i)))",
- ExpectedTokens);
- EXPECT_EQ("M(i)", getSourceText(toks[2], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextExpandsToMaximumInMacroArgumentForEndOfMacro) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "M(M(i) c)",
- ExpectedTokens);
- EXPECT_EQ("M(i)", getSourceText(toks[0], toks[0]));
- }
- TEST_F(LexerTest, GetSourceTextExpandsInMacroArgumentForBeginOfMacro) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "M(c c M(i))",
- ExpectedTokens);
- EXPECT_EQ("c M(i)", getSourceText(toks[1], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextExpandsInMacroArgumentForEndOfMacro) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "M(M(i) c c)",
- ExpectedTokens);
- EXPECT_EQ("M(i) c", getSourceText(toks[0], toks[1]));
- }
- TEST_F(LexerTest, GetSourceTextInSeparateFnMacros) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "M(c M(i)) M(M(i) c)",
- ExpectedTokens);
- EXPECT_EQ("<INVALID>", getSourceText(toks[1], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextWorksAcrossTokenPastes) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "#define C(x) M(x##c)\n"
- "M(f(C(i)))",
- ExpectedTokens);
- EXPECT_EQ("C(i)", getSourceText(toks[2], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextExpandsAcrossMultipleMacroCalls) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "f(M(M(i)))",
- ExpectedTokens);
- EXPECT_EQ("M(M(i))", getSourceText(toks[2], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextInMiddleOfMacroArgument) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "M(f(i))",
- ExpectedTokens);
- EXPECT_EQ("i", getSourceText(toks[2], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextExpandsAroundDifferentMacroCalls) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "#define C(x) x\n"
- "f(C(M(i)))",
- ExpectedTokens);
- EXPECT_EQ("C(M(i))", getSourceText(toks[2], toks[2]));
- }
- TEST_F(LexerTest, GetSourceTextOnlyExpandsIfFirstTokenInMacro) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "#define C(x) c x\n"
- "f(C(M(i)))",
- ExpectedTokens);
- EXPECT_EQ("M(i)", getSourceText(toks[3], toks[3]));
- }
- TEST_F(LexerTest, GetSourceTextExpandsRecursively) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::l_paren);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_paren);
- std::vector<Token> toks = CheckLex("#define M(x) x\n"
- "#define C(x) c M(x)\n"
- "C(f(M(i)))",
- ExpectedTokens);
- EXPECT_EQ("M(i)", getSourceText(toks[3], toks[3]));
- }
- TEST_F(LexerTest, LexAPI) {
- std::vector<tok::TokenKind> ExpectedTokens;
- ExpectedTokens.push_back(tok::l_square);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_square);
- ExpectedTokens.push_back(tok::l_square);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::r_square);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- ExpectedTokens.push_back(tok::identifier);
- std::vector<Token> toks = CheckLex("#define M(x) [x]\n"
- "#define N(x) x\n"
- "#define INN(x) x\n"
- "#define NOF1 INN(val)\n"
- "#define NOF2 val\n"
- "M(foo) N([bar])\n"
- "N(INN(val)) N(NOF1) N(NOF2) N(val)",
- ExpectedTokens);
- SourceLocation lsqrLoc = toks[0].getLocation();
- SourceLocation idLoc = toks[1].getLocation();
- SourceLocation rsqrLoc = toks[2].getLocation();
- std::pair<SourceLocation,SourceLocation>
- macroPair = SourceMgr.getExpansionRange(lsqrLoc);
- SourceRange macroRange = SourceRange(macroPair.first, macroPair.second);
- SourceLocation Loc;
- EXPECT_TRUE(Lexer::isAtStartOfMacroExpansion(lsqrLoc, SourceMgr, LangOpts, &Loc));
- EXPECT_EQ(Loc, macroRange.getBegin());
- EXPECT_FALSE(Lexer::isAtStartOfMacroExpansion(idLoc, SourceMgr, LangOpts));
- EXPECT_FALSE(Lexer::isAtEndOfMacroExpansion(idLoc, SourceMgr, LangOpts));
- EXPECT_TRUE(Lexer::isAtEndOfMacroExpansion(rsqrLoc, SourceMgr, LangOpts, &Loc));
- EXPECT_EQ(Loc, macroRange.getEnd());
- CharSourceRange range = Lexer::makeFileCharRange(
- CharSourceRange::getTokenRange(lsqrLoc, idLoc), SourceMgr, LangOpts);
- EXPECT_TRUE(range.isInvalid());
- range = Lexer::makeFileCharRange(CharSourceRange::getTokenRange(idLoc, rsqrLoc),
- SourceMgr, LangOpts);
- EXPECT_TRUE(range.isInvalid());
- range = Lexer::makeFileCharRange(CharSourceRange::getTokenRange(lsqrLoc, rsqrLoc),
- SourceMgr, LangOpts);
- EXPECT_TRUE(!range.isTokenRange());
- EXPECT_EQ(range.getAsRange(),
- SourceRange(macroRange.getBegin(),
- macroRange.getEnd().getLocWithOffset(1)));
- StringRef text = Lexer::getSourceText(
- CharSourceRange::getTokenRange(lsqrLoc, rsqrLoc),
- SourceMgr, LangOpts);
- EXPECT_EQ(text, "M(foo)");
- SourceLocation macroLsqrLoc = toks[3].getLocation();
- SourceLocation macroIdLoc = toks[4].getLocation();
- SourceLocation macroRsqrLoc = toks[5].getLocation();
- SourceLocation fileLsqrLoc = SourceMgr.getSpellingLoc(macroLsqrLoc);
- SourceLocation fileIdLoc = SourceMgr.getSpellingLoc(macroIdLoc);
- SourceLocation fileRsqrLoc = SourceMgr.getSpellingLoc(macroRsqrLoc);
- range = Lexer::makeFileCharRange(
- CharSourceRange::getTokenRange(macroLsqrLoc, macroIdLoc),
- SourceMgr, LangOpts);
- EXPECT_EQ(SourceRange(fileLsqrLoc, fileIdLoc.getLocWithOffset(3)),
- range.getAsRange());
- range = Lexer::makeFileCharRange(CharSourceRange::getTokenRange(macroIdLoc, macroRsqrLoc),
- SourceMgr, LangOpts);
- EXPECT_EQ(SourceRange(fileIdLoc, fileRsqrLoc.getLocWithOffset(1)),
- range.getAsRange());
- macroPair = SourceMgr.getExpansionRange(macroLsqrLoc);
- range = Lexer::makeFileCharRange(
- CharSourceRange::getTokenRange(macroLsqrLoc, macroRsqrLoc),
- SourceMgr, LangOpts);
- EXPECT_EQ(SourceRange(macroPair.first, macroPair.second.getLocWithOffset(1)),
- range.getAsRange());
- text = Lexer::getSourceText(
- CharSourceRange::getTokenRange(SourceRange(macroLsqrLoc, macroIdLoc)),
- SourceMgr, LangOpts);
- EXPECT_EQ(text, "[bar");
- SourceLocation idLoc1 = toks[6].getLocation();
- SourceLocation idLoc2 = toks[7].getLocation();
- SourceLocation idLoc3 = toks[8].getLocation();
- SourceLocation idLoc4 = toks[9].getLocation();
- EXPECT_EQ("INN", Lexer::getImmediateMacroName(idLoc1, SourceMgr, LangOpts));
- EXPECT_EQ("INN", Lexer::getImmediateMacroName(idLoc2, SourceMgr, LangOpts));
- EXPECT_EQ("NOF2", Lexer::getImmediateMacroName(idLoc3, SourceMgr, LangOpts));
- EXPECT_EQ("N", Lexer::getImmediateMacroName(idLoc4, SourceMgr, LangOpts));
- }
- TEST_F(LexerTest, DontMergeMacroArgsFromDifferentMacroFiles) {
- std::vector<Token> toks =
- Lex("#define helper1 0\n"
- "void helper2(const char *, ...);\n"
- "#define M1(a, ...) helper2(a, ##__VA_ARGS__)\n"
- "#define M2(a, ...) M1(a, helper1, ##__VA_ARGS__)\n"
- "void f1() { M2(\"a\", \"b\"); }");
- // Check the file corresponding to the "helper1" macro arg in M2.
- //
- // The lexer used to report its size as 31, meaning that the end of the
- // expansion would be on the *next line* (just past `M2("a", "b")`). Make
- // sure that we get the correct end location (the comma after "helper1").
- SourceLocation helper1ArgLoc = toks[20].getLocation();
- EXPECT_EQ(SourceMgr.getFileIDSize(SourceMgr.getFileID(helper1ArgLoc)), 8U);
- }
- } // anonymous namespace
|