123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845 |
- //===- unittests/AST/CommentLexer.cpp ------ Comment lexer tests ----------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "clang/AST/CommentLexer.h"
- #include "clang/AST/CommentCommandTraits.h"
- #include "clang/Basic/CommentOptions.h"
- #include "clang/Basic/Diagnostic.h"
- #include "clang/Basic/DiagnosticOptions.h"
- #include "clang/Basic/FileManager.h"
- #include "clang/Basic/SourceManager.h"
- #include "llvm/ADT/STLExtras.h"
- #include "gtest/gtest.h"
- #include <vector>
- using namespace llvm;
- using namespace clang;
- namespace clang {
- namespace comments {
- namespace {
- class CommentLexerTest : public ::testing::Test {
- protected:
- CommentLexerTest()
- : FileMgr(FileMgrOpts),
- DiagID(new DiagnosticIDs()),
- Diags(DiagID, new DiagnosticOptions, new IgnoringDiagConsumer()),
- SourceMgr(Diags, FileMgr),
- Traits(Allocator, CommentOptions()) {
- }
- FileSystemOptions FileMgrOpts;
- FileManager FileMgr;
- IntrusiveRefCntPtr<DiagnosticIDs> DiagID;
- DiagnosticsEngine Diags;
- SourceManager SourceMgr;
- llvm::BumpPtrAllocator Allocator;
- CommandTraits Traits;
- void lexString(const char *Source, std::vector<Token> &Toks);
- StringRef getCommandName(const Token &Tok) {
- return Traits.getCommandInfo(Tok.getCommandID())->Name;
- }
- StringRef getVerbatimBlockName(const Token &Tok) {
- return Traits.getCommandInfo(Tok.getVerbatimBlockID())->Name;
- }
- StringRef getVerbatimLineName(const Token &Tok) {
- return Traits.getCommandInfo(Tok.getVerbatimLineID())->Name;
- }
- };
- void CommentLexerTest::lexString(const char *Source,
- std::vector<Token> &Toks) {
- std::unique_ptr<MemoryBuffer> Buf = MemoryBuffer::getMemBuffer(Source);
- FileID File = SourceMgr.createFileID(std::move(Buf));
- SourceLocation Begin = SourceMgr.getLocForStartOfFile(File);
- Lexer L(Allocator, Diags, Traits, Begin, Source, Source + strlen(Source));
- while (1) {
- Token Tok;
- L.lex(Tok);
- if (Tok.is(tok::eof))
- break;
- Toks.push_back(Tok);
- }
- }
- } // unnamed namespace
- // Empty source range should be handled.
- TEST_F(CommentLexerTest, Basic1) {
- const char *Source = "";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(0U, Toks.size());
- }
- // Empty comments should be handled.
- TEST_F(CommentLexerTest, Basic2) {
- const char *Sources[] = {
- "//", "///", "//!", "///<", "//!<"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(1U, Toks.size());
- ASSERT_EQ(tok::newline, Toks[0].getKind());
- }
- }
- // Empty comments should be handled.
- TEST_F(CommentLexerTest, Basic3) {
- const char *Sources[] = {
- "/**/", "/***/", "/*!*/", "/**<*/", "/*!<*/"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(2U, Toks.size());
- ASSERT_EQ(tok::newline, Toks[0].getKind());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- }
- }
- // Single comment with plain text.
- TEST_F(CommentLexerTest, Basic4) {
- const char *Sources[] = {
- "// Meow", "/// Meow", "//! Meow",
- "// Meow\n", "// Meow\r\n", "//! Meow\r",
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(2U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Meow"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- }
- }
- // Single comment with plain text.
- TEST_F(CommentLexerTest, Basic5) {
- const char *Sources[] = {
- "/* Meow*/", "/** Meow*/", "/*! Meow*/"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Meow"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- }
- // Test newline escaping.
- TEST_F(CommentLexerTest, Basic6) {
- const char *Sources[] = {
- "// Aaa\\\n" " Bbb\\ \n" " Ccc?" "?/\n",
- "// Aaa\\\r\n" " Bbb\\ \r\n" " Ccc?" "?/\r\n",
- "// Aaa\\\r" " Bbb\\ \r" " Ccc?" "?/\r"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(10U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Aaa"), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("\\"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" Bbb"), Toks[3].getText());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef("\\"), Toks[4].getText());
- ASSERT_EQ(tok::text, Toks[5].getKind());
- ASSERT_EQ(StringRef(" "), Toks[5].getText());
- ASSERT_EQ(tok::newline, Toks[6].getKind());
- ASSERT_EQ(tok::text, Toks[7].getKind());
- ASSERT_EQ(StringRef(" Ccc?" "?/"), Toks[7].getText());
- ASSERT_EQ(tok::newline, Toks[8].getKind());
- ASSERT_EQ(tok::newline, Toks[9].getKind());
- }
- }
- // Check that we skip C-style aligned stars correctly.
- TEST_F(CommentLexerTest, Basic7) {
- const char *Source =
- "/* Aaa\n"
- " * Bbb\r\n"
- "\t* Ccc\n"
- " ! Ddd\n"
- " * Eee\n"
- " ** Fff\n"
- " */";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(15U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Aaa"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" Bbb"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef(" Ccc"), Toks[4].getText());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- ASSERT_EQ(tok::text, Toks[6].getKind());
- ASSERT_EQ(StringRef(" ! Ddd"), Toks[6].getText());
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- ASSERT_EQ(tok::text, Toks[8].getKind());
- ASSERT_EQ(StringRef(" Eee"), Toks[8].getText());
- ASSERT_EQ(tok::newline, Toks[9].getKind());
- ASSERT_EQ(tok::text, Toks[10].getKind());
- ASSERT_EQ(StringRef("* Fff"), Toks[10].getText());
- ASSERT_EQ(tok::newline, Toks[11].getKind());
- ASSERT_EQ(tok::text, Toks[12].getKind());
- ASSERT_EQ(StringRef(" "), Toks[12].getText());
- ASSERT_EQ(tok::newline, Toks[13].getKind());
- ASSERT_EQ(tok::newline, Toks[14].getKind());
- }
- // A command marker followed by comment end.
- TEST_F(CommentLexerTest, DoxygenCommand1) {
- const char *Sources[] = { "//@", "///@", "//!@" };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(2U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef("@"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- }
- }
- // A command marker followed by comment end.
- TEST_F(CommentLexerTest, DoxygenCommand2) {
- const char *Sources[] = { "/*@*/", "/**@*/", "/*!@*/"};
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef("@"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- }
- // A command marker followed by comment end.
- TEST_F(CommentLexerTest, DoxygenCommand3) {
- const char *Sources[] = { "/*\\*/", "/**\\*/" };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef("\\"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- }
- // Doxygen escape sequences.
- TEST_F(CommentLexerTest, DoxygenCommand4) {
- const char *Sources[] = {
- "/// \\\\ \\@ \\& \\$ \\# \\< \\> \\% \\\" \\. \\::",
- "/// @\\ @@ @& @$ @# @< @> @% @\" @. @::"
- };
- const char *Text[] = {
- " ",
- "\\", " ", "@", " ", "&", " ", "$", " ", "#", " ",
- "<", " ", ">", " ", "%", " ", "\"", " ", ".", " ",
- "::", ""
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(array_lengthof(Text), Toks.size());
- for (size_t j = 0, e = Toks.size(); j != e; j++) {
- if(Toks[j].is(tok::text)) {
- ASSERT_EQ(StringRef(Text[j]), Toks[j].getText())
- << "index " << i;
- }
- }
- }
- }
- // A command marker followed by a non-letter that is not a part of an escape
- // sequence.
- TEST_F(CommentLexerTest, DoxygenCommand5) {
- const char *Source = "/// \\^ \\0";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(6U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("\\"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("^ "), Toks[2].getText());
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef("\\"), Toks[3].getText());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef("0"), Toks[4].getText());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- }
- TEST_F(CommentLexerTest, DoxygenCommand6) {
- const char *Source = "/// \\brief Aaa.";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::backslash_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("brief"), getCommandName(Toks[1]));
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" Aaa."), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, DoxygenCommand7) {
- const char *Source = "/// \\em\\em \\em\t\\em\n";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(8U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::backslash_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[1]));
- ASSERT_EQ(tok::backslash_command, Toks[2].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[2]));
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" "), Toks[3].getText());
- ASSERT_EQ(tok::backslash_command, Toks[4].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[4]));
- ASSERT_EQ(tok::text, Toks[5].getKind());
- ASSERT_EQ(StringRef("\t"), Toks[5].getText());
- ASSERT_EQ(tok::backslash_command, Toks[6].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[6]));
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- }
- TEST_F(CommentLexerTest, DoxygenCommand8) {
- const char *Source = "/// @em@em @em\t@em\n";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(8U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::at_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[1]));
- ASSERT_EQ(tok::at_command, Toks[2].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[2]));
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" "), Toks[3].getText());
- ASSERT_EQ(tok::at_command, Toks[4].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[4]));
- ASSERT_EQ(tok::text, Toks[5].getKind());
- ASSERT_EQ(StringRef("\t"), Toks[5].getText());
- ASSERT_EQ(tok::at_command, Toks[6].getKind());
- ASSERT_EQ(StringRef("em"), getCommandName(Toks[6]));
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- }
- TEST_F(CommentLexerTest, DoxygenCommand9) {
- const char *Source = "/// \\aaa\\bbb \\ccc\t\\ddd\n";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(8U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::unknown_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("aaa"), Toks[1].getUnknownCommandName());
- ASSERT_EQ(tok::unknown_command, Toks[2].getKind());
- ASSERT_EQ(StringRef("bbb"), Toks[2].getUnknownCommandName());
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" "), Toks[3].getText());
- ASSERT_EQ(tok::unknown_command, Toks[4].getKind());
- ASSERT_EQ(StringRef("ccc"), Toks[4].getUnknownCommandName());
- ASSERT_EQ(tok::text, Toks[5].getKind());
- ASSERT_EQ(StringRef("\t"), Toks[5].getText());
- ASSERT_EQ(tok::unknown_command, Toks[6].getKind());
- ASSERT_EQ(StringRef("ddd"), Toks[6].getUnknownCommandName());
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- }
- TEST_F(CommentLexerTest, DoxygenCommand10) {
- const char *Source = "// \\c\n";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::backslash_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("c"), getCommandName(Toks[1]));
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, RegisterCustomBlockCommand) {
- const char *Source =
- "/// \\NewBlockCommand Aaa.\n"
- "/// @NewBlockCommand Aaa.\n";
- Traits.registerBlockCommand(StringRef("NewBlockCommand"));
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(8U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::backslash_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("NewBlockCommand"), getCommandName(Toks[1]));
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" Aaa."), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef(" "), Toks[4].getText());
- ASSERT_EQ(tok::at_command, Toks[5].getKind());
- ASSERT_EQ(StringRef("NewBlockCommand"), getCommandName(Toks[5]));
- ASSERT_EQ(tok::text, Toks[6].getKind());
- ASSERT_EQ(StringRef(" Aaa."), Toks[6].getText());
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- }
- TEST_F(CommentLexerTest, RegisterMultipleBlockCommands) {
- const char *Source =
- "/// \\Foo\n"
- "/// \\Bar Baz\n"
- "/// \\Blech quux=corge\n";
- Traits.registerBlockCommand(StringRef("Foo"));
- Traits.registerBlockCommand(StringRef("Bar"));
- Traits.registerBlockCommand(StringRef("Blech"));
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(11U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::backslash_command, Toks[1].getKind());
- ASSERT_EQ(StringRef("Foo"), getCommandName(Toks[1]));
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" "), Toks[3].getText());
- ASSERT_EQ(tok::backslash_command, Toks[4].getKind());
- ASSERT_EQ(StringRef("Bar"), getCommandName(Toks[4]));
- ASSERT_EQ(tok::text, Toks[5].getKind());
- ASSERT_EQ(StringRef(" Baz"), Toks[5].getText());
- ASSERT_EQ(tok::newline, Toks[6].getKind());
- ASSERT_EQ(tok::text, Toks[7].getKind());
- ASSERT_EQ(StringRef(" "), Toks[7].getText());
- ASSERT_EQ(tok::backslash_command, Toks[8].getKind());
- ASSERT_EQ(StringRef("Blech"), getCommandName(Toks[8]));
- ASSERT_EQ(tok::text, Toks[9].getKind());
- ASSERT_EQ(StringRef(" quux=corge"), Toks[9].getText());
- ASSERT_EQ(tok::newline, Toks[10].getKind());
- }
- // Empty verbatim block.
- TEST_F(CommentLexerTest, VerbatimBlock1) {
- const char *Sources[] = {
- "/// \\verbatim\\endverbatim\n//",
- "/** \\verbatim\\endverbatim*/"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(5U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::verbatim_block_end, Toks[2].getKind());
- ASSERT_EQ(StringRef("endverbatim"), getVerbatimBlockName(Toks[2]));
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- }
- }
- // Empty verbatim block without an end command.
- TEST_F(CommentLexerTest, VerbatimBlock2) {
- const char *Source = "/// \\verbatim";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- // Empty verbatim block without an end command.
- TEST_F(CommentLexerTest, VerbatimBlock3) {
- const char *Source = "/** \\verbatim*/";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- // Single-line verbatim block.
- TEST_F(CommentLexerTest, VerbatimBlock4) {
- const char *Sources[] = {
- "/// Meow \\verbatim aaa \\endverbatim\n//",
- "/** Meow \\verbatim aaa \\endverbatim*/"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(6U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Meow "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[2].getKind());
- ASSERT_EQ(StringRef(" aaa "), Toks[2].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[3].getKind());
- ASSERT_EQ(StringRef("endverbatim"), getVerbatimBlockName(Toks[3]));
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- }
- }
- // Single-line verbatim block without an end command.
- TEST_F(CommentLexerTest, VerbatimBlock5) {
- const char *Sources[] = {
- "/// Meow \\verbatim aaa \n//",
- "/** Meow \\verbatim aaa */"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(5U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Meow "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[2].getKind());
- ASSERT_EQ(StringRef(" aaa "), Toks[2].getVerbatimBlockText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- }
- }
- TEST_F(CommentLexerTest, VerbatimBlock6) {
- const char *Source =
- "// \\verbatim\n"
- "// Aaa\n"
- "//\n"
- "// Bbb\n"
- "// \\endverbatim\n";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(10U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- ASSERT_EQ(tok::verbatim_block_line, Toks[3].getKind());
- ASSERT_EQ(StringRef(" Aaa"), Toks[3].getVerbatimBlockText());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- ASSERT_EQ(tok::verbatim_block_line, Toks[6].getKind());
- ASSERT_EQ(StringRef(" Bbb"), Toks[6].getVerbatimBlockText());
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- ASSERT_EQ(tok::verbatim_block_end, Toks[8].getKind());
- ASSERT_EQ(StringRef("endverbatim"), getVerbatimBlockName(Toks[8]));
- ASSERT_EQ(tok::newline, Toks[9].getKind());
- }
- TEST_F(CommentLexerTest, VerbatimBlock7) {
- const char *Source =
- "/* \\verbatim\n"
- " * Aaa\n"
- " *\n"
- " * Bbb\n"
- " * \\endverbatim\n"
- " */";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(10U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[2].getKind());
- ASSERT_EQ(StringRef(" Aaa"), Toks[2].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_line, Toks[3].getKind());
- ASSERT_EQ(StringRef(""), Toks[3].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_line, Toks[4].getKind());
- ASSERT_EQ(StringRef(" Bbb"), Toks[4].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[5].getKind());
- ASSERT_EQ(StringRef("endverbatim"), getVerbatimBlockName(Toks[5]));
- ASSERT_EQ(tok::newline, Toks[6].getKind());
- ASSERT_EQ(tok::text, Toks[7].getKind());
- ASSERT_EQ(StringRef(" "), Toks[7].getText());
- ASSERT_EQ(tok::newline, Toks[8].getKind());
- ASSERT_EQ(tok::newline, Toks[9].getKind());
- }
- // Complex test for verbatim blocks.
- TEST_F(CommentLexerTest, VerbatimBlock8) {
- const char *Source =
- "/* Meow \\verbatim aaa\\$\\@\n"
- "bbb \\endverbati\r"
- "ccc\r\n"
- "ddd \\endverbatim Blah \\verbatim eee\n"
- "\\endverbatim BlahBlah*/";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(14U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Meow "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[2].getKind());
- ASSERT_EQ(StringRef(" aaa\\$\\@"), Toks[2].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_line, Toks[3].getKind());
- ASSERT_EQ(StringRef("bbb \\endverbati"), Toks[3].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_line, Toks[4].getKind());
- ASSERT_EQ(StringRef("ccc"), Toks[4].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_line, Toks[5].getKind());
- ASSERT_EQ(StringRef("ddd "), Toks[5].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[6].getKind());
- ASSERT_EQ(StringRef("endverbatim"), getVerbatimBlockName(Toks[6]));
- ASSERT_EQ(tok::text, Toks[7].getKind());
- ASSERT_EQ(StringRef(" Blah "), Toks[7].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[8].getKind());
- ASSERT_EQ(StringRef("verbatim"), getVerbatimBlockName(Toks[8]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[9].getKind());
- ASSERT_EQ(StringRef(" eee"), Toks[9].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[10].getKind());
- ASSERT_EQ(StringRef("endverbatim"), getVerbatimBlockName(Toks[10]));
- ASSERT_EQ(tok::text, Toks[11].getKind());
- ASSERT_EQ(StringRef(" BlahBlah"), Toks[11].getText());
- ASSERT_EQ(tok::newline, Toks[12].getKind());
- ASSERT_EQ(tok::newline, Toks[13].getKind());
- }
- // LaTeX verbatim blocks.
- TEST_F(CommentLexerTest, VerbatimBlock9) {
- const char *Source =
- "/// \\f$ Aaa \\f$ \\f[ Bbb \\f] \\f{ Ccc \\f}";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(13U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[1].getKind());
- ASSERT_EQ(StringRef("f$"), getVerbatimBlockName(Toks[1]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[2].getKind());
- ASSERT_EQ(StringRef(" Aaa "), Toks[2].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[3].getKind());
- ASSERT_EQ(StringRef("f$"), getVerbatimBlockName(Toks[3]));
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef(" "), Toks[4].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[5].getKind());
- ASSERT_EQ(StringRef("f["), getVerbatimBlockName(Toks[5]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[6].getKind());
- ASSERT_EQ(StringRef(" Bbb "), Toks[6].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[7].getKind());
- ASSERT_EQ(StringRef("f]"), getVerbatimBlockName(Toks[7]));
- ASSERT_EQ(tok::text, Toks[8].getKind());
- ASSERT_EQ(StringRef(" "), Toks[8].getText());
- ASSERT_EQ(tok::verbatim_block_begin, Toks[9].getKind());
- ASSERT_EQ(StringRef("f{"), getVerbatimBlockName(Toks[9]));
- ASSERT_EQ(tok::verbatim_block_line, Toks[10].getKind());
- ASSERT_EQ(StringRef(" Ccc "), Toks[10].getVerbatimBlockText());
- ASSERT_EQ(tok::verbatim_block_end, Toks[11].getKind());
- ASSERT_EQ(StringRef("f}"), getVerbatimBlockName(Toks[11]));
- ASSERT_EQ(tok::newline, Toks[12].getKind());
- }
- // Empty verbatim line.
- TEST_F(CommentLexerTest, VerbatimLine1) {
- const char *Sources[] = {
- "/// \\fn\n//",
- "/** \\fn*/"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_line_name, Toks[1].getKind());
- ASSERT_EQ(StringRef("fn"), getVerbatimLineName(Toks[1]));
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- }
- // Verbatim line with Doxygen escape sequences, which should not be expanded.
- TEST_F(CommentLexerTest, VerbatimLine2) {
- const char *Sources[] = {
- "/// \\fn void *foo(const char *zzz = \"\\$\");\n//",
- "/** \\fn void *foo(const char *zzz = \"\\$\");*/"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(5U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_line_name, Toks[1].getKind());
- ASSERT_EQ(StringRef("fn"), getVerbatimLineName(Toks[1]));
- ASSERT_EQ(tok::verbatim_line_text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" void *foo(const char *zzz = \"\\$\");"),
- Toks[2].getVerbatimLineText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- }
- }
- // Verbatim line should not eat anything from next source line.
- TEST_F(CommentLexerTest, VerbatimLine3) {
- const char *Source =
- "/** \\fn void *foo(const char *zzz = \"\\$\");\n"
- " * Meow\n"
- " */";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(9U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::verbatim_line_name, Toks[1].getKind());
- ASSERT_EQ(StringRef("fn"), getVerbatimLineName(Toks[1]));
- ASSERT_EQ(tok::verbatim_line_text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" void *foo(const char *zzz = \"\\$\");"),
- Toks[2].getVerbatimLineText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef(" Meow"), Toks[4].getText());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- ASSERT_EQ(tok::text, Toks[6].getKind());
- ASSERT_EQ(StringRef(" "), Toks[6].getText());
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- ASSERT_EQ(tok::newline, Toks[8].getKind());
- }
- TEST_F(CommentLexerTest, HTML1) {
- const char *Source =
- "// <";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("<"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTML2) {
- const char *Source =
- "// a<2";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" a"), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("<"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("2"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTML3) {
- const char *Source =
- "// < img";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("<"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" img"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTML4) {
- const char *Sources[] = {
- "// <img",
- "// <img "
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML5) {
- const char *Source =
- "// <img 42";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("42"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTML6) {
- const char *Source = "// <img> Meow";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(5U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_greater, Toks[2].getKind());
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" Meow"), Toks[3].getText());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- }
- TEST_F(CommentLexerTest, HTML7) {
- const char *Source = "// <img=";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("="), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTML8) {
- const char *Source = "// <img src=> Meow";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(7U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::html_equals, Toks[3].getKind());
- ASSERT_EQ(tok::html_greater, Toks[4].getKind());
- ASSERT_EQ(tok::text, Toks[5].getKind());
- ASSERT_EQ(StringRef(" Meow"), Toks[5].getText());
- ASSERT_EQ(tok::newline, Toks[6].getKind());
- }
- TEST_F(CommentLexerTest, HTML9) {
- const char *Sources[] = {
- "// <img src",
- "// <img src "
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML10) {
- const char *Sources[] = {
- "// <img src=",
- "// <img src ="
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(5U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::html_equals, Toks[3].getKind());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML11) {
- const char *Sources[] = {
- "// <img src=\"",
- "// <img src = \"",
- "// <img src=\'",
- "// <img src = \'"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(6U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::html_equals, Toks[3].getKind());
- ASSERT_EQ(tok::html_quoted_string, Toks[4].getKind());
- ASSERT_EQ(StringRef(""), Toks[4].getHTMLQuotedString());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML12) {
- const char *Source = "// <img src=@";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(6U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::html_equals, Toks[3].getKind());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef("@"), Toks[4].getText());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- }
- TEST_F(CommentLexerTest, HTML13) {
- const char *Sources[] = {
- "// <img src=\"val\\\"\\'val",
- "// <img src=\"val\\\"\\'val\"",
- "// <img src=\'val\\\"\\'val",
- "// <img src=\'val\\\"\\'val\'"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(6U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::html_equals, Toks[3].getKind());
- ASSERT_EQ(tok::html_quoted_string, Toks[4].getKind());
- ASSERT_EQ(StringRef("val\\\"\\'val"), Toks[4].getHTMLQuotedString());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML14) {
- const char *Sources[] = {
- "// <img src=\"val\\\"\\'val\">",
- "// <img src=\'val\\\"\\'val\'>"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(7U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_ident, Toks[2].getKind());
- ASSERT_EQ(StringRef("src"), Toks[2].getHTMLIdent());
- ASSERT_EQ(tok::html_equals, Toks[3].getKind());
- ASSERT_EQ(tok::html_quoted_string, Toks[4].getKind());
- ASSERT_EQ(StringRef("val\\\"\\'val"), Toks[4].getHTMLQuotedString());
- ASSERT_EQ(tok::html_greater, Toks[5].getKind());
- ASSERT_EQ(tok::newline, Toks[6].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML15) {
- const char *Sources[] = {
- "// <img/>",
- "// <img />"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::html_slash_greater, Toks[2].getKind());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML16) {
- const char *Sources[] = {
- "// <img/ Aaa",
- "// <img / Aaa"
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(5U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_start_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagStartName());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("/"), Toks[2].getText());
- ASSERT_EQ(tok::text, Toks[3].getKind());
- ASSERT_EQ(StringRef(" Aaa"), Toks[3].getText());
- ASSERT_EQ(tok::newline, Toks[4].getKind());
- }
- }
- TEST_F(CommentLexerTest, HTML17) {
- const char *Source = "// </";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("</"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTML18) {
- const char *Source = "// </@";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("</"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("@"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTML19) {
- const char *Source = "// </img";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::html_end_tag, Toks[1].getKind());
- ASSERT_EQ(StringRef("img"), Toks[1].getHTMLTagEndName());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, NotAKnownHTMLTag1) {
- const char *Source = "// <tag>";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("<tag"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(">"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, NotAKnownHTMLTag2) {
- const char *Source = "// </tag>";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("</tag"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(">"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences1) {
- const char *Source = "// &";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences2) {
- const char *Source = "// &!";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("!"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences3) {
- const char *Source = "// &";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences4) {
- const char *Source = "// &!";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("!"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences5) {
- const char *Source = "// &#";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&#"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences6) {
- const char *Source = "// &#a";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&#"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("a"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences7) {
- const char *Source = "// *";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("*"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences8) {
- const char *Source = "// *a";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("*"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("a"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences9) {
- const char *Source = "// &#x";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&#x"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences10) {
- const char *Source = "// &#xz";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&#x"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("z"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences11) {
- const char *Source = "// «";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("«"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences12) {
- const char *Source = "// «z";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("«"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("z"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences13) {
- const char *Source = "// &";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences14) {
- const char *Source = "// &<";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef("<"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences15) {
- const char *Source = "// & meow";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(4U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("&"), Toks[1].getText());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" meow"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- }
- TEST_F(CommentLexerTest, HTMLCharacterReferences16) {
- const char *Sources[] = {
- "// =",
- "// =",
- "// =",
- "// ="
- };
- for (size_t i = 0, e = array_lengthof(Sources); i != e; i++) {
- std::vector<Token> Toks;
- lexString(Sources[i], Toks);
- ASSERT_EQ(3U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" "), Toks[0].getText());
- ASSERT_EQ(tok::text, Toks[1].getKind());
- ASSERT_EQ(StringRef("="), Toks[1].getText());
- ASSERT_EQ(tok::newline, Toks[2].getKind());
- }
- }
- TEST_F(CommentLexerTest, MultipleComments) {
- const char *Source =
- "// Aaa\n"
- "/// Bbb\n"
- "/* Ccc\n"
- " * Ddd*/\n"
- "/** Eee*/";
- std::vector<Token> Toks;
- lexString(Source, Toks);
- ASSERT_EQ(12U, Toks.size());
- ASSERT_EQ(tok::text, Toks[0].getKind());
- ASSERT_EQ(StringRef(" Aaa"), Toks[0].getText());
- ASSERT_EQ(tok::newline, Toks[1].getKind());
- ASSERT_EQ(tok::text, Toks[2].getKind());
- ASSERT_EQ(StringRef(" Bbb"), Toks[2].getText());
- ASSERT_EQ(tok::newline, Toks[3].getKind());
- ASSERT_EQ(tok::text, Toks[4].getKind());
- ASSERT_EQ(StringRef(" Ccc"), Toks[4].getText());
- ASSERT_EQ(tok::newline, Toks[5].getKind());
- ASSERT_EQ(tok::text, Toks[6].getKind());
- ASSERT_EQ(StringRef(" Ddd"), Toks[6].getText());
- ASSERT_EQ(tok::newline, Toks[7].getKind());
- ASSERT_EQ(tok::newline, Toks[8].getKind());
- ASSERT_EQ(tok::text, Toks[9].getKind());
- ASSERT_EQ(StringRef(" Eee"), Toks[9].getText());
- ASSERT_EQ(tok::newline, Toks[10].getKind());
- ASSERT_EQ(tok::newline, Toks[11].getKind());
- }
- } // end namespace comments
- } // end namespace clang
|