123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370 |
- //===--- SourceManager.cpp - Track and cache source files -----------------===//
- //
- // The LLVM Compiler Infrastructure
- //
- // This file was developed by Chris Lattner and is distributed under
- // the University of Illinois Open Source License. See LICENSE.TXT for details.
- //
- //===----------------------------------------------------------------------===//
- //
- // This file implements the SourceManager interface.
- //
- //===----------------------------------------------------------------------===//
- #include "clang/Basic/SourceManager.h"
- #include "clang/Basic/FileManager.h"
- #include "llvm/Support/MemoryBuffer.h"
- #include "llvm/System/Path.h"
- #include <algorithm>
- #include <iostream>
- using namespace clang;
- using namespace SrcMgr;
- using llvm::MemoryBuffer;
- SourceManager::~SourceManager() {
- for (std::map<const FileEntry *, FileInfo>::iterator I = FileInfos.begin(),
- E = FileInfos.end(); I != E; ++I) {
- delete I->second.Buffer;
- delete[] I->second.SourceLineCache;
- }
-
- for (std::list<InfoRec>::iterator I = MemBufferInfos.begin(),
- E = MemBufferInfos.end(); I != E; ++I) {
- delete I->second.Buffer;
- delete[] I->second.SourceLineCache;
- }
- }
- // FIXME: REMOVE THESE
- #include <unistd.h>
- #include <sys/types.h>
- #include <sys/uio.h>
- #include <sys/fcntl.h>
- #include <cerrno>
- static const MemoryBuffer *ReadFileFast(const FileEntry *FileEnt) {
- #if 0
- // FIXME: Reintroduce this and zap this function once the common llvm stuff
- // is fast for the small case.
- return MemoryBuffer::getFile(FileEnt->getName(), strlen(FileEnt->getName()),
- FileEnt->getSize());
- #endif
-
- // If the file is larger than some threshold, use 'read', otherwise use mmap.
- if (FileEnt->getSize() >= 4096*4)
- return MemoryBuffer::getFile(FileEnt->getName(), strlen(FileEnt->getName()),
- 0, FileEnt->getSize());
-
- MemoryBuffer *SB = MemoryBuffer::getNewUninitMemBuffer(FileEnt->getSize(),
- FileEnt->getName());
- char *BufPtr = const_cast<char*>(SB->getBufferStart());
-
- int FD = ::open(FileEnt->getName(), O_RDONLY);
- if (FD == -1) {
- delete SB;
- return 0;
- }
-
- unsigned BytesLeft = FileEnt->getSize();
- while (BytesLeft) {
- ssize_t NumRead = ::read(FD, BufPtr, BytesLeft);
- if (NumRead != -1) {
- BytesLeft -= NumRead;
- BufPtr += NumRead;
- } else if (errno == EINTR) {
- // try again
- } else {
- // error reading.
- close(FD);
- delete SB;
- return 0;
- }
- }
- close(FD);
-
- return SB;
- }
- /// getFileInfo - Create or return a cached FileInfo for the specified file.
- ///
- const InfoRec *
- SourceManager::getInfoRec(const FileEntry *FileEnt) {
- assert(FileEnt && "Didn't specify a file entry to use?");
- // Do we already have information about this file?
- std::map<const FileEntry *, FileInfo>::iterator I =
- FileInfos.lower_bound(FileEnt);
- if (I != FileInfos.end() && I->first == FileEnt)
- return &*I;
-
- // Nope, get information.
- const MemoryBuffer *File = ReadFileFast(FileEnt);
- if (File == 0)
- return 0;
- const InfoRec &Entry =
- *FileInfos.insert(I, std::make_pair(FileEnt, FileInfo()));
- FileInfo &Info = const_cast<FileInfo &>(Entry.second);
- Info.Buffer = File;
- Info.SourceLineCache = 0;
- Info.NumLines = 0;
- return &Entry;
- }
- /// createMemBufferInfoRec - Create a new info record for the specified memory
- /// buffer. This does no caching.
- const InfoRec *
- SourceManager::createMemBufferInfoRec(const MemoryBuffer *Buffer) {
- // Add a new info record to the MemBufferInfos list and return it.
- FileInfo FI;
- FI.Buffer = Buffer;
- FI.SourceLineCache = 0;
- FI.NumLines = 0;
- MemBufferInfos.push_back(InfoRec(0, FI));
- return &MemBufferInfos.back();
- }
- /// createFileID - Create a new fileID for the specified InfoRec and include
- /// position. This works regardless of whether the InfoRec corresponds to a
- /// file or some other input source.
- unsigned SourceManager::createFileID(const InfoRec *File,
- SourceLocation IncludePos) {
- // If FileEnt is really large (e.g. it's a large .i file), we may not be able
- // to fit an arbitrary position in the file in the FilePos field. To handle
- // this, we create one FileID for each chunk of the file that fits in a
- // FilePos field.
- unsigned FileSize = File->second.Buffer->getBufferSize();
- if (FileSize+1 < (1 << SourceLocation::FilePosBits)) {
- FileIDs.push_back(FileIDInfo::getNormalBuffer(IncludePos, 0, File));
- assert(FileIDs.size() < (1 << SourceLocation::FileIDBits) &&
- "Ran out of file ID's!");
- return FileIDs.size();
- }
-
- // Create one FileID for each chunk of the file.
- unsigned Result = FileIDs.size()+1;
- unsigned ChunkNo = 0;
- while (1) {
- FileIDs.push_back(FileIDInfo::getNormalBuffer(IncludePos, ChunkNo++, File));
- if (FileSize+1 < (1 << SourceLocation::FilePosBits)) break;
- FileSize -= (1 << SourceLocation::FilePosBits);
- }
- assert(FileIDs.size() < (1 << SourceLocation::FileIDBits) &&
- "Ran out of file ID's!");
- return Result;
- }
- /// getInstantiationLoc - Return a new SourceLocation that encodes the fact
- /// that a token from physloc PhysLoc should actually be referenced from
- /// InstantiationLoc.
- SourceLocation SourceManager::getInstantiationLoc(SourceLocation PhysLoc,
- SourceLocation InstantLoc) {
- assert(getFIDInfo(PhysLoc.getFileID())->IDType !=
- SrcMgr::FileIDInfo::MacroExpansion &&
- "Location instantiated in a macro?");
-
- // Resolve InstantLoc down to a real logical location.
- InstantLoc = getLogicalLoc(InstantLoc);
-
- unsigned InstantiationFileID;
- // If this is the same instantiation as was requested last time, return this
- // immediately.
- if (PhysLoc.getFileID() == LastInstantiationLoc_MacroFID &&
- InstantLoc == LastInstantiationLoc_InstantLoc) {
- InstantiationFileID = LastInstantiationLoc_Result;
- } else {
- // Add a FileID for this. FIXME: should cache these!
- FileIDs.push_back(FileIDInfo::getMacroExpansion(InstantLoc,
- PhysLoc.getFileID()));
- InstantiationFileID = FileIDs.size();
-
- // Remember this in the single-entry cache for next time.
- LastInstantiationLoc_MacroFID = PhysLoc.getFileID();
- LastInstantiationLoc_InstantLoc = InstantLoc;
- LastInstantiationLoc_Result = InstantiationFileID;
- }
- return SourceLocation(InstantiationFileID, PhysLoc.getRawFilePos());
- }
- /// getCharacterData - Return a pointer to the start of the specified location
- /// in the appropriate MemoryBuffer.
- const char *SourceManager::getCharacterData(SourceLocation SL) const {
- // Note that this is a hot function in the getSpelling() path, which is
- // heavily used by -E mode.
- unsigned FileID = SL.getFileID();
- assert(FileID && "Invalid source location!");
-
- return getFileInfo(FileID)->Buffer->getBufferStart() + getFilePos(SL);
- }
- /// getIncludeLoc - Return the location of the #include for the specified
- /// FileID.
- SourceLocation SourceManager::getIncludeLoc(unsigned FileID) const {
- const SrcMgr::FileIDInfo *FIDInfo = getFIDInfo(FileID);
- // For Macros, the physical loc is specified by the MacroTokenFileID.
- if (FIDInfo->IDType == SrcMgr::FileIDInfo::MacroExpansion)
- FIDInfo = &FileIDs[FIDInfo->u.MacroTokenFileID-1];
-
- return FIDInfo->IncludeLoc;
- }
- /// getColumnNumber - Return the column # for the specified include position.
- /// this is significantly cheaper to compute than the line number. This returns
- /// zero if the column number isn't known.
- unsigned SourceManager::getColumnNumber(SourceLocation Loc) const {
- Loc = getLogicalLoc(Loc);
- unsigned FileID = Loc.getFileID();
- if (FileID == 0) return 0;
-
- unsigned FilePos = getFilePos(Loc);
- const MemoryBuffer *Buffer = getBuffer(FileID);
- const char *Buf = Buffer->getBufferStart();
- unsigned LineStart = FilePos;
- while (LineStart && Buf[LineStart-1] != '\n' && Buf[LineStart-1] != '\r')
- --LineStart;
- return FilePos-LineStart+1;
- }
- /// getSourceName - This method returns the name of the file or buffer that
- /// the SourceLocation specifies. This can be modified with #line directives,
- /// etc.
- std::string SourceManager::getSourceName(SourceLocation Loc) {
- Loc = getLogicalLoc(Loc);
- unsigned FileID = Loc.getFileID();
- if (FileID == 0) return "";
- return getFileInfo(FileID)->Buffer->getBufferIdentifier();
- }
- /// getLineNumber - Given a SourceLocation, return the physical line number
- /// for the position indicated. This requires building and caching a table of
- /// line offsets for the MemoryBuffer, so this is not cheap: use only when
- /// about to emit a diagnostic.
- unsigned SourceManager::getLineNumber(SourceLocation Loc) {
- Loc = getLogicalLoc(Loc);
- unsigned FileID = Loc.getFileID();
- if (FileID == 0) return 0;
- FileInfo *FileInfo = getFileInfo(FileID);
-
- // If this is the first use of line information for this buffer, compute the
- /// SourceLineCache for it on demand.
- if (FileInfo->SourceLineCache == 0) {
- const MemoryBuffer *Buffer = FileInfo->Buffer;
-
- // Find the file offsets of all of the *physical* source lines. This does
- // not look at trigraphs, escaped newlines, or anything else tricky.
- std::vector<unsigned> LineOffsets;
-
- // Line #1 starts at char 0.
- LineOffsets.push_back(0);
-
- const unsigned char *Buf = (const unsigned char *)Buffer->getBufferStart();
- const unsigned char *End = (const unsigned char *)Buffer->getBufferEnd();
- unsigned Offs = 0;
- while (1) {
- // Skip over the contents of the line.
- // TODO: Vectorize this? This is very performance sensitive for programs
- // with lots of diagnostics and in -E mode.
- const unsigned char *NextBuf = (const unsigned char *)Buf;
- while (*NextBuf != '\n' && *NextBuf != '\r' && *NextBuf != '\0')
- ++NextBuf;
- Offs += NextBuf-Buf;
- Buf = NextBuf;
-
- if (Buf[0] == '\n' || Buf[0] == '\r') {
- // If this is \n\r or \r\n, skip both characters.
- if ((Buf[1] == '\n' || Buf[1] == '\r') && Buf[0] != Buf[1])
- ++Offs, ++Buf;
- ++Offs, ++Buf;
- LineOffsets.push_back(Offs);
- } else {
- // Otherwise, this is a null. If end of file, exit.
- if (Buf == End) break;
- // Otherwise, skip the null.
- ++Offs, ++Buf;
- }
- }
- LineOffsets.push_back(Offs);
-
- // Copy the offsets into the FileInfo structure.
- FileInfo->NumLines = LineOffsets.size();
- FileInfo->SourceLineCache = new unsigned[LineOffsets.size()];
- std::copy(LineOffsets.begin(), LineOffsets.end(),
- FileInfo->SourceLineCache);
- }
- // Okay, we know we have a line number table. Do a binary search to find the
- // line number that this character position lands on.
- unsigned NumLines = FileInfo->NumLines;
- unsigned *SourceLineCache = FileInfo->SourceLineCache;
-
- // TODO: If this is performance sensitive, we could try doing simple radix
- // type approaches to make good (tight?) initial guesses based on the
- // assumption that all lines are the same average size.
- unsigned *Pos = std::lower_bound(SourceLineCache, SourceLineCache+NumLines,
- getFilePos(Loc)+1);
- return Pos-SourceLineCache;
- }
- /// getSourceFilePos - This method returns the *logical* offset from the start
- /// of the file that the specified SourceLocation represents. This returns
- /// the location of the *logical* character data, not the physical file
- /// position. In the case of macros, for example, this returns where the
- /// macro was instantiated, not where the characters for the macro can be
- /// found.
- unsigned SourceManager::getSourceFilePos(SourceLocation Loc) const {
-
- // If this is a macro, we need to get the instantiation location.
- const SrcMgr::FileIDInfo *FIDInfo = getFIDInfo(Loc.getFileID());
- while (FIDInfo->IDType == SrcMgr::FileIDInfo::MacroExpansion) {
- Loc = FIDInfo->IncludeLoc;
- FIDInfo = getFIDInfo(Loc.getFileID());
- }
-
- return getFilePos(Loc);
- }
- /// PrintStats - Print statistics to stderr.
- ///
- void SourceManager::PrintStats() const {
- std::cerr << "\n*** Source Manager Stats:\n";
- std::cerr << FileInfos.size() << " files mapped, " << MemBufferInfos.size()
- << " mem buffers mapped, " << FileIDs.size()
- << " file ID's allocated.\n";
- unsigned NumBuffers = 0, NumMacros = 0;
- for (unsigned i = 0, e = FileIDs.size(); i != e; ++i) {
- if (FileIDs[i].IDType == FileIDInfo::NormalBuffer)
- ++NumBuffers;
- else if (FileIDs[i].IDType == FileIDInfo::MacroExpansion)
- ++NumMacros;
- else
- assert(0 && "Unknown FileID!");
- }
- std::cerr << " " << NumBuffers << " normal buffer FileID's, "
- << NumMacros << " macro expansion FileID's.\n";
-
-
-
- unsigned NumLineNumsComputed = 0;
- unsigned NumFileBytesMapped = 0;
- for (std::map<const FileEntry *, FileInfo>::const_iterator I =
- FileInfos.begin(), E = FileInfos.end(); I != E; ++I) {
- NumLineNumsComputed += I->second.SourceLineCache != 0;
- NumFileBytesMapped += I->second.Buffer->getBufferSize();
- }
- std::cerr << NumFileBytesMapped << " bytes of files mapped, "
- << NumLineNumsComputed << " files with line #'s computed.\n";
- }
|