mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
cded1d3751
Summary: The LLVM SourceMgr class (which is used indirectly by Swift, though not Clang) has a routine for looking up line numbers of SMLocs. This routine uses a shared, special-purpose cache that handles exactly one access pattern efficiently: looking up the line number of an SMLoc that points into the same buffer as the last query made to the SourceMgr, at a location in the buffer at or ahead of the last query. When this works it's fine, but when it fails it's catastrophic for performancer: one recent out-of-order access from a Swift utility routine ran for tens of seconds, spending 99% of its time repeatedly scanning buffers for '\n'. This change removes the shared cache from the SourceMgr and installs a new cache in each SrcBuffer. The per-SrcBuffer caches are also "full", in the sense that rather than caching a single last-query pointer, they cache _all_ the line-ending offsets, in a binary-searchable array, such that once it's populated (on first access), all subsequent access patterns run at the same speed. Performance measurements I've done show this is actually a little bit faster on real codebases (though only a couple fractions of a percent). Memory usage is up by a few tens to hundreds of bytes per SrcBuffer that has a line lookup done on it; I've attempted to minimize this by using dynamic selection of integer sized when storing offset arrays. But the main motive here is to make-impossible the cases we don't always see, that show up by surprise when there is an out-of-order access pattern. Reviewers: jordan_rose Reviewed By: jordan_rose Subscribers: probinson, llvm-commits Differential Revision: https://reviews.llvm.org/D45003 llvm-svn: 329470
310 lines
11 KiB
C++
310 lines
11 KiB
C++
//===- SourceMgr.h - Manager for Source Buffers & Diagnostics ---*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file declares the SMDiagnostic and SourceMgr classes. This
|
|
// provides a simple substrate for diagnostics, #include handling, and other low
|
|
// level things for simple parsers.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_SUPPORT_SOURCEMGR_H
|
|
#define LLVM_SUPPORT_SOURCEMGR_H
|
|
|
|
#include "llvm/ADT/ArrayRef.h"
|
|
#include "llvm/ADT/None.h"
|
|
#include "llvm/ADT/PointerUnion.h"
|
|
#include "llvm/ADT/SmallVector.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/ADT/Twine.h"
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
#include "llvm/Support/SMLoc.h"
|
|
#include <algorithm>
|
|
#include <cassert>
|
|
#include <memory>
|
|
#include <string>
|
|
#include <utility>
|
|
#include <vector>
|
|
|
|
namespace llvm {
|
|
|
|
class raw_ostream;
|
|
class SMDiagnostic;
|
|
class SMFixIt;
|
|
|
|
/// This owns the files read by a parser, handles include stacks,
|
|
/// and handles diagnostic wrangling.
|
|
class SourceMgr {
|
|
public:
|
|
enum DiagKind {
|
|
DK_Error,
|
|
DK_Warning,
|
|
DK_Remark,
|
|
DK_Note,
|
|
};
|
|
|
|
/// Clients that want to handle their own diagnostics in a custom way can
|
|
/// register a function pointer+context as a diagnostic handler.
|
|
/// It gets called each time PrintMessage is invoked.
|
|
using DiagHandlerTy = void (*)(const SMDiagnostic &, void *Context);
|
|
|
|
private:
|
|
struct SrcBuffer {
|
|
/// The memory buffer for the file.
|
|
std::unique_ptr<MemoryBuffer> Buffer;
|
|
|
|
/// Helper type for OffsetCache below: since we're storing many offsets
|
|
/// into relatively small files (often smaller than 2^8 or 2^16 bytes),
|
|
/// we select the offset vector element type dynamically based on the
|
|
/// size of Buffer.
|
|
using VariableSizeOffsets = PointerUnion4<std::vector<uint8_t> *,
|
|
std::vector<uint16_t> *,
|
|
std::vector<uint32_t> *,
|
|
std::vector<uint64_t> *>;
|
|
|
|
/// Vector of offsets into Buffer at which there are line-endings
|
|
/// (lazily populated). Once populated, the '\n' that marks the end of
|
|
/// line number N from [1..] is at Buffer[OffsetCache[N-1]]. Since
|
|
/// these offsets are in sorted (ascending) order, they can be
|
|
/// binary-searched for the first one after any given offset (eg. an
|
|
/// offset corresponding to a particular SMLoc).
|
|
mutable VariableSizeOffsets OffsetCache;
|
|
|
|
/// Populate \c OffsetCache and look up a given \p Ptr in it, assuming
|
|
/// it points somewhere into \c Buffer. The static type parameter \p T
|
|
/// must be an unsigned integer type from uint{8,16,32,64}_t large
|
|
/// enough to store offsets inside \c Buffer.
|
|
template<typename T>
|
|
unsigned getLineNumber(const char *Ptr) const;
|
|
|
|
/// This is the location of the parent include, or null if at the top level.
|
|
SMLoc IncludeLoc;
|
|
|
|
SrcBuffer() = default;
|
|
SrcBuffer(SrcBuffer &&);
|
|
SrcBuffer(const SrcBuffer &) = delete;
|
|
SrcBuffer &operator=(const SrcBuffer &) = delete;
|
|
~SrcBuffer();
|
|
};
|
|
|
|
/// This is all of the buffers that we are reading from.
|
|
std::vector<SrcBuffer> Buffers;
|
|
|
|
// This is the list of directories we should search for include files in.
|
|
std::vector<std::string> IncludeDirectories;
|
|
|
|
DiagHandlerTy DiagHandler = nullptr;
|
|
void *DiagContext = nullptr;
|
|
|
|
bool isValidBufferID(unsigned i) const { return i && i <= Buffers.size(); }
|
|
|
|
public:
|
|
SourceMgr() = default;
|
|
SourceMgr(const SourceMgr &) = delete;
|
|
SourceMgr &operator=(const SourceMgr &) = delete;
|
|
~SourceMgr() = default;
|
|
|
|
void setIncludeDirs(const std::vector<std::string> &Dirs) {
|
|
IncludeDirectories = Dirs;
|
|
}
|
|
|
|
/// Specify a diagnostic handler to be invoked every time PrintMessage is
|
|
/// called. \p Ctx is passed into the handler when it is invoked.
|
|
void setDiagHandler(DiagHandlerTy DH, void *Ctx = nullptr) {
|
|
DiagHandler = DH;
|
|
DiagContext = Ctx;
|
|
}
|
|
|
|
DiagHandlerTy getDiagHandler() const { return DiagHandler; }
|
|
void *getDiagContext() const { return DiagContext; }
|
|
|
|
const SrcBuffer &getBufferInfo(unsigned i) const {
|
|
assert(isValidBufferID(i));
|
|
return Buffers[i - 1];
|
|
}
|
|
|
|
const MemoryBuffer *getMemoryBuffer(unsigned i) const {
|
|
assert(isValidBufferID(i));
|
|
return Buffers[i - 1].Buffer.get();
|
|
}
|
|
|
|
unsigned getNumBuffers() const {
|
|
return Buffers.size();
|
|
}
|
|
|
|
unsigned getMainFileID() const {
|
|
assert(getNumBuffers());
|
|
return 1;
|
|
}
|
|
|
|
SMLoc getParentIncludeLoc(unsigned i) const {
|
|
assert(isValidBufferID(i));
|
|
return Buffers[i - 1].IncludeLoc;
|
|
}
|
|
|
|
/// Add a new source buffer to this source manager. This takes ownership of
|
|
/// the memory buffer.
|
|
unsigned AddNewSourceBuffer(std::unique_ptr<MemoryBuffer> F,
|
|
SMLoc IncludeLoc) {
|
|
SrcBuffer NB;
|
|
NB.Buffer = std::move(F);
|
|
NB.IncludeLoc = IncludeLoc;
|
|
Buffers.push_back(std::move(NB));
|
|
return Buffers.size();
|
|
}
|
|
|
|
/// Search for a file with the specified name in the current directory or in
|
|
/// one of the IncludeDirs.
|
|
///
|
|
/// If no file is found, this returns 0, otherwise it returns the buffer ID
|
|
/// of the stacked file. The full path to the included file can be found in
|
|
/// \p IncludedFile.
|
|
unsigned AddIncludeFile(const std::string &Filename, SMLoc IncludeLoc,
|
|
std::string &IncludedFile);
|
|
|
|
/// Return the ID of the buffer containing the specified location.
|
|
///
|
|
/// 0 is returned if the buffer is not found.
|
|
unsigned FindBufferContainingLoc(SMLoc Loc) const;
|
|
|
|
/// Find the line number for the specified location in the specified file.
|
|
/// This is not a fast method.
|
|
unsigned FindLineNumber(SMLoc Loc, unsigned BufferID = 0) const {
|
|
return getLineAndColumn(Loc, BufferID).first;
|
|
}
|
|
|
|
/// Find the line and column number for the specified location in the
|
|
/// specified file. This is not a fast method.
|
|
std::pair<unsigned, unsigned> getLineAndColumn(SMLoc Loc,
|
|
unsigned BufferID = 0) const;
|
|
|
|
/// Emit a message about the specified location with the specified string.
|
|
///
|
|
/// \param ShowColors Display colored messages if output is a terminal and
|
|
/// the default error handler is used.
|
|
void PrintMessage(raw_ostream &OS, SMLoc Loc, DiagKind Kind,
|
|
const Twine &Msg,
|
|
ArrayRef<SMRange> Ranges = None,
|
|
ArrayRef<SMFixIt> FixIts = None,
|
|
bool ShowColors = true) const;
|
|
|
|
/// Emits a diagnostic to llvm::errs().
|
|
void PrintMessage(SMLoc Loc, DiagKind Kind, const Twine &Msg,
|
|
ArrayRef<SMRange> Ranges = None,
|
|
ArrayRef<SMFixIt> FixIts = None,
|
|
bool ShowColors = true) const;
|
|
|
|
/// Emits a manually-constructed diagnostic to the given output stream.
|
|
///
|
|
/// \param ShowColors Display colored messages if output is a terminal and
|
|
/// the default error handler is used.
|
|
void PrintMessage(raw_ostream &OS, const SMDiagnostic &Diagnostic,
|
|
bool ShowColors = true) const;
|
|
|
|
/// Return an SMDiagnostic at the specified location with the specified
|
|
/// string.
|
|
///
|
|
/// \param Msg If non-null, the kind of message (e.g., "error") which is
|
|
/// prefixed to the message.
|
|
SMDiagnostic GetMessage(SMLoc Loc, DiagKind Kind, const Twine &Msg,
|
|
ArrayRef<SMRange> Ranges = None,
|
|
ArrayRef<SMFixIt> FixIts = None) const;
|
|
|
|
/// Prints the names of included files and the line of the file they were
|
|
/// included from. A diagnostic handler can use this before printing its
|
|
/// custom formatted message.
|
|
///
|
|
/// \param IncludeLoc The location of the include.
|
|
/// \param OS the raw_ostream to print on.
|
|
void PrintIncludeStack(SMLoc IncludeLoc, raw_ostream &OS) const;
|
|
};
|
|
|
|
/// Represents a single fixit, a replacement of one range of text with another.
|
|
class SMFixIt {
|
|
SMRange Range;
|
|
|
|
std::string Text;
|
|
|
|
public:
|
|
// FIXME: Twine.str() is not very efficient.
|
|
SMFixIt(SMLoc Loc, const Twine &Insertion)
|
|
: Range(Loc, Loc), Text(Insertion.str()) {
|
|
assert(Loc.isValid());
|
|
}
|
|
|
|
// FIXME: Twine.str() is not very efficient.
|
|
SMFixIt(SMRange R, const Twine &Replacement)
|
|
: Range(R), Text(Replacement.str()) {
|
|
assert(R.isValid());
|
|
}
|
|
|
|
StringRef getText() const { return Text; }
|
|
SMRange getRange() const { return Range; }
|
|
|
|
bool operator<(const SMFixIt &Other) const {
|
|
if (Range.Start.getPointer() != Other.Range.Start.getPointer())
|
|
return Range.Start.getPointer() < Other.Range.Start.getPointer();
|
|
if (Range.End.getPointer() != Other.Range.End.getPointer())
|
|
return Range.End.getPointer() < Other.Range.End.getPointer();
|
|
return Text < Other.Text;
|
|
}
|
|
};
|
|
|
|
/// Instances of this class encapsulate one diagnostic report, allowing
|
|
/// printing to a raw_ostream as a caret diagnostic.
|
|
class SMDiagnostic {
|
|
const SourceMgr *SM = nullptr;
|
|
SMLoc Loc;
|
|
std::string Filename;
|
|
int LineNo = 0;
|
|
int ColumnNo = 0;
|
|
SourceMgr::DiagKind Kind = SourceMgr::DK_Error;
|
|
std::string Message, LineContents;
|
|
std::vector<std::pair<unsigned, unsigned>> Ranges;
|
|
SmallVector<SMFixIt, 4> FixIts;
|
|
|
|
public:
|
|
// Null diagnostic.
|
|
SMDiagnostic() = default;
|
|
// Diagnostic with no location (e.g. file not found, command line arg error).
|
|
SMDiagnostic(StringRef filename, SourceMgr::DiagKind Knd, StringRef Msg)
|
|
: Filename(filename), LineNo(-1), ColumnNo(-1), Kind(Knd), Message(Msg) {}
|
|
|
|
// Diagnostic with a location.
|
|
SMDiagnostic(const SourceMgr &sm, SMLoc L, StringRef FN,
|
|
int Line, int Col, SourceMgr::DiagKind Kind,
|
|
StringRef Msg, StringRef LineStr,
|
|
ArrayRef<std::pair<unsigned,unsigned>> Ranges,
|
|
ArrayRef<SMFixIt> FixIts = None);
|
|
|
|
const SourceMgr *getSourceMgr() const { return SM; }
|
|
SMLoc getLoc() const { return Loc; }
|
|
StringRef getFilename() const { return Filename; }
|
|
int getLineNo() const { return LineNo; }
|
|
int getColumnNo() const { return ColumnNo; }
|
|
SourceMgr::DiagKind getKind() const { return Kind; }
|
|
StringRef getMessage() const { return Message; }
|
|
StringRef getLineContents() const { return LineContents; }
|
|
ArrayRef<std::pair<unsigned, unsigned>> getRanges() const { return Ranges; }
|
|
|
|
void addFixIt(const SMFixIt &Hint) {
|
|
FixIts.push_back(Hint);
|
|
}
|
|
|
|
ArrayRef<SMFixIt> getFixIts() const {
|
|
return FixIts;
|
|
}
|
|
|
|
void print(const char *ProgName, raw_ostream &S, bool ShowColors = true,
|
|
bool ShowKindLabel = true) const;
|
|
};
|
|
|
|
} // end namespace llvm
|
|
|
|
#endif // LLVM_SUPPORT_SOURCEMGR_H
|