2019-03-05 21:45:17 +01:00
|
|
|
//===- RemarkParser.cpp --------------------------------------------------===//
|
2018-10-10 20:43:42 +02:00
|
|
|
//
|
2019-01-19 11:56:40 +01:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2018-10-10 20:43:42 +02:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file provides utility methods used by clients that want to use the
|
2019-03-05 21:45:17 +01:00
|
|
|
// parser for remark diagnostics in LLVM.
|
2018-10-10 20:43:42 +02:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
#include "llvm/Remarks/RemarkParser.h"
|
|
|
|
#include "YAMLRemarkParser.h"
|
2019-03-05 21:45:17 +01:00
|
|
|
#include "llvm-c/Remarks.h"
|
2018-10-10 20:43:42 +02:00
|
|
|
#include "llvm/ADT/STLExtras.h"
|
2019-03-19 22:11:07 +01:00
|
|
|
#include "llvm/Support/CBindingWrapping.h"
|
2018-10-10 20:43:42 +02:00
|
|
|
|
|
|
|
using namespace llvm;
|
2019-03-19 22:11:07 +01:00
|
|
|
using namespace llvm::remarks;
|
2018-10-10 20:43:42 +02:00
|
|
|
|
2019-07-16 17:24:59 +02:00
|
|
|
static std::unique_ptr<ParserImpl> formatToParserImpl(Format ParserFormat,
|
2019-07-04 02:31:03 +02:00
|
|
|
StringRef Buf) {
|
2019-07-16 17:24:59 +02:00
|
|
|
switch (ParserFormat) {
|
|
|
|
case Format::YAML:
|
2019-07-04 02:31:03 +02:00
|
|
|
return llvm::make_unique<YAMLParserImpl>(Buf);
|
2019-07-16 17:24:59 +02:00
|
|
|
case Format::Unknown:
|
|
|
|
llvm_unreachable("Unhandled llvm::remarks::ParserFormat enum");
|
|
|
|
return nullptr;
|
2019-07-04 02:31:03 +02:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
static std::unique_ptr<ParserImpl>
|
2019-07-16 17:24:59 +02:00
|
|
|
formatToParserImpl(Format ParserFormat, StringRef Buf,
|
2019-07-04 02:31:03 +02:00
|
|
|
const ParsedStringTable &StrTab) {
|
2019-07-16 17:24:59 +02:00
|
|
|
switch (ParserFormat) {
|
|
|
|
case Format::YAML:
|
2019-07-04 02:31:03 +02:00
|
|
|
return llvm::make_unique<YAMLParserImpl>(Buf, &StrTab);
|
2019-07-16 17:24:59 +02:00
|
|
|
case Format::Unknown:
|
|
|
|
llvm_unreachable("Unhandled llvm::remarks::ParserFormat enum");
|
|
|
|
return nullptr;
|
2019-07-04 02:31:03 +02:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2019-07-16 17:24:59 +02:00
|
|
|
Parser::Parser(Format ParserFormat, StringRef Buf)
|
|
|
|
: Impl(formatToParserImpl(ParserFormat, Buf)) {}
|
2018-10-10 20:43:42 +02:00
|
|
|
|
2019-07-16 17:24:59 +02:00
|
|
|
Parser::Parser(Format ParserFormat, StringRef Buf,
|
2019-07-04 02:31:03 +02:00
|
|
|
const ParsedStringTable &StrTab)
|
2019-07-16 17:24:59 +02:00
|
|
|
: Impl(formatToParserImpl(ParserFormat, Buf, StrTab)) {}
|
[Remarks] Add string deduplication using a string table
* Add support for uniquing strings in the remark streamer and emitting the string table in the remarks section.
* Add parsing support for the string table in the RemarkParser.
From this remark:
```
--- !Missed
Pass: inline
Name: NoDefinition
DebugLoc: { File: 'test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c',
Line: 7, Column: 3 }
Function: printArgsNoRet
Args:
- Callee: printf
- String: ' will not be inlined into '
- Caller: printArgsNoRet
DebugLoc: { File: 'test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c',
Line: 6, Column: 0 }
- String: ' because its definition is unavailable'
...
```
to:
```
--- !Missed
Pass: 0
Name: 1
DebugLoc: { File: 3, Line: 7, Column: 3 }
Function: 2
Args:
- Callee: 4
- String: 5
- Caller: 2
DebugLoc: { File: 3, Line: 6, Column: 0 }
- String: 6
...
```
And the string table in the .remarks/__remarks section containing:
```
inline\0NoDefinition\0printArgsNoRet\0
test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c\0printf\0
will not be inlined into \0 because its definition is unavailable\0
```
This is mostly supposed to be used for testing purposes, but it gives us
a 2x reduction in the remark size, and is an incremental change for the
updates to the remarks file format.
Differential Revision: https://reviews.llvm.org/D60227
llvm-svn: 359050
2019-04-24 02:06:24 +02:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
Parser::~Parser() = default;
|
2018-10-10 20:43:42 +02:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
static Expected<const Remark *> getNextYAML(YAMLParserImpl &Impl) {
|
|
|
|
YAMLRemarkParser &YAMLParser = Impl.YAMLParser;
|
|
|
|
// Check for EOF.
|
|
|
|
if (Impl.YAMLIt == Impl.YAMLParser.Stream.end())
|
|
|
|
return nullptr;
|
2019-03-19 19:21:43 +01:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
auto CurrentIt = Impl.YAMLIt;
|
2019-03-19 19:21:43 +01:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
// Try to parse an entry.
|
|
|
|
if (Error E = YAMLParser.parseYAMLElement(*CurrentIt)) {
|
|
|
|
// Set the iterator to the end, in case the user calls getNext again.
|
|
|
|
Impl.YAMLIt = Impl.YAMLParser.Stream.end();
|
|
|
|
return std::move(E);
|
2019-03-19 19:21:43 +01:00
|
|
|
}
|
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
// Move on.
|
|
|
|
++Impl.YAMLIt;
|
2019-03-19 19:21:43 +01:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
// Return the just-parsed remark.
|
|
|
|
if (const Optional<YAMLRemarkParser::ParseState> &State = YAMLParser.State)
|
|
|
|
return &State->TheRemark;
|
|
|
|
else
|
|
|
|
return createStringError(std::make_error_code(std::errc::invalid_argument),
|
|
|
|
"unexpected error while parsing.");
|
2019-03-19 19:21:43 +01:00
|
|
|
}
|
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
Expected<const Remark *> Parser::getNext() const {
|
|
|
|
if (auto *Impl = dyn_cast<YAMLParserImpl>(this->Impl.get()))
|
|
|
|
return getNextYAML(*Impl);
|
|
|
|
llvm_unreachable("Get next called with an unknown parsing implementation.");
|
2018-10-10 20:43:42 +02:00
|
|
|
}
|
2019-03-19 19:21:43 +01:00
|
|
|
|
[Remarks] Add string deduplication using a string table
* Add support for uniquing strings in the remark streamer and emitting the string table in the remarks section.
* Add parsing support for the string table in the RemarkParser.
From this remark:
```
--- !Missed
Pass: inline
Name: NoDefinition
DebugLoc: { File: 'test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c',
Line: 7, Column: 3 }
Function: printArgsNoRet
Args:
- Callee: printf
- String: ' will not be inlined into '
- Caller: printArgsNoRet
DebugLoc: { File: 'test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c',
Line: 6, Column: 0 }
- String: ' because its definition is unavailable'
...
```
to:
```
--- !Missed
Pass: 0
Name: 1
DebugLoc: { File: 3, Line: 7, Column: 3 }
Function: 2
Args:
- Callee: 4
- String: 5
- Caller: 2
DebugLoc: { File: 3, Line: 6, Column: 0 }
- String: 6
...
```
And the string table in the .remarks/__remarks section containing:
```
inline\0NoDefinition\0printArgsNoRet\0
test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c\0printf\0
will not be inlined into \0 because its definition is unavailable\0
```
This is mostly supposed to be used for testing purposes, but it gives us
a 2x reduction in the remark size, and is an incremental change for the
updates to the remarks file format.
Differential Revision: https://reviews.llvm.org/D60227
llvm-svn: 359050
2019-04-24 02:06:24 +02:00
|
|
|
ParsedStringTable::ParsedStringTable(StringRef InBuffer) : Buffer(InBuffer) {
|
|
|
|
while (!InBuffer.empty()) {
|
|
|
|
// Strings are separated by '\0' bytes.
|
|
|
|
std::pair<StringRef, StringRef> Split = InBuffer.split('\0');
|
|
|
|
// We only store the offset from the beginning of the buffer.
|
|
|
|
Offsets.push_back(Split.first.data() - Buffer.data());
|
|
|
|
InBuffer = Split.second;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-04 02:30:58 +02:00
|
|
|
Expected<StringRef> ParsedStringTable::operator[](size_t Index) const {
|
[Remarks] Add string deduplication using a string table
* Add support for uniquing strings in the remark streamer and emitting the string table in the remarks section.
* Add parsing support for the string table in the RemarkParser.
From this remark:
```
--- !Missed
Pass: inline
Name: NoDefinition
DebugLoc: { File: 'test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c',
Line: 7, Column: 3 }
Function: printArgsNoRet
Args:
- Callee: printf
- String: ' will not be inlined into '
- Caller: printArgsNoRet
DebugLoc: { File: 'test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c',
Line: 6, Column: 0 }
- String: ' because its definition is unavailable'
...
```
to:
```
--- !Missed
Pass: 0
Name: 1
DebugLoc: { File: 3, Line: 7, Column: 3 }
Function: 2
Args:
- Callee: 4
- String: 5
- Caller: 2
DebugLoc: { File: 3, Line: 6, Column: 0 }
- String: 6
...
```
And the string table in the .remarks/__remarks section containing:
```
inline\0NoDefinition\0printArgsNoRet\0
test-suite/SingleSource/UnitTests/2002-04-17-PrintfChar.c\0printf\0
will not be inlined into \0 because its definition is unavailable\0
```
This is mostly supposed to be used for testing purposes, but it gives us
a 2x reduction in the remark size, and is an incremental change for the
updates to the remarks file format.
Differential Revision: https://reviews.llvm.org/D60227
llvm-svn: 359050
2019-04-24 02:06:24 +02:00
|
|
|
if (Index >= Offsets.size())
|
|
|
|
return createStringError(
|
|
|
|
std::make_error_code(std::errc::invalid_argument),
|
|
|
|
"String with index %u is out of bounds (size = %u).", Index,
|
|
|
|
Offsets.size());
|
|
|
|
|
|
|
|
size_t Offset = Offsets[Index];
|
|
|
|
// If it's the last offset, we can't use the next offset to know the size of
|
|
|
|
// the string.
|
|
|
|
size_t NextOffset =
|
|
|
|
(Index == Offsets.size() - 1) ? Buffer.size() : Offsets[Index + 1];
|
|
|
|
return StringRef(Buffer.data() + Offset, NextOffset - Offset - 1);
|
|
|
|
}
|
|
|
|
|
2019-03-19 19:21:43 +01:00
|
|
|
// Create wrappers for C Binding types (see CBindingWrapping.h).
|
2019-03-19 22:11:07 +01:00
|
|
|
DEFINE_SIMPLE_CONVERSION_FUNCTIONS(remarks::Parser, LLVMRemarkParserRef)
|
2018-10-10 20:43:42 +02:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
extern "C" LLVMRemarkParserRef LLVMRemarkParserCreateYAML(const void *Buf,
|
|
|
|
uint64_t Size) {
|
2019-07-16 17:24:59 +02:00
|
|
|
return wrap(new remarks::Parser(
|
|
|
|
remarks::Format::YAML, StringRef(static_cast<const char *>(Buf), Size)));
|
2019-03-19 19:09:51 +01:00
|
|
|
}
|
2018-10-10 20:43:42 +02:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
static void handleYAMLError(remarks::YAMLParserImpl &Impl, Error E) {
|
|
|
|
handleAllErrors(
|
|
|
|
std::move(E),
|
|
|
|
[&](const YAMLParseError &PE) {
|
|
|
|
Impl.YAMLParser.Stream.printError(&PE.getNode(),
|
|
|
|
Twine(PE.getMessage()) + Twine('\n'));
|
|
|
|
},
|
|
|
|
[&](const ErrorInfoBase &EIB) { EIB.log(Impl.YAMLParser.ErrorStream); });
|
|
|
|
Impl.HasErrors = true;
|
|
|
|
}
|
2018-10-10 20:43:42 +02:00
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
extern "C" LLVMRemarkEntryRef
|
|
|
|
LLVMRemarkParserGetNext(LLVMRemarkParserRef Parser) {
|
|
|
|
remarks::Parser &TheParser = *unwrap(Parser);
|
|
|
|
|
|
|
|
Expected<const remarks::Remark *> RemarkOrErr = TheParser.getNext();
|
|
|
|
if (!RemarkOrErr) {
|
|
|
|
// Error during parsing.
|
|
|
|
if (auto *Impl = dyn_cast<remarks::YAMLParserImpl>(TheParser.Impl.get()))
|
|
|
|
handleYAMLError(*Impl, RemarkOrErr.takeError());
|
|
|
|
else
|
|
|
|
llvm_unreachable("unkown parser implementation.");
|
2019-03-19 19:09:51 +01:00
|
|
|
return nullptr;
|
2019-03-19 19:21:43 +01:00
|
|
|
}
|
|
|
|
|
2019-03-19 22:11:07 +01:00
|
|
|
if (*RemarkOrErr == nullptr)
|
|
|
|
return nullptr;
|
|
|
|
// Valid remark.
|
|
|
|
return wrap(*RemarkOrErr);
|
2018-10-10 20:43:42 +02:00
|
|
|
}
|
|
|
|
|
2019-03-05 21:45:17 +01:00
|
|
|
extern "C" LLVMBool LLVMRemarkParserHasError(LLVMRemarkParserRef Parser) {
|
2019-03-19 22:11:07 +01:00
|
|
|
if (auto *Impl =
|
|
|
|
dyn_cast<remarks::YAMLParserImpl>(unwrap(Parser)->Impl.get()))
|
|
|
|
return Impl->HasErrors;
|
|
|
|
llvm_unreachable("unkown parser implementation.");
|
2018-10-10 20:43:42 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
extern "C" const char *
|
2019-03-05 21:45:17 +01:00
|
|
|
LLVMRemarkParserGetErrorMessage(LLVMRemarkParserRef Parser) {
|
2019-03-19 22:11:07 +01:00
|
|
|
if (auto *Impl =
|
|
|
|
dyn_cast<remarks::YAMLParserImpl>(unwrap(Parser)->Impl.get()))
|
|
|
|
return Impl->YAMLParser.ErrorStream.str().c_str();
|
|
|
|
llvm_unreachable("unkown parser implementation.");
|
2018-10-10 20:43:42 +02:00
|
|
|
}
|
|
|
|
|
2019-03-05 21:45:17 +01:00
|
|
|
extern "C" void LLVMRemarkParserDispose(LLVMRemarkParserRef Parser) {
|
2018-10-10 20:43:42 +02:00
|
|
|
delete unwrap(Parser);
|
|
|
|
}
|