2020-11-16 15:44:35 +01:00
|
|
|
//===-- yaml-parser-fuzzer.cpp - Fuzzer for YAML parser -------------------===//
|
|
|
|
//
|
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "llvm/ADT/StringRef.h"
|
|
|
|
#include "llvm/Support/YAMLParser.h"
|
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
|
|
|
|
static bool isValidYaml(const uint8_t *Data, size_t Size) {
|
|
|
|
SourceMgr SM;
|
|
|
|
yaml::Stream Stream(StringRef(reinterpret_cast<const char *>(Data), Size),
|
|
|
|
SM);
|
|
|
|
return Stream.validate();
|
|
|
|
}
|
|
|
|
|
|
|
|
extern "C" int LLVMFuzzerTestOneInput(const uint8_t *Data, size_t Size) {
|
|
|
|
std::vector<uint8_t> Input(Data, Data + Size);
|
|
|
|
|
2020-11-16 20:05:06 +01:00
|
|
|
// Ensure we don't crash on any arbitrary byte string.
|
|
|
|
isValidYaml(Input.data(), Input.size());
|
|
|
|
|
|
|
|
// Ensure we don't crash on byte strings with no null characters.
|
2021-01-02 18:24:15 +01:00
|
|
|
llvm::erase_value(Input, 0);
|
2020-11-16 20:05:06 +01:00
|
|
|
Input.shrink_to_fit();
|
|
|
|
bool IsValidWithout0s = isValidYaml(Input.data(), Input.size());
|
|
|
|
|
2020-11-16 15:44:35 +01:00
|
|
|
// Ensure we don't crash on byte strings where the only null character is
|
|
|
|
// one-past-the-end of the actual input to the parser.
|
|
|
|
Input.push_back(0);
|
|
|
|
Input.shrink_to_fit();
|
2020-11-16 20:05:06 +01:00
|
|
|
bool IsValidWhen0Terminated = isValidYaml(Input.data(), Input.size() - 1);
|
|
|
|
|
|
|
|
// Ensure we don't crash on byte strings with no null characters, but with
|
|
|
|
// an invalid character one-past-the-end of the actual input to the parser.
|
|
|
|
Input.back() = 1;
|
|
|
|
bool IsValidWhen1Terminated = isValidYaml(Input.data(), Input.size() - 1);
|
|
|
|
|
|
|
|
// The parser should either accept all of these inputs, or reject all of
|
|
|
|
// them, because the parser sees an identical byte string in each case. This
|
|
|
|
// should hopefully catch some cases where the parser is sensitive to what is
|
|
|
|
// present one-past-the-end of the actual input.
|
|
|
|
if (IsValidWithout0s != IsValidWhen0Terminated ||
|
|
|
|
IsValidWhen0Terminated != IsValidWhen1Terminated)
|
|
|
|
LLVM_BUILTIN_TRAP;
|
2020-11-16 15:44:35 +01:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|