2018-10-12 00:33:50 +02:00
|
|
|
//===- CopyConfig.h -------------------------------------------------------===//
|
|
|
|
//
|
2019-01-19 09:50:56 +01:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2018-10-12 00:33:50 +02:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef LLVM_TOOLS_LLVM_OBJCOPY_COPY_CONFIG_H
|
|
|
|
#define LLVM_TOOLS_LLVM_OBJCOPY_COPY_CONFIG_H
|
|
|
|
|
[llvm-objcopy] Refactor ELF-specific config out to ELFCopyConfig. NFC.
Summary:
This patch splits the command-line parsing into two phases:
First, parse cross-platform options and leave ELF-specific options unparsed.
Second, in the ELF implementation, parse ELF-specific options and construct ELFCopyConfig.
Reviewers: espindola, alexshap, rupprecht, jhenderson, jakehehrlich, MaskRay
Reviewed By: alexshap, jhenderson, jakehehrlich, MaskRay
Subscribers: mgorny, emaste, arichardson, jakehehrlich, MaskRay, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67139
llvm-svn: 372712
2019-09-24 11:38:23 +02:00
|
|
|
#include "ELF/ELFConfig.h"
|
2018-10-12 00:33:50 +02:00
|
|
|
#include "llvm/ADT/ArrayRef.h"
|
2019-03-28 19:27:00 +01:00
|
|
|
#include "llvm/ADT/BitmaskEnum.h"
|
2018-10-12 00:33:50 +02:00
|
|
|
#include "llvm/ADT/Optional.h"
|
|
|
|
#include "llvm/ADT/SmallVector.h"
|
|
|
|
#include "llvm/ADT/StringMap.h"
|
|
|
|
#include "llvm/ADT/StringRef.h"
|
2019-02-25 15:12:41 +01:00
|
|
|
#include "llvm/Object/ELFTypes.h"
|
2019-02-04 19:38:00 +01:00
|
|
|
#include "llvm/Support/Allocator.h"
|
2019-02-21 18:05:19 +01:00
|
|
|
#include "llvm/Support/Error.h"
|
2019-02-06 12:00:07 +01:00
|
|
|
#include "llvm/Support/Regex.h"
|
2018-10-12 00:33:50 +02:00
|
|
|
// Necessary for llvm::DebugCompressionType::None
|
|
|
|
#include "llvm/Target/TargetOptions.h"
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
namespace llvm {
|
|
|
|
namespace objcopy {
|
|
|
|
|
2019-07-05 07:28:38 +02:00
|
|
|
enum class FileFormat {
|
|
|
|
Unspecified,
|
|
|
|
ELF,
|
|
|
|
Binary,
|
|
|
|
IHex,
|
|
|
|
};
|
|
|
|
|
2018-10-12 00:33:50 +02:00
|
|
|
// This type keeps track of the machine info for various architectures. This
|
|
|
|
// lets us map architecture names to ELF types and the e_machine value of the
|
|
|
|
// ELF file.
|
|
|
|
struct MachineInfo {
|
[llvm-objcopy] Support full list of bfd targets that lld uses.
Summary:
This change takes the full list of bfd targets that lld supports (see `ScriptParser.cpp`), including generic handling for `*-freebsd` targets (which uses the same settings but with a FreeBSD OSABI). In particular this adds mips support for `--output-target` (but not yet via `--binary-architecture`).
lld and llvm-objcopy use their own different custom data structures, so I'd prefer to check this in as-is (add support directly in llvm-objcopy, including all the test coverage) and do a separate NFC patch(s) that consolidate the two by putting this mapping into libobject.
See [[ https://bugs.llvm.org/show_bug.cgi?id=41462 | PR41462 ]].
Reviewers: jhenderson, jakehehrlich, espindola, alexshap, arichardson
Reviewed By: arichardson
Subscribers: fedor.sergeev, emaste, sdardis, krytarowski, atanasyan, llvm-commits, MaskRay, arichardson
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D60773
llvm-svn: 358562
2019-04-17 09:42:31 +02:00
|
|
|
MachineInfo(uint16_t EM, uint8_t ABI, bool Is64, bool IsLittle)
|
|
|
|
: EMachine(EM), OSABI(ABI), Is64Bit(Is64), IsLittleEndian(IsLittle) {}
|
|
|
|
// Alternative constructor that defaults to NONE for OSABI.
|
|
|
|
MachineInfo(uint16_t EM, bool Is64, bool IsLittle)
|
|
|
|
: MachineInfo(EM, ELF::ELFOSABI_NONE, Is64, IsLittle) {}
|
|
|
|
// Default constructor for unset fields.
|
|
|
|
MachineInfo() : MachineInfo(0, 0, false, false) {}
|
2018-10-12 00:33:50 +02:00
|
|
|
uint16_t EMachine;
|
2019-03-22 11:21:09 +01:00
|
|
|
uint8_t OSABI;
|
2018-10-12 00:33:50 +02:00
|
|
|
bool Is64Bit;
|
|
|
|
bool IsLittleEndian;
|
|
|
|
};
|
|
|
|
|
2019-03-28 19:27:00 +01:00
|
|
|
// Flags set by --set-section-flags or --rename-section. Interpretation of these
|
|
|
|
// is format-specific and not all flags are meaningful for all object file
|
|
|
|
// formats. This is a bitmask; many section flags may be set.
|
|
|
|
enum SectionFlag {
|
|
|
|
SecNone = 0,
|
|
|
|
SecAlloc = 1 << 0,
|
|
|
|
SecLoad = 1 << 1,
|
|
|
|
SecNoload = 1 << 2,
|
|
|
|
SecReadonly = 1 << 3,
|
|
|
|
SecDebug = 1 << 4,
|
|
|
|
SecCode = 1 << 5,
|
|
|
|
SecData = 1 << 6,
|
|
|
|
SecRom = 1 << 7,
|
|
|
|
SecMerge = 1 << 8,
|
|
|
|
SecStrings = 1 << 9,
|
|
|
|
SecContents = 1 << 10,
|
|
|
|
SecShare = 1 << 11,
|
|
|
|
LLVM_MARK_AS_BITMASK_ENUM(/* LargestValue = */ SecShare)
|
|
|
|
};
|
|
|
|
|
2018-10-12 00:33:50 +02:00
|
|
|
struct SectionRename {
|
|
|
|
StringRef OriginalName;
|
|
|
|
StringRef NewName;
|
2019-03-28 19:27:00 +01:00
|
|
|
Optional<SectionFlag> NewFlags;
|
2018-10-12 00:33:50 +02:00
|
|
|
};
|
|
|
|
|
[llvm-objcopy] Implement --set-section-flags.
Summary:
--set-section-flags is used to change the section flags (e.g. SHF_ALLOC) for given sections. The flags allowed are the same from the existing --rename-section=.old=.new[,flags] feature.
Additionally, make sure that --set-section-flag cannot be used with --rename-section (either the source or destination), since --rename-section accepts flags. This avoids ambiguity for something like "--rename-section=.foo=.bar,alloc --set-section-flag=.bar,code".
Reviewers: jhenderson, jakehehrlich, alexshap, espindola
Reviewed By: jhenderson, jakehehrlich
Subscribers: llvm-commits, emaste, arichardson
Differential Revision: https://reviews.llvm.org/D57198
llvm-svn: 352505
2019-01-29 16:05:38 +01:00
|
|
|
struct SectionFlagsUpdate {
|
|
|
|
StringRef Name;
|
2019-03-28 19:27:00 +01:00
|
|
|
SectionFlag NewFlags;
|
[llvm-objcopy] Implement --set-section-flags.
Summary:
--set-section-flags is used to change the section flags (e.g. SHF_ALLOC) for given sections. The flags allowed are the same from the existing --rename-section=.old=.new[,flags] feature.
Additionally, make sure that --set-section-flag cannot be used with --rename-section (either the source or destination), since --rename-section accepts flags. This avoids ambiguity for something like "--rename-section=.foo=.bar,alloc --set-section-flag=.bar,code".
Reviewers: jhenderson, jakehehrlich, alexshap, espindola
Reviewed By: jhenderson, jakehehrlich
Subscribers: llvm-commits, emaste, arichardson
Differential Revision: https://reviews.llvm.org/D57198
llvm-svn: 352505
2019-01-29 16:05:38 +01:00
|
|
|
};
|
|
|
|
|
[llvm-objcopy] Support -X|--discard-locals.
Summary:
This adds support for the --discard-locals flag, which acts similarly to --discard-all, except it only applies to compiler-generated symbols (i.e. symbols starting with `.L` in ELF).
I am not sure about COFF local symbols: those appear to also use `.L` in most cases, but also use just `L` in other cases, so for now I am just leaving it unimplemented there.
Fixes PR36160
Reviewers: jhenderson, alexshap, jakehehrlich, mstorsjo, espindola
Reviewed By: jhenderson
Subscribers: llvm-commits, emaste, arichardson
Differential Revision: https://reviews.llvm.org/D57248
llvm-svn: 352626
2019-01-30 15:58:13 +01:00
|
|
|
enum class DiscardType {
|
|
|
|
None, // Default
|
|
|
|
All, // --discard-all (-x)
|
|
|
|
Locals, // --discard-locals (-X)
|
|
|
|
};
|
|
|
|
|
2019-02-06 12:00:07 +01:00
|
|
|
class NameOrRegex {
|
|
|
|
StringRef Name;
|
|
|
|
// Regex is shared between multiple CopyConfig instances.
|
|
|
|
std::shared_ptr<Regex> R;
|
|
|
|
|
|
|
|
public:
|
|
|
|
NameOrRegex(StringRef Pattern, bool IsRegex);
|
|
|
|
bool operator==(StringRef S) const { return R ? R->match(S) : Name == S; }
|
|
|
|
bool operator!=(StringRef S) const { return !operator==(S); }
|
|
|
|
};
|
|
|
|
|
[llvm-objcopy][NFC] Refactor symbol/section matching
Summary:
The matchers for section/symbol related flags (e.g. `--keep-symbol=Name` or `--regex --keep-symbol=foo.*`) are currently just vectors that are matched linearlly. However, adding wildcard support would require negative matching too, e.g. a symbol should be removed if it matches a wildcard *but* doesn't match some other wildcard.
To make the next patch simpler, consolidate matching logic to a class defined in CopyConfig that takes care of matching.
Reviewers: jhenderson, seiya, MaskRay, espindola, alexshap
Reviewed By: jhenderson, MaskRay
Subscribers: emaste, arichardson, jakehehrlich, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D66432
llvm-svn: 369689
2019-08-22 21:17:50 +02:00
|
|
|
// Matcher that checks symbol or section names against the command line flags
|
|
|
|
// provided for that option.
|
|
|
|
class NameMatcher {
|
|
|
|
std::vector<NameOrRegex> Matchers;
|
|
|
|
|
|
|
|
public:
|
|
|
|
void addMatcher(NameOrRegex Matcher) {
|
|
|
|
Matchers.push_back(std::move(Matcher));
|
|
|
|
}
|
|
|
|
bool matches(StringRef S) const { return is_contained(Matchers, S); }
|
|
|
|
bool empty() const { return Matchers.empty(); }
|
|
|
|
};
|
|
|
|
|
2018-10-12 00:33:50 +02:00
|
|
|
// Configuration for copying/stripping a single file.
|
|
|
|
struct CopyConfig {
|
[llvm-objcopy] Refactor ELF-specific config out to ELFCopyConfig. NFC.
Summary:
This patch splits the command-line parsing into two phases:
First, parse cross-platform options and leave ELF-specific options unparsed.
Second, in the ELF implementation, parse ELF-specific options and construct ELFCopyConfig.
Reviewers: espindola, alexshap, rupprecht, jhenderson, jakehehrlich, MaskRay
Reviewed By: alexshap, jhenderson, jakehehrlich, MaskRay
Subscribers: mgorny, emaste, arichardson, jakehehrlich, MaskRay, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67139
llvm-svn: 372712
2019-09-24 11:38:23 +02:00
|
|
|
// Format-specific options to be initialized lazily when needed.
|
|
|
|
Optional<elf::ELFCopyConfig> ELF;
|
|
|
|
|
2018-10-12 00:33:50 +02:00
|
|
|
// Main input/output options
|
|
|
|
StringRef InputFilename;
|
2019-07-05 07:28:38 +02:00
|
|
|
FileFormat InputFormat;
|
2018-10-12 00:33:50 +02:00
|
|
|
StringRef OutputFilename;
|
2019-07-05 07:28:38 +02:00
|
|
|
FileFormat OutputFormat;
|
2018-10-12 00:33:50 +02:00
|
|
|
|
2019-01-07 17:59:12 +01:00
|
|
|
// Only applicable when --output-format!=binary (e.g. elf64-x86-64).
|
|
|
|
Optional<MachineInfo> OutputArch;
|
2018-10-12 00:33:50 +02:00
|
|
|
|
|
|
|
// Advanced options
|
|
|
|
StringRef AddGnuDebugLink;
|
2019-05-14 12:59:04 +02:00
|
|
|
// Cached gnu_debuglink's target CRC
|
|
|
|
uint32_t GnuDebugLinkCRC32;
|
2018-12-03 20:49:23 +01:00
|
|
|
StringRef BuildIdLinkDir;
|
|
|
|
Optional<StringRef> BuildIdLinkInput;
|
|
|
|
Optional<StringRef> BuildIdLinkOutput;
|
2019-06-07 19:57:48 +02:00
|
|
|
Optional<StringRef> ExtractPartition;
|
2018-10-12 00:33:50 +02:00
|
|
|
StringRef SplitDWO;
|
|
|
|
StringRef SymbolsPrefix;
|
2019-05-08 11:49:35 +02:00
|
|
|
StringRef AllocSectionsPrefix;
|
[llvm-objcopy] Support -X|--discard-locals.
Summary:
This adds support for the --discard-locals flag, which acts similarly to --discard-all, except it only applies to compiler-generated symbols (i.e. symbols starting with `.L` in ELF).
I am not sure about COFF local symbols: those appear to also use `.L` in most cases, but also use just `L` in other cases, so for now I am just leaving it unimplemented there.
Fixes PR36160
Reviewers: jhenderson, alexshap, jakehehrlich, mstorsjo, espindola
Reviewed By: jhenderson
Subscribers: llvm-commits, emaste, arichardson
Differential Revision: https://reviews.llvm.org/D57248
llvm-svn: 352626
2019-01-30 15:58:13 +01:00
|
|
|
DiscardType DiscardMode = DiscardType::None;
|
[llvm-objcopy] Refactor ELF-specific config out to ELFCopyConfig. NFC.
Summary:
This patch splits the command-line parsing into two phases:
First, parse cross-platform options and leave ELF-specific options unparsed.
Second, in the ELF implementation, parse ELF-specific options and construct ELFCopyConfig.
Reviewers: espindola, alexshap, rupprecht, jhenderson, jakehehrlich, MaskRay
Reviewed By: alexshap, jhenderson, jakehehrlich, MaskRay
Subscribers: mgorny, emaste, arichardson, jakehehrlich, MaskRay, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67139
llvm-svn: 372712
2019-09-24 11:38:23 +02:00
|
|
|
Optional<StringRef> NewSymbolVisibility;
|
2018-10-12 00:33:50 +02:00
|
|
|
|
|
|
|
// Repeated options
|
|
|
|
std::vector<StringRef> AddSection;
|
|
|
|
std::vector<StringRef> DumpSection;
|
[llvm-objcopy] Refactor ELF-specific config out to ELFCopyConfig. NFC.
Summary:
This patch splits the command-line parsing into two phases:
First, parse cross-platform options and leave ELF-specific options unparsed.
Second, in the ELF implementation, parse ELF-specific options and construct ELFCopyConfig.
Reviewers: espindola, alexshap, rupprecht, jhenderson, jakehehrlich, MaskRay
Reviewed By: alexshap, jhenderson, jakehehrlich, MaskRay
Subscribers: mgorny, emaste, arichardson, jakehehrlich, MaskRay, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67139
llvm-svn: 372712
2019-09-24 11:38:23 +02:00
|
|
|
std::vector<StringRef> SymbolsToAdd;
|
[llvm-objcopy][NFC] Refactor symbol/section matching
Summary:
The matchers for section/symbol related flags (e.g. `--keep-symbol=Name` or `--regex --keep-symbol=foo.*`) are currently just vectors that are matched linearlly. However, adding wildcard support would require negative matching too, e.g. a symbol should be removed if it matches a wildcard *but* doesn't match some other wildcard.
To make the next patch simpler, consolidate matching logic to a class defined in CopyConfig that takes care of matching.
Reviewers: jhenderson, seiya, MaskRay, espindola, alexshap
Reviewed By: jhenderson, MaskRay
Subscribers: emaste, arichardson, jakehehrlich, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D66432
llvm-svn: 369689
2019-08-22 21:17:50 +02:00
|
|
|
|
|
|
|
// Section matchers
|
|
|
|
NameMatcher KeepSection;
|
|
|
|
NameMatcher OnlySection;
|
|
|
|
NameMatcher ToRemove;
|
|
|
|
|
|
|
|
// Symbol matchers
|
|
|
|
NameMatcher SymbolsToGlobalize;
|
|
|
|
NameMatcher SymbolsToKeep;
|
|
|
|
NameMatcher SymbolsToLocalize;
|
|
|
|
NameMatcher SymbolsToRemove;
|
|
|
|
NameMatcher UnneededSymbolsToRemove;
|
|
|
|
NameMatcher SymbolsToWeaken;
|
|
|
|
NameMatcher SymbolsToKeepGlobal;
|
2018-10-12 00:33:50 +02:00
|
|
|
|
|
|
|
// Map options
|
|
|
|
StringMap<SectionRename> SectionsToRename;
|
[llvm-objcopy] Implement --set-section-flags.
Summary:
--set-section-flags is used to change the section flags (e.g. SHF_ALLOC) for given sections. The flags allowed are the same from the existing --rename-section=.old=.new[,flags] feature.
Additionally, make sure that --set-section-flag cannot be used with --rename-section (either the source or destination), since --rename-section accepts flags. This avoids ambiguity for something like "--rename-section=.foo=.bar,alloc --set-section-flag=.bar,code".
Reviewers: jhenderson, jakehehrlich, alexshap, espindola
Reviewed By: jhenderson, jakehehrlich
Subscribers: llvm-commits, emaste, arichardson
Differential Revision: https://reviews.llvm.org/D57198
llvm-svn: 352505
2019-01-29 16:05:38 +01:00
|
|
|
StringMap<SectionFlagsUpdate> SetSectionFlags;
|
2018-10-12 00:33:50 +02:00
|
|
|
StringMap<StringRef> SymbolsToRename;
|
|
|
|
|
2019-02-26 10:24:22 +01:00
|
|
|
// ELF entry point address expression. The input parameter is an entry point
|
|
|
|
// address in the input ELF file. The entry address in the output file is
|
|
|
|
// calculated with EntryExpr(input_address), when either --set-start or
|
|
|
|
// --change-start is used.
|
|
|
|
std::function<uint64_t(uint64_t)> EntryExpr;
|
|
|
|
|
2018-10-12 00:33:50 +02:00
|
|
|
// Boolean options
|
2019-04-18 11:13:30 +02:00
|
|
|
bool AllowBrokenLinks = false;
|
2018-11-01 18:36:37 +01:00
|
|
|
bool DeterministicArchives = true;
|
2018-10-12 00:33:50 +02:00
|
|
|
bool ExtractDWO = false;
|
2019-06-07 19:57:48 +02:00
|
|
|
bool ExtractMainPartition = false;
|
2018-10-12 00:33:50 +02:00
|
|
|
bool KeepFileSymbols = false;
|
|
|
|
bool LocalizeHidden = false;
|
|
|
|
bool OnlyKeepDebug = false;
|
|
|
|
bool PreserveDates = false;
|
|
|
|
bool StripAll = false;
|
|
|
|
bool StripAllGNU = false;
|
|
|
|
bool StripDWO = false;
|
|
|
|
bool StripDebug = false;
|
|
|
|
bool StripNonAlloc = false;
|
|
|
|
bool StripSections = false;
|
|
|
|
bool StripUnneeded = false;
|
|
|
|
bool Weaken = false;
|
|
|
|
bool DecompressDebugSections = false;
|
|
|
|
DebugCompressionType CompressionType = DebugCompressionType::None;
|
[llvm-objcopy] Refactor ELF-specific config out to ELFCopyConfig. NFC.
Summary:
This patch splits the command-line parsing into two phases:
First, parse cross-platform options and leave ELF-specific options unparsed.
Second, in the ELF implementation, parse ELF-specific options and construct ELFCopyConfig.
Reviewers: espindola, alexshap, rupprecht, jhenderson, jakehehrlich, MaskRay
Reviewed By: alexshap, jhenderson, jakehehrlich, MaskRay
Subscribers: mgorny, emaste, arichardson, jakehehrlich, MaskRay, abrachet, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67139
llvm-svn: 372712
2019-09-24 11:38:23 +02:00
|
|
|
|
|
|
|
// parseELFConfig performs ELF-specific command-line parsing. Fills `ELF` on
|
|
|
|
// success or returns an Error otherwise.
|
|
|
|
Error parseELFConfig() {
|
|
|
|
if (!ELF) {
|
|
|
|
Expected<elf::ELFCopyConfig> ELFConfig = elf::parseConfig(*this);
|
|
|
|
if (!ELFConfig)
|
|
|
|
return ELFConfig.takeError();
|
|
|
|
ELF = *ELFConfig;
|
|
|
|
}
|
|
|
|
return Error::success();
|
|
|
|
}
|
2018-10-12 00:33:50 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
// Configuration for the overall invocation of this tool. When invoked as
|
|
|
|
// objcopy, will always contain exactly one CopyConfig. When invoked as strip,
|
|
|
|
// will contain one or more CopyConfigs.
|
|
|
|
struct DriverConfig {
|
|
|
|
SmallVector<CopyConfig, 1> CopyConfigs;
|
2019-02-04 19:38:00 +01:00
|
|
|
BumpPtrAllocator Alloc;
|
2018-10-12 00:33:50 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
// ParseObjcopyOptions returns the config and sets the input arguments. If a
|
|
|
|
// help flag is set then ParseObjcopyOptions will print the help messege and
|
|
|
|
// exit.
|
2019-02-21 18:05:19 +01:00
|
|
|
Expected<DriverConfig> parseObjcopyOptions(ArrayRef<const char *> ArgsArr);
|
2018-10-12 00:33:50 +02:00
|
|
|
|
|
|
|
// ParseStripOptions returns the config and sets the input arguments. If a
|
|
|
|
// help flag is set then ParseStripOptions will print the help messege and
|
2019-06-18 02:39:10 +02:00
|
|
|
// exit. ErrorCallback is used to handle recoverable errors. An Error returned
|
|
|
|
// by the callback aborts the parsing and is then returned by this function.
|
|
|
|
Expected<DriverConfig>
|
|
|
|
parseStripOptions(ArrayRef<const char *> ArgsArr,
|
|
|
|
std::function<Error(Error)> ErrorCallback);
|
2018-10-12 00:33:50 +02:00
|
|
|
|
|
|
|
} // namespace objcopy
|
|
|
|
} // namespace llvm
|
|
|
|
|
|
|
|
#endif
|