1//===- CodeGenDataReader.cpp ----------------------------------------------===//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7//===----------------------------------------------------------------------===//
9// This file contains support for reading codegen data.
11//===----------------------------------------------------------------------===//
19 #define DEBUG_TYPE "cg-data-reader"
25 cl::desc(
"Read function map names in indexed CodeGenData. Can be "
26 "disabled to save memory and time for final consumption of the "
27 "indexed CodeGenData in production."));
34 "Lazily load indexed CodeGenData. Enable to save memory and time "
35 "for final consumption of the indexed CodeGenData in production."));
40 : FS.getBufferForFile(Filename);
41 if (std::error_code EC = BufferOrErr.getError())
43 return std::move(BufferOrErr.get());
56 auto processSectionContents = [&](
const StringRef &Name,
58 if (Name != CGOutlineName && Name != CGMergeName)
62 auto *
Data =
reinterpret_cast<const unsigned char *
>(Contents.data());
63 auto *EndData =
Data + Contents.size();
64 // In case dealing with an executable that has concatenated cgdata,
65 // we want to merge them into a single cgdata.
66 // Although it's not a typical workflow, we support this scenario
67 // by looping over all data in the sections.
68 if (Name == CGOutlineName) {
69 while (
Data != EndData) {
72 GlobalOutlineRecord.
merge(LocalOutlineRecord);
74 }
else if (Name == CGMergeName) {
75 while (
Data != EndData) {
78 GlobalFunctionMapRecord.
merge(LocalFunctionMapRecord);
83 for (
auto &Section : Obj->
sections()) {
90 processSectionContents(*NameOrErr, *ContentsOrErr);
99 // The smallest header with the version 1 is 24 bytes.
100 // Do not update this value even with the new version of the header.
101 const unsigned MinHeaderSize = 24;
102 if (DataBuffer->getBufferSize() < MinHeaderSize)
106 reinterpret_cast<const unsigned char *
>(DataBuffer->getBufferStart());
108 reinterpret_cast<const unsigned char *
>(DataBuffer->getBufferEnd());
113 const unsigned char *
Ptr = Start + Header.OutlinedHashTreeOffset;
119 // TODO: lazy loading support for outlined hash tree.
120 std::shared_ptr<MemoryBuffer> SharedDataBuffer = std::move(DataBuffer);
122 const unsigned char *
Ptr = Start + Header.StableFunctionMapOffset;
129 Header.StableFunctionMapOffset);
139 // Set up the buffer to read.
141 if (
Error E = BufferOrError.takeError())
148 if (Buffer->getBufferSize() == 0)
151 std::unique_ptr<CodeGenDataReader> Reader;
152 // Create the reader.
154 Reader = std::make_unique<IndexedCodeGenDataReader>(std::move(Buffer));
156 Reader = std::make_unique<TextCodeGenDataReader>(std::move(Buffer));
160 // Initialize the reader and return the result.
161 if (
Error E = Reader->read())
164 return std::move(Reader);
174 // Verify that it's magical.
179 // Verify that this really looks like plain ASCII text by checking a
180 // 'reasonable' number of characters (up to the magic size).
187 // Parse the custom header line by line.
188 for (; !Line.is_at_eof(); ++Line) {
189 // Skip empty or whitespace-only lines
190 if (Line->trim().empty())
193 if (!Line->starts_with(
":"))
196 if (Str.equals_insensitive(
"outlined_hash_tree"))
198 else if (Str.equals_insensitive(
"stable_function_map"))
204 // We treat an empty header (that is a comment # only) as a valid header.
205 if (Line.is_at_eof()) {
211 // The YAML docs follow after the header.
212 const char *Pos = Line->data();
213 size_t Size =
reinterpret_cast<size_t>(DataBuffer->getBufferEnd()) -
214 reinterpret_cast<size_t>(Pos);
223}
// end namespace llvm
static cl::opt< bool > IndexedCodeGenDataReadFunctionMapNames("indexed-codegen-data-read-function-map-names", cl::init(true), cl::Hidden, cl::desc("Read function map names in indexed CodeGenData. Can be " "disabled to save memory and time for final consumption of the " "indexed CodeGenData in production."))
Error success()
Clear the current error and return a successful one.
OutlinedHashTreeRecord HashTreeRecord
The outlined hash tree that has been read.
static LLVM_ABI Expected< std::unique_ptr< CodeGenDataReader > > create(const Twine &Path, vfs::FileSystem &FS)
Factory method to create an appropriately typed reader for the given codegen data file path and file ...
StableFunctionMapRecord FunctionMapRecord
The stable function map that has been read. When it's released by.
static LLVM_ABI Error mergeFromObjectFile(const object::ObjectFile *Obj, OutlinedHashTreeRecord &GlobalOutlineRecord, StableFunctionMapRecord &GlobalFunctionMapRecord, stable_hash *CombinedHash=nullptr)
Extract the cgdata embedded in sections from the given object file and merge them into the GlobalOutl...
Lightweight error class with error context and mandatory checking.
static ErrorSuccess success()
Create a success value.
Tagged union holding either a T or a Error.
Error takeError()
Take ownership of the stored error.
static bool hasFormat(const MemoryBuffer &Buffer)
Return true if the given buffer is in binary codegen data format.
Error read() override
Read the contents including the header.
bool hasStableFunctionMap() const override
Return true if the header indicates the data has a stable function map.
bool hasOutlinedHashTree() const override
Return true if the header indicates the data has an outlined hash tree.
This interface provides simple read-only access to a block of memory, and provides simple methods for...
StringRef getBuffer() const
static ErrorOr< std::unique_ptr< MemoryBuffer > > getSTDIN()
Read all of stdin into a file buffer, and return it.
StringRef - Represent a constant reference to a string, i.e.
StringRef drop_front(size_t N=1) const
Return a StringRef equal to 'this' but with the first N elements dropped.
StringRef rtrim(char Char) const
Return string with consecutive Char characters starting from the right removed.
StringRef take_front(size_t N=1) const
Return a StringRef equal to 'this' but with only the first N elements remaining.
static bool hasFormat(const MemoryBuffer &Buffer)
Return true if the given buffer is in text codegen data format.
bool hasStableFunctionMap() const override
Return true if the header indicates the data has a stable function map.
bool hasOutlinedHashTree() const override
Return true if the header indicates the data has an outlined hash tree.
Error read() override
Read the contents including the header.
Triple - Helper class for working with autoconf configuration names.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
This class is the base class for all object file types.
Triple makeTriple() const
Create a triple from the data in this object file.
section_iterator_range sections() const
The virtual file system interface.
initializer< Ty > init(const Ty &Val)
value_type read(const void *memory, endianness endian)
Read a value of a particular endianness from memory.
This is an optimization pass for GlobalISel generic memory operations.
@ StableFunctionMergingMap
@ FunctionOutlinedHashTree
static Expected< std::unique_ptr< MemoryBuffer > > setupMemoryBuffer(const Twine &Filename, vfs::FileSystem &FS)
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI uint64_t xxh3_64bits(ArrayRef< uint8_t > data)
cl::opt< bool > IndexedCodeGenDataLazyLoading("indexed-codegen-data-lazy-loading", cl::init(false), cl::Hidden, cl::desc("Lazily load indexed CodeGenData. Enable to save memory and time " "for final consumption of the indexed CodeGenData in production."))
uint64_t stable_hash
An opaque object representing a stable hash code.
Error make_error(ArgTs &&... Args)
Make a Error instance representing failure using the given error info type.
FunctionAddr VTableAddr uintptr_t uintptr_t Data
bool isPrint(char C)
Checks whether character C is printable.
bool isSpace(char C)
Checks whether character C is whitespace in the "C" locale.
LLVM_ABI Error errorCodeToError(std::error_code EC)
Helper for converting an std::error_code to a Error.
stable_hash stable_hash_combine(ArrayRef< stable_hash > Buffer)
LLVM_ABI std::string getCodeGenDataSectionName(CGDataSectKind CGSK, Triple::ObjectFormatType OF, bool AddSegmentInfo=true)
LLVM_ABI void deserialize(const unsigned char *&Ptr)
Deserialize the outlined hash tree from a raw_ostream.
void merge(const OutlinedHashTreeRecord &Other)
Merge the other outlined hash tree into this one.
The structure of the serialized stable function map is as follows:
void merge(const StableFunctionMapRecord &Other)
Merge the stable function map into this one.
LLVM_ABI void deserialize(const unsigned char *&Ptr)
Deserialize the stable function map from a raw_ostream.