Viewing file: BitcodeReader.h (12.69 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
//===- llvm/Bitcode/BitcodeReader.h - Bitcode reader ------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This header defines interfaces to read LLVM bitcode files/streams. // //===----------------------------------------------------------------------===//
#ifndef LLVM_BITCODE_BITCODEREADER_H #define LLVM_BITCODE_BITCODEREADER_H
#include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/StringRef.h" #include "llvm/Bitstream/BitCodeEnums.h" #include "llvm/IR/GlobalValue.h" #include "llvm/Support/Endian.h" #include "llvm/Support/Error.h" #include "llvm/Support/ErrorOr.h" #include "llvm/Support/MemoryBufferRef.h" #include <cstdint> #include <memory> #include <optional> #include <string> #include <system_error> #include <vector> namespace llvm {
class LLVMContext; class Module; class MemoryBuffer; class Metadata; class ModuleSummaryIndex; class Type; class Value;
// Callback to override the data layout string of an imported bitcode module. // The first argument is the target triple, the second argument the data layout // string from the input, or a default string. It will be used if the callback // returns std::nullopt. typedef std::function<std::optional<std::string>(StringRef, StringRef)> DataLayoutCallbackFuncTy;
typedef std::function<Type *(unsigned)> GetTypeByIDTy;
typedef std::function<unsigned(unsigned, unsigned)> GetContainedTypeIDTy;
typedef std::function<void(Value *, unsigned, GetTypeByIDTy, GetContainedTypeIDTy)> ValueTypeCallbackTy;
typedef std::function<void(Metadata **, unsigned, GetTypeByIDTy, GetContainedTypeIDTy)> MDTypeCallbackTy;
// These functions are for converting Expected/Error values to // ErrorOr/std::error_code for compatibility with legacy clients. FIXME: // Remove these functions once no longer needed by the C and libLTO APIs.
std::error_code errorToErrorCodeAndEmitErrors(LLVMContext &Ctx, Error Err);
template <typename T> ErrorOr<T> expectedToErrorOrAndEmitErrors(LLVMContext &Ctx, Expected<T> Val) { if (!Val) return errorToErrorCodeAndEmitErrors(Ctx, Val.takeError()); return std::move(*Val); }
struct ParserCallbacks { std::optional<DataLayoutCallbackFuncTy> DataLayout; /// The ValueType callback is called for every function definition or /// declaration and allows accessing the type information, also behind /// pointers. This can be useful, when the opaque pointer upgrade cleans all /// type information behind pointers. /// The second argument to ValueTypeCallback is the type ID of the /// function, the two passed functions can be used to extract type /// information. std::optional<ValueTypeCallbackTy> ValueType; /// The MDType callback is called for every value in metadata. std::optional<MDTypeCallbackTy> MDType;
ParserCallbacks() = default; explicit ParserCallbacks(DataLayoutCallbackFuncTy DataLayout) : DataLayout(DataLayout) {} };
struct BitcodeFileContents;
/// Basic information extracted from a bitcode module to be used for LTO. struct BitcodeLTOInfo { bool IsThinLTO; bool HasSummary; bool EnableSplitLTOUnit; bool UnifiedLTO; };
/// Represents a module in a bitcode file. class BitcodeModule { // This covers the identification (if present) and module blocks. ArrayRef<uint8_t> Buffer; StringRef ModuleIdentifier;
// The string table used to interpret this module. StringRef Strtab;
// The bitstream location of the IDENTIFICATION_BLOCK. uint64_t IdentificationBit;
// The bitstream location of this module's MODULE_BLOCK. uint64_t ModuleBit;
BitcodeModule(ArrayRef<uint8_t> Buffer, StringRef ModuleIdentifier, uint64_t IdentificationBit, uint64_t ModuleBit) : Buffer(Buffer), ModuleIdentifier(ModuleIdentifier), IdentificationBit(IdentificationBit), ModuleBit(ModuleBit) {}
// Calls the ctor. friend Expected<BitcodeFileContents> getBitcodeFileContents(MemoryBufferRef Buffer);
Expected<std::unique_ptr<Module>> getModuleImpl(LLVMContext &Context, bool MaterializeAll, bool ShouldLazyLoadMetadata, bool IsImporting, ParserCallbacks Callbacks = {});
public: StringRef getBuffer() const { return StringRef((const char *)Buffer.begin(), Buffer.size()); }
StringRef getStrtab() const { return Strtab; }
StringRef getModuleIdentifier() const { return ModuleIdentifier; }
/// Read the bitcode module and prepare for lazy deserialization of function /// bodies. If ShouldLazyLoadMetadata is true, lazily load metadata as well. /// If IsImporting is true, this module is being parsed for ThinLTO /// importing into another module. Expected<std::unique_ptr<Module>> getLazyModule(LLVMContext &Context, bool ShouldLazyLoadMetadata, bool IsImporting, ParserCallbacks Callbacks = {});
/// Read the entire bitcode module and return it. Expected<std::unique_ptr<Module>> parseModule(LLVMContext &Context, ParserCallbacks Callbacks = {});
/// Returns information about the module to be used for LTO: whether to /// compile with ThinLTO, and whether it has a summary. Expected<BitcodeLTOInfo> getLTOInfo();
/// Parse the specified bitcode buffer, returning the module summary index. Expected<std::unique_ptr<ModuleSummaryIndex>> getSummary();
/// Parse the specified bitcode buffer and merge its module summary index /// into CombinedIndex. Error readSummary(ModuleSummaryIndex &CombinedIndex, StringRef ModulePath, std::function<bool(GlobalValue::GUID)> IsPrevailing = nullptr); };
struct BitcodeFileContents { std::vector<BitcodeModule> Mods; StringRef Symtab, StrtabForSymtab; };
/// Returns the contents of a bitcode file. This includes the raw contents of /// the symbol table embedded in the bitcode file. Clients which require a /// symbol table should prefer to use irsymtab::read instead of this function /// because it creates a reader for the irsymtab and handles upgrading bitcode /// files without a symbol table or with an old symbol table. Expected<BitcodeFileContents> getBitcodeFileContents(MemoryBufferRef Buffer);
/// Returns a list of modules in the specified bitcode buffer. Expected<std::vector<BitcodeModule>> getBitcodeModuleList(MemoryBufferRef Buffer);
/// Read the header of the specified bitcode buffer and prepare for lazy /// deserialization of function bodies. If ShouldLazyLoadMetadata is true, /// lazily load metadata as well. If IsImporting is true, this module is /// being parsed for ThinLTO importing into another module. Expected<std::unique_ptr<Module>> getLazyBitcodeModule(MemoryBufferRef Buffer, LLVMContext &Context, bool ShouldLazyLoadMetadata = false, bool IsImporting = false, ParserCallbacks Callbacks = {});
/// Like getLazyBitcodeModule, except that the module takes ownership of /// the memory buffer if successful. If successful, this moves Buffer. On /// error, this *does not* move Buffer. If IsImporting is true, this module is /// being parsed for ThinLTO importing into another module. Expected<std::unique_ptr<Module>> getOwningLazyBitcodeModule( std::unique_ptr<MemoryBuffer> &&Buffer, LLVMContext &Context, bool ShouldLazyLoadMetadata = false, bool IsImporting = false, ParserCallbacks Callbacks = {});
/// Read the header of the specified bitcode buffer and extract just the /// triple information. If successful, this returns a string. On error, this /// returns "". Expected<std::string> getBitcodeTargetTriple(MemoryBufferRef Buffer);
/// Return true if \p Buffer contains a bitcode file with ObjC code (category /// or class) in it. Expected<bool> isBitcodeContainingObjCCategory(MemoryBufferRef Buffer);
/// Read the header of the specified bitcode buffer and extract just the /// producer string information. If successful, this returns a string. On /// error, this returns "". Expected<std::string> getBitcodeProducerString(MemoryBufferRef Buffer);
/// Read the specified bitcode file, returning the module. Expected<std::unique_ptr<Module>> parseBitcodeFile(MemoryBufferRef Buffer, LLVMContext &Context, ParserCallbacks Callbacks = {});
/// Returns LTO information for the specified bitcode file. Expected<BitcodeLTOInfo> getBitcodeLTOInfo(MemoryBufferRef Buffer);
/// Parse the specified bitcode buffer, returning the module summary index. Expected<std::unique_ptr<ModuleSummaryIndex>> getModuleSummaryIndex(MemoryBufferRef Buffer);
/// Parse the specified bitcode buffer and merge the index into CombinedIndex. Error readModuleSummaryIndex(MemoryBufferRef Buffer, ModuleSummaryIndex &CombinedIndex);
/// Parse the module summary index out of an IR file and return the module /// summary index object if found, or an empty summary if not. If Path refers /// to an empty file and IgnoreEmptyThinLTOIndexFile is true, then /// this function will return nullptr. Expected<std::unique_ptr<ModuleSummaryIndex>> getModuleSummaryIndexForFile(StringRef Path, bool IgnoreEmptyThinLTOIndexFile = false);
/// isBitcodeWrapper - Return true if the given bytes are the magic bytes /// for an LLVM IR bitcode wrapper. inline bool isBitcodeWrapper(const unsigned char *BufPtr, const unsigned char *BufEnd) { // See if you can find the hidden message in the magic bytes :-). // (Hint: it's a little-endian encoding.) return BufPtr != BufEnd && BufPtr[0] == 0xDE && BufPtr[1] == 0xC0 && BufPtr[2] == 0x17 && BufPtr[3] == 0x0B; }
/// isRawBitcode - Return true if the given bytes are the magic bytes for /// raw LLVM IR bitcode (without a wrapper). inline bool isRawBitcode(const unsigned char *BufPtr, const unsigned char *BufEnd) { // These bytes sort of have a hidden message, but it's not in // little-endian this time, and it's a little redundant. return BufPtr != BufEnd && BufPtr[0] == 'B' && BufPtr[1] == 'C' && BufPtr[2] == 0xc0 && BufPtr[3] == 0xde; }
/// isBitcode - Return true if the given bytes are the magic bytes for /// LLVM IR bitcode, either with or without a wrapper. inline bool isBitcode(const unsigned char *BufPtr, const unsigned char *BufEnd) { return isBitcodeWrapper(BufPtr, BufEnd) || isRawBitcode(BufPtr, BufEnd); }
/// SkipBitcodeWrapperHeader - Some systems wrap bc files with a special /// header for padding or other reasons. The format of this header is: /// /// struct bc_header { /// uint32_t Magic; // 0x0B17C0DE /// uint32_t Version; // Version, currently always 0. /// uint32_t BitcodeOffset; // Offset to traditional bitcode file. /// uint32_t BitcodeSize; // Size of traditional bitcode file. /// ... potentially other gunk ... /// }; /// /// This function is called when we find a file with a matching magic number. /// In this case, skip down to the subsection of the file that is actually a /// BC file. /// If 'VerifyBufferSize' is true, check that the buffer is large enough to /// contain the whole bitcode file. inline bool SkipBitcodeWrapperHeader(const unsigned char *&BufPtr, const unsigned char *&BufEnd, bool VerifyBufferSize) { // Must contain the offset and size field! if (unsigned(BufEnd - BufPtr) < BWH_SizeField + 4) return true;
unsigned Offset = support::endian::read32le(&BufPtr[BWH_OffsetField]); unsigned Size = support::endian::read32le(&BufPtr[BWH_SizeField]); uint64_t BitcodeOffsetEnd = (uint64_t)Offset + (uint64_t)Size;
// Verify that Offset+Size fits in the file. if (VerifyBufferSize && BitcodeOffsetEnd > uint64_t(BufEnd-BufPtr)) return true; BufPtr += Offset; BufEnd = BufPtr+Size; return false; }
APInt readWideAPInt(ArrayRef<uint64_t> Vals, unsigned TypeBits);
const std::error_category &BitcodeErrorCategory(); enum class BitcodeError { CorruptedBitcode = 1 }; inline std::error_code make_error_code(BitcodeError E) { return std::error_code(static_cast<int>(E), BitcodeErrorCategory()); }
} // end namespace llvm
namespace std {
template <> struct is_error_code_enum<llvm::BitcodeError> : std::true_type {};
} // end namespace std
#endif // LLVM_BITCODE_BITCODEREADER_H
|