c33b9395b1
When opaque pointers are enabled and old IR with typed pointers is read, the BitcodeReader automatically upgrades all typed pointers to opaque pointers. This is a lossy conversion, i.e. when a function argument is a pointer and unused, it’s impossible to reconstruct the original type behind the pointer. There are cases where the type information of pointers is needed. One is reading DXIL, which is bitcode of old LLVM IR and makes a lot of use of pointers in function signatures. We’d like to keep using up-to-date llvm to read in and process DXIL, so in the face of opaque pointers, we need some way to access the type information of pointers from the read bitcode. This patch allows extracting type information by supplying functions to parseBitcodeFile that get called for each function signature or metadata value. The function can access the type information via the reader’s type IDs and the getTypeByID and getContainedTypeID functions. The tests exemplarily shows how type info from pointers can be stored in metadata for use after the BitcodeReader finished. Differential Revision: https://reviews.llvm.org/D127728
136 lines
5.0 KiB
C++
136 lines
5.0 KiB
C++
//===---- IRReader.cpp - Reader for LLVM IR files -------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/IRReader/IRReader.h"
|
|
#include "llvm-c/IRReader.h"
|
|
#include "llvm/AsmParser/Parser.h"
|
|
#include "llvm/Bitcode/BitcodeReader.h"
|
|
#include "llvm/IR/LLVMContext.h"
|
|
#include "llvm/IR/Module.h"
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
#include "llvm/Support/SourceMgr.h"
|
|
#include "llvm/Support/Timer.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
#include <optional>
|
|
#include <system_error>
|
|
|
|
using namespace llvm;
|
|
|
|
namespace llvm {
|
|
extern bool TimePassesIsEnabled;
|
|
}
|
|
|
|
const char TimeIRParsingGroupName[] = "irparse";
|
|
const char TimeIRParsingGroupDescription[] = "LLVM IR Parsing";
|
|
const char TimeIRParsingName[] = "parse";
|
|
const char TimeIRParsingDescription[] = "Parse IR";
|
|
|
|
std::unique_ptr<Module>
|
|
llvm::getLazyIRModule(std::unique_ptr<MemoryBuffer> Buffer, SMDiagnostic &Err,
|
|
LLVMContext &Context, bool ShouldLazyLoadMetadata) {
|
|
if (isBitcode((const unsigned char *)Buffer->getBufferStart(),
|
|
(const unsigned char *)Buffer->getBufferEnd())) {
|
|
Expected<std::unique_ptr<Module>> ModuleOrErr = getOwningLazyBitcodeModule(
|
|
std::move(Buffer), Context, ShouldLazyLoadMetadata);
|
|
if (Error E = ModuleOrErr.takeError()) {
|
|
handleAllErrors(std::move(E), [&](ErrorInfoBase &EIB) {
|
|
Err = SMDiagnostic(Buffer->getBufferIdentifier(), SourceMgr::DK_Error,
|
|
EIB.message());
|
|
});
|
|
return nullptr;
|
|
}
|
|
return std::move(ModuleOrErr.get());
|
|
}
|
|
|
|
return parseAssembly(Buffer->getMemBufferRef(), Err, Context);
|
|
}
|
|
|
|
std::unique_ptr<Module> llvm::getLazyIRFileModule(StringRef Filename,
|
|
SMDiagnostic &Err,
|
|
LLVMContext &Context,
|
|
bool ShouldLazyLoadMetadata) {
|
|
ErrorOr<std::unique_ptr<MemoryBuffer>> FileOrErr =
|
|
MemoryBuffer::getFileOrSTDIN(Filename);
|
|
if (std::error_code EC = FileOrErr.getError()) {
|
|
Err = SMDiagnostic(Filename, SourceMgr::DK_Error,
|
|
"Could not open input file: " + EC.message());
|
|
return nullptr;
|
|
}
|
|
|
|
return getLazyIRModule(std::move(FileOrErr.get()), Err, Context,
|
|
ShouldLazyLoadMetadata);
|
|
}
|
|
|
|
std::unique_ptr<Module> llvm::parseIR(MemoryBufferRef Buffer, SMDiagnostic &Err,
|
|
LLVMContext &Context,
|
|
ParserCallbacks Callbacks) {
|
|
NamedRegionTimer T(TimeIRParsingName, TimeIRParsingDescription,
|
|
TimeIRParsingGroupName, TimeIRParsingGroupDescription,
|
|
TimePassesIsEnabled);
|
|
if (isBitcode((const unsigned char *)Buffer.getBufferStart(),
|
|
(const unsigned char *)Buffer.getBufferEnd())) {
|
|
Expected<std::unique_ptr<Module>> ModuleOrErr =
|
|
parseBitcodeFile(Buffer, Context, Callbacks);
|
|
if (Error E = ModuleOrErr.takeError()) {
|
|
handleAllErrors(std::move(E), [&](ErrorInfoBase &EIB) {
|
|
Err = SMDiagnostic(Buffer.getBufferIdentifier(), SourceMgr::DK_Error,
|
|
EIB.message());
|
|
});
|
|
return nullptr;
|
|
}
|
|
return std::move(ModuleOrErr.get());
|
|
}
|
|
|
|
return parseAssembly(Buffer, Err, Context, nullptr,
|
|
Callbacks.DataLayout.value_or(
|
|
[](StringRef, StringRef) { return std::nullopt; }));
|
|
}
|
|
|
|
std::unique_ptr<Module> llvm::parseIRFile(StringRef Filename, SMDiagnostic &Err,
|
|
LLVMContext &Context,
|
|
ParserCallbacks Callbacks) {
|
|
ErrorOr<std::unique_ptr<MemoryBuffer>> FileOrErr =
|
|
MemoryBuffer::getFileOrSTDIN(Filename, /*IsText=*/true);
|
|
if (std::error_code EC = FileOrErr.getError()) {
|
|
Err = SMDiagnostic(Filename, SourceMgr::DK_Error,
|
|
"Could not open input file: " + EC.message());
|
|
return nullptr;
|
|
}
|
|
|
|
return parseIR(FileOrErr.get()->getMemBufferRef(), Err, Context, Callbacks);
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// C API.
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
LLVMBool LLVMParseIRInContext(LLVMContextRef ContextRef,
|
|
LLVMMemoryBufferRef MemBuf, LLVMModuleRef *OutM,
|
|
char **OutMessage) {
|
|
SMDiagnostic Diag;
|
|
|
|
std::unique_ptr<MemoryBuffer> MB(unwrap(MemBuf));
|
|
*OutM =
|
|
wrap(parseIR(MB->getMemBufferRef(), Diag, *unwrap(ContextRef)).release());
|
|
|
|
if(!*OutM) {
|
|
if (OutMessage) {
|
|
std::string buf;
|
|
raw_string_ostream os(buf);
|
|
|
|
Diag.print(nullptr, os, false);
|
|
os.flush();
|
|
|
|
*OutMessage = strdup(buf.c_str());
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
return 0;
|
|
}
|