This PR changes how `ModuleManager` deduplicates module files. Previously, `ModuleManager` used `FileEntry` for assigning unique identity to module files. This works fine for explicitly-built modules because they don't change during the lifetime of a single Clang instance. For implicitly-built modules however, there are two issues: 1. The `FileEntry` objects are deduplicated by `FileManager` based on the inode number. Some file systems reuse inode numbers of previously removed files. Because implicitly-built module files are rapidly removed and created, this deduplication breaks and compilations may fail spuriously when inode numbers are recycled during the lifetime of a single Clang instance. 2. The first thing `ModuleManager` does when loading a module file is consulting the `FileManager` and checking the file size and modification time match the expectation of the importer. This is done even when such module file already lives in the `InMemoryModuleCache`. This introduces racy behavior into the mechanism that explicitly tries to solve race conditions, and may lead into spurious compilation failures. This PR identifies implicitly-built module files by a pair of `DirectoryEntry` of the module cache path and the path suffix `<context-hash>/<module-name>-<module-map-path-hash>.pcm`. This gives us canonicalization of the user-provided module cache path without turning to `FileEntry` for the PCM file. The path suffix is Clang-generated and is already canonical. Some tests needed to be updated because the module cache path directory was also used as an include directory. This PR relies on not caching the non-existence of the module cache directory in the `FileManager`. When other parts of Clang are trying to look up the same path and cache its non-existence, things break. This is probably very specific to some of our tests and not how users are setting up their compilations.
203 lines
8.0 KiB
C++
203 lines
8.0 KiB
C++
//===- ChainedIncludesSource.cpp - Chained PCHs in Memory -------*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file defines the ChainedIncludesSource class, which converts headers
|
|
// to chained PCHs in memory, mainly used for testing.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "clang/Basic/Builtins.h"
|
|
#include "clang/Basic/TargetInfo.h"
|
|
#include "clang/Frontend/ASTUnit.h"
|
|
#include "clang/Frontend/CompilerInstance.h"
|
|
#include "clang/Frontend/TextDiagnosticPrinter.h"
|
|
#include "clang/Lex/Preprocessor.h"
|
|
#include "clang/Lex/PreprocessorOptions.h"
|
|
#include "clang/Parse/ParseAST.h"
|
|
#include "clang/Sema/MultiplexExternalSemaSource.h"
|
|
#include "clang/Serialization/ASTReader.h"
|
|
#include "clang/Serialization/ASTWriter.h"
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
|
|
using namespace clang;
|
|
|
|
namespace {
|
|
class ChainedIncludesSource : public ExternalSemaSource {
|
|
public:
|
|
ChainedIncludesSource(std::vector<std::unique_ptr<CompilerInstance>> CIs)
|
|
: CIs(std::move(CIs)) {}
|
|
|
|
protected:
|
|
//===--------------------------------------------------------------------===//
|
|
// ExternalASTSource interface.
|
|
//===--------------------------------------------------------------------===//
|
|
|
|
/// Return the amount of memory used by memory buffers, breaking down
|
|
/// by heap-backed versus mmap'ed memory.
|
|
void getMemoryBufferSizes(MemoryBufferSizes &sizes) const override {
|
|
for (unsigned i = 0, e = CIs.size(); i != e; ++i) {
|
|
if (const ExternalASTSource *eSrc =
|
|
CIs[i]->getASTContext().getExternalSource()) {
|
|
eSrc->getMemoryBufferSizes(sizes);
|
|
}
|
|
}
|
|
}
|
|
|
|
private:
|
|
std::vector<std::unique_ptr<CompilerInstance>> CIs;
|
|
};
|
|
} // end anonymous namespace
|
|
|
|
static llvm::IntrusiveRefCntPtr<ASTReader>
|
|
createASTReader(CompilerInstance &CI, StringRef pchFile,
|
|
SmallVectorImpl<std::unique_ptr<llvm::MemoryBuffer>> &MemBufs,
|
|
SmallVectorImpl<std::string> &bufNames,
|
|
ASTDeserializationListener *deserialListener = nullptr) {
|
|
Preprocessor &PP = CI.getPreprocessor();
|
|
auto Reader = llvm::makeIntrusiveRefCnt<ASTReader>(
|
|
PP, CI.getModuleCache(), &CI.getASTContext(), CI.getPCHContainerReader(),
|
|
CI.getCodeGenOpts(),
|
|
/*Extensions=*/ArrayRef<std::shared_ptr<ModuleFileExtension>>(),
|
|
/*isysroot=*/"", DisableValidationForModuleKind::PCH);
|
|
for (unsigned ti = 0; ti < bufNames.size(); ++ti) {
|
|
StringRef sr(bufNames[ti]);
|
|
Reader->addInMemoryBuffer(sr, std::move(MemBufs[ti]));
|
|
}
|
|
Reader->setDeserializationListener(deserialListener);
|
|
switch (Reader->ReadAST(ModuleFileName::makeExplicit(pchFile),
|
|
serialization::MK_PCH, SourceLocation(),
|
|
ASTReader::ARR_None)) {
|
|
case ASTReader::Success:
|
|
// Set the predefines buffer as suggested by the PCH reader.
|
|
PP.setPredefines(Reader->getSuggestedPredefines());
|
|
return Reader;
|
|
|
|
case ASTReader::Failure:
|
|
case ASTReader::Missing:
|
|
case ASTReader::OutOfDate:
|
|
case ASTReader::VersionMismatch:
|
|
case ASTReader::ConfigurationMismatch:
|
|
case ASTReader::HadErrors:
|
|
break;
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
IntrusiveRefCntPtr<ExternalSemaSource>
|
|
clang::createChainedIncludesSource(CompilerInstance &CI,
|
|
IntrusiveRefCntPtr<ASTReader> &OutReader) {
|
|
|
|
std::vector<std::string> &includes = CI.getPreprocessorOpts().ChainedIncludes;
|
|
assert(!includes.empty() && "No '-chain-include' in options!");
|
|
|
|
std::vector<std::unique_ptr<CompilerInstance>> CIs;
|
|
InputKind IK = CI.getFrontendOpts().Inputs[0].getKind();
|
|
|
|
SmallVector<std::unique_ptr<llvm::MemoryBuffer>, 4> SerialBufs;
|
|
SmallVector<std::string, 4> serialBufNames;
|
|
|
|
for (unsigned i = 0, e = includes.size(); i != e; ++i) {
|
|
bool firstInclude = (i == 0);
|
|
std::unique_ptr<CompilerInvocation> CInvok;
|
|
CInvok.reset(new CompilerInvocation(CI.getInvocation()));
|
|
|
|
CInvok->getPreprocessorOpts().ChainedIncludes.clear();
|
|
CInvok->getPreprocessorOpts().ImplicitPCHInclude.clear();
|
|
CInvok->getPreprocessorOpts().DisablePCHOrModuleValidation =
|
|
DisableValidationForModuleKind::PCH;
|
|
CInvok->getPreprocessorOpts().Includes.clear();
|
|
CInvok->getPreprocessorOpts().MacroIncludes.clear();
|
|
CInvok->getPreprocessorOpts().Macros.clear();
|
|
|
|
CInvok->getFrontendOpts().Inputs.clear();
|
|
FrontendInputFile InputFile(includes[i], IK);
|
|
CInvok->getFrontendOpts().Inputs.push_back(InputFile);
|
|
|
|
TextDiagnosticPrinter *DiagClient =
|
|
new TextDiagnosticPrinter(llvm::errs(), CI.getDiagnosticOpts());
|
|
auto Diags = llvm::makeIntrusiveRefCnt<DiagnosticsEngine>(
|
|
DiagnosticIDs::create(), CI.getDiagnosticOpts(), DiagClient);
|
|
|
|
auto Clang = std::make_unique<CompilerInstance>(
|
|
std::move(CInvok), CI.getPCHContainerOperations());
|
|
// Inherit the VFS as-is: code below does not make changes to the VFS or to
|
|
// the VFS-affecting options.
|
|
Clang->setVirtualFileSystem(CI.getVirtualFileSystemPtr());
|
|
Clang->setDiagnostics(Diags);
|
|
Clang->setTarget(TargetInfo::CreateTargetInfo(
|
|
Clang->getDiagnostics(), Clang->getInvocation().getTargetOpts()));
|
|
Clang->createFileManager();
|
|
Clang->createSourceManager();
|
|
Clang->createPreprocessor(TU_Prefix);
|
|
Clang->getDiagnosticClient().BeginSourceFile(Clang->getLangOpts(),
|
|
&Clang->getPreprocessor());
|
|
Clang->createASTContext();
|
|
|
|
auto Buffer = std::make_shared<PCHBuffer>();
|
|
ArrayRef<std::shared_ptr<ModuleFileExtension>> Extensions;
|
|
auto consumer = std::make_unique<PCHGenerator>(
|
|
Clang->getPreprocessor(), Clang->getModuleCache(), "-", /*isysroot=*/"",
|
|
Buffer, Clang->getCodeGenOpts(), Extensions,
|
|
/*AllowASTWithErrors=*/true);
|
|
Clang->getASTContext().setASTMutationListener(
|
|
consumer->GetASTMutationListener());
|
|
Clang->setASTConsumer(std::move(consumer));
|
|
Clang->createSema(TU_Prefix, nullptr);
|
|
|
|
if (firstInclude) {
|
|
Preprocessor &PP = Clang->getPreprocessor();
|
|
PP.getBuiltinInfo().initializeBuiltins(PP.getIdentifierTable(),
|
|
PP.getLangOpts());
|
|
} else {
|
|
assert(!SerialBufs.empty());
|
|
SmallVector<std::unique_ptr<llvm::MemoryBuffer>, 4> Bufs;
|
|
// TODO: Pass through the existing MemoryBuffer instances instead of
|
|
// allocating new ones.
|
|
for (auto &SB : SerialBufs)
|
|
Bufs.push_back(llvm::MemoryBuffer::getMemBuffer(SB->getBuffer()));
|
|
std::string pchName = includes[i-1];
|
|
llvm::raw_string_ostream os(pchName);
|
|
os << ".pch" << i-1;
|
|
serialBufNames.push_back(pchName);
|
|
|
|
IntrusiveRefCntPtr<ASTReader> Reader;
|
|
Reader = createASTReader(
|
|
*Clang, pchName, Bufs, serialBufNames,
|
|
Clang->getASTConsumer().GetASTDeserializationListener());
|
|
if (!Reader)
|
|
return nullptr;
|
|
Clang->setASTReader(Reader);
|
|
Clang->getASTContext().setExternalSource(Reader);
|
|
}
|
|
|
|
if (!Clang->InitializeSourceManager(InputFile))
|
|
return nullptr;
|
|
|
|
ParseAST(Clang->getSema());
|
|
Clang->getDiagnosticClient().EndSourceFile();
|
|
assert(Buffer->IsComplete && "serialization did not complete");
|
|
auto &serialAST = Buffer->Data;
|
|
SerialBufs.push_back(llvm::MemoryBuffer::getMemBufferCopy(
|
|
StringRef(serialAST.data(), serialAST.size())));
|
|
serialAST.clear();
|
|
CIs.push_back(std::move(Clang));
|
|
}
|
|
|
|
assert(!SerialBufs.empty());
|
|
std::string pchName = includes.back() + ".pch-final";
|
|
serialBufNames.push_back(pchName);
|
|
OutReader = createASTReader(CI, pchName, SerialBufs, serialBufNames);
|
|
if (!OutReader)
|
|
return nullptr;
|
|
|
|
auto ChainedSrc =
|
|
llvm::makeIntrusiveRefCnt<ChainedIncludesSource>(std::move(CIs));
|
|
return llvm::makeIntrusiveRefCnt<MultiplexExternalSemaSource>(
|
|
std::move(ChainedSrc), OutReader);
|
|
}
|