//===-- SymbolFileNativePDB.cpp ---------------------------------*- C++ -*-===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include "SymbolFileNativePDB.h" #include "clang/AST/Attr.h" #include "clang/AST/CharUnits.h" #include "clang/AST/Decl.h" #include "clang/AST/DeclCXX.h" #include "lldb/Core/Module.h" #include "lldb/Core/PluginManager.h" #include "lldb/Symbol/ClangASTContext.h" #include "lldb/Symbol/ClangASTImporter.h" #include "lldb/Symbol/ClangExternalASTSourceCommon.h" #include "lldb/Symbol/CompileUnit.h" #include "lldb/Symbol/LineTable.h" #include "lldb/Symbol/ObjectFile.h" #include "lldb/Symbol/SymbolContext.h" #include "lldb/Symbol/SymbolVendor.h" #include "llvm/DebugInfo/CodeView/CVRecord.h" #include "llvm/DebugInfo/CodeView/CVTypeVisitor.h" #include "llvm/DebugInfo/CodeView/DebugLinesSubsection.h" #include "llvm/DebugInfo/CodeView/LazyRandomTypeCollection.h" #include "llvm/DebugInfo/CodeView/RecordName.h" #include "llvm/DebugInfo/CodeView/SymbolDeserializer.h" #include "llvm/DebugInfo/CodeView/TypeDeserializer.h" #include "llvm/DebugInfo/PDB/Native/DbiStream.h" #include "llvm/DebugInfo/PDB/Native/GlobalsStream.h" #include "llvm/DebugInfo/PDB/Native/InfoStream.h" #include "llvm/DebugInfo/PDB/Native/ModuleDebugStream.h" #include "llvm/DebugInfo/PDB/Native/PDBFile.h" #include "llvm/DebugInfo/PDB/Native/SymbolStream.h" #include "llvm/DebugInfo/PDB/Native/TpiStream.h" #include "llvm/DebugInfo/PDB/PDBTypes.h" #include "llvm/Object/COFF.h" #include "llvm/Support/Allocator.h" #include "llvm/Support/BinaryStreamReader.h" #include "llvm/Support/ErrorOr.h" #include "llvm/Support/MemoryBuffer.h" #include "PdbSymUid.h" #include "PdbUtil.h" #include "UdtRecordCompleter.h" using namespace lldb; using namespace lldb_private; using namespace npdb; using namespace llvm::codeview; using namespace llvm::pdb; static lldb::LanguageType TranslateLanguage(PDB_Lang lang) { switch (lang) { case PDB_Lang::Cpp: return lldb::LanguageType::eLanguageTypeC_plus_plus; case PDB_Lang::C: return lldb::LanguageType::eLanguageTypeC; default: return lldb::LanguageType::eLanguageTypeUnknown; } } static std::unique_ptr loadPDBFile(std::string PdbPath, llvm::BumpPtrAllocator &Allocator) { llvm::ErrorOr> ErrorOrBuffer = llvm::MemoryBuffer::getFile(PdbPath, /*FileSize=*/-1, /*RequiresNullTerminator=*/false); if (!ErrorOrBuffer) return nullptr; std::unique_ptr Buffer = std::move(*ErrorOrBuffer); llvm::StringRef Path = Buffer->getBufferIdentifier(); auto Stream = llvm::make_unique( std::move(Buffer), llvm::support::little); auto File = llvm::make_unique(Path, std::move(Stream), Allocator); if (auto EC = File->parseFileHeaders()) { llvm::consumeError(std::move(EC)); return nullptr; } if (auto EC = File->parseStreamData()) { llvm::consumeError(std::move(EC)); return nullptr; } return File; } static std::unique_ptr loadMatchingPDBFile(std::string exe_path, llvm::BumpPtrAllocator &allocator) { // Try to find a matching PDB for an EXE. using namespace llvm::object; auto expected_binary = createBinary(exe_path); // If the file isn't a PE/COFF executable, fail. if (!expected_binary) { llvm::consumeError(expected_binary.takeError()); return nullptr; } OwningBinary binary = std::move(*expected_binary); auto *obj = llvm::dyn_cast(binary.getBinary()); if (!obj) return nullptr; const llvm::codeview::DebugInfo *pdb_info = nullptr; // If it doesn't have a debug directory, fail. llvm::StringRef pdb_file; auto ec = obj->getDebugPDBInfo(pdb_info, pdb_file); if (ec) return nullptr; // if the file doesn't exist, is not a pdb, or doesn't have a matching guid, // fail. llvm::file_magic magic; ec = llvm::identify_magic(pdb_file, magic); if (ec || magic != llvm::file_magic::pdb) return nullptr; std::unique_ptr pdb = loadPDBFile(pdb_file, allocator); if (!pdb) return nullptr; auto expected_info = pdb->getPDBInfoStream(); if (!expected_info) { llvm::consumeError(expected_info.takeError()); return nullptr; } llvm::codeview::GUID guid; memcpy(&guid, pdb_info->PDB70.Signature, 16); if (expected_info->getGuid() != guid) return nullptr; return pdb; } static bool IsFunctionPrologue(const CompilandIndexItem &cci, lldb::addr_t addr) { // FIXME: Implement this. return false; } static bool IsFunctionEpilogue(const CompilandIndexItem &cci, lldb::addr_t addr) { // FIXME: Implement this. return false; } static clang::MSInheritanceAttr::Spelling GetMSInheritance(LazyRandomTypeCollection &tpi, const ClassRecord &record) { if (record.DerivationList == TypeIndex::None()) return clang::MSInheritanceAttr::Spelling::Keyword_single_inheritance; CVType bases = tpi.getType(record.DerivationList); ArgListRecord base_list; cantFail(TypeDeserializer::deserializeAs(bases, base_list)); if (base_list.ArgIndices.empty()) return clang::MSInheritanceAttr::Spelling::Keyword_single_inheritance; int base_count = 0; for (TypeIndex ti : base_list.ArgIndices) { CVType base = tpi.getType(ti); if (base.kind() == LF_VBCLASS || base.kind() == LF_IVBCLASS) return clang::MSInheritanceAttr::Spelling::Keyword_virtual_inheritance; ++base_count; } if (base_count > 1) return clang::MSInheritanceAttr::Keyword_multiple_inheritance; return clang::MSInheritanceAttr::Keyword_single_inheritance; } static lldb::BasicType GetCompilerTypeForSimpleKind(SimpleTypeKind kind) { switch (kind) { case SimpleTypeKind::Boolean128: case SimpleTypeKind::Boolean16: case SimpleTypeKind::Boolean32: case SimpleTypeKind::Boolean64: case SimpleTypeKind::Boolean8: return lldb::eBasicTypeBool; case SimpleTypeKind::Byte: case SimpleTypeKind::UnsignedCharacter: return lldb::eBasicTypeUnsignedChar; case SimpleTypeKind::NarrowCharacter: return lldb::eBasicTypeChar; case SimpleTypeKind::SignedCharacter: case SimpleTypeKind::SByte: return lldb::eBasicTypeSignedChar; case SimpleTypeKind::Character16: return lldb::eBasicTypeChar16; case SimpleTypeKind::Character32: return lldb::eBasicTypeChar32; case SimpleTypeKind::Complex80: return lldb::eBasicTypeLongDoubleComplex; case SimpleTypeKind::Complex64: return lldb::eBasicTypeDoubleComplex; case SimpleTypeKind::Complex32: return lldb::eBasicTypeFloatComplex; case SimpleTypeKind::Float128: case SimpleTypeKind::Float80: return lldb::eBasicTypeLongDouble; case SimpleTypeKind::Float64: return lldb::eBasicTypeDouble; case SimpleTypeKind::Float32: return lldb::eBasicTypeFloat; case SimpleTypeKind::Float16: return lldb::eBasicTypeHalf; case SimpleTypeKind::Int128: return lldb::eBasicTypeInt128; case SimpleTypeKind::Int64: case SimpleTypeKind::Int64Quad: return lldb::eBasicTypeLongLong; case SimpleTypeKind::Int32: return lldb::eBasicTypeInt; case SimpleTypeKind::Int16: case SimpleTypeKind::Int16Short: return lldb::eBasicTypeShort; case SimpleTypeKind::UInt128: return lldb::eBasicTypeUnsignedInt128; case SimpleTypeKind::UInt64: case SimpleTypeKind::UInt64Quad: return lldb::eBasicTypeUnsignedLongLong; case SimpleTypeKind::HResult: case SimpleTypeKind::UInt32: return lldb::eBasicTypeUnsignedInt; case SimpleTypeKind::UInt16: case SimpleTypeKind::UInt16Short: return lldb::eBasicTypeUnsignedShort; case SimpleTypeKind::Int32Long: return lldb::eBasicTypeLong; case SimpleTypeKind::UInt32Long: return lldb::eBasicTypeUnsignedLong; case SimpleTypeKind::Void: return lldb::eBasicTypeVoid; case SimpleTypeKind::WideCharacter: return lldb::eBasicTypeWChar; default: return lldb::eBasicTypeInvalid; } } static size_t GetTypeSizeForSimpleKind(SimpleTypeKind kind) { switch (kind) { case SimpleTypeKind::Boolean128: case SimpleTypeKind::Int128: case SimpleTypeKind::UInt128: case SimpleTypeKind::Float128: return 16; case SimpleTypeKind::Complex80: case SimpleTypeKind::Float80: return 10; case SimpleTypeKind::Boolean64: case SimpleTypeKind::Complex64: case SimpleTypeKind::UInt64: case SimpleTypeKind::UInt64Quad: case SimpleTypeKind::Float64: case SimpleTypeKind::Int64: case SimpleTypeKind::Int64Quad: return 8; case SimpleTypeKind::Boolean32: case SimpleTypeKind::Character32: case SimpleTypeKind::Complex32: case SimpleTypeKind::Float32: case SimpleTypeKind::Int32: case SimpleTypeKind::Int32Long: case SimpleTypeKind::UInt32Long: case SimpleTypeKind::HResult: case SimpleTypeKind::UInt32: return 4; case SimpleTypeKind::Boolean16: case SimpleTypeKind::Character16: case SimpleTypeKind::Float16: case SimpleTypeKind::Int16: case SimpleTypeKind::Int16Short: case SimpleTypeKind::UInt16: case SimpleTypeKind::UInt16Short: case SimpleTypeKind::WideCharacter: return 2; case SimpleTypeKind::Boolean8: case SimpleTypeKind::Byte: case SimpleTypeKind::UnsignedCharacter: case SimpleTypeKind::NarrowCharacter: case SimpleTypeKind::SignedCharacter: case SimpleTypeKind::SByte: return 1; case SimpleTypeKind::Void: default: return 0; } } static llvm::StringRef GetSimpleTypeName(SimpleTypeKind kind) { switch (kind) { case SimpleTypeKind::Boolean128: case SimpleTypeKind::Boolean16: case SimpleTypeKind::Boolean32: case SimpleTypeKind::Boolean64: case SimpleTypeKind::Boolean8: return "bool"; case SimpleTypeKind::Byte: case SimpleTypeKind::UnsignedCharacter: return "unsigned char"; case SimpleTypeKind::NarrowCharacter: return "char"; case SimpleTypeKind::SignedCharacter: case SimpleTypeKind::SByte: return "signed char"; case SimpleTypeKind::Character16: return "char16_t"; case SimpleTypeKind::Character32: return "char32_t"; case SimpleTypeKind::Complex80: case SimpleTypeKind::Complex64: case SimpleTypeKind::Complex32: return "complex"; case SimpleTypeKind::Float128: case SimpleTypeKind::Float80: return "long double"; case SimpleTypeKind::Float64: return "double"; case SimpleTypeKind::Float32: return "float"; case SimpleTypeKind::Float16: return "single"; case SimpleTypeKind::Int128: return "__int128"; case SimpleTypeKind::Int64: case SimpleTypeKind::Int64Quad: return "int64_t"; case SimpleTypeKind::Int32: return "int"; case SimpleTypeKind::Int16: return "short"; case SimpleTypeKind::UInt128: return "unsigned __int128"; case SimpleTypeKind::UInt64: case SimpleTypeKind::UInt64Quad: return "uint64_t"; case SimpleTypeKind::HResult: return "HRESULT"; case SimpleTypeKind::UInt32: return "unsigned"; case SimpleTypeKind::UInt16: case SimpleTypeKind::UInt16Short: return "unsigned short"; case SimpleTypeKind::Int32Long: return "long"; case SimpleTypeKind::UInt32Long: return "unsigned long"; case SimpleTypeKind::Void: return "void"; case SimpleTypeKind::WideCharacter: return "wchar_t"; default: return ""; } } static bool IsClassRecord(TypeLeafKind kind) { switch (kind) { case LF_STRUCTURE: case LF_CLASS: case LF_INTERFACE: return true; default: return false; } } static PDB_SymType GetPdbSymType(TpiStream &tpi, TypeIndex ti) { if (ti.isSimple()) { if (ti.getSimpleMode() == SimpleTypeMode::Direct) return PDB_SymType::BuiltinType; return PDB_SymType::PointerType; } CVType cvt = tpi.getType(ti); TypeLeafKind kind = cvt.kind(); if (kind != LF_MODIFIER) return CVTypeToPDBType(kind); // If this is an LF_MODIFIER, look through it to get the kind that it // modifies. Note that it's not possible to have an LF_MODIFIER that // modifies another LF_MODIFIER, although this would handle that anyway. ModifierRecord mr; llvm::cantFail(TypeDeserializer::deserializeAs(cvt, mr)); return GetPdbSymType(tpi, mr.ModifiedType); } static clang::TagTypeKind TranslateUdtKind(const TagRecord &cr) { switch (cr.Kind) { case TypeRecordKind::Class: return clang::TTK_Class; case TypeRecordKind::Struct: return clang::TTK_Struct; case TypeRecordKind::Union: return clang::TTK_Union; case TypeRecordKind::Interface: return clang::TTK_Interface; case TypeRecordKind::Enum: return clang::TTK_Enum; default: lldbassert(false && "Invalid tag record kind!"); return clang::TTK_Struct; } } void SymbolFileNativePDB::Initialize() { PluginManager::RegisterPlugin(GetPluginNameStatic(), GetPluginDescriptionStatic(), CreateInstance, DebuggerInitialize); } void SymbolFileNativePDB::Terminate() { PluginManager::UnregisterPlugin(CreateInstance); } void SymbolFileNativePDB::DebuggerInitialize(Debugger &debugger) {} ConstString SymbolFileNativePDB::GetPluginNameStatic() { static ConstString g_name("native-pdb"); return g_name; } const char *SymbolFileNativePDB::GetPluginDescriptionStatic() { return "Microsoft PDB debug symbol cross-platform file reader."; } SymbolFile *SymbolFileNativePDB::CreateInstance(ObjectFile *obj_file) { return new SymbolFileNativePDB(obj_file); } SymbolFileNativePDB::SymbolFileNativePDB(ObjectFile *object_file) : SymbolFile(object_file) {} SymbolFileNativePDB::~SymbolFileNativePDB() {} uint32_t SymbolFileNativePDB::CalculateAbilities() { uint32_t abilities = 0; if (!m_obj_file) return 0; if (!m_index) { // Lazily load and match the PDB file, but only do this once. std::unique_ptr file_up = loadMatchingPDBFile(m_obj_file->GetFileSpec().GetPath(), m_allocator); if (!file_up) { auto module_sp = m_obj_file->GetModule(); if (!module_sp) return 0; // See if any symbol file is specified through `--symfile` option. FileSpec symfile = module_sp->GetSymbolFileFileSpec(); if (!symfile) return 0; file_up = loadPDBFile(symfile.GetPath(), m_allocator); } if (!file_up) return 0; auto expected_index = PdbIndex::create(std::move(file_up)); if (!expected_index) { llvm::consumeError(expected_index.takeError()); return 0; } m_index = std::move(*expected_index); } if (!m_index) return 0; // We don't especially have to be precise here. We only distinguish between // stripped and not stripped. abilities = kAllAbilities; if (m_index->dbi().isStripped()) abilities &= ~(Blocks | LocalVariables); return abilities; } void SymbolFileNativePDB::InitializeObject() { m_obj_load_address = m_obj_file->GetFileOffset(); m_index->SetLoadAddress(m_obj_load_address); m_index->ParseSectionContribs(); TypeSystem *ts = GetTypeSystemForLanguage(eLanguageTypeC_plus_plus); m_clang = llvm::dyn_cast_or_null(ts); m_importer = llvm::make_unique(); lldbassert(m_clang); } uint32_t SymbolFileNativePDB::GetNumCompileUnits() { const DbiModuleList &modules = m_index->dbi().modules(); uint32_t count = modules.getModuleCount(); if (count == 0) return count; // The linker can inject an additional "dummy" compilation unit into the // PDB. Ignore this special compile unit for our purposes, if it is there. // It is always the last one. DbiModuleDescriptor last = modules.getModuleDescriptor(count - 1); if (last.getModuleName() == "* Linker *") --count; return count; } lldb::FunctionSP SymbolFileNativePDB::CreateFunction(PdbSymUid func_uid, const SymbolContext &sc) { lldbassert(func_uid.tag() == PDB_SymType::Function); PdbSymUid cuid = PdbSymUid::makeCompilandId(func_uid.asCuSym().modi); const CompilandIndexItem *cci = m_index->compilands().GetCompiland(cuid); lldbassert(cci); CVSymbol sym_record = cci->m_debug_stream.readSymbolAtOffset(func_uid.asCuSym().offset); lldbassert(sym_record.kind() == S_LPROC32 || sym_record.kind() == S_GPROC32); SegmentOffsetLength sol = GetSegmentOffsetAndLength(sym_record); auto file_vm_addr = m_index->MakeVirtualAddress(sol.so); if (file_vm_addr == LLDB_INVALID_ADDRESS || file_vm_addr == 0) return nullptr; AddressRange func_range(file_vm_addr, sol.length, sc.module_sp->GetSectionList()); if (!func_range.GetBaseAddress().IsValid()) return nullptr; Type *func_type = nullptr; // FIXME: Resolve types and mangled names. PdbSymUid sig_uid = PdbSymUid::makeTypeSymId(PDB_SymType::FunctionSig, TypeIndex{0}, false); Mangled mangled(getSymbolName(sym_record)); FunctionSP func_sp = std::make_shared( sc.comp_unit, func_uid.toOpaqueId(), sig_uid.toOpaqueId(), mangled, func_type, func_range); sc.comp_unit->AddFunction(func_sp); return func_sp; } CompUnitSP SymbolFileNativePDB::CreateCompileUnit(const CompilandIndexItem &cci) { lldb::LanguageType lang = cci.m_compile_opts ? TranslateLanguage(cci.m_compile_opts->getLanguage()) : lldb::eLanguageTypeUnknown; LazyBool optimized = eLazyBoolNo; if (cci.m_compile_opts && cci.m_compile_opts->hasOptimizations()) optimized = eLazyBoolYes; llvm::StringRef source_file_name = m_index->compilands().GetMainSourceFile(cci); FileSpec fs(source_file_name, false); CompUnitSP cu_sp = std::make_shared(m_obj_file->GetModule(), nullptr, fs, cci.m_uid.toOpaqueId(), lang, optimized); const PdbCompilandId &cuid = cci.m_uid.asCompiland(); m_obj_file->GetModule()->GetSymbolVendor()->SetCompileUnitAtIndex(cuid.modi, cu_sp); return cu_sp; } lldb::TypeSP SymbolFileNativePDB::CreateModifierType(PdbSymUid type_uid, const ModifierRecord &mr) { TpiStream &stream = m_index->tpi(); TypeSP t = GetOrCreateType(mr.ModifiedType); CompilerType ct = t->GetForwardCompilerType(); if ((mr.Modifiers & ModifierOptions::Const) != ModifierOptions::None) ct = ct.AddConstModifier(); if ((mr.Modifiers & ModifierOptions::Volatile) != ModifierOptions::None) ct = ct.AddVolatileModifier(); std::string name; if (mr.ModifiedType.isSimple()) name = GetSimpleTypeName(mr.ModifiedType.getSimpleKind()); else name = computeTypeName(stream.typeCollection(), mr.ModifiedType); Declaration decl; return std::make_shared(type_uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(name), t->GetByteSize(), nullptr, LLDB_INVALID_UID, Type::eEncodingIsUID, decl, ct, Type::eResolveStateFull); } lldb::TypeSP SymbolFileNativePDB::CreatePointerType( PdbSymUid type_uid, const llvm::codeview::PointerRecord &pr) { TypeSP pointee = GetOrCreateType(pr.ReferentType); CompilerType pointee_ct = pointee->GetForwardCompilerType(); lldbassert(pointee_ct); Declaration decl; if (pr.isPointerToMember()) { MemberPointerInfo mpi = pr.getMemberInfo(); TypeSP class_type = GetOrCreateType(mpi.ContainingType); CompilerType ct = ClangASTContext::CreateMemberPointerType( class_type->GetLayoutCompilerType(), pointee_ct); return std::make_shared( type_uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(), pr.getSize(), nullptr, LLDB_INVALID_UID, Type::eEncodingIsUID, decl, ct, Type::eResolveStateFull); } CompilerType pointer_ct = pointee_ct; if (pr.getMode() == PointerMode::LValueReference) pointer_ct = pointer_ct.GetLValueReferenceType(); else if (pr.getMode() == PointerMode::RValueReference) pointer_ct = pointer_ct.GetRValueReferenceType(); else pointer_ct = pointer_ct.GetPointerType(); if ((pr.getOptions() & PointerOptions::Const) != PointerOptions::None) pointer_ct = pointer_ct.AddConstModifier(); if ((pr.getOptions() & PointerOptions::Volatile) != PointerOptions::None) pointer_ct = pointer_ct.AddVolatileModifier(); if ((pr.getOptions() & PointerOptions::Restrict) != PointerOptions::None) pointer_ct = pointer_ct.AddRestrictModifier(); return std::make_shared(type_uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(), pr.getSize(), nullptr, LLDB_INVALID_UID, Type::eEncodingIsUID, decl, pointer_ct, Type::eResolveStateFull); } lldb::TypeSP SymbolFileNativePDB::CreateSimpleType(TypeIndex ti) { if (ti.getSimpleMode() != SimpleTypeMode::Direct) { PdbSymUid uid = PdbSymUid::makeTypeSymId(PDB_SymType::PointerType, ti, false); TypeSP direct_sp = GetOrCreateType(ti.makeDirect()); CompilerType ct = direct_sp->GetFullCompilerType(); ct = ct.GetPointerType(); uint32_t pointer_size = 0; switch (ti.getSimpleMode()) { case SimpleTypeMode::FarPointer32: case SimpleTypeMode::NearPointer32: pointer_size = 4; break; case SimpleTypeMode::NearPointer64: pointer_size = 8; break; default: // 128-bit and 16-bit pointers unsupported. return nullptr; } Declaration decl; return std::make_shared(uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(), pointer_size, nullptr, LLDB_INVALID_UID, Type::eEncodingIsUID, decl, ct, Type::eResolveStateFull); } PdbSymUid uid = PdbSymUid::makeTypeSymId(PDB_SymType::BuiltinType, ti, false); if (ti.getSimpleKind() == SimpleTypeKind::NotTranslated) return nullptr; lldb::BasicType bt = GetCompilerTypeForSimpleKind(ti.getSimpleKind()); lldbassert(bt != lldb::eBasicTypeInvalid); CompilerType ct = m_clang->GetBasicType(bt); size_t size = GetTypeSizeForSimpleKind(ti.getSimpleKind()); llvm::StringRef type_name = GetSimpleTypeName(ti.getSimpleKind()); Declaration decl; return std::make_shared(uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(type_name), size, nullptr, LLDB_INVALID_UID, Type::eEncodingIsUID, decl, ct, Type::eResolveStateFull); } lldb::TypeSP SymbolFileNativePDB::CreateClassStructUnion( PdbSymUid type_uid, llvm::StringRef name, size_t size, clang::TagTypeKind ttk, clang::MSInheritanceAttr::Spelling inheritance) { // Some UDT with trival ctor has zero length. Just ignore. if (size == 0) return nullptr; // Ignore unnamed-tag UDTs. name = DropNameScope(name); if (name.empty()) return nullptr; clang::DeclContext *decl_context = m_clang->GetTranslationUnitDecl(); lldb::AccessType access = (ttk == clang::TTK_Class) ? lldb::eAccessPrivate : lldb::eAccessPublic; ClangASTMetadata metadata; metadata.SetUserID(type_uid.toOpaqueId()); metadata.SetIsDynamicCXXType(false); CompilerType ct = m_clang->CreateRecordType(decl_context, access, name.str().c_str(), ttk, lldb::eLanguageTypeC_plus_plus, &metadata); lldbassert(ct.IsValid()); clang::CXXRecordDecl *record_decl = m_clang->GetAsCXXRecordDecl(ct.GetOpaqueQualType()); lldbassert(record_decl); clang::MSInheritanceAttr *attr = clang::MSInheritanceAttr::CreateImplicit( *m_clang->getASTContext(), inheritance); record_decl->addAttr(attr); ClangASTContext::StartTagDeclarationDefinition(ct); // Even if it's possible, don't complete it at this point. Just mark it // forward resolved, and if/when LLDB needs the full definition, it can // ask us. ClangASTContext::SetHasExternalStorage(ct.GetOpaqueQualType(), true); // FIXME: Search IPI stream for LF_UDT_MOD_SRC_LINE. Declaration decl; return std::make_shared(type_uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(name), size, nullptr, LLDB_INVALID_UID, Type::eEncodingIsUID, decl, ct, Type::eResolveStateForward); } lldb::TypeSP SymbolFileNativePDB::CreateTagType(PdbSymUid type_uid, const ClassRecord &cr) { clang::TagTypeKind ttk = TranslateUdtKind(cr); clang::MSInheritanceAttr::Spelling inheritance = GetMSInheritance(m_index->tpi().typeCollection(), cr); return CreateClassStructUnion(type_uid, cr.getName(), cr.getSize(), ttk, inheritance); } lldb::TypeSP SymbolFileNativePDB::CreateTagType(PdbSymUid type_uid, const UnionRecord &ur) { return CreateClassStructUnion( type_uid, ur.getName(), ur.getSize(), clang::TTK_Union, clang::MSInheritanceAttr::Spelling::Keyword_single_inheritance); } lldb::TypeSP SymbolFileNativePDB::CreateTagType(PdbSymUid type_uid, const EnumRecord &er) { llvm::StringRef name = DropNameScope(er.getName()); clang::DeclContext *decl_context = m_clang->GetTranslationUnitDecl(); Declaration decl; TypeSP underlying_type = GetOrCreateType(er.UnderlyingType); CompilerType enum_ct = m_clang->CreateEnumerationType( name.str().c_str(), decl_context, decl, underlying_type->GetFullCompilerType(), er.isScoped()); ClangASTContext::StartTagDeclarationDefinition(enum_ct); // We're just going to forward resolve this for now. We'll complete // it only if the user requests. return std::make_shared( type_uid.toOpaqueId(), m_clang->GetSymbolFile(), ConstString(name), underlying_type->GetByteSize(), nullptr, LLDB_INVALID_UID, lldb_private::Type::eEncodingIsUID, decl, enum_ct, lldb_private::Type::eResolveStateForward); } TypeSP SymbolFileNativePDB::CreateType(PdbSymUid type_uid) { const PdbTypeSymId &tsid = type_uid.asTypeSym(); TypeIndex index(tsid.index); if (index.getIndex() < TypeIndex::FirstNonSimpleIndex) return CreateSimpleType(index); TpiStream &stream = tsid.is_ipi ? m_index->ipi() : m_index->tpi(); CVType cvt = stream.getType(index); if (cvt.kind() == LF_MODIFIER) { ModifierRecord modifier; llvm::cantFail( TypeDeserializer::deserializeAs(cvt, modifier)); return CreateModifierType(type_uid, modifier); } if (cvt.kind() == LF_POINTER) { PointerRecord pointer; llvm::cantFail( TypeDeserializer::deserializeAs(cvt, pointer)); return CreatePointerType(type_uid, pointer); } if (IsClassRecord(cvt.kind())) { ClassRecord cr; llvm::cantFail(TypeDeserializer::deserializeAs(cvt, cr)); return CreateTagType(type_uid, cr); } if (cvt.kind() == LF_ENUM) { EnumRecord er; llvm::cantFail(TypeDeserializer::deserializeAs(cvt, er)); return CreateTagType(type_uid, er); } if (cvt.kind() == LF_UNION) { UnionRecord ur; llvm::cantFail(TypeDeserializer::deserializeAs(cvt, ur)); return CreateTagType(type_uid, ur); } return nullptr; } TypeSP SymbolFileNativePDB::CreateAndCacheType(PdbSymUid type_uid) { // If they search for a UDT which is a forward ref, try and resolve the full // decl and just map the forward ref uid to the full decl record. llvm::Optional full_decl_uid; if (type_uid.tag() == PDB_SymType::UDT || type_uid.tag() == PDB_SymType::Enum) { const PdbTypeSymId &type_id = type_uid.asTypeSym(); TypeIndex ti(type_id.index); lldbassert(!ti.isSimple()); CVType cvt = m_index->tpi().getType(ti); if (IsForwardRefUdt(cvt)) { auto expected_full_ti = m_index->tpi().findFullDeclForForwardRef(ti); if (!expected_full_ti) llvm::consumeError(expected_full_ti.takeError()); else { full_decl_uid = PdbSymUid::makeTypeSymId( type_uid.tag(), *expected_full_ti, type_id.is_ipi); // It's possible that a lookup would occur for the full decl causing it // to be cached, then a second lookup would occur for the forward decl. // We don't want to create a second full decl, so make sure the full // decl hasn't already been cached. auto full_iter = m_types.find(full_decl_uid->toOpaqueId()); if (full_iter != m_types.end()) { TypeSP result = full_iter->second; // Map the forward decl to the TypeSP for the full decl so we can take // the fast path next time. m_types[type_uid.toOpaqueId()] = result; return result; } } } } PdbSymUid best_uid = full_decl_uid ? *full_decl_uid : type_uid; TypeSP result = CreateType(best_uid); m_types[best_uid.toOpaqueId()] = result; // If we had both a forward decl and a full decl, make both point to the new // type. if (full_decl_uid) m_types[type_uid.toOpaqueId()] = result; const PdbTypeSymId &type_id = best_uid.asTypeSym(); if (best_uid.tag() == PDB_SymType::UDT || best_uid.tag() == PDB_SymType::Enum) { clang::TagDecl *record_decl = m_clang->GetAsTagDecl(result->GetForwardCompilerType()); lldbassert(record_decl); TypeIndex ti(type_id.index); m_uid_to_decl[best_uid.toOpaqueId()] = record_decl; m_decl_to_status[record_decl] = DeclStatus(best_uid.toOpaqueId(), Type::eResolveStateForward); } return result; } TypeSP SymbolFileNativePDB::GetOrCreateType(PdbSymUid type_uid) { lldbassert(PdbSymUid::isTypeSym(type_uid.tag())); // We can't use try_emplace / overwrite here because the process of creating // a type could create nested types, which could invalidate iterators. So // we have to do a 2-phase lookup / insert. auto iter = m_types.find(type_uid.toOpaqueId()); if (iter != m_types.end()) return iter->second; return CreateAndCacheType(type_uid); } lldb::TypeSP SymbolFileNativePDB::GetOrCreateType(llvm::codeview::TypeIndex ti) { PDB_SymType pdbst = GetPdbSymType(m_index->tpi(), ti); PdbSymUid tuid = PdbSymUid::makeTypeSymId(pdbst, ti, false); return GetOrCreateType(tuid); } FunctionSP SymbolFileNativePDB::GetOrCreateFunction(PdbSymUid func_uid, const SymbolContext &sc) { lldbassert(func_uid.tag() == PDB_SymType::Function); auto emplace_result = m_functions.try_emplace(func_uid.toOpaqueId(), nullptr); if (emplace_result.second) emplace_result.first->second = CreateFunction(func_uid, sc); lldbassert(emplace_result.first->second); return emplace_result.first->second; } CompUnitSP SymbolFileNativePDB::GetOrCreateCompileUnit(const CompilandIndexItem &cci) { auto emplace_result = m_compilands.try_emplace(cci.m_uid.toOpaqueId(), nullptr); if (emplace_result.second) emplace_result.first->second = CreateCompileUnit(cci); lldbassert(emplace_result.first->second); return emplace_result.first->second; } lldb::CompUnitSP SymbolFileNativePDB::ParseCompileUnitAtIndex(uint32_t index) { if (index >= GetNumCompileUnits()) return CompUnitSP(); lldbassert(index < UINT16_MAX); if (index >= UINT16_MAX) return nullptr; CompilandIndexItem &item = m_index->compilands().GetOrCreateCompiland(index); return GetOrCreateCompileUnit(item); } lldb::LanguageType SymbolFileNativePDB::ParseCompileUnitLanguage(const SymbolContext &sc) { // What fields should I expect to be filled out on the SymbolContext? Is it // safe to assume that `sc.comp_unit` is valid? if (!sc.comp_unit) return lldb::eLanguageTypeUnknown; PdbSymUid uid = PdbSymUid::fromOpaqueId(sc.comp_unit->GetID()); lldbassert(uid.tag() == PDB_SymType::Compiland); CompilandIndexItem *item = m_index->compilands().GetCompiland(uid); lldbassert(item); if (!item->m_compile_opts) return lldb::eLanguageTypeUnknown; return TranslateLanguage(item->m_compile_opts->getLanguage()); } size_t SymbolFileNativePDB::ParseCompileUnitFunctions(const SymbolContext &sc) { lldbassert(sc.comp_unit); return false; } static bool NeedsResolvedCompileUnit(uint32_t resolve_scope) { // If any of these flags are set, we need to resolve the compile unit. uint32_t flags = eSymbolContextCompUnit; flags |= eSymbolContextVariable; flags |= eSymbolContextFunction; flags |= eSymbolContextBlock; flags |= eSymbolContextLineEntry; return (resolve_scope & flags) != 0; } uint32_t SymbolFileNativePDB::ResolveSymbolContext(const Address &addr, uint32_t resolve_scope, SymbolContext &sc) { uint32_t resolved_flags = 0; lldb::addr_t file_addr = addr.GetFileAddress(); if (NeedsResolvedCompileUnit(resolve_scope)) { llvm::Optional modi = m_index->GetModuleIndexForVa(file_addr); if (!modi) return 0; PdbSymUid cuid = PdbSymUid::makeCompilandId(*modi); CompilandIndexItem *cci = m_index->compilands().GetCompiland(cuid); if (!cci) return 0; sc.comp_unit = GetOrCreateCompileUnit(*cci).get(); resolved_flags |= eSymbolContextCompUnit; } if (resolve_scope & eSymbolContextFunction) { lldbassert(sc.comp_unit); std::vector matches = m_index->FindSymbolsByVa(file_addr); for (const auto &match : matches) { if (match.uid.tag() != PDB_SymType::Function) continue; sc.function = GetOrCreateFunction(match.uid, sc).get(); } resolved_flags |= eSymbolContextFunction; } if (resolve_scope & eSymbolContextLineEntry) { lldbassert(sc.comp_unit); if (auto *line_table = sc.comp_unit->GetLineTable()) { if (line_table->FindLineEntryByAddress(addr, sc.line_entry)) resolved_flags |= eSymbolContextLineEntry; } } return resolved_flags; } static void AppendLineEntryToSequence(LineTable &table, LineSequence &sequence, const CompilandIndexItem &cci, lldb::addr_t base_addr, uint32_t file_number, const LineFragmentHeader &block, const LineNumberEntry &cur) { LineInfo cur_info(cur.Flags); if (cur_info.isAlwaysStepInto() || cur_info.isNeverStepInto()) return; uint64_t addr = base_addr + cur.Offset; bool is_statement = cur_info.isStatement(); bool is_prologue = IsFunctionPrologue(cci, addr); bool is_epilogue = IsFunctionEpilogue(cci, addr); uint32_t lno = cur_info.getStartLine(); table.AppendLineEntryToSequence(&sequence, addr, lno, 0, file_number, is_statement, false, is_prologue, is_epilogue, false); } static void TerminateLineSequence(LineTable &table, const LineFragmentHeader &block, lldb::addr_t base_addr, uint32_t file_number, uint32_t last_line, std::unique_ptr seq) { // The end is always a terminal entry, so insert it regardless. table.AppendLineEntryToSequence(seq.get(), base_addr + block.CodeSize, last_line, 0, file_number, false, false, false, false, true); table.InsertSequence(seq.release()); } bool SymbolFileNativePDB::ParseCompileUnitLineTable(const SymbolContext &sc) { // Unfortunately LLDB is set up to parse the entire compile unit line table // all at once, even if all it really needs is line info for a specific // function. In the future it would be nice if it could set the sc.m_function // member, and we could only get the line info for the function in question. lldbassert(sc.comp_unit); PdbSymUid cu_id = PdbSymUid::fromOpaqueId(sc.comp_unit->GetID()); lldbassert(cu_id.isCompiland()); CompilandIndexItem *cci = m_index->compilands().GetCompiland(cu_id); lldbassert(cci); auto line_table = llvm::make_unique(sc.comp_unit); // This is basically a copy of the .debug$S subsections from all original COFF // object files merged together with address relocations applied. We are // looking for all DEBUG_S_LINES subsections. for (const DebugSubsectionRecord &dssr : cci->m_debug_stream.getSubsectionsArray()) { if (dssr.kind() != DebugSubsectionKind::Lines) continue; DebugLinesSubsectionRef lines; llvm::BinaryStreamReader reader(dssr.getRecordData()); if (auto EC = lines.initialize(reader)) { llvm::consumeError(std::move(EC)); return false; } const LineFragmentHeader *lfh = lines.header(); uint64_t virtual_addr = m_index->MakeVirtualAddress(lfh->RelocSegment, lfh->RelocOffset); const auto &checksums = cci->m_strings.checksums().getArray(); const auto &strings = cci->m_strings.strings(); for (const LineColumnEntry &group : lines) { // Indices in this structure are actually offsets of records in the // DEBUG_S_FILECHECKSUMS subsection. Those entries then have an index // into the global PDB string table. auto iter = checksums.at(group.NameIndex); if (iter == checksums.end()) continue; llvm::Expected efn = strings.getString(iter->FileNameOffset); if (!efn) { llvm::consumeError(efn.takeError()); continue; } // LLDB wants the index of the file in the list of support files. auto fn_iter = llvm::find(cci->m_file_list, *efn); lldbassert(fn_iter != cci->m_file_list.end()); uint32_t file_index = std::distance(cci->m_file_list.begin(), fn_iter); std::unique_ptr sequence( line_table->CreateLineSequenceContainer()); lldbassert(!group.LineNumbers.empty()); for (const LineNumberEntry &entry : group.LineNumbers) { AppendLineEntryToSequence(*line_table, *sequence, *cci, virtual_addr, file_index, *lfh, entry); } LineInfo last_line(group.LineNumbers.back().Flags); TerminateLineSequence(*line_table, *lfh, virtual_addr, file_index, last_line.getEndLine(), std::move(sequence)); } } if (line_table->GetSize() == 0) return false; sc.comp_unit->SetLineTable(line_table.release()); return true; } bool SymbolFileNativePDB::ParseCompileUnitDebugMacros(const SymbolContext &sc) { // PDB doesn't contain information about macros return false; } bool SymbolFileNativePDB::ParseCompileUnitSupportFiles( const SymbolContext &sc, FileSpecList &support_files) { lldbassert(sc.comp_unit); PdbSymUid comp_uid = PdbSymUid::fromOpaqueId(sc.comp_unit->GetID()); lldbassert(comp_uid.tag() == PDB_SymType::Compiland); const CompilandIndexItem *cci = m_index->compilands().GetCompiland(comp_uid); lldbassert(cci); for (llvm::StringRef f : cci->m_file_list) { FileSpec::Style style = f.startswith("/") ? FileSpec::Style::posix : FileSpec::Style::windows; FileSpec spec(f, false, style); support_files.Append(spec); } return true; } bool SymbolFileNativePDB::ParseImportedModules( const SymbolContext &sc, std::vector &imported_modules) { // PDB does not yet support module debug info return false; } size_t SymbolFileNativePDB::ParseFunctionBlocks(const SymbolContext &sc) { lldbassert(sc.comp_unit && sc.function); return 0; } uint32_t SymbolFileNativePDB::FindFunctions( const ConstString &name, const CompilerDeclContext *parent_decl_ctx, uint32_t name_type_mask, bool include_inlines, bool append, SymbolContextList &sc_list) { // For now we only support lookup by method name. if (!(name_type_mask & eFunctionNameTypeMethod)) return 0; using SymbolAndOffset = std::pair; std::vector matches = m_index->globals().findRecordsByName( name.GetStringRef(), m_index->symrecords()); for (const SymbolAndOffset &match : matches) { if (match.second.kind() != S_PROCREF && match.second.kind() != S_LPROCREF) continue; ProcRefSym proc(match.second.kind()); cantFail(SymbolDeserializer::deserializeAs(match.second, proc)); if (!IsValidRecord(proc)) continue; PdbSymUid cuid = PdbSymUid::makeCompilandId(proc); CompilandIndexItem &cci = m_index->compilands().GetOrCreateCompiland(cuid); SymbolContext sc; sc.comp_unit = GetOrCreateCompileUnit(cci).get(); sc.module_sp = sc.comp_unit->GetModule(); PdbSymUid func_uid = PdbSymUid::makeCuSymId(proc); sc.function = GetOrCreateFunction(func_uid, sc).get(); sc_list.Append(sc); } return sc_list.GetSize(); } uint32_t SymbolFileNativePDB::FindFunctions(const RegularExpression ®ex, bool include_inlines, bool append, SymbolContextList &sc_list) { return 0; } uint32_t SymbolFileNativePDB::FindTypes( const SymbolContext &sc, const ConstString &name, const CompilerDeclContext *parent_decl_ctx, bool append, uint32_t max_matches, llvm::DenseSet &searched_symbol_files, TypeMap &types) { if (!append) types.Clear(); if (!name) return 0; searched_symbol_files.clear(); searched_symbol_files.insert(this); // There is an assumption 'name' is not a regex size_t match_count = FindTypesByName(name.GetStringRef(), max_matches, types); return match_count; } size_t SymbolFileNativePDB::FindTypes(const std::vector &context, bool append, TypeMap &types) { return 0; } size_t SymbolFileNativePDB::FindTypesByName(llvm::StringRef name, uint32_t max_matches, TypeMap &types) { size_t match_count = 0; std::vector matches = m_index->tpi().findRecordsByName(name); if (max_matches > 0 && max_matches < matches.size()) matches.resize(max_matches); for (TypeIndex ti : matches) { TypeSP type = GetOrCreateType(ti); if (!type) continue; types.Insert(type); ++match_count; } return match_count; } size_t SymbolFileNativePDB::ParseTypes(const SymbolContext &sc) { return 0; } Type *SymbolFileNativePDB::ResolveTypeUID(lldb::user_id_t type_uid) { auto iter = m_types.find(type_uid); // lldb should not be passing us non-sensical type uids. the only way it // could have a type uid in the first place is if we handed it out, in which // case we should know about the type. So this is not a get-or-create type // operation, it is strictly a get, and the type is guaranteed to exist. // // However, since the implementation is not yet complete, we don't currently // support all possible use cases. For example, we currently create all // functions with indices of 0 for the signature type simply because this is // not yet implemented. At the time the function object is created we should // be creating an lldb::TypeSP for this, adding it to the m_types, and // returning a valid Type object for it and putting it in this map. Once all // cases like this are handled, we can promote this to an assert. if (iter == m_types.end()) return nullptr; return &*iter->second; } bool SymbolFileNativePDB::CompleteType(CompilerType &compiler_type) { // If this is not in our map, it's an error. clang::TagDecl *tag_decl = m_clang->GetAsTagDecl(compiler_type); lldbassert(tag_decl); auto status_iter = m_decl_to_status.find(tag_decl); lldbassert(status_iter != m_decl_to_status.end()); // If it's already complete, just return. DeclStatus &status = status_iter->second; if (status.status == Type::eResolveStateFull) return true; PdbSymUid uid = PdbSymUid::fromOpaqueId(status.uid); lldbassert(uid.tag() == PDB_SymType::UDT || uid.tag() == PDB_SymType::Enum); const PdbTypeSymId &type_id = uid.asTypeSym(); ClangASTContext::SetHasExternalStorage(compiler_type.GetOpaqueQualType(), false); // In CreateAndCacheType, we already go out of our way to resolve forward // ref UDTs to full decls, and the uids we vend out always refer to full // decls if a full decl exists in the debug info. So if we don't have a full // decl here, it means one doesn't exist in the debug info, and we can't // complete the type. CVType cvt = m_index->tpi().getType(TypeIndex(type_id.index)); if (IsForwardRefUdt(cvt)) return false; auto types_iter = m_types.find(uid.toOpaqueId()); lldbassert(types_iter != m_types.end()); TypeIndex field_list_ti = GetFieldListIndex(cvt); CVType field_list_cvt = m_index->tpi().getType(field_list_ti); if (field_list_cvt.kind() != LF_FIELDLIST) return false; // Visit all members of this class, then perform any finalization necessary // to complete the class. UdtRecordCompleter completer(uid, compiler_type, *tag_decl, *this); auto error = llvm::codeview::visitMemberRecordStream(field_list_cvt.data(), completer); completer.complete(); status.status = Type::eResolveStateFull; if (!error) return true; llvm::consumeError(std::move(error)); return false; } size_t SymbolFileNativePDB::GetTypes(lldb_private::SymbolContextScope *sc_scope, uint32_t type_mask, lldb_private::TypeList &type_list) { return 0; } CompilerDeclContext SymbolFileNativePDB::FindNamespace(const SymbolContext &sc, const ConstString &name, const CompilerDeclContext *parent_decl_ctx) { return {}; } TypeSystem * SymbolFileNativePDB::GetTypeSystemForLanguage(lldb::LanguageType language) { auto type_system = m_obj_file->GetModule()->GetTypeSystemForLanguage(language); if (type_system) type_system->SetSymbolFile(this); return type_system; } ConstString SymbolFileNativePDB::GetPluginName() { static ConstString g_name("pdb"); return g_name; } uint32_t SymbolFileNativePDB::GetPluginVersion() { return 1; }