#include #include #include #include #include "imgui.h" #include "TracyCharUtil.hpp" #include "TracyColor.hpp" #include "TracyFilesystem.hpp" #include "TracyImGui.hpp" #include "TracyMicroArchitecture.hpp" #include "TracyPrint.hpp" #include "TracySort.hpp" #include "TracySourceView.hpp" #include "TracyView.hpp" #include "TracyWorker.hpp" #include "IconsFontAwesome5.h" #ifndef TRACY_NO_FILESELECTOR # include "../nfd/nfd.h" #endif namespace tracy { struct MicroArchUx { const char* uArch; const char* cpuName; const char* moniker; }; static constexpr MicroArchUx s_uArchUx[] = { { "Conroe", "Core 2 Duo E6750", "CON" }, { "Wolfdale", "Core 2 Duo E8400", "WOL" }, { "Nehalem", "Core i5-750", "NHM" }, { "Westmere", "Core i5-650", "WSM" }, { "Sandy Bridge", "Core i7-2600", "SNB" }, { "Ivy Bridge", "Core i5-3470", "IVB" }, { "Haswell", "Xeon E3-1225 v3", "HSW" }, { "Broadwell", "Core i5-5200U", "BDW" }, { "Skylake", "Core i7-6500U", "SKL" }, { "Skylake-X", "Core i9-7900X", "SKX" }, { "Kaby Lake", "Core i7-7700", "KBL" }, { "Coffee Lake", "Core i7-8700K", "CFL" }, { "Cannon Lake", "Core i3-8121U", "CNL" }, { "Ice Lake", "Core i5-1035G1", "ICL" }, { "Cascade Lake", "Core i9-10980XE", "CLX" }, { "Tiger Lake", "Core i7-1165G7", "TGL" }, { "Rocket Lake", "Core i9-11900", "RKL" }, { "AMD Zen+", "Ryzen 5 2600", "ZEN+" }, { "AMD Zen 2", "Ryzen 7 3700X", "ZEN2" }, { "AMD Zen 3", "Ryzen 5 5600X", "ZEN3" }, }; static constexpr const char* s_regNameX86[] = { "invalid", "rflags", "rax", "rbx", "rcx", "rdx", "rsi", "rdi", "rbp", "rsp", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15", "mm0", "mm1", "mm2", "mm3", "mm4", "mm5", "mm6", "mm7", "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15", "xmm16", "xmm17", "xmm18", "xmm19", "xmm20", "xmm21", "xmm22", "xmm23", "xmm24", "xmm25", "xmm26", "xmm27", "xmm28", "xmm29", "xmm30", "xmm31", "k0", "k1", "k2", "k3", "k4", "k5", "k6", "k7" }; static_assert( sizeof( s_regNameX86 ) / sizeof( *s_regNameX86 ) == (size_t)SourceView::RegsX86::NUMBER_OF_ENTRIES, "Invalid x86 register name table" ); static SourceView::RegsX86 s_regMapX86[X86_REG_ENDING]; static constexpr const char* s_CostName[] = { "Sample count", "Cycles", "Slow branches", "Slow cache", "Retirements", "Branches taken", "Branch miss", "Cache access", "Cache miss" }; static constexpr SourceView::CostType s_costSeparateAfter = SourceView::CostType::SlowCache; static size_t CountHwSamples( const SortedVector& vec, const Range& range ) { if( vec.empty() ) return 0; auto it = std::lower_bound( vec.begin(), vec.end(), range.min, [] ( const auto& lhs, const auto& rhs ) { return lhs.Val() < rhs; } ); if( it == vec.end() ) return 0; auto end = std::lower_bound( it, vec.end(), range.max, [] ( const auto& lhs, const auto& rhs ) { return lhs.Val() < rhs; } ); return std::distance( it, end ); } static void PrintHwSampleTooltip( size_t cycles, size_t retired, size_t cacheRef, size_t cacheMiss, size_t branchRetired, size_t branchMiss, bool hideFirstSeparator ) { if( cycles || retired ) { if( hideFirstSeparator ) { hideFirstSeparator = false; } else { ImGui::Separator(); } if( cycles && retired ) { char buf[32]; auto end = PrintFloat( buf, buf+32, float( retired ) / cycles, 2 ); *end = '\0'; TextFocused( "IPC:", buf ); } if( cycles ) TextFocused( "Cycles:", RealToString( cycles ) ); if( retired ) TextFocused( "Retirements:", RealToString( retired ) ); } if( cacheRef || cacheMiss ) { if( hideFirstSeparator ) { hideFirstSeparator = false; } else { ImGui::Separator(); } if( cacheRef ) { char buf[32]; auto end = PrintFloat( buf, buf+32, float( 100 * cacheMiss ) / cacheRef, 2 ); memcpy( end, "%", 2 ); TextFocused( "Cache miss rate:", buf ); TextFocused( "Cache references:", RealToString( cacheRef ) ); } if( cacheMiss ) TextFocused( "Cache misses:", RealToString( cacheMiss ) ); } if( branchRetired || branchMiss ) { if( hideFirstSeparator ) { hideFirstSeparator = false; } else { ImGui::Separator(); } if( branchRetired ) { char buf[32]; auto end = PrintFloat( buf, buf+32, float( 100 * branchMiss ) / branchRetired, 2 ); memcpy( end, "%", 2 ); TextFocused( "Branch mispredictions rate:", buf ); TextFocused( "Retired branches:", RealToString( branchRetired ) ); } if( branchMiss ) TextFocused( "Branch mispredictions:", RealToString( branchMiss ) ); } } enum { JumpSeparation = 6 }; enum { JumpArrowBase = 9 }; SourceView::SourceView( ImFont* font, GetWindowCallback gwcb ) : m_font( font ) , m_symAddr( 0 ) , m_targetAddr( 0 ) , m_targetLine( 0 ) , m_selectedLine( 0 ) , m_asmSelected( -1 ) , m_hoveredLine( 0 ) , m_hoveredSource( 0 ) , m_codeLen( 0 ) , m_highlightAddr( 0 ) , m_asmCountBase( -1 ) , m_asmRelative( false ) , m_asmBytes( false ) , m_asmShowSourceLocation( true ) , m_calcInlineStats( true ) , m_atnt( false ) , m_childCalls( false ) , m_hwSamples( true ) , m_cost( CostType::SampleCount ) , m_showJumps( true ) , m_cpuArch( CpuArchUnknown ) , m_showLatency( false ) , m_gwcb( gwcb ) { m_microArchOpMap.reserve( OpsNum ); for( int i=0; i> 4 ); } struct CpuIdMap { uint32_t cpuInfo; const char* moniker; }; // http://instlatx64.atw.hu/ seems to be a good resource // // .------ extended family id // |.----- extended model id // || .--- family id // || |.-- model // || ||.- stepping // || ||| static constexpr CpuIdMap s_cpuIdMap[] = { { PackCpuInfo( 0x810F81 ), "ZEN+" }, { PackCpuInfo( 0x800F82 ), "ZEN+" }, { PackCpuInfo( 0x830F10 ), "ZEN2" }, { PackCpuInfo( 0x840F70 ), "ZEN2" }, { PackCpuInfo( 0x860F01 ), "ZEN2" }, { PackCpuInfo( 0x860F81 ), "ZEN2" }, { PackCpuInfo( 0x870F10 ), "ZEN2" }, { PackCpuInfo( 0x890F00 ), "ZEN2" }, { PackCpuInfo( 0x890F80 ), "ZEN2" }, { PackCpuInfo( 0xA00F11 ), "ZEN3" }, { PackCpuInfo( 0xA00F80 ), "ZEN3" }, { PackCpuInfo( 0xA20F10 ), "ZEN3" }, { PackCpuInfo( 0xA30F00 ), "ZEN3" }, { PackCpuInfo( 0xA50F00 ), "ZEN3" }, { PackCpuInfo( 0x0A0671 ), "RKL" }, { PackCpuInfo( 0x0806C1 ), "TGL" }, { PackCpuInfo( 0x0806D1 ), "TGL" }, { PackCpuInfo( 0x0706E5 ), "ICL" }, { PackCpuInfo( 0x050656 ), "CLX" }, { PackCpuInfo( 0x050657 ), "CLX" }, { PackCpuInfo( 0x060663 ), "CNL" }, { PackCpuInfo( 0x0906EA ), "CFL" }, { PackCpuInfo( 0x0906EB ), "CFL" }, { PackCpuInfo( 0x0906EC ), "CFL" }, { PackCpuInfo( 0x0906ED ), "CFL" }, { PackCpuInfo( 0x0806E9 ), "KBL" }, { PackCpuInfo( 0x0806EA ), "KBL" }, { PackCpuInfo( 0x0906E9 ), "KBL" }, { PackCpuInfo( 0x050654 ), "SKX" }, { PackCpuInfo( 0x0406E3 ), "SKL" }, { PackCpuInfo( 0x0506E0 ), "SKL" }, { PackCpuInfo( 0x0506E3 ), "SKL" }, { PackCpuInfo( 0x0306D4 ), "BDW" }, { PackCpuInfo( 0x040671 ), "BDW" }, { PackCpuInfo( 0x0406F1 ), "BDW" }, { PackCpuInfo( 0x0306C3 ), "HSW" }, { PackCpuInfo( 0x0306F2 ), "HSW" }, { PackCpuInfo( 0x040651 ), "HSW" }, { PackCpuInfo( 0x0306A9 ), "IVB" }, { PackCpuInfo( 0x0306E3 ), "IVB" }, { PackCpuInfo( 0x0306E4 ), "IVB" }, { PackCpuInfo( 0x0206A2 ), "SNB" }, { PackCpuInfo( 0x0206A7 ), "SNB" }, { PackCpuInfo( 0x0206D5 ), "SNB" }, { PackCpuInfo( 0x0206D6 ), "SNB" }, { PackCpuInfo( 0x0206D7 ), "SNB" }, { PackCpuInfo( 0x0206F2 ), "WSM" }, { PackCpuInfo( 0x0206C0 ), "WSM" }, { PackCpuInfo( 0x0206C1 ), "WSM" }, { PackCpuInfo( 0x0206C2 ), "WSM" }, { PackCpuInfo( 0x020652 ), "WSM" }, { PackCpuInfo( 0x020655 ), "WSM" }, { PackCpuInfo( 0x0206E6 ), "NHM" }, { PackCpuInfo( 0x0106A1 ), "NHM" }, { PackCpuInfo( 0x0106A2 ), "NHM" }, { PackCpuInfo( 0x0106A4 ), "NHM" }, { PackCpuInfo( 0x0106A5 ), "NHM" }, { PackCpuInfo( 0x0106E4 ), "NHM" }, { PackCpuInfo( 0x0106E5 ), "NHM" }, { PackCpuInfo( 0x010676 ), "WOL" }, { PackCpuInfo( 0x01067A ), "WOL" }, { PackCpuInfo( 0x0006F2 ), "CON" }, { PackCpuInfo( 0x0006F4 ), "CON" }, { PackCpuInfo( 0x0006F6 ), "CON" }, { PackCpuInfo( 0x0006FB ), "CON" }, { PackCpuInfo( 0x0006FD ), "CON" }, { 0, 0 } }; void SourceView::SetCpuId( uint32_t cpuId ) { auto ptr = s_cpuIdMap; while( ptr->cpuInfo ) { if( cpuId == ptr->cpuInfo ) { SelectMicroArchitecture( ptr->moniker ); m_profileMicroArch = m_selMicroArch; return; } ptr++; } SelectMicroArchitecture( "ZEN2" ); m_profileMicroArch = -1; } void SourceView::OpenSource( const char* fileName, int line, const View& view, const Worker& worker ) { m_targetLine = line; m_selectedLine = line; m_targetAddr = 0; m_baseAddr = 0; m_symAddr = 0; m_sourceFiles.clear(); m_asm.clear(); ParseSource( fileName, worker, view ); assert( !m_source.empty() ); } void SourceView::OpenSymbol( const char* fileName, int line, uint64_t baseAddr, uint64_t symAddr, const Worker& worker, const View& view ) { m_targetLine = line; m_targetAddr = symAddr; m_baseAddr = baseAddr; m_symAddr = symAddr; m_sourceFiles.clear(); m_selectedAddresses.clear(); m_selectedAddresses.emplace( symAddr ); ParseSource( fileName, worker, view ); Disassemble( baseAddr, worker ); SelectLine( line, &worker, true, symAddr ); SelectViewMode(); if( !worker.GetInlineSymbolList( baseAddr, m_codeLen ) ) m_calcInlineStats = false; } void SourceView::SelectViewMode() { if( !m_source.empty() ) { if( !m_asm.empty() ) { m_displayMode = DisplayMixed; } else { m_displayMode = DisplaySource; } } else { assert( !m_asm.empty() ); m_displayMode = DisplayAsm; } } void SourceView::ParseSource( const char* fileName, const Worker& worker, const View& view ) { if( m_source.filename() != fileName ) { m_srcWidth = 0; m_source.Parse( fileName, worker, view ); } } static bool IsJumpConditionalX86( const char* op ) { static constexpr const char* branchX86[] = { "je", "jne", "jg", "jge", "ja", "jae", "jl", "jle", "jb", "jbe", "jo", "jno", "jz", "jnz", "js", "jns", "jcxz", "jecxz", "jrcxz", "loop", "loope", "loopne", "loopnz", "loopz", "jnle", "jnl", "jnge", "jng", "jnbe", "jnb", "jnae", "jna", "jc", "jnc", "jp", "jpe", "jnp", "jpo", nullptr }; auto ptr = branchX86; while( *ptr ) if( strcmp( *ptr++, op ) == 0 ) return true; return false; } bool SourceView::Disassemble( uint64_t symAddr, const Worker& worker ) { m_asm.clear(); m_locMap.clear(); m_jumpTable.clear(); m_jumpOut.clear(); m_maxJumpLevel = 0; m_asmSelected = -1; m_asmCountBase = -1; m_asmWidth = 0; if( symAddr == 0 ) return false; m_cpuArch = worker.GetCpuArch(); if( m_cpuArch == CpuArchUnknown ) return false; uint32_t len; auto code = worker.GetSymbolCode( symAddr, len ); if( !code ) return false; m_disasmFail = -1; csh handle; cs_err rval = CS_ERR_ARCH; switch( m_cpuArch ) { case CpuArchX86: rval = cs_open( CS_ARCH_X86, CS_MODE_32, &handle ); break; case CpuArchX64: rval = cs_open( CS_ARCH_X86, CS_MODE_64, &handle ); break; case CpuArchArm32: rval = cs_open( CS_ARCH_ARM, CS_MODE_ARM, &handle ); break; case CpuArchArm64: rval = cs_open( CS_ARCH_ARM64, CS_MODE_ARM, &handle ); break; default: assert( false ); break; } if( rval != CS_ERR_OK ) return false; cs_option( handle, CS_OPT_DETAIL, CS_OPT_ON ); cs_option( handle, CS_OPT_SYNTAX, m_atnt ? CS_OPT_SYNTAX_ATT : CS_OPT_SYNTAX_INTEL ); cs_insn* insn; size_t cnt = cs_disasm( handle, (const uint8_t*)code, len, symAddr, 0, &insn ); if( cnt > 0 ) { if( insn[cnt-1].address - symAddr + insn[cnt-1].size < len ) m_disasmFail = insn[cnt-1].address - symAddr; int bytesMax = 0; int mLenMax = 0; m_asm.reserve( cnt ); for( size_t i=0; i= symAddr && jumpAddr < symAddr + len ) { auto fit = std::lower_bound( insn, insn+cnt, jumpAddr, []( const auto& l, const auto& r ) { return l.address < r; } ); if( fit != insn+cnt && fit->address == jumpAddr ) { const auto min = std::min( jumpAddr, op.address ); const auto max = std::max( jumpAddr, op.address ); auto it = m_jumpTable.find( jumpAddr ); if( it == m_jumpTable.end() ) { m_jumpTable.emplace( jumpAddr, JumpData { min, max, 0, { op.address } } ); } else { if( it->second.min > min ) it->second.min = min; else if( it->second.max < max ) it->second.max = max; it->second.source.emplace_back( op.address ); } } else { jumpAddr = 0; } } else { m_jumpOut.emplace( op.address ); } } std::vector params; switch( m_cpuArch ) { case CpuArchX86: case CpuArchX64: for( uint8_t i=0; ix86.op_count == 2 ); const auto opidx = m_atnt ? 0 : 1; assert( op.detail->x86.operands[opidx].type == X86_OP_MEM ); auto& mem = op.detail->x86.operands[opidx].mem; if( mem.base == X86_REG_INVALID ) { if( mem.index == X86_REG_INVALID ) { leaData = LeaData::d; } else { leaData = mem.disp == 0 ? LeaData::i : LeaData::id; } } else if( mem.base == X86_REG_RIP ) { leaData = mem.disp == 0 ? LeaData::r : LeaData::rd; } else { if( mem.index == X86_REG_INVALID ) { leaData = mem.disp == 0 ? LeaData::b : LeaData::bd; } else { leaData = mem.disp == 0 ? LeaData::bi : LeaData::bid; } } } m_asm.emplace_back( AsmLine { op.address, jumpAddr, op.mnemonic, op.op_str, (uint8_t)op.size, leaData, jumpConditional, std::move( params ) } ); #if CS_API_MAJOR >= 4 auto& entry = m_asm.back(); cs_regs read, write; uint8_t rcnt, wcnt; cs_regs_access( handle, &op, read, &rcnt, write, &wcnt ); int idx; switch( m_cpuArch ) { case CpuArchX86: case CpuArchX64: assert( rcnt < sizeof( entry.readX86 ) ); assert( wcnt < sizeof( entry.writeX86 ) ); idx = 0; for( int i=0; i mLenMax ) mLenMax = mLen; if( op.size > bytesMax ) bytesMax = op.size; uint32_t mLineMax = 0; uint32_t srcline; const auto srcidx = worker.GetLocationForAddress( op.address, srcline ); if( srcline != 0 ) { if( srcline > mLineMax ) mLineMax = srcline; const auto idx = srcidx.Idx(); auto sit = m_sourceFiles.find( idx ); if( sit == m_sourceFiles.end() ) { m_sourceFiles.emplace( idx, srcline ); } } char tmp[16]; sprintf( tmp, "%" PRIu32, mLineMax ); m_maxLine = strlen( tmp ) + 1; } cs_free( insn, cnt ); m_maxMnemonicLen = mLenMax + 2; m_maxAsmBytes = bytesMax; if( !m_jumpTable.empty() ) { struct JumpRange { uint64_t target; uint64_t len; }; std::vector jumpRange; jumpRange.reserve( m_jumpTable.size() ); for( auto& v : m_jumpTable ) { pdqsort_branchless( v.second.source.begin(), v.second.source.end() ); jumpRange.emplace_back( JumpRange { v.first, v.second.max - v.second.min } ); } pdqsort_branchless( jumpRange.begin(), jumpRange.end(), []( const auto& l, const auto& r ) { return l.len < r.len; } ); std::vector>> levelRanges; for( auto& v : jumpRange ) { auto it = m_jumpTable.find( v.target ); assert( it != m_jumpTable.end() ); size_t level = 0; for(;;) { assert( levelRanges.size() >= level ); if( levelRanges.size() == level ) { it->second.level = level; levelRanges.push_back( { { it->second.min, it->second.max } } ); break; } else { bool validFit = true; auto& lr = levelRanges[level]; for( auto& range : lr ) { assert( !( it->second.min >= range.first && it->second.max <= range.second ) ); if( it->second.min <= range.second && it->second.max >= range.first ) { validFit = false; break; } } if( validFit ) { it->second.level = level; lr.emplace_back( it->second.min, it->second.max ); break; } level++; } } if( level > m_maxJumpLevel ) m_maxJumpLevel = level; } uint32_t locNum = 0; for( auto& v : m_asm ) { if( m_jumpTable.find( v.addr ) != m_jumpTable.end() ) { m_locMap.emplace( v.addr, locNum++ ); } } } } cs_close( &handle ); m_codeLen = len; ResetAsm(); return true; } void SourceView::Render( Worker& worker, View& view ) { m_highlightAddr.Decay( 0 ); m_hoveredLine.Decay( 0 ); m_hoveredSource.Decay( 0 ); if( m_symAddr == 0 ) { if( m_source.filename() ) TextFocused( ICON_FA_FILE " File:", m_source.filename() ); if( m_source.is_cached() ) { TextColoredUnformatted( ImVec4( 0.4f, 0.8f, 0.4f, 1.f ), ICON_FA_DATABASE ); ImGui::SameLine(); ImGui::TextUnformatted( "Source file cached during profiling run" ); } else { TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 1.f, 0.3f, 0.3f, 1.f ), "The source file contents might not reflect the actual profiled code!" ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); } RenderSimpleSourceView(); } else { RenderSymbolView( worker, view ); } } void SourceView::RenderSimpleSourceView() { ImGui::SetNextWindowContentSize( ImVec2( m_srcWidth, 0 ) ); ImGui::BeginChild( "##sourceView", ImVec2( 0, 0 ), true, ImGuiWindowFlags_HorizontalScrollbar ); if( m_font ) ImGui::PushFont( m_font ); auto& lines = m_source.get(); auto draw = ImGui::GetWindowDrawList(); const auto wpos = ImGui::GetWindowPos(); const auto dpos = wpos + ImVec2( 0.5f, 0.5f ); const auto wh = ImGui::GetWindowHeight(); const auto ty = ImGui::GetFontSize(); const auto ts = ImGui::CalcTextSize( " " ).x; const auto lineCount = lines.size(); const auto tmp = RealToString( lineCount ); const auto maxLine = strlen( tmp ); const auto lx = ts * maxLine + ty + round( ts*0.4f ); DrawLine( draw, dpos + ImVec2( lx, 0 ), dpos + ImVec2( lx, wh ), 0x08FFFFFF ); const AddrStat zero = {}; if( m_targetLine != 0 ) { int lineNum = 1; for( auto& line : lines ) { if( m_targetLine == lineNum ) { m_targetLine = 0; ImGui::SetScrollHereY(); } RenderLine( line, lineNum++, zero, zero, zero, nullptr, nullptr ); } const auto win = ImGui::GetCurrentWindowRead(); m_srcWidth = win->DC.CursorMaxPos.x - win->DC.CursorStartPos.x; } else { ImGuiListClipper clipper; clipper.Begin( (int)lines.size() ); while( clipper.Step() ) { for( auto i=clipper.DisplayStart; iisInline ) { auto parent = worker.GetSymbolData( m_baseAddr ); if( parent ) { TextFocused( ICON_FA_PUZZLE_PIECE " Symbol:", worker.GetString( parent->name ) ); } else { char tmp[16]; sprintf( tmp, "0x%" PRIx64, m_baseAddr ); TextFocused( ICON_FA_PUZZLE_PIECE " Symbol:", tmp ); } } else { TextFocused( ICON_FA_PUZZLE_PIECE " Symbol:", worker.GetString( sym->name ) ); } ImGui::SameLine(); TextDisabledUnformatted( worker.GetString( sym->imageName ) ); ImGui::SameLine(); ImGui::TextDisabled( "0x%" PRIx64, m_baseAddr ); const bool limitView = view.m_statRange.active; auto inlineList = worker.GetInlineSymbolList( m_baseAddr, m_codeLen ); if( inlineList ) { SmallCheckbox( ICON_FA_SITEMAP " Function:", &m_calcInlineStats ); ImGui::SameLine(); ImGui::SetNextItemWidth( -1 ); ImGui::PushStyleVar( ImGuiStyleVar_FramePadding, ImVec2( 0, 0 ) ); const auto currSymName = m_symAddr == m_baseAddr ? "[ - self - ]" : worker.GetString( sym->name ); if( ImGui::BeginCombo( "##functionList", currSymName, ImGuiComboFlags_HeightLarge ) ) { const auto symEnd = m_baseAddr + m_codeLen; unordered_flat_map symStat; if( limitView ) { symStat.emplace( m_baseAddr, CountAsmIpStats( m_baseAddr, worker, true, view ) ); auto ptr = inlineList; while( *ptr < symEnd ) { symStat.emplace( *ptr, CountAsmIpStats( *ptr, worker, true, view ) ); ptr++; } } else { const auto& ss = worker.GetSymbolStats(); for( auto& v : ss ) symStat.emplace( v.first, v.second.excl ); } uint32_t totalSamples = 0; Vector> symInline; auto baseStatIt = symStat.find( m_baseAddr ); if( baseStatIt == symStat.end() || baseStatIt->second == 0 ) { symInline.push_back( std::make_pair( m_baseAddr, 0 ) ); } else { symInline.push_back( std::make_pair( m_baseAddr, baseStatIt->second ) ); totalSamples += baseStatIt->second; } while( *inlineList < symEnd ) { if( *inlineList != m_baseAddr ) { auto statIt = symStat.find( *inlineList ); if( statIt == symStat.end() || statIt->second == 0 ) { symInline.push_back_non_empty( std::make_pair( *inlineList, 0 ) ); } else { symInline.push_back_non_empty( std::make_pair( *inlineList, statIt->second ) ); totalSamples += statIt->second; } } inlineList++; } pdqsort_branchless( symInline.begin(), symInline.end(), []( const auto& l, const auto& r ) { return l.second == r.second ? l.first < r.first : l.second > r.second; } ); if( totalSamples == 0 ) { ImGui::Columns( 2 ); static bool widthSet = false; if( !widthSet ) { widthSet = true; const auto w = ImGui::GetWindowWidth(); const auto c1 = ImGui::CalcTextSize( "0xeeeeeeeeeeeeee" ).x; ImGui::SetColumnWidth( 0, w - c1 ); ImGui::SetColumnWidth( 1, c1 ); } } else { ImGui::Columns( 3 ); static bool widthSet = false; if( !widthSet ) { widthSet = true; const auto w = ImGui::GetWindowWidth(); const auto c0 = ImGui::CalcTextSize( "12345678901234567890" ).x; const auto c2 = ImGui::CalcTextSize( "0xeeeeeeeeeeeeee" ).x; ImGui::SetColumnWidth( 0, c0 ); ImGui::SetColumnWidth( 1, w - c0 - c2 ); ImGui::SetColumnWidth( 2, c2 ); } } for( auto& v : symInline ) { if( totalSamples != 0 ) { if( v.second != 0 ) { ImGui::TextUnformatted( TimeToString( v.second * worker.GetSamplingPeriod() ) ); ImGui::SameLine(); ImGui::TextDisabled( "(%.2f%%)", 100.f * v.second / totalSamples ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); TextFocused( "Sample count:", RealToString( v.second ) ); ImGui::EndTooltip(); } } ImGui::NextColumn(); } auto isym = worker.GetSymbolData( v.first ); assert( isym ); ImGui::PushID( v.first ); const auto symName = v.first == m_baseAddr ? "[ - self - ]" : worker.GetString( isym->name ); if( ImGui::Selectable( symName, v.first == m_symAddr, ImGuiSelectableFlags_SpanAllColumns ) ) { m_symAddr = v.first; const auto sym = worker.GetSymbolData( v.first ); const char* file; uint32_t line; if( sym->isInline ) { file = worker.GetString( sym->callFile ); line = sym->callLine; } else { file = worker.GetString( sym->file ); line = sym->line; } ParseSource( file, worker, view ); m_targetLine = line; SelectLine( line, &worker, true ); SelectViewMode(); } ImGui::PopID(); ImGui::NextColumn(); ImGui::TextDisabled( "0x%" PRIx64, v.first ); ImGui::NextColumn(); } ImGui::EndColumns(); ImGui::EndCombo(); } ImGui::PopStyleVar(); } TextDisabledUnformatted( "Mode:" ); ImGui::SameLine(); ImGui::PushStyleVar( ImGuiStyleVar_FramePadding, ImVec2( 0, 0 ) ); if( !m_source.empty() ) { ImGui::RadioButton( "Source", &m_displayMode, DisplaySource ); if( !m_asm.empty() ) { ImGui::SameLine(); ImGui::RadioButton( "Assembly", &m_displayMode, DisplayAsm ); ImGui::SameLine(); ImGui::RadioButton( "Combined", &m_displayMode, DisplayMixed ); } } else { ImGui::RadioButton( "Assembly", &m_displayMode, DisplayAsm ); } if( !m_asm.empty() ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); TextFocused( ICON_FA_WEIGHT_HANGING " Code:", MemSizeToString( m_codeLen ) ); } AddrStat iptotalSrc = {}, iptotalAsm = {}; AddrStat ipmaxSrc = {}, ipmaxAsm = {}; unordered_flat_map ipcountSrc, ipcountAsm; if( m_cost == CostType::SampleCount ) { if( m_calcInlineStats ) { GatherIpStats( m_symAddr, iptotalSrc, iptotalAsm, ipcountSrc, ipcountAsm, ipmaxSrc, ipmaxAsm, worker, limitView, view ); GatherAdditionalIpStats( m_symAddr, iptotalSrc, iptotalAsm, ipcountSrc, ipcountAsm, ipmaxSrc, ipmaxAsm, worker, limitView, view ); } else { GatherIpStats( m_baseAddr, iptotalSrc, iptotalAsm, ipcountSrc, ipcountAsm, ipmaxSrc, ipmaxAsm, worker, limitView, view ); auto iptr = worker.GetInlineSymbolList( m_baseAddr, m_codeLen ); if( iptr ) { const auto symEnd = m_baseAddr + m_codeLen; while( *iptr < symEnd ) { GatherIpStats( *iptr, iptotalSrc, iptotalAsm, ipcountSrc, ipcountAsm, ipmaxSrc, ipmaxAsm, worker, limitView, view ); iptr++; } } GatherAdditionalIpStats( m_symAddr, iptotalSrc, iptotalAsm, ipcountSrc, ipcountAsm, ipmaxSrc, ipmaxAsm, worker, limitView, view ); } } else { GatherIpHwStats( iptotalSrc, iptotalAsm, ipcountSrc, ipcountAsm, ipmaxSrc, ipmaxAsm, worker, limitView, view ); } if( !m_calcInlineStats ) { iptotalSrc = iptotalAsm; } const auto slzReady = worker.AreSourceLocationZonesReady(); if( ( iptotalAsm.local + iptotalAsm.ext ) > 0 || ( view.m_statRange.active && worker.GetSamplesForSymbol( m_baseAddr ) ) ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( worker.GetHwSampleCountAddress() != 0 ) { SmallCheckbox( ICON_FA_HAMMER " Hw samples", &m_hwSamples ); ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); ImGui::TextUnformatted( ICON_FA_HIGHLIGHTER " Cost" ); ImGui::SameLine(); float mw = 0; for( auto& v : s_CostName ) { const auto w = ImGui::CalcTextSize( v ).x; if( w > mw ) mw = w; } ImGui::SetNextItemWidth( mw + ImGui::GetFontSize() ); ImGui::PushStyleVar( ImGuiStyleVar_FramePadding, ImVec2( 0, 0 ) ); if( ImGui::BeginCombo( "##cost", s_CostName[(int)m_cost], ImGuiComboFlags_HeightLarge ) ) { int idx = 0; for( auto& v : s_CostName ) { if( ImGui::Selectable( v, idx == (int)m_cost ) ) m_cost = (CostType)idx; if( (CostType)idx == s_costSeparateAfter ) ImGui::Separator(); idx++; } ImGui::EndCombo(); } ImGui::PopStyleVar(); ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); } if( m_cost == CostType::SampleCount ) { if( !slzReady ) { ImGui::PushItemFlag( ImGuiItemFlags_Disabled, true ); ImGui::PushStyleVar( ImGuiStyleVar_Alpha, ImGui::GetStyle().Alpha * 0.5f ); m_childCalls = false; } else if( ImGui::IsKeyDown( 'Z' ) ) { m_childCalls = !m_childCalls; } SmallCheckbox( ICON_FA_SIGN_OUT_ALT " Child calls", &m_childCalls ); if( !slzReady ) { ImGui::PopStyleVar(); ImGui::PopItemFlag(); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Please wait, processing data..." ); ImGui::EndTooltip(); } } else { if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Press Z key to temporarily reverse selection." ); ImGui::EndTooltip(); } } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( m_childCalls ) { TextFocused( ICON_FA_STOPWATCH " Time:", TimeToString( ( iptotalAsm.local + iptotalAsm.ext ) * worker.GetSamplingPeriod() ) ); } else { TextFocused( ICON_FA_STOPWATCH " Time:", TimeToString( iptotalAsm.local * worker.GetSamplingPeriod() ) ); } if( iptotalAsm.ext ) { ImGui::SameLine(); ImGui::TextDisabled( "(%c%s)", m_childCalls ? '-' : '+', TimeToString( iptotalAsm.ext * worker.GetSamplingPeriod() ) ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Child call samples" ); ImGui::EndTooltip(); } } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( m_childCalls ) { TextFocused( ICON_FA_EYE_DROPPER " Samples:", RealToString( iptotalAsm.local + iptotalAsm.ext ) ); } else { TextFocused( ICON_FA_EYE_DROPPER " Samples:", RealToString( iptotalAsm.local ) ); } if( iptotalAsm.ext ) { ImGui::SameLine(); ImGui::Text( "(%c%s)", m_childCalls ? '-' : '+', RealToString( iptotalAsm.ext ) ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Child call samples" ); ImGui::EndTooltip(); } } } else { TextFocused( "Events:", RealToString( iptotalAsm.local ) ); } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( !worker.AreSymbolSamplesReady() ) { view.m_statRange.active = false; bool val = false; ImGui::PushItemFlag( ImGuiItemFlags_Disabled, true ); ImGui::PushStyleVar( ImGuiStyleVar_Alpha, ImGui::GetStyle().Alpha * 0.5f ); ImGui::Checkbox( "Limit range", &val ); ImGui::PopItemFlag(); ImGui::PopStyleVar(); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Please wait, processing data..." ); ImGui::EndTooltip(); } } else { if( ImGui::Checkbox( "Limit range", &view.m_statRange.active ) ) { if( view.m_statRange.active && view.m_statRange.min == 0 && view.m_statRange.max == 0 ) { const auto& vd = view.GetViewData(); view.m_statRange.min = vd.zvStart; view.m_statRange.max = vd.zvEnd; } } if( view.m_statRange.active ) { ImGui::SameLine(); TextColoredUnformatted( 0xFF00FFFF, ICON_FA_EXCLAMATION_TRIANGLE ); ImGui::SameLine(); ToggleButton( ICON_FA_RULER " Limits", view.m_showRanges ); } } } else { m_cost = CostType::SampleCount; } ImGui::PopStyleVar(); ImGui::Separator(); uint64_t jumpOut = 0; switch( m_displayMode ) { case DisplaySource: RenderSymbolSourceView( iptotalSrc, ipcountSrc, ipcountAsm, ipmaxSrc, worker, view ); break; case DisplayAsm: jumpOut = RenderSymbolAsmView( iptotalAsm, ipcountAsm, ipmaxAsm, worker, view ); break; case DisplayMixed: ImGui::Columns( 2 ); RenderSymbolSourceView( iptotalSrc, ipcountSrc, ipcountAsm, ipmaxSrc, worker, view ); ImGui::NextColumn(); jumpOut = RenderSymbolAsmView( iptotalAsm, ipcountAsm, ipmaxAsm, worker, view ); ImGui::EndColumns(); break; default: assert( false ); break; } if( slzReady && ImGui::IsKeyDown( 'Z' ) ) m_childCalls = !m_childCalls; if( jumpOut != 0 ) { auto sym = worker.GetSymbolData( jumpOut ); if( sym ) { auto line = sym->line; auto file = line == 0 ? nullptr : worker.GetString( sym->file ); if( file && !SourceFileValid( file, worker.GetCaptureTime(), view, worker ) ) { file = nullptr; line = 0; } if( line > 0 || sym->size.Val() > 0 ) { OpenSymbol( file, line, jumpOut, jumpOut, worker, view ); } } } } static uint32_t GetHotnessColor( uint32_t count, uint32_t maxCount ) { const auto ratio = float( 2 * count ) / maxCount; if( ratio <= 0.5f ) { const auto a = int( ( ratio * 1.5f + 0.25f ) * 255 ); return 0x000000FF | ( a << 24 ); } else if( ratio <= 1.f ) { const auto g = int( ( ratio - 0.5f ) * 511 ); return 0xFF0000FF | ( g << 8 ); } else if( ratio <= 2.f ) { const auto b = int( ( ratio - 1.f ) * 255 ); return 0xFF00FFFF | ( b << 16 ); } else { return 0xFFFFFFFF; } } static uint32_t GetHotnessGlow( uint32_t count, uint32_t maxCount ) { const auto ratio = float( 2 * count ) / maxCount; if( ratio <= 0.5f ) { return 0; } else if( ratio <= 1.f ) { const auto a = int( ( ratio * 2.f - 1.f ) * 102 ); return 0x000000FF | ( a << 24 ); } else if( ratio <= 2.f ) { const auto g = int( ( ratio - 1.f ) * 192 ); return 0x660000FF | ( g << 8 ); } else { return 0x6600C0FF; } } static constexpr uint32_t GoodnessColor[256] = { 0xFF3232FF, 0xFF3235FE, 0xFF3238FE, 0xFF323AFD, 0xFF323DFD, 0xFF323FFC, 0xFF3242FC, 0xFF3244FB, 0xFF3246FB, 0xFF3248FB, 0xFF324AFA, 0xFF324CFA, 0xFF324EF9, 0xFF3250F9, 0xFF3252F8, 0xFF3254F8, 0xFF3255F8, 0xFF3257F7, 0xFF3259F7, 0xFF325AF6, 0xFF325CF6, 0xFF325EF5, 0xFF325FF5, 0xFF3260F4, 0xFF3262F4, 0xFF3263F3, 0xFF3265F3, 0xFF3266F3, 0xFF3268F2, 0xFF3269F2, 0xFF326AF1, 0xFF326BF1, 0xFF326DF0, 0xFF326EF0, 0xFF326FEF, 0xFF3270EF, 0xFF3272EE, 0xFF3273EE, 0xFF3274EE, 0xFF3275ED, 0xFF3276ED, 0xFF3277EC, 0xFF3279EC, 0xFF327AEB, 0xFF327BEB, 0xFF327CEA, 0xFF327DEA, 0xFF327EE9, 0xFF327FE9, 0xFF3280E8, 0xFF3281E8, 0xFF3282E7, 0xFF3283E7, 0xFF3284E6, 0xFF3285E6, 0xFF3286E5, 0xFF3287E5, 0xFF3288E4, 0xFF3289E4, 0xFF328AE3, 0xFF328BE3, 0xFF328CE2, 0xFF328DE2, 0xFF328EE1, 0xFF328EE1, 0xFF328FE0, 0xFF3290E0, 0xFF3291DF, 0xFF3292DF, 0xFF3293DE, 0xFF3294DE, 0xFF3295DD, 0xFF3295DD, 0xFF3296DC, 0xFF3297DC, 0xFF3298DB, 0xFF3299DB, 0xFF329ADA, 0xFF329ADA, 0xFF329BD9, 0xFF329CD9, 0xFF329DD8, 0xFF329ED8, 0xFF329ED7, 0xFF329FD7, 0xFF32A0D6, 0xFF32A1D5, 0xFF32A2D5, 0xFF32A2D4, 0xFF32A3D4, 0xFF32A4D3, 0xFF32A5D3, 0xFF32A5D2, 0xFF32A6D2, 0xFF32A7D1, 0xFF32A8D1, 0xFF32A8D0, 0xFF32A9CF, 0xFF32AACF, 0xFF32AACE, 0xFF32ABCE, 0xFF32ACCD, 0xFF32ADCD, 0xFF32ADCC, 0xFF32AECC, 0xFF32AFCB, 0xFF32AFCA, 0xFF32B0CA, 0xFF32B1C9, 0xFF32B1C9, 0xFF32B2C8, 0xFF32B3C7, 0xFF32B3C7, 0xFF32B4C6, 0xFF32B5C6, 0xFF32B5C5, 0xFF32B6C5, 0xFF32B7C4, 0xFF32B7C3, 0xFF32B8C3, 0xFF32B9C2, 0xFF32B9C2, 0xFF32BAC1, 0xFF32BBC0, 0xFF32BBC0, 0xFF32BCBF, 0xFF32BDBE, 0xFF32BDBE, 0xFF32BEBD, 0xFF32BEBD, 0xFF32BFBC, 0xFF32C0BB, 0xFF32C0BB, 0xFF32C1BA, 0xFF32C2B9, 0xFF32C2B9, 0xFF32C3B8, 0xFF32C3B7, 0xFF32C4B7, 0xFF32C5B6, 0xFF32C5B5, 0xFF32C6B5, 0xFF32C6B4, 0xFF32C7B3, 0xFF32C7B3, 0xFF32C8B2, 0xFF32C9B1, 0xFF32C9B1, 0xFF32CAB0, 0xFF32CAAF, 0xFF32CBAF, 0xFF32CCAE, 0xFF32CCAD, 0xFF32CDAD, 0xFF32CDAC, 0xFF32CEAB, 0xFF32CEAA, 0xFF32CFAA, 0xFF32CFA9, 0xFF32D0A8, 0xFF32D1A8, 0xFF32D1A7, 0xFF32D2A6, 0xFF32D2A5, 0xFF32D3A5, 0xFF32D3A4, 0xFF32D4A3, 0xFF32D4A2, 0xFF32D5A2, 0xFF32D5A1, 0xFF32D6A0, 0xFF32D79F, 0xFF32D79E, 0xFF32D89E, 0xFF32D89D, 0xFF32D99C, 0xFF32D99B, 0xFF32DA9A, 0xFF32DA9A, 0xFF32DB99, 0xFF32DB98, 0xFF32DC97, 0xFF32DC96, 0xFF32DD95, 0xFF32DD95, 0xFF32DE94, 0xFF32DE93, 0xFF32DF92, 0xFF32DF91, 0xFF32E090, 0xFF32E08F, 0xFF32E18E, 0xFF32E18E, 0xFF32E28D, 0xFF32E28C, 0xFF32E38B, 0xFF32E38A, 0xFF32E489, 0xFF32E488, 0xFF32E587, 0xFF32E586, 0xFF32E685, 0xFF32E684, 0xFF32E783, 0xFF32E782, 0xFF32E881, 0xFF32E880, 0xFF32E97F, 0xFF32E97E, 0xFF32EA7D, 0xFF32EA7C, 0xFF32EB7B, 0xFF32EB7A, 0xFF32EC79, 0xFF32EC77, 0xFF32ED76, 0xFF32ED75, 0xFF32EE74, 0xFF32EE73, 0xFF32EE72, 0xFF32EF70, 0xFF32EF6F, 0xFF32F06E, 0xFF32F06D, 0xFF32F16B, 0xFF32F16A, 0xFF32F269, 0xFF32F268, 0xFF32F366, 0xFF32F365, 0xFF32F363, 0xFF32F462, 0xFF32F460, 0xFF32F55F, 0xFF32F55E, 0xFF32F65C, 0xFF32F65A, 0xFF32F759, 0xFF32F757, 0xFF32F855, 0xFF32F854, 0xFF32F852, 0xFF32F950, 0xFF32F94E, 0xFF32FA4C, 0xFF32FA4A, 0xFF32FB48, 0xFF32FB46, 0xFF32FB44, 0xFF32FC42, 0xFF32FC3F, 0xFF32FD3D, 0xFF32FD3A, 0xFF32FE38, 0xFF32FE35, 0xFF32FF32, }; static uint32_t GetGoodnessColor( float inRatio ) { const auto ratio = std::clamp( int( inRatio * 255.f ), 0, 255 ); return GoodnessColor[ratio]; } void SourceView::RenderSymbolSourceView( const AddrStat& iptotal, const unordered_flat_map& ipcount, const unordered_flat_map& ipcountAsm, const AddrStat& ipmax, Worker& worker, const View& view ) { if( m_sourceFiles.empty() ) { if( m_source.is_cached() ) { TextColoredUnformatted( ImVec4( 0.4f, 0.8f, 0.4f, 1.f ), ICON_FA_DATABASE ); ImGui::SameLine(); ImGui::TextUnformatted( "Source file cached during profiling run" ); } else { TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 1.f, 0.3f, 0.3f, 1.f ), "The source file contents might not reflect the actual profiled code!" ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); } } else { if( m_source.is_cached() ) { TextColoredUnformatted( ImVec4( 0.4f, 0.8f, 0.4f, 1.f ), ICON_FA_DATABASE ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Source file cached during profiling run" ); ImGui::EndTooltip(); } } else { TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 1.f, 0.3f, 0.3f, 1.f ), "The source file contents might not reflect the actual profiled code!" ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); ImGui::EndTooltip(); } } ImGui::SameLine(); TextDisabledUnformatted( ICON_FA_FILE " File:" ); ImGui::SameLine(); const auto fileColor = GetHsvColor( m_source.idx(), 0 ); SmallColorBox( fileColor ); ImGui::SameLine(); ImGui::SetNextItemWidth( -1 ); ImGui::PushStyleVar( ImGuiStyleVar_FramePadding, ImVec2( 0, 0 ) ); if( ImGui::BeginCombo( "##fileList", m_source.filename(), ImGuiComboFlags_HeightLarge ) ) { if( m_asm.empty() ) { for( auto& v : m_sourceFiles ) { const auto color = GetHsvColor( v.first, 0 ); SmallColorBox( color ); ImGui::SameLine(); auto fstr = worker.GetString( StringIdx( v.first ) ); if( SourceFileValid( fstr, worker.GetCaptureTime(), view, worker ) ) { ImGui::PushID( v.first ); if( ImGui::Selectable( fstr, fstr == m_source.filename() ) ) { ParseSource( fstr, worker, view ); m_targetLine = v.second; SelectLine( v.second, &worker ); } ImGui::PopID(); } else { TextDisabledUnformatted( fstr ); } } } else { AddrStat totalSamples = {}; unordered_flat_map fileCounts; for( auto& v : m_asm ) { uint32_t srcline; const auto srcidx = worker.GetLocationForAddress( v.addr, srcline ); if( srcline != 0 ) { AddrStat cnt = {}; auto ait = ipcountAsm.find( v.addr ); if( ait != ipcountAsm.end() ) cnt = ait->second; auto fit = fileCounts.find( srcidx.Idx() ); if( fit == fileCounts.end() ) { fileCounts.emplace( srcidx.Idx(), cnt ); } else { fit->second += cnt; } totalSamples += cnt; } } std::vector> fileCountsVec; fileCountsVec.reserve( fileCounts.size() ); for( auto& v : fileCounts ) fileCountsVec.emplace_back( v.first, v.second ); if( m_childCalls ) { pdqsort_branchless( fileCountsVec.begin(), fileCountsVec.end(), [&worker] (const auto& l, const auto& r ) { return ( l.second.local + l.second.ext == r.second.local + r.second.ext ) ? strcmp( worker.GetString( l.first ), worker.GetString( r.first ) ) < 0 : ( l.second.local + l.second.ext > r.second.local + r.second.ext ); } ); } else { pdqsort_branchless( fileCountsVec.begin(), fileCountsVec.end(), [&worker] (const auto& l, const auto& r ) { return l.second.local == r.second.local ? strcmp( worker.GetString( l.first ), worker.GetString( r.first ) ) < 0 : l.second.local > r.second.local; } ); } const auto hasSamples = totalSamples.local + totalSamples.ext != 0; if( hasSamples ) { ImGui::Columns( 2 ); static bool widthSet = false; if( !widthSet ) { widthSet = true; const auto w = ImGui::GetWindowWidth(); const auto c0 = ImGui::CalcTextSize( "12345678901234567890" ).x; ImGui::SetColumnWidth( 0, c0 ); ImGui::SetColumnWidth( 1, w - c0 ); } } for( auto& v : fileCountsVec ) { if( hasSamples ) { auto fit = fileCounts.find( v.first ); assert( fit != fileCounts.end() ); if( fit->second.local + fit->second.ext != 0 ) { if( m_cost == CostType::SampleCount ) { if( m_childCalls ) { ImGui::TextUnformatted( TimeToString( ( fit->second.local + fit->second.ext ) * worker.GetSamplingPeriod() ) ); } else { ImGui::TextUnformatted( TimeToString( fit->second.local * worker.GetSamplingPeriod() ) ); } if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); if( fit->second.local ) { TextFocused( "Local time:", TimeToString( fit->second.local * worker.GetSamplingPeriod() ) ); TextFocused( "Local samples:", RealToString( fit->second.local ) ); } if( fit->second.ext ) { TextFocused( "Child time:", TimeToString( fit->second.ext * worker.GetSamplingPeriod() ) ); TextFocused( "Child samples:", RealToString( fit->second.ext ) ); } ImGui::EndTooltip(); } } else { ImGui::TextUnformatted( RealToString( fit->second.local ) ); } ImGui::SameLine(); if( m_childCalls ) { ImGui::TextDisabled( "(%.2f%%)", 100.f * ( fit->second.local + fit->second.ext ) / ( totalSamples.local + totalSamples.ext ) ); } else if( totalSamples.local != 0 ) { ImGui::TextDisabled( "(%.2f%%)", 100.f * fit->second.local / totalSamples.local ); } else { TextDisabledUnformatted( "(0.00%%)" ); } } ImGui::NextColumn(); } const auto color = GetHsvColor( v.first, 0 ); SmallColorBox( color ); ImGui::SameLine(); auto fstr = worker.GetString( StringIdx( v.first ) ); if( SourceFileValid( fstr, worker.GetCaptureTime(), view, worker ) ) { ImGui::PushID( v.first ); if( ImGui::Selectable( fstr, fstr == m_source.filename(), ImGuiSelectableFlags_SpanAllColumns ) ) { uint32_t line = 0; for( auto& file : m_sourceFiles ) { if( file.first == v.first ) { line = file.second; break; } } ParseSource( fstr, worker, view ); m_targetLine = line; SelectLine( line, &worker ); } ImGui::PopID(); } else { TextDisabledUnformatted( fstr ); } if( hasSamples ) ImGui::NextColumn(); } if( hasSamples ) ImGui::EndColumns(); } ImGui::EndCombo(); } ImGui::PopStyleVar(); } const float bottom = m_srcSampleSelect.empty() ? 0 : ImGui::GetFrameHeight(); ImGui::SetNextWindowContentSize( ImVec2( m_srcWidth, 0 ) ); ImGui::BeginChild( "##sourceView", ImVec2( 0, -bottom ), true, ImGuiWindowFlags_NoMove | ImGuiWindowFlags_HorizontalScrollbar ); if( m_font ) ImGui::PushFont( m_font ); auto& lines = m_source.get(); auto draw = ImGui::GetWindowDrawList(); const auto wpos = ImGui::GetWindowPos() - ImVec2( ImGui::GetCurrentWindowRead()->Scroll.x, 0 ); const auto dpos = wpos + ImVec2( 0.5f, 0.5f ); const auto wh = ImGui::GetWindowHeight(); const auto ty = ImGui::GetFontSize(); const auto ts = ImGui::CalcTextSize( " " ).x; const auto lineCount = lines.size(); const auto tmp = RealToString( lineCount ); const auto maxLine = strlen( tmp ); auto lx = ts * maxLine + ty + round( ts*0.4f ); if( iptotal.local + iptotal.ext != 0 ) lx += ts * 7 + ty; if( !m_asm.empty() ) { const auto tmp = RealToString( m_asm.size() ); const auto maxAsm = strlen( tmp ) + 1; lx += ts * maxAsm + ty; } if( m_hwSamples && worker.GetHwSampleCountAddress() != 0 ) lx += 19 * ts + ty; DrawLine( draw, dpos + ImVec2( lx, 0 ), dpos + ImVec2( lx, wh ), 0x08FFFFFF ); const AddrStat zero = {}; m_selectedAddressesHover.clear(); if( m_targetLine != 0 ) { int lineNum = 1; for( auto& line : lines ) { if( m_targetLine == lineNum ) { m_targetLine = 0; ImGui::SetScrollHereY(); } RenderLine( line, lineNum++, zero, iptotal, ipmax, &worker, &view ); } const auto win = ImGui::GetCurrentWindowRead(); m_srcWidth = win->DC.CursorMaxPos.x - win->DC.CursorStartPos.x; } else { ImGuiListClipper clipper; clipper.Begin( (int)lines.size() ); while( clipper.Step() ) { if( iptotal.local + iptotal.ext == 0 ) { for( auto i=clipper.DisplayStart; isecond; RenderLine( lines[i], i+1, ipcnt, iptotal, ipmax, &worker, &view ); } } } } const auto win = ImGui::GetCurrentWindowRead(); if( win->ScrollbarY ) { auto draw = ImGui::GetWindowDrawList(); auto rect = ImGui::GetWindowScrollbarRect( win, ImGuiAxis_Y ); ImGui::PushClipRect( rect.Min, rect.Max, false ); if( m_selectedLine != 0 ) { const auto ly = round( rect.Min.y + ( m_selectedLine - 0.5f ) / lines.size() * rect.GetHeight() ); DrawLine( draw, ImVec2( rect.Min.x + 0.5f, ly + 0.5f ), ImVec2( rect.Max.x + 0.5f, ly + 0.5f ), 0x8899994C, 3 ); } if( m_source.idx() == m_hoveredSource && m_hoveredLine != 0 ) { const auto ly = round( rect.Min.y + ( m_hoveredLine - 0.5f ) / lines.size() * rect.GetHeight() ); DrawLine( draw, ImVec2( rect.Min.x + 0.5f, ly + 0.5f ), ImVec2( rect.Max.x + 0.5f, ly + 0.5f ), 0x88888888, 3 ); } std::vector> ipData; ipData.reserve( ipcount.size() ); for( auto& v : ipcount ) ipData.emplace_back( v.first, v.second ); for( uint32_t lineNum = 1; lineNum <= lines.size(); lineNum++ ) { if( ipcount.find( lineNum ) == ipcount.end() ) { auto addresses = worker.GetAddressesForLocation( m_source.idx(), lineNum ); if( addresses ) { for( auto& addr : *addresses ) { if( addr >= m_baseAddr && addr < m_baseAddr + m_codeLen ) { ipData.emplace_back( lineNum, AddrStat {} ); break; } } } } } pdqsort_branchless( ipData.begin(), ipData.end(), []( const auto& l, const auto& r ) { return l.first < r.first; } ); const auto step = uint32_t( lines.size() * 2 / rect.GetHeight() ); const auto x14 = round( rect.Min.x + rect.GetWidth() * 0.4f ); const auto x34 = round( rect.Min.x + rect.GetWidth() * 0.6f ); auto it = ipData.begin(); while( it != ipData.end() ) { const auto firstLine = it->first; AddrStat ipSum = {}; while( it != ipData.end() && it->first <= firstLine + step ) { ipSum += it->second; ++it; } const auto ly = round( rect.Min.y + float( firstLine ) / lines.size() * rect.GetHeight() ); if( m_childCalls ) { const auto color = ( ipSum.local + ipSum.ext == 0 ) ? 0x22FFFFFF : GetHotnessColor( ipSum.local + ipSum.ext, ipmax.local + ipmax.ext ); draw->AddRectFilled( ImVec2( x14, ly ), ImVec2( x34, ly+3 ), color ); } else { const auto color = ipSum.local == 0 ? 0x22FFFFFF : GetHotnessColor( ipSum.local, ipmax.local ); draw->AddRectFilled( ImVec2( x14, ly ), ImVec2( x34, ly+3 ), color ); } } ImGui::PopClipRect(); } if( m_font ) ImGui::PopFont(); ImGui::EndChild(); if( !m_srcSampleSelect.empty() ) { AddrStat count = {}; uint32_t numLines = 0; for( auto& idx : m_srcSampleSelect ) { auto it = ipcount.find( idx ); if( it != ipcount.end() ) { count += it->second; numLines++; } } ImGui::BeginChild( "##srcSelect" ); if( ImGui::SmallButton( ICON_FA_TIMES ) ) { m_srcSampleSelect.clear(); m_srcGroupSelect = -1; } ImGui::SameLine(); char buf[16]; char* end; if( m_childCalls ) { end = PrintFloat( buf, buf+16, 100.f * ( count.local + count.ext ) / ( iptotal.local + iptotal.ext ), 2 ); } else if( iptotal.local != 0 ) { end = PrintFloat( buf, buf+16, 100.f * count.local / iptotal.local, 2 ); } else { end = PrintFloat( buf, buf+16, 0.f, 2 ); } memcpy( end, "%", 2 ); TextFocused( "Selected:", buf ); ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( m_cost == CostType::SampleCount ) { if( m_childCalls ) { TextFocused( "Time:", TimeToString( ( count.local + count.ext ) * worker.GetSamplingPeriod() ) ); } else { TextFocused( "Time:", TimeToString( count.local * worker.GetSamplingPeriod() ) ); } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( m_childCalls ) { TextFocused( "Sample count:", RealToString( count.local + count.ext ) ); } else { TextFocused( "Sample count:", RealToString( count.local ) ); } } else { TextFocused( "Events:", RealToString( count.local ) ); } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); TextFocused( "Lines:", RealToString( numLines ) ); ImGui::EndChild(); } } static constexpr char HexPrint[] = { '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'A', 'B', 'C', 'D', 'E', 'F' }; static int PrintHexBytesRaw( char* buf, const uint8_t* bytes, size_t len ) { const auto start = buf; for( size_t i=0; i> 4]; *buf++ = HexPrint[byte & 0xF]; *buf++ = ' '; } *--buf = '\0'; return buf - start; } static int PrintHexBytesArm( char* buf, const uint8_t* bytes ) { const auto start = buf; for( int i=3; i>=0; i-- ) { const auto byte = bytes[i]; *buf++ = HexPrint[byte >> 4]; *buf++ = HexPrint[byte & 0xF]; *buf++ = ' '; } *--buf = '\0'; return buf - start; } static int PrintHexBytes( char* buf, const uint8_t* bytes, size_t len, CpuArchitecture arch ) { switch( arch ) { case CpuArchX86: case CpuArchX64: return PrintHexBytesRaw( buf, bytes, len ); case CpuArchArm32: case CpuArchArm64: assert( len == 4 ); return PrintHexBytesArm( buf, bytes ); default: assert( false ); return 0; } } uint64_t SourceView::RenderSymbolAsmView( const AddrStat& iptotal, const unordered_flat_map& ipcount, const AddrStat& ipmax, Worker& worker, View& view ) { if( m_disasmFail >= 0 ) { TextColoredUnformatted( ImVec4( 1.f, 1.f, 0.2f, 1.f ), ICON_FA_EXCLAMATION_TRIANGLE ); if( ImGui::IsItemHovered() ) { const bool clicked = ImGui::IsItemClicked(); ImGui::BeginTooltip(); TextColoredUnformatted( ImVec4( 1, 0, 0, 1 ), "Disassembly failure." ); ImGui::TextUnformatted( "Some instructions weren't properly decoded. Possible reasons:" ); ImGui::TextUnformatted( " 1. Old version of capstone library doesn't support some instructions." ); ImGui::TextUnformatted( " 2. Trying to decode data part of the symbol (e.g. jump arrays, etc.)" ); TextFocused( "Code size:", RealToString( m_codeLen ) ); TextFocused( "Disassembled bytes:", RealToString( m_disasmFail ) ); char tmp[64]; auto bytesLeft = std::min( 16u, m_codeLen - m_disasmFail ); auto code = worker.GetSymbolCode( m_baseAddr, m_codeLen ); assert( code ); PrintHexBytesRaw( tmp, (const uint8_t*)code, bytesLeft ); TextFocused( "Failure bytes:", tmp ); TextDisabledUnformatted( "Click to copy to clipboard." ); ImGui::EndTooltip(); if( clicked ) ImGui::SetClipboardText( tmp ); } ImGui::SameLine(); } SmallCheckbox( ICON_FA_SEARCH_LOCATION " Relative loc.", &m_asmRelative ); if( !m_sourceFiles.empty() ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); SmallCheckbox( ICON_FA_FILE_IMPORT " Source loc.", &m_asmShowSourceLocation ); } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); SmallCheckbox( ICON_FA_COGS " Machine code", &m_asmBytes ); ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); SmallCheckbox( ICON_FA_SHARE " Jumps", &m_showJumps ); if( m_cpuArch == CpuArchX64 || m_cpuArch == CpuArchX86 ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( SmallCheckbox( "AT&T", &m_atnt ) ) Disassemble( m_baseAddr, worker ); if( !m_atnt ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); float mw = 0; for( auto& v : s_uArchUx ) { const auto w = ImGui::CalcTextSize( v.uArch ).x; if( w > mw ) mw = w; } if( m_selMicroArch == m_profileMicroArch ) { TextColoredUnformatted( ImVec4( 0.4f, 0.8f, 0.4f, 1.f ), ICON_FA_MICROCHIP ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Selected microarchitecture is the same as the profiled application was running on" ); ImGui::EndTooltip(); } } else { TextColoredUnformatted( ImVec4( 1.f, 0.3f, 0.3f, 1.f ), ICON_FA_MICROCHIP ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); ImGui::TextUnformatted( "Selected microarchitecture does not match the one profiled application was running on" ); if( m_profileMicroArch >= 0 ) { ImGui::Text( "Measurements were performed on the %s microarchitecture", s_uArchUx[m_profileMicroArch].uArch ); } else { ImGui::TextUnformatted( "Measurements were performed on an unknown microarchitecture" ); } ImGui::EndTooltip(); } } ImGui::SameLine( 0, 0 ); ImGui::TextUnformatted( " \xce\xbc""arch:" ); ImGui::SameLine(); ImGui::SetNextItemWidth( mw + ImGui::GetFontSize() ); ImGui::PushStyleVar( ImGuiStyleVar_FramePadding, ImVec2( 0, 0 ) ); if( ImGui::BeginCombo( "##uarch", s_uArchUx[m_selMicroArch].uArch, ImGuiComboFlags_HeightLarge ) ) { int idx = 0; for( auto& v : s_uArchUx ) { if( ImGui::Selectable( v.uArch, idx == m_selMicroArch ) ) SelectMicroArchitecture( v.moniker ); ImGui::SameLine(); TextDisabledUnformatted( v.cpuName ); idx++; } ImGui::EndCombo(); } ImGui::PopStyleVar(); ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); SmallCheckbox( ICON_FA_TRUCK_LOADING " Latency", &m_showLatency ); } } #ifndef TRACY_NO_FILESELECTOR ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( ImGui::SmallButton( ICON_FA_FILE_IMPORT " Save" ) ) { Save( worker ); } #endif const float bottom = m_asmSampleSelect.empty() ? 0 : ImGui::GetFrameHeight(); ImGui::SetNextWindowContentSize( ImVec2( m_asmWidth, 0 ) ); ImGui::BeginChild( "##asmView", ImVec2( 0, -bottom ), true, ImGuiWindowFlags_NoMove | ImGuiWindowFlags_HorizontalScrollbar ); if( m_font ) ImGui::PushFont( m_font ); int maxAddrLen; { char tmp[32]; sprintf( tmp, "%" PRIx64, m_baseAddr + m_codeLen ); maxAddrLen = strlen( tmp ); } uint64_t selJumpStart = 0; uint64_t selJumpEnd; uint64_t selJumpTarget; uint64_t jumpOut = 0; const AddrStat zero = {}; if( m_targetAddr != 0 ) { for( auto& line : m_asm ) { if( m_targetAddr == line.addr ) { m_targetAddr = 0; ImGui::SetScrollHereY(); } RenderAsmLine( line, zero, iptotal, ipmax, worker, jumpOut, maxAddrLen, view ); } const auto win = ImGui::GetCurrentWindowRead(); m_asmWidth = win->DC.CursorMaxPos.x - win->DC.CursorStartPos.x; } else { const auto th = (int)ImGui::GetTextLineHeightWithSpacing(); ImGuiListClipper clipper; clipper.Begin( (int)m_asm.size(), th ); while( clipper.Step() ) { assert( clipper.StepNo == 3 ); const auto wpos = ImGui::GetCursorScreenPos(); const auto dpos = wpos + ImVec2( 0.5f, 0.5f ); static std::vector insList; insList.clear(); if( iptotal.local + iptotal.ext == 0 ) { for( auto i=clipper.DisplayStart; isecond; RenderAsmLine( line, ipcnt, iptotal, ipmax, worker, jumpOut, maxAddrLen, view ); insList.emplace_back( line.addr ); } } if( m_showJumps && !m_jumpTable.empty() ) { auto draw = ImGui::GetWindowDrawList(); const auto ts = ImGui::CalcTextSize( " " ); const auto th2 = floor( ts.y / 2 ); const auto th4 = floor( ts.y / 4 ); const auto xoff = ( ( iptotal.local + iptotal.ext ) == 0 ? 0 : ( 7 * ts.x + ts.y ) ) + (3+maxAddrLen) * ts.x + ( ( m_asmShowSourceLocation && !m_sourceFiles.empty() ) ? 36 * ts.x : 0 ) + ( m_asmBytes ? m_maxAsmBytes*3 * ts.x : 0 ) + ( ( m_hwSamples && worker.GetHwSampleCountAddress() != 0 ) ? ( 19 * ts.x + ts.y ) : 0 ); const auto minAddr = m_asm[clipper.DisplayStart].addr; const auto maxAddr = m_asm[clipper.DisplayEnd-1].addr; const auto mjl = m_maxJumpLevel; const auto JumpArrow = JumpArrowBase * ts.y / 15; int i = -1; for( auto& v : m_jumpTable ) { i++; if( v.second.min > maxAddr || v.second.max < minAddr ) continue; const auto col = GetHsvColor( i, 0 ); auto it0 = std::lower_bound( insList.begin(), insList.end(), v.second.min ); auto it1 = std::lower_bound( insList.begin(), insList.end(), v.second.max ); const auto y0 = ( it0 == insList.end() || *it0 != v.second.min ) ? -th : ( it0 - insList.begin() ) * th; const auto y1 = it1 == insList.end() ? ( insList.size() + 1 ) * th : ( it1 - insList.begin() ) * th; float thickness = 1; if( ImGui::IsWindowHovered() && ImGui::IsMouseHoveringRect( wpos + ImVec2( xoff + JumpSeparation * ( mjl - v.second.level ) - JumpSeparation / 2, y0 + th2 ), wpos + ImVec2( xoff + JumpSeparation * ( mjl - v.second.level ) + JumpSeparation / 2, y1 + th2 ) ) ) { thickness = 2; if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); char tmp[32]; sprintf( tmp, "+%" PRIu64, v.first - m_baseAddr ); TextFocused( "Jump target:", tmp ); ImGui::SameLine(); sprintf( tmp, "(0x%" PRIx64 ")", v.first ); TextDisabledUnformatted( tmp ); auto lit = m_locMap.find( v.first ); assert( lit != m_locMap.end() ); sprintf( tmp, ".L%" PRIu32, lit->second ); TextFocused( "Jump label:", tmp ); uint32_t srcline; const auto srcidx = worker.GetLocationForAddress( v.first, srcline ); if( srcline != 0 ) { const auto fileName = worker.GetString( srcidx ); const auto fileColor = GetHsvColor( srcidx.Idx(), 0 ); TextDisabledUnformatted( "Target location:" ); ImGui::SameLine(); SmallColorBox( fileColor ); ImGui::SameLine(); ImGui::Text( "%s:%i", fileName, srcline ); } TextFocused( "Jump range:", MemSizeToString( v.second.max - v.second.min ) ); TextFocused( "Jump sources:", RealToString( v.second.source.size() ) ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); if( ImGui::IsMouseClicked( 0 ) ) { m_targetAddr = v.first; m_selectedAddresses.clear(); m_selectedAddresses.emplace( v.first ); } #ifndef TRACY_NO_FILESELECTOR else if( ImGui::IsMouseClicked( 1 ) ) { ImGui::OpenPopup( "jumpPopup" ); m_jumpPopupAddr = v.first; } #endif selJumpStart = v.second.min; selJumpEnd = v.second.max; selJumpTarget = v.first; } DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * ( mjl - v.second.level ), y0 + th2 ), dpos + ImVec2( xoff + JumpSeparation * ( mjl - v.second.level ), y1 + th2 ), col, thickness ); if( v.first >= minAddr && v.first <= maxAddr ) { auto iit = std::lower_bound( insList.begin(), insList.end(), v.first ); assert( iit != insList.end() ); const auto y = ( iit - insList.begin() ) * th; DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * ( mjl - v.second.level ), y + th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + JumpArrow + 1, y + th2 ), col, thickness ); DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * mjl + JumpArrow, y + th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + JumpArrow - th4, y + th2 - th4 ), col, thickness ); DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * mjl + JumpArrow, y + th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + JumpArrow - th4, y + th2 + th4 ), col, thickness ); } for( auto& s : v.second.source ) { if( s >= minAddr && s <= maxAddr ) { auto iit = std::lower_bound( insList.begin(), insList.end(), s ); assert( iit != insList.end() ); const auto y = ( iit - insList.begin() ) * th; DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * ( mjl - v.second.level ), y + th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + JumpArrow, y + th2 ), col, thickness ); } } } } } #ifndef TRACY_NO_FILESELECTOR if( m_font ) ImGui::PopFont(); if( ImGui::BeginPopup( "jumpPopup" ) ) { if( ImGui::Button( ICON_FA_FILE_IMPORT " Save jump range" ) ) { auto it = m_jumpTable.find( m_jumpPopupAddr ); assert( it != m_jumpTable.end() ); size_t minIdx = 0, maxIdx = 0; size_t i; for( i=0; isecond.min ) { minIdx = i++; break; } } assert( i != m_asm.size() ); for( ; isecond.max ) { maxIdx = i+1; break; } } assert( i != m_asm.size() ); Save( worker, minIdx, maxIdx ); ImGui::CloseCurrentPopup(); } ImGui::EndPopup(); } if( m_font ) ImGui::PushFont( m_font ); #endif } const auto win = ImGui::GetCurrentWindowRead(); if( win->ScrollbarY ) { auto draw = ImGui::GetWindowDrawList(); auto rect = ImGui::GetWindowScrollbarRect( win, ImGuiAxis_Y ); ImGui::PushClipRect( rect.Min, rect.Max, false ); std::vector lineOff; lineOff.reserve( std::max( m_selectedAddresses.size(), m_selectedAddressesHover.size() ) ); if( !m_selectedAddresses.empty() ) { for( size_t i=0; i lastLine ) { lastLine = ly; DrawLine( draw, ImVec2( rect.Min.x + 0.5f, ly + 0.5f ), ImVec2( rect.Max.x + 0.5f, ly + 0.5f ), 0x8899994C, 1 ); } } } if( !m_selectedAddressesHover.empty() ) { lineOff.clear(); for( size_t i=0; i lastLine ) { lastLine = ly; DrawLine( draw, ImVec2( rect.Min.x + 0.5f, ly + 0.5f ), ImVec2( rect.Max.x + 0.5f, ly + 0.5f ), 0x88888888, 1 ); } } } uint32_t selJumpLineStart, selJumpLineEnd, selJumpLineTarget; std::vector> ipData; ipData.reserve( ipcount.size() ); if( selJumpStart == 0 ) { for( size_t i=0; isecond ); } } else { for( size_t i=0; isecond ); } } pdqsort_branchless( ipData.begin(), ipData.end(), []( const auto& l, const auto& r ) { return l.first < r.first; } ); const auto step = uint32_t( m_asm.size() * 2 / rect.GetHeight() ); const auto x40 = round( rect.Min.x + rect.GetWidth() * 0.4f ); const auto x60 = round( rect.Min.x + rect.GetWidth() * 0.6f ); auto it = ipData.begin(); while( it != ipData.end() ) { const auto firstLine = it->first; AddrStat ipSum = {}; while( it != ipData.end() && it->first <= firstLine + step ) { ipSum += it->second; ++it; } const auto ly = round( rect.Min.y + float( firstLine ) / m_asm.size() * rect.GetHeight() ); if( m_childCalls ) { const auto color = GetHotnessColor( ipSum.local + ipSum.ext, ipmax.local + ipmax.ext ); draw->AddRectFilled( ImVec2( x40, ly ), ImVec2( x60, ly+3 ), color ); } else if( ipmax.local != 0 ) { const auto color = GetHotnessColor( ipSum.local, ipmax.local ); draw->AddRectFilled( ImVec2( x40, ly ), ImVec2( x60, ly+3 ), color ); } } if( selJumpStart != 0 ) { const auto yStart = 0.5f + rect.Min.y + float( selJumpLineStart ) / m_asm.size() * rect.GetHeight(); const auto yEnd = 0.5f + rect.Min.y + float( selJumpLineEnd ) / m_asm.size() * rect.GetHeight(); const auto yTarget = 0.5f + rect.Min.y + float( selJumpLineTarget ) / m_asm.size() * rect.GetHeight(); const auto x50 = 0.5f + round( rect.Min.x + rect.GetWidth() * 0.5f ) - 1; const auto x25 = 0.5f + round( rect.Min.x + rect.GetWidth() * 0.25f ); const auto x75 = 0.5f + round( rect.Min.x + rect.GetWidth() * 0.75f ); DrawLine( draw, ImVec2( x50, yStart ), ImVec2( x50, yEnd ), 0xFF00FF00 ); DrawLine( draw, ImVec2( x25, yTarget ), ImVec2( x75, yTarget ), 0xFF00FF00 ); } if( m_asmSelected >= 0 ) { const auto x0 = rect.Min.x; const auto x1 = rect.Min.x + rect.GetWidth() * 0.2f; float sy; for( int i=0; i<(int)m_asm.size(); i++ ) { if( i == m_asmSelected ) { sy = round( rect.Min.y + ( i - 0.5f ) / m_asm.size() * rect.GetHeight() ); } else if( m_asm[i].regData[0] != 0 ) { int flags = 0; int idx = 0; for(;;) { const auto& v = m_asm[i].regData[idx++]; if( v == 0 ) break; flags |= v & FlagMask; } uint32_t col = 0; if( ( flags & ( WriteBit | ReadBit ) ) == ( WriteBit | ReadBit ) ) col = 0xFF00FFFF; else if( flags & WriteBit ) col = 0xFF0000FF; else if( flags & ReadBit ) col = 0xFF00FF00; if( col != 0 ) { const auto ly = round( rect.Min.y + ( i - 0.5f ) / m_asm.size() * rect.GetHeight() ); DrawLine( draw, ImVec2( x0 + 0.5f, ly + 0.5f ), ImVec2( x1 + 0.5f, ly + 0.5f ), col, 3 ); } } } DrawLine( draw, ImVec2( x0 + 0.5f, sy + 0.5f ), ImVec2( x1 + 0.5f, sy + 0.5f ), 0xFFFF9900, 3 ); } } if( m_font ) ImGui::PopFont(); ImGui::EndChild(); if( !m_asmSampleSelect.empty() ) { AddrStat count = {}; uint32_t numLines = 0; for( auto& idx : m_asmSampleSelect ) { auto it = ipcount.find( m_asm[idx].addr ); if( it != ipcount.end() ) { count += it->second; numLines++; } } ImGui::BeginChild( "##asmSelect" ); if( ImGui::SmallButton( ICON_FA_TIMES ) ) { m_asmSampleSelect.clear(); m_asmGroupSelect = -1; } ImGui::SameLine(); char buf[16]; char* end; if( m_childCalls ) { end = PrintFloat( buf, buf+16, 100.f * ( count.local + count.ext ) / ( iptotal.local + iptotal.ext ), 2 ); } else if( iptotal.local != 0 ) { end = PrintFloat( buf, buf+16, 100.f * count.local / iptotal.local, 2 ); } else { end = PrintFloat( buf, buf+16, 0.f, 2 ); } memcpy( end, "%", 2 ); TextFocused( "Selected:", buf ); ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( m_cost == CostType::SampleCount ) { if( m_childCalls ) { TextFocused( "Time:", TimeToString( ( count.local + count.ext ) * worker.GetSamplingPeriod() ) ); } else { TextFocused( "Time:", TimeToString( count.local * worker.GetSamplingPeriod() ) ); } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( m_childCalls ) { TextFocused( "Sample count:", RealToString( count.local + count.ext ) ); } else { TextFocused( "Sample count:", RealToString( count.local ) ); } } else { TextFocused( "Events:", RealToString( count.local ) ); } ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); TextFocused( "Lines:", RealToString( numLines ) ); ImGui::EndChild(); } return jumpOut; } static bool PrintPercentage( float val, uint32_t col = 0xFFFFFFFF ) { const auto ty = ImGui::GetFontSize(); auto draw = ImGui::GetWindowDrawList(); const auto wpos = ImGui::GetCursorScreenPos(); const auto stw = ImGui::CalcTextSize( " " ).x; const auto htw = stw / 2; const auto tw = stw * 8; char tmp[16]; auto end = PrintFloat( tmp, tmp+16, val, 2 ); memcpy( end, "%", 2 ); end++; const auto sz = end - tmp; char buf[16]; memset( buf, ' ', 7-sz ); memcpy( buf + 7 - sz, tmp, sz+1 ); draw->AddRectFilled( wpos, wpos + ImVec2( val * tw / 100, ty+1 ), 0xFF444444 ); DrawTextContrast( draw, wpos + ImVec2( htw, 0 ), col, buf ); ImGui::ItemSize( ImVec2( stw * 7, ty ), 0 ); return ImGui::IsWindowHovered() && ImGui::IsMouseHoveringRect( wpos, wpos + ImVec2( stw * 7, ty ) ); } void SourceView::RenderLine( const Tokenizer::Line& line, int lineNum, const AddrStat& ipcnt, const AddrStat& iptotal, const AddrStat& ipmax, Worker* worker, const View* view ) { const auto ts = ImGui::CalcTextSize( " " ); const auto ty = ImGui::GetFontSize(); auto draw = ImGui::GetWindowDrawList(); const auto w = std::max( m_srcWidth, ImGui::GetWindowWidth() ); const auto wpos = ImGui::GetCursorScreenPos(); const auto dpos = wpos + ImVec2( 0.5f, 0.5f ); if( m_source.idx() == m_hoveredSource && lineNum == m_hoveredLine ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0x22FFFFFF ); } else if( lineNum == m_selectedLine ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0xFF333322 ); } bool hasHwData = false; size_t cycles = 0, retired = 0, cacheRef = 0, cacheMiss = 0, branchRetired = 0, branchMiss = 0; uint32_t match = 0; if( !m_asm.empty() ) { assert( worker && view ); auto addresses = worker->GetAddressesForLocation( m_source.idx(), lineNum ); if( addresses ) { for( auto& addr : *addresses ) { if( addr >= m_baseAddr && addr < m_baseAddr + m_codeLen ) { if( !m_calcInlineStats || worker->GetInlineSymbolForAddress( addr ) == m_symAddr ) { match++; const auto hw = worker->GetHwSampleData( addr ); if( hw ) { hasHwData = true; auto& statRange = view->m_statRange; if( statRange.active ) { hw->sort(); cycles += CountHwSamples( hw->cycles, statRange ); retired += CountHwSamples( hw->retired, statRange ); cacheRef += CountHwSamples( hw->cacheRef, statRange ); cacheMiss += CountHwSamples( hw->cacheMiss, statRange ); branchRetired += CountHwSamples( hw->branchRetired, statRange ); branchMiss += CountHwSamples( hw->branchMiss, statRange ); } else { cycles += hw->cycles.size(); retired += hw->retired.size(); cacheRef += hw->cacheRef.size(); cacheMiss += hw->cacheMiss.size(); branchRetired += hw->branchRetired.size(); branchMiss += hw->branchMiss.size(); } } } } } } } bool mouseHandled = false; if( iptotal.local + iptotal.ext != 0 ) { if( ( m_childCalls && ipcnt.local + ipcnt.ext == 0 ) || ( !m_childCalls && ipcnt.local == 0 ) ) { const auto ts = ImGui::CalcTextSize( " " ); ImGui::ItemSize( ImVec2( 7 * ts.x, ts.y ) ); if( hasHwData && ImGui::IsWindowHovered() && ImGui::IsMouseHoveringRect( wpos, wpos + ImVec2( ts.x * 7, ty ) ) ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); PrintHwSampleTooltip( cycles, retired, cacheRef, cacheMiss, branchRetired, branchMiss, true ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); } } else { auto sit = m_srcSampleSelect.find( lineNum ); bool hover; if( m_childCalls ) { hover = PrintPercentage( 100.f * ( ipcnt.local + ipcnt.ext ) / ( iptotal.local + iptotal.ext ), sit == m_srcSampleSelect.end() ? 0xFFFFFFFF : 0xFF8888FF ); } else { hover = PrintPercentage( 100.f * ipcnt.local / iptotal.local, sit == m_srcSampleSelect.end() ? 0xFFFFFFFF : 0xFF8888FF ); } if( hover ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); if( ipcnt.local ) { if( m_cost == CostType::SampleCount ) { if( worker ) TextFocused( "Local time:", TimeToString( ipcnt.local * worker->GetSamplingPeriod() ) ); TextFocused( "Local samples:", RealToString( ipcnt.local ) ); } else { TextFocused( "Events:", RealToString( ipcnt.local ) ); } } if( ipcnt.ext ) { if( worker ) TextFocused( "Child time:", TimeToString( ipcnt.ext * worker->GetSamplingPeriod() ) ); TextFocused( "Child samples:", RealToString( ipcnt.ext ) ); } if( hasHwData ) PrintHwSampleTooltip( cycles, retired, cacheRef, cacheMiss, branchRetired, branchMiss, false ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); if( ImGui::IsMouseClicked( 0 ) ) { mouseHandled = true; auto& io = ImGui::GetIO(); if( io.KeyCtrl ) { m_srcGroupSelect = lineNum; if( sit == m_srcSampleSelect.end() ) { m_srcSampleSelect.emplace( lineNum ); } else { m_srcSampleSelect.erase( sit ); } } else if( io.KeyShift ) { m_srcSampleSelect.clear(); if( m_srcGroupSelect == -1 ) { m_srcGroupSelect = lineNum; m_srcSampleSelect.insert( lineNum ); } else { if( lineNum < m_srcGroupSelect ) { for( int i=lineNum; i<=m_srcGroupSelect; i++ ) { m_srcSampleSelect.insert( i ); } } else { for( int i=m_srcGroupSelect; i<=lineNum; i++ ) { m_srcSampleSelect.insert( i ); } } } } else { m_srcSampleSelect.clear(); m_srcSampleSelect.insert( lineNum ); m_srcGroupSelect = lineNum; } } else if( ImGui::IsMouseClicked( 1 ) ) { mouseHandled = true; m_srcSampleSelect.clear(); m_srcGroupSelect = -1; } } uint32_t col, glow; if( m_childCalls ) { col = GetHotnessColor( ipcnt.local + ipcnt.ext, ipmax.local + ipmax.ext ); glow = GetHotnessGlow( ipcnt.local + ipcnt.ext, ipmax.local + ipmax.ext ); } else { col = GetHotnessColor( ipcnt.local, ipmax.local ); glow = GetHotnessGlow( ipcnt.local, ipmax.local ); } if( glow ) { DrawLine( draw, dpos + ImVec2( 1, 1 ), dpos + ImVec2( 1, ty-2 ), glow ); DrawLine( draw, dpos + ImVec2( -1, 1 ), dpos + ImVec2( -1, ty-2 ), glow ); } DrawLine( draw, dpos + ImVec2( 0, 1 ), dpos + ImVec2( 0, ty-2 ), col ); } ImGui::SameLine( 0, ty ); } const bool showHwSamples = worker && m_hwSamples && worker->GetHwSampleCountAddress() != 0; if( showHwSamples ) { if( hasHwData ) { RenderHwLinePart( cycles, retired, branchRetired, branchMiss, cacheRef, cacheMiss, ts ); } else { ImGui::ItemSize( ImVec2( 19 * ts.x, ts.y ) ); } ImGui::SameLine( 0, ty ); } const auto lineCount = m_source.get().size(); const auto tmp = RealToString( lineCount ); const auto maxLine = strlen( tmp ); const auto lineString = RealToString( lineNum ); const auto linesz = strlen( lineString ); char buf[16]; memset( buf, ' ', maxLine - linesz ); memcpy( buf + maxLine - linesz, lineString, linesz+1 ); TextDisabledUnformatted( buf ); ImGui::SameLine( 0, ty ); if( !m_asm.empty() ) { const auto tmp = RealToString( m_asm.size() ); const auto maxAsm = strlen( tmp ) + 1; if( match > 0 ) { const auto asmString = RealToString( match ); sprintf( buf, "@%s", asmString ); const auto asmsz = strlen( buf ); TextDisabledUnformatted( buf ); ImGui::SameLine( 0, 0 ); ImGui::ItemSize( ImVec2( ts.x * ( maxAsm - asmsz ), ty ), 0 ); } else { ImGui::ItemSize( ImVec2( ts.x * maxAsm, ty ), 0 ); } } ImGui::SameLine( 0, ty ); auto ptr = line.begin; auto it = line.tokens.begin(); while( ptr < line.end ) { if( it == line.tokens.end() ) { ImGui::TextUnformatted( ptr, line.end ); ImGui::SameLine( 0, 0 ); break; } if( ptr < it->begin ) { ImGui::TextUnformatted( ptr, it->begin ); ImGui::SameLine( 0, 0 ); } TextColoredUnformatted( SyntaxColors[(int)it->color], it->begin, it->end ); ImGui::SameLine( 0, 0 ); ptr = it->end; ++it; } ImGui::ItemSize( ImVec2( 0, 0 ), 0 ); if( match > 0 && ImGui::IsWindowHovered() && ImGui::IsMouseHoveringRect( wpos, wpos + ImVec2( w, ty+1 ) ) ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0x11FFFFFF ); if( !mouseHandled && ( ImGui::IsMouseClicked( 0 ) || ImGui::IsMouseClicked( 1 ) ) ) { m_displayMode = DisplayMixed; SelectLine( lineNum, worker, ImGui::IsMouseClicked( 1 ) ); } else { SelectAsmLinesHover( m_source.idx(), lineNum, *worker ); } } DrawLine( draw, dpos + ImVec2( 0, ty+2 ), dpos + ImVec2( w, ty+2 ), 0x08FFFFFF ); } void SourceView::RenderAsmLine( AsmLine& line, const AddrStat& ipcnt, const AddrStat& iptotal, const AddrStat& ipmax, Worker& worker, uint64_t& jumpOut, int maxAddrLen, View& view ) { const auto ty = ImGui::GetFontSize(); auto draw = ImGui::GetWindowDrawList(); const auto w = std::max( m_asmWidth, ImGui::GetWindowWidth() ); const auto wpos = ImGui::GetCursorScreenPos(); const auto dpos = wpos + ImVec2( 0.5f, 0.5f ); if( m_selectedAddressesHover.find( line.addr ) != m_selectedAddressesHover.end() ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0x22FFFFFF ); } else if( m_selectedAddresses.find( line.addr ) != m_selectedAddresses.end() ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0xFF333322 ); } if( line.addr == m_highlightAddr ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0xFF222233 ); } const auto asmIdx = &line - m_asm.data(); const auto hw = worker.GetHwSampleData( line.addr ); size_t cycles = 0, retired = 0, cacheRef = 0, cacheMiss = 0, branchRetired = 0, branchMiss = 0; if( hw && ( !m_calcInlineStats || worker.GetInlineSymbolForAddress( line.addr ) == m_symAddr ) ) { if( view.m_statRange.active ) { hw->sort(); cycles = CountHwSamples( hw->cycles, view.m_statRange ); retired = CountHwSamples( hw->retired, view.m_statRange ); cacheRef = CountHwSamples( hw->cacheRef, view.m_statRange ); cacheMiss = CountHwSamples( hw->cacheMiss, view.m_statRange ); branchRetired = CountHwSamples( hw->branchRetired, view.m_statRange ); branchMiss = CountHwSamples( hw->branchMiss, view.m_statRange ); } else { cycles = hw->cycles.size(); retired = hw->retired.size(); cacheRef = hw->cacheRef.size(); cacheMiss = hw->cacheMiss.size(); branchRetired = hw->branchRetired.size(); branchMiss = hw->branchMiss.size(); } } const auto ts = ImGui::CalcTextSize( " " ); if( iptotal.local + iptotal.ext != 0 ) { if( ( m_childCalls && ipcnt.local + ipcnt.ext == 0 ) || ( !m_childCalls && ipcnt.local == 0 ) ) { ImGui::ItemSize( ImVec2( 7 * ts.x, ts.y ) ); if( hw && ImGui::IsWindowHovered() && ImGui::IsMouseHoveringRect( wpos, wpos + ImVec2( ts.x * 7, ty ) ) ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); PrintHwSampleTooltip( cycles, retired, cacheRef, cacheMiss, branchRetired, branchMiss, true ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); } } else { const auto idx = &line - m_asm.data(); auto sit = m_asmSampleSelect.find( idx ); bool hover; if( m_childCalls ) { hover = PrintPercentage( 100.f * ( ipcnt.local + ipcnt.ext ) / ( iptotal.local + iptotal.ext ), sit == m_asmSampleSelect.end() ? 0xFFFFFFFF : 0xFF8888FF ); } else { hover = PrintPercentage( 100.f * ipcnt.local / iptotal.local, sit == m_asmSampleSelect.end() ? 0xFFFFFFFF : 0xFF8888FF ); } if( hover ) { uint64_t symAddrParents = m_baseAddr; auto inlineList = worker.GetInlineSymbolList( m_baseAddr, m_codeLen ); if( inlineList ) { const auto cfi = worker.PackPointer( line.addr ); const auto symEnd = m_baseAddr + m_codeLen; while( *inlineList < symEnd ) { auto ipmap = worker.GetSymbolInstructionPointers( *inlineList ); if( ipmap ) { if( ipmap->find( cfi ) != ipmap->end() ) { symAddrParents = *inlineList; break; } } inlineList++; } } if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); if( ipcnt.local ) { if( m_cost == CostType::SampleCount ) { TextFocused( "Local time:", TimeToString( ipcnt.local * worker.GetSamplingPeriod() ) ); TextFocused( "Local samples:", RealToString( ipcnt.local ) ); } else { TextFocused( "Events:", RealToString( ipcnt.local ) ); } } if( ipcnt.ext ) { TextFocused( "Child time:", TimeToString( ipcnt.ext * worker.GetSamplingPeriod() ) ); TextFocused( "Child samples:", RealToString( ipcnt.ext ) ); } if( hw ) PrintHwSampleTooltip( cycles, retired, cacheRef, cacheMiss, branchRetired, branchMiss, false ); const auto& stats = *worker.GetSymbolStats( symAddrParents ); if( !stats.parents.empty() ) { ImGui::Separator(); TextFocused( "Entry call stacks:", RealToString( stats.parents.size() ) ); ImGui::SameLine(); TextDisabledUnformatted( "(middle click to view)" ); } ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); if( ImGui::IsMouseClicked( 0 ) ) { auto& io = ImGui::GetIO(); if( io.KeyCtrl ) { m_asmGroupSelect = idx; if( sit == m_asmSampleSelect.end() ) { m_asmSampleSelect.emplace( idx ); } else { m_asmSampleSelect.erase( sit ); } } else if( io.KeyShift ) { m_asmSampleSelect.clear(); if( m_asmGroupSelect == -1 ) { m_asmGroupSelect = idx; m_asmSampleSelect.insert( idx ); } else { if( idx < m_asmGroupSelect ) { for( int i=idx; i<=m_asmGroupSelect; i++ ) { m_asmSampleSelect.insert( i ); } } else { for( int i=m_asmGroupSelect; i<=idx; i++ ) { m_asmSampleSelect.insert( i ); } } } } else { m_asmSampleSelect.clear(); m_asmSampleSelect.insert( idx ); m_asmGroupSelect = idx; } } else if( ImGui::IsMouseClicked( 1 ) ) { m_asmSampleSelect.clear(); m_asmGroupSelect = -1; } else if( !stats.parents.empty() && ImGui::IsMouseClicked( 2 ) ) { view.ShowSampleParents( symAddrParents ); } } uint32_t col, glow; if( m_childCalls ) { col = GetHotnessColor( ipcnt.local + ipcnt.ext, ipmax.local + ipmax.ext ); glow = GetHotnessGlow( ipcnt.local + ipcnt.ext, ipmax.local + ipmax.ext ); } else { col = GetHotnessColor( ipcnt.local, ipmax.local ); glow = GetHotnessGlow( ipcnt.local, ipmax.local ); } if( glow ) { DrawLine( draw, dpos + ImVec2( 1, 1 ), dpos + ImVec2( 1, ty-2 ), glow ); DrawLine( draw, dpos + ImVec2( -1, 1 ), dpos + ImVec2( -1, ty-2 ), glow ); } DrawLine( draw, dpos + ImVec2( 0, 1 ), dpos + ImVec2( 0, ty-2 ), col ); } ImGui::SameLine( 0, ty ); } const bool showHwSamples = m_hwSamples && worker.GetHwSampleCountAddress() != 0; if( showHwSamples ) { if( hw ) { RenderHwLinePart( cycles, retired, branchRetired, branchMiss, cacheRef, cacheMiss, ts ); } else { ImGui::ItemSize( ImVec2( 19 * ts.x, ts.y ) ); } ImGui::SameLine( 0, ty ); } char buf[256]; if( m_asmCountBase >= 0 ) { sprintf( buf, "[%i]", int( asmIdx - m_asmCountBase ) ); } else if( m_asmRelative ) { sprintf( buf, "+%" PRIu64, line.addr - m_baseAddr ); } else { sprintf( buf, "%" PRIx64, line.addr ); } const auto asz = strlen( buf ); memset( buf+asz, ' ', maxAddrLen-asz ); buf[maxAddrLen] = '\0'; if( m_asmCountBase >= 0 ) { TextColoredUnformatted( asmIdx - m_asmCountBase < 0 ? 0xFFBB6666 : 0xFF66BBBB, buf ); } else { TextDisabledUnformatted( buf ); } if( ImGui::IsItemHovered() ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); if( m_asmCountBase >= 0 ) { TextDisabledUnformatted( "Absolute address:" ); ImGui::SameLine(); ImGui::Text( "%" PRIx64, line.addr ); TextDisabledUnformatted( "Relative address:" ); ImGui::SameLine(); ImGui::Text( "+%" PRIx64, line.addr - m_baseAddr ); } else if( m_asmRelative ) { TextDisabledUnformatted( "Absolute address:" ); ImGui::SameLine(); ImGui::Text( "%" PRIx64, line.addr ); } else { TextDisabledUnformatted( "Relative address:" ); ImGui::SameLine(); ImGui::Text( "+%" PRIx64, line.addr - m_baseAddr ); } ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); if( ImGui::IsItemClicked( 0 ) ) { m_asmCountBase = asmIdx; } else if( ImGui::IsItemClicked( 1 ) ) { m_asmCountBase = -1; } } const auto stw = ImGui::CalcTextSize( " " ).x; bool lineHovered = false; if( m_asmShowSourceLocation && !m_sourceFiles.empty() ) { ImGui::SameLine(); uint32_t srcline; const auto srcidx = worker.GetLocationForAddress( line.addr, srcline ); if( srcline != 0 ) { const auto fileName = worker.GetString( srcidx ); const auto fileColor = GetHsvColor( srcidx.Idx(), 0 ); SmallColorBox( fileColor ); ImGui::SameLine(); char buf[64]; const auto fnsz = strlen( fileName ); if( fnsz < 30 - m_maxLine ) { sprintf( buf, "%s:%i", fileName, srcline ); } else { sprintf( buf, "...%s:%i", fileName+fnsz-(30-3-1-m_maxLine), srcline ); } const auto bufsz = strlen( buf ); TextDisabledUnformatted( buf ); if( ImGui::IsItemHovered() ) { lineHovered = true; if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); if( worker.HasInlineSymbolAddresses() ) { const auto symAddr = worker.GetInlineSymbolForAddress( line.addr ); if( symAddr != 0 ) { const auto symData = worker.GetSymbolData( symAddr ); if( symData ) { TextFocused( "Function:", worker.GetString( symData->name ) ); ImGui::SameLine(); ImGui::TextDisabled( "(0x%" PRIx64 ")", symAddr ); } } } TextFocused( "File:", fileName ); TextFocused( "Line:", RealToString( srcline ) ); if( SourceFileValid( fileName, worker.GetCaptureTime(), view, worker ) ) { m_sourceTooltip.Parse( fileName, worker, view ); if( !m_sourceTooltip.empty() ) { ImGui::Separator(); if( m_font ) ImGui::PushFont( m_font ); auto& lines = m_sourceTooltip.get(); const int start = std::max( 0, (int)srcline - 4 ); const int end = std::min( m_sourceTooltip.get().size(), srcline + 3 ); bool first = true; int bottomEmpty = 0; for( int i=start; i 0 ) { ImGui::TextUnformatted( "" ); bottomEmpty--; } auto ptr = line.begin; auto it = line.tokens.begin(); while( ptr < line.end ) { if( it == line.tokens.end() ) { ImGui::TextUnformatted( ptr, line.end ); ImGui::SameLine( 0, 0 ); break; } if( ptr < it->begin ) { ImGui::TextUnformatted( ptr, it->begin ); ImGui::SameLine( 0, 0 ); } TextColoredUnformatted( i == srcline-1 ? SyntaxColors[(int)it->color] : SyntaxColorsDimmed[(int)it->color], it->begin, it->end ); ImGui::SameLine( 0, 0 ); ptr = it->end; ++it; } ImGui::ItemSize( ImVec2( 0, 0 ), 0 ); } } if( m_font ) ImGui::PopFont(); } } ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); if( ImGui::IsItemClicked( 0 ) || ImGui::IsItemClicked( 1 ) ) { if( m_source.filename() == fileName ) { if( ImGui::IsMouseClicked( 1 ) ) m_targetLine = srcline; SelectLine( srcline, &worker, false ); m_displayMode = DisplayMixed; } else if( SourceFileValid( fileName, worker.GetCaptureTime(), view, worker ) ) { ParseSource( fileName, worker, view ); m_targetLine = srcline; SelectLine( srcline, &worker, false ); SelectViewMode(); } else { SelectAsmLines( srcidx.Idx(), srcline, worker, false ); } } else { m_hoveredLine = srcline; m_hoveredSource = srcidx.Idx(); } } ImGui::SameLine( 0, 0 ); ImGui::ItemSize( ImVec2( stw * ( 32 - bufsz ), ty ), 0 ); } else { SmallColorBox( 0 ); ImGui::SameLine(); TextDisabledUnformatted( "[unknown]" ); ImGui::SameLine( 0, 0 ); ImGui::ItemSize( ImVec2( stw * 23, ty ), 0 ); } } if( m_asmBytes ) { auto code = (const uint8_t*)worker.GetSymbolCode( m_baseAddr, m_codeLen ); assert( code ); char tmp[64]; const auto len = PrintHexBytes( tmp, code + line.addr - m_baseAddr, line.len, worker.GetCpuArch() ); ImGui::SameLine(); TextColoredUnformatted( ImVec4( 0.5, 0.5, 1, 1 ), tmp ); ImGui::SameLine( 0, 0 ); ImGui::ItemSize( ImVec2( stw * ( m_maxAsmBytes*3 - len ), ty ), 0 ); } if( m_showJumps ) { const auto JumpArrow = JumpArrowBase * ty / 15; ImGui::SameLine( 0, 2*ty + JumpArrow + m_maxJumpLevel * JumpSeparation ); auto jit = m_jumpOut.find( line.addr ); if( jit != m_jumpOut.end() ) { const auto th2 = floor( ts.y / 2 ); const auto th4 = floor( ts.y / 4 ); const auto& mjl = m_maxJumpLevel; const auto col = GetHsvColor( line.jumpAddr, 6 ); const auto xoff = ( ( iptotal.local + iptotal.ext == 0 ) ? 0 : ( 7 * ts.x + ts.y ) ) + (3+maxAddrLen) * ts.x + ( ( m_asmShowSourceLocation && !m_sourceFiles.empty() ) ? 36 * ts.x : 0 ) + ( m_asmBytes ? m_maxAsmBytes*3 * ts.x : 0 ) + ( showHwSamples ? ( 19 * ts.x + ts.y ) : 0 ); DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * mjl + th2, th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + th2 + JumpArrow / 2, th2 ), col ); DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * mjl + th2, th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + th2 + th4, th2 - th4 ), col ); DrawLine( draw, dpos + ImVec2( xoff + JumpSeparation * mjl + th2, th2 ), dpos + ImVec2( xoff + JumpSeparation * mjl + th2 + th4, th2 + th4 ), col ); } } else { ImGui::SameLine( 0, ty ); } int opdesc = 0; const AsmVar* asmVar = nullptr; if( !m_atnt && ( m_cpuArch == CpuArchX64 || m_cpuArch == CpuArchX86 ) ) { auto uarch = MicroArchitectureData[m_idxMicroArch]; char tmp[32]; for( size_t i=0; i= 'a' && c <= 'z' ) c = c - 'a' + 'A'; tmp[i] = c; } tmp[line.mnemonic.size()] = '\0'; const char* mnemonic = tmp; if( strcmp( mnemonic, "LEA" ) == 0 ) { static constexpr const char* LeaTable[] = { "LEA", "LEA_B", "LEA_BD", "LEA_BI", "LEA_BID", "LEA_D", "LEA_I", "LEA_ID", "LEA_R", "LEA_RD" }; mnemonic = LeaTable[(int)line.leaData]; } auto it = m_microArchOpMap.find( mnemonic ); if( it != m_microArchOpMap.end() ) { const auto opid = it->second; auto oit = std::lower_bound( uarch->ops, uarch->ops + uarch->numOps, opid, []( const auto& l, const auto& r ) { return l->id < r; } ); if( oit != uarch->ops + uarch->numOps && (*oit)->id == opid ) { const auto& op = *oit; opdesc = op->descId; std::vector> res; res.reserve( op->numVariants ); for( int i=0; inumVariants; i++ ) { const auto& var = *op->variant[i]; if( var.descNum == (int)line.params.size() ) { int penalty = 0; bool match = true; for( int j=0; jvariant[res[0].first]; } } } } if( m_showLatency && asmVar && asmVar->minlat >= 0 ) { const auto pos = ImVec2( (int)ImGui::GetCursorScreenPos().x, (int)ImGui::GetCursorScreenPos().y ); const auto ty = ImGui::GetFontSize(); if( asmVar->minlat == 0 ) { DrawLine( draw, pos + ImVec2( 0.5f, -0.5f ), pos + ImVec2( 0.5f, ty + 0.5f ), 0x660000FF ); } else { draw->AddRectFilled( pos, pos + ImVec2( ty * asmVar->minlat + 1, ty + 1 ), 0x660000FF ); } if( asmVar->minlat != asmVar->maxlat ) { draw->AddRectFilled( pos + ImVec2( ty * asmVar->minlat + 1, 0 ), pos + ImVec2( ty * asmVar->maxlat + 1, ty + 1 ), 0x5500FFFF ); } } const auto msz = line.mnemonic.size(); memcpy( buf, line.mnemonic.c_str(), msz ); memset( buf+msz, ' ', m_maxMnemonicLen-msz ); bool hasJump = false; if( line.jumpAddr != 0 ) { auto lit = m_locMap.find( line.jumpAddr ); if( lit != m_locMap.end() ) { char tmp[64]; sprintf( tmp, ".L%" PRIu32, lit->second ); strcpy( buf+m_maxMnemonicLen, tmp ); hasJump = true; } } if( !hasJump ) { memcpy( buf+m_maxMnemonicLen, line.operands.c_str(), line.operands.size() + 1 ); } const bool isInContext = !m_calcInlineStats || !worker.HasInlineSymbolAddresses() || worker.GetInlineSymbolForAddress( line.addr ) == m_symAddr; if( asmIdx == m_asmSelected ) { TextColoredUnformatted( ImVec4( 1, 0.25f, 0.25f, isInContext ? 1.f : 0.5f ), buf ); } else if( line.regData[0] != 0 ) { bool hasDepencency = false; int idx = 0; for(;;) { if( line.regData[idx] == 0 ) break; if( line.regData[idx] & ( WriteBit | ReadBit ) ) { hasDepencency = true; break; } idx++; } if( hasDepencency ) { TextColoredUnformatted( ImVec4( 1, 0.5f, 1, isInContext ? 1.f : 0.5f ), buf ); } else { if( isInContext ) { ImGui::TextUnformatted( buf ); } else { TextDisabledUnformatted( buf ); } } } else { if( isInContext ) { ImGui::TextUnformatted( buf ); } else { TextDisabledUnformatted( buf ); } } uint32_t jumpOffset; uint64_t jumpBase; const char* jumpName = nullptr; if( line.jumpAddr != 0 ) { jumpOffset = 0; jumpBase = worker.GetSymbolForAddress( line.jumpAddr, jumpOffset ); auto jumpSym = jumpBase == 0 ? worker.GetSymbolData( line.jumpAddr ) : worker.GetSymbolData( jumpBase ); if( jumpSym ) jumpName = worker.GetString( jumpSym->name ); } if( ImGui::IsItemHovered() ) { if( asmVar ) { const auto& var = *asmVar; if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); if( jumpName || opdesc != 0 ) { if( opdesc != 0 ) ImGui::TextUnformatted( OpDescList[opdesc] ); if( jumpName ) { if( jumpBase == m_baseAddr ) { TextDisabledUnformatted( "Local target:" ); } else { TextDisabledUnformatted( "External target:" ); } ImGui::SameLine(); ImGui::Text( "%s+%" PRIu32, jumpName, jumpOffset ); } ImGui::Separator(); } TextFocused( "Throughput:", RealToString( var.tp ) ); ImGui::SameLine(); TextDisabledUnformatted( "(cycles per instruction, lower is better)" ); if( var.maxlat >= 0 ) { bool exact = false; TextDisabledUnformatted( "Latency:" ); ImGui::SameLine(); if( var.minlat == var.maxlat && var.minbound == var.maxbound ) { if( var.minbound ) { ImGui::Text( "\xe2\x89\xa4%s", RealToString( var.minlat ) ); } else { ImGui::TextUnformatted( RealToString( var.minlat ) ); exact = true; } } else { if( var.minbound ) { ImGui::Text( "[\xe2\x89\xa4%s", RealToString( var.minlat ) ); } else { ImGui::Text( "[%s", RealToString( var.minlat ) ); } ImGui::SameLine( 0, 0 ); if( var.maxbound ) { ImGui::Text( " \xE2\x80\x93 \xe2\x89\xa4%s]", RealToString( var.maxlat ) ); } else { ImGui::Text( " \xE2\x80\x93 %s]", RealToString( var.maxlat ) ); } } ImGui::SameLine(); if( exact ) { TextDisabledUnformatted( "(cycles in execution)" ); } else { TextDisabledUnformatted( "(cycles in execution, may vary by used output)" ); } } TextFocused( "\xce\xbcops:", RealToString( var.uops ) ); if( var.port != -1 ) TextFocused( "Ports:", PortList[var.port] ); ImGui::Separator(); TextFocused( "ISA set:", IsaList[var.isaSet] ); if( var.descNum > 0 ) { TextDisabledUnformatted( "Operands:" ); ImGui::SameLine(); bool first = true; for( int i=0; isecond ); } if( line.regData[0] != 0 ) { if( !line.params.empty() ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); } else { ImGui::SameLine( 0, 0 ); } TextColoredUnformatted( ImVec4( 0.5f, 0.5, 1, 1 ), "{" ); ImGui::SameLine( 0, 0 ); int idx = 0; for(;;) { ImVec4 col; if( line.regData[idx] == 0 ) break; if( ( line.regData[idx] & ( WriteBit | ReadBit ) ) == ( WriteBit | ReadBit ) ) col = ImVec4( 1, 1, 0.5f, 1 ); else if( line.regData[idx] & WriteBit ) col = ImVec4( 1, 0.5f, 0.5f, 1 ); else if( line.regData[idx] & ReadBit ) col = ImVec4( 0.5f, 1, 0.5f, 1 ); else col = ImVec4( 0.5f, 0.5f, 0.5f, 1 ); if( idx > 0 ) { ImGui::SameLine( 0, 0 ); TextColoredUnformatted( ImVec4( 0.5f, 0.5, 1, 1 ), ", " ); ImGui::SameLine( 0, 0 ); } TextColoredUnformatted( col, s_regNameX86[line.regData[idx] & RegMask] ); if( ImGui::IsItemHovered() ) { ImGui::BeginTooltip(); if( ( line.regData[idx] & ( WriteBit | ReadBit ) ) == ( WriteBit | ReadBit ) ) ImGui::TextUnformatted( "Read and write" ); else if( line.regData[idx] & WriteBit ) ImGui::TextUnformatted( "Write" ); else if( line.regData[idx] & ReadBit ) ImGui::TextUnformatted( "Read" ); else ImGui::TextUnformatted( "Previous read" ); ImGui::EndTooltip(); } idx++; } ImGui::SameLine( 0, 0 ); TextColoredUnformatted( ImVec4( 0.5f, 0.5, 1, 1 ), "}" ); } if( jumpName ) { ImGui::SameLine(); ImGui::Spacing(); ImGui::SameLine(); if( jumpBase == m_baseAddr ) { ImGui::TextDisabled( "-> [%s+%" PRIu32"]", jumpName, jumpOffset ); if( ImGui::IsItemHovered() ) { m_highlightAddr = line.jumpAddr; if( ImGui::IsItemClicked() ) { m_targetAddr = line.jumpAddr; m_selectedAddresses.clear(); m_selectedAddresses.emplace( line.jumpAddr ); } } } else { ImGui::TextDisabled( "[%s+%" PRIu32"]", jumpName, jumpOffset ); if( ImGui::IsItemClicked() ) jumpOut = line.jumpAddr; } } if( lineHovered ) { draw->AddRectFilled( wpos, wpos + ImVec2( w, ty+1 ), 0x11FFFFFF ); } DrawLine( draw, dpos + ImVec2( 0, ty+2 ), dpos + ImVec2( w, ty+2 ), 0x08FFFFFF ); } void SourceView::RenderHwLinePart( size_t cycles, size_t retired, size_t branchRetired, size_t branchMiss, size_t cacheRef, size_t cacheMiss, const ImVec2& ts ) { if( cycles ) { const bool unreliable = cycles < 10 || retired < 10; const float ipc = float( retired ) / cycles; uint32_t col = unreliable ? 0x44FFFFFF : GetGoodnessColor( ipc * 0.25f ); if( ipc >= 10 ) { TextColoredUnformatted( col, " 10+ " ); } else { char buf[16]; *buf = ' '; const auto end = PrintFloat( buf+1, buf+16, ipc, 2 ); assert( end == buf + 5 ); memcpy( end, " ", 3 ); TextColoredUnformatted( col, buf ); } if( ImGui::IsItemHovered() ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); ImGui::TextUnformatted( "Instructions Per Cycle (IPC)" ); ImGui::SameLine(); TextDisabledUnformatted( "Higher is better" ); ImGui::Separator(); TextFocused( "Cycles:", RealToString( cycles ) ); TextFocused( "Retirements:", RealToString( retired ) ); if( unreliable ) TextColoredUnformatted( 0xFF4444FF, "Not enough samples for reliable data!" ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); } } else { ImGui::ItemSize( ImVec2( 7 * ts.x, ts.y ) ); } ImGui::SameLine( 0, 0 ); if( branchRetired ) { const bool unreliable = branchRetired < 10; const float rate = float( branchMiss ) / branchRetired; uint32_t col = unreliable ? 0x44FFFFFF : GetGoodnessColor( 1.f - rate * 3.f ); if( branchMiss == 0 ) { TextColoredUnformatted( col, " 0% " ); } else if( rate >= 1.f ) { TextColoredUnformatted( col, " 100% " ); } else { char buf[16]; if( rate >= 0.1f ) { const auto end = PrintFloat( buf, buf+16, rate * 100, 1 ); assert( end == buf+4 ); } else { *buf = ' '; const auto end = PrintFloat( buf+1, buf+16, rate * 100, 1 ); assert( end == buf+4 ); } memcpy( buf+4, "% ", 4 ); TextColoredUnformatted( col, buf ); } if( ImGui::IsItemHovered() ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); ImGui::TextUnformatted( "Branch mispredictions rate" ); ImGui::SameLine(); TextDisabledUnformatted( "Lower is better" ); ImGui::Separator(); TextFocused( "Retired branches:", RealToString( branchRetired ) ); TextFocused( "Branch mispredictions:", RealToString( branchMiss ) ); if( unreliable ) TextColoredUnformatted( 0xFF4444FF, "Not enough samples for reliable data!" ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); } } else { ImGui::ItemSize( ImVec2( 7 * ts.x, ts.y ) ); } ImGui::SameLine( 0, 0 ); if( cacheRef ) { const bool unreliable = cacheRef < 10; const float rate = float( cacheMiss ) / cacheRef; uint32_t col = unreliable ? 0x44FFFFFF : GetGoodnessColor( 1.f - rate * 3.f ); if( cacheMiss == 0 ) { TextColoredUnformatted( col, " 0%" ); } else if( rate >= 1.f ) { TextColoredUnformatted( col, " 100%" ); } else { char buf[16]; if( rate >= 0.1f ) { const auto end = PrintFloat( buf, buf+16, rate * 100, 1 ); assert( end == buf+4 ); } else { *buf = ' '; const auto end = PrintFloat( buf+1, buf+16, rate * 100, 1 ); assert( end == buf+4 ); } memcpy( buf+4, "%", 2 ); TextColoredUnformatted( col, buf ); } if( ImGui::IsItemHovered() ) { if( m_font ) ImGui::PopFont(); ImGui::BeginTooltip(); ImGui::TextUnformatted( "Cache miss rate" ); ImGui::SameLine(); TextDisabledUnformatted( "Lower is better" ); ImGui::Separator(); TextFocused( "Cache references:", RealToString( cacheRef ) ); TextFocused( "Cache misses:", RealToString( cacheMiss ) ); if( unreliable ) TextColoredUnformatted( 0xFF4444FF, "Not enough samples for reliable data!" ); ImGui::EndTooltip(); if( m_font ) ImGui::PushFont( m_font ); } } else { ImGui::ItemSize( ImVec2( 5 * ts.x, ts.y ) ); } } void SourceView::SelectLine( uint32_t line, const Worker* worker, bool changeAsmLine, uint64_t targetAddr ) { m_selectedLine = line; if( m_symAddr == 0 ) return; assert( worker ); SelectAsmLines( m_source.idx(), line, *worker, changeAsmLine, targetAddr ); } void SourceView::SelectAsmLines( uint32_t file, uint32_t line, const Worker& worker, bool changeAsmLine, uint64_t targetAddr ) { m_selectedAddresses.clear(); auto addresses = worker.GetAddressesForLocation( file, line ); if( addresses ) { const auto& addr = *addresses; if( changeAsmLine ) { if( targetAddr != 0 ) { m_targetAddr = targetAddr; } else { for( auto& v : addr ) { if( v >= m_baseAddr && v < m_baseAddr + m_codeLen ) { m_targetAddr = v; break; } } } } for( auto& v : addr ) { if( v >= m_baseAddr && v < m_baseAddr + m_codeLen ) { m_selectedAddresses.emplace( v ); } } } } void SourceView::SelectAsmLinesHover( uint32_t file, uint32_t line, const Worker& worker ) { assert( m_selectedAddressesHover.empty() ); auto addresses = worker.GetAddressesForLocation( file, line ); if( addresses ) { for( auto& v : *addresses ) { if( v >= m_baseAddr && v < m_baseAddr + m_codeLen ) { m_selectedAddressesHover.emplace( v ); } } } } void SourceView::GatherIpHwStats( AddrStat& iptotalSrc, AddrStat& iptotalAsm, unordered_flat_map& ipcountSrc, unordered_flat_map& ipcountAsm, AddrStat& ipmaxSrc, AddrStat& ipmaxAsm, Worker& worker, bool limitView, const View& view ) { auto filename = m_source.filename(); for( auto& v : m_asm ) { const auto& addr = v.addr; if( m_calcInlineStats && worker.GetInlineSymbolForAddress( addr ) != m_symAddr ) continue; const auto hw = worker.GetHwSampleData( addr ); if( !hw ) continue; uint64_t stat; if( view.m_statRange.active ) { switch( m_cost ) { case CostType::Cycles: stat = CountHwSamples( hw->cycles, view.m_statRange ); break; case CostType::Retirements: stat = CountHwSamples( hw->retired, view.m_statRange ); break; case CostType::BranchesTaken: stat = CountHwSamples( hw->branchRetired, view.m_statRange ); break; case CostType::BranchMiss: stat = CountHwSamples( hw->branchMiss, view.m_statRange ); break; case CostType::SlowBranches: stat = sqrt( CountHwSamples( hw->branchMiss, view.m_statRange ) * CountHwSamples( hw->branchRetired, view.m_statRange ) ); break; case CostType::CacheAccess: stat = CountHwSamples( hw->cacheRef, view.m_statRange ); break; case CostType::CacheMiss: stat = CountHwSamples( hw->cacheMiss, view.m_statRange ); break; case CostType::SlowCache: stat = sqrt( CountHwSamples( hw->cacheMiss, view.m_statRange ) * CountHwSamples( hw->cacheRef, view.m_statRange ) ); break; default: assert( false ); return; } } else { switch( m_cost ) { case CostType::Cycles: stat = hw->cycles.size(); break; case CostType::Retirements: stat = hw->retired.size(); break; case CostType::BranchesTaken: stat = hw->branchRetired.size(); break; case CostType::BranchMiss: stat = hw->branchMiss.size(); break; case CostType::SlowBranches: stat = sqrt( hw->branchMiss.size() * hw->branchRetired.size() ); break; case CostType::CacheAccess: stat = hw->cacheRef.size(); break; case CostType::CacheMiss: stat = hw->cacheMiss.size(); break; case CostType::SlowCache: stat = sqrt( hw->cacheMiss.size() * hw->cacheRef.size() ); break; default: assert( false ); return; } } assert( ipcountAsm.find( addr ) == ipcountAsm.end() ); ipcountAsm.emplace( addr, AddrStat { stat, 0 } ); iptotalAsm.local += stat; if( ipmaxAsm.local < stat ) ipmaxAsm.local = stat; if( filename ) { uint32_t line; const auto fref = worker.GetLocationForAddress( addr, line ); if( line != 0 ) { auto ffn = worker.GetString( fref ); if( strcmp( ffn, filename ) == 0 ) { auto it = ipcountSrc.find( line ); if( it == ipcountSrc.end() ) { ipcountSrc.emplace( line, AddrStat{ stat, 0 } ); if( ipmaxSrc.local < stat ) ipmaxSrc.local = stat; } else { const auto sum = it->second.local + stat; it->second.local = sum; if( ipmaxSrc.local < sum ) ipmaxSrc.local = sum; } iptotalSrc.local += stat; } } } } } void SourceView::GatherIpStats( uint64_t baseAddr, AddrStat& iptotalSrc, AddrStat& iptotalAsm, unordered_flat_map& ipcountSrc, unordered_flat_map& ipcountAsm, AddrStat& ipmaxSrc, AddrStat& ipmaxAsm, const Worker& worker, bool limitView, const View& view ) { const auto slzReady = worker.AreSourceLocationZonesReady(); auto filename = m_source.filename(); if( limitView ) { auto vec = worker.GetSamplesForSymbol( baseAddr ); if( !vec ) return; auto it = std::lower_bound( vec->begin(), vec->end(), view.m_statRange.min, [] ( const auto& lhs, const auto& rhs ) { return lhs.time.Val() < rhs; } ); if( it == vec->end() ) return; auto end = std::lower_bound( it, vec->end(), view.m_statRange.max, [] ( const auto& lhs, const auto& rhs ) { return lhs.time.Val() < rhs; } ); iptotalAsm.local += end - it; while( it != end ) { if( filename ) { auto frame = worker.GetCallstackFrame( it->ip ); if( frame ) { auto ffn = worker.GetString( frame->data[0].file ); if( strcmp( ffn, filename ) == 0 ) { const auto line = frame->data[0].line; if( line != 0 ) { auto sit = ipcountSrc.find( line ); if( sit == ipcountSrc.end() ) { ipcountSrc.emplace( line, AddrStat { 1, 0 } ); if( ipmaxSrc.local < 1 ) ipmaxSrc.local = 1; } else { const auto sum = sit->second.local + 1; sit->second.local = sum; if( ipmaxSrc.local < sum ) ipmaxSrc.local = sum; } iptotalSrc.local++; } } } } auto addr = worker.GetCanonicalPointer( it->ip ); auto sit = ipcountAsm.find( addr ); if( sit == ipcountAsm.end() ) { ipcountAsm.emplace( addr, AddrStat{ 1, 0 } ); if( ipmaxAsm.local < 1 ) ipmaxAsm.local = 1; } else { const auto sum = sit->second.local + 1; sit->second.local = sum; if( ipmaxAsm.local < sum ) ipmaxAsm.local = sum; } ++it; } } else { auto ipmap = worker.GetSymbolInstructionPointers( baseAddr ); if( !ipmap ) return; for( auto& ip : *ipmap ) { auto addr = worker.GetCanonicalPointer( ip.first ); assert( ipcountAsm.find( addr ) == ipcountAsm.end() ); auto cp = slzReady ? worker.GetChildSamples( addr ) : nullptr; const auto ccnt = cp ? cp->size() : 0; ipcountAsm.emplace( addr, AddrStat { ip.second, ccnt } ); iptotalAsm.local += ip.second; iptotalAsm.ext += ccnt; if( ipmaxAsm.local < ip.second ) ipmaxAsm.local = ip.second; if( ipmaxAsm.ext < ccnt ) ipmaxAsm.ext = ccnt; if( filename ) { auto frame = worker.GetCallstackFrame( ip.first ); if( frame ) { auto ffn = worker.GetString( frame->data[0].file ); if( strcmp( ffn, filename ) == 0 ) { const auto line = frame->data[0].line; if( line != 0 ) { auto it = ipcountSrc.find( line ); if( it == ipcountSrc.end() ) { ipcountSrc.emplace( line, AddrStat{ ip.second, ccnt } ); if( ipmaxSrc.local < ip.second ) ipmaxSrc.local = ip.second; if( ipmaxSrc.ext < ccnt ) ipmaxSrc.ext = ccnt; } else { const auto sum = it->second.local + ip.second; const auto csum = it->second.ext + ccnt; it->second.local = sum; it->second.ext = csum; if( ipmaxSrc.local < sum ) ipmaxSrc.local = sum; if( ipmaxSrc.ext < csum ) ipmaxSrc.ext = csum; } iptotalSrc.local += ip.second; iptotalSrc.ext += ccnt; } } } } } } } void SourceView::GatherAdditionalIpStats( uint64_t baseAddr, AddrStat& iptotalSrc, AddrStat& iptotalAsm, unordered_flat_map& ipcountSrc, unordered_flat_map& ipcountAsm, AddrStat& ipmaxSrc, AddrStat& ipmaxAsm, const Worker& worker, bool limitView, const View& view ) { if( !worker.AreSourceLocationZonesReady() ) return; auto sym = worker.GetSymbolData( baseAddr ); if( !sym ) return; auto filename = m_source.filename(); if( limitView ) { for( uint64_t ip = baseAddr; ip < baseAddr + sym->size.Val(); ip++ ) { if( ipcountAsm.find( ip ) != ipcountAsm.end() ) continue; auto cp = worker.GetChildSamples( ip ); if( !cp ) continue; auto it = std::lower_bound( cp->begin(), cp->end(), view.m_statRange.min, [] ( const auto& lhs, const auto& rhs ) { return lhs.Val() < rhs; } ); if( it == cp->end() ) continue; auto end = std::lower_bound( it, cp->end(), view.m_statRange.max, [] ( const auto& lhs, const auto& rhs ) { return lhs.Val() < rhs; } ); const auto ccnt = uint64_t( end - it ); ipcountAsm.emplace( ip, AddrStat { 0, ccnt } ); iptotalAsm.ext += ccnt; if( ipmaxAsm.ext < ccnt ) ipmaxAsm.ext = ccnt; if( filename ) { auto frame = worker.GetCallstackFrame( worker.PackPointer( ip ) ); if( frame ) { auto ffn = worker.GetString( frame->data[0].file ); if( strcmp( ffn, filename ) == 0 ) { const auto line = frame->data[0].line; if( line != 0 ) { auto it = ipcountSrc.find( line ); if( it == ipcountSrc.end() ) { ipcountSrc.emplace( line, AddrStat{ 0, ccnt } ); if( ipmaxSrc.ext < ccnt ) ipmaxSrc.ext = ccnt; } else { const auto csum = it->second.ext + ccnt; it->second.ext = csum; if( ipmaxSrc.ext < csum ) ipmaxSrc.ext = csum; } iptotalSrc.ext += ccnt; } } } } } } else { for( uint64_t ip = baseAddr; ip < baseAddr + sym->size.Val(); ip++ ) { if( ipcountAsm.find( ip ) != ipcountAsm.end() ) continue; auto cp = worker.GetChildSamples( ip ); if( !cp ) continue; const auto ccnt = cp->size(); ipcountAsm.emplace( ip, AddrStat { 0, ccnt } ); iptotalAsm.ext += ccnt; if( ipmaxAsm.ext < ccnt ) ipmaxAsm.ext = ccnt; if( filename ) { auto frame = worker.GetCallstackFrame( worker.PackPointer( ip ) ); if( frame ) { auto ffn = worker.GetString( frame->data[0].file ); if( strcmp( ffn, filename ) == 0 ) { const auto line = frame->data[0].line; if( line != 0 ) { auto it = ipcountSrc.find( line ); if( it == ipcountSrc.end() ) { ipcountSrc.emplace( line, AddrStat{ 0, ccnt } ); if( ipmaxSrc.ext < ccnt ) ipmaxSrc.ext = ccnt; } else { const auto csum = it->second.ext + ccnt; it->second.ext = csum; if( ipmaxSrc.ext < csum ) ipmaxSrc.ext = csum; } iptotalSrc.ext += ccnt; } } } } } } } uint32_t SourceView::CountAsmIpStats( uint64_t baseAddr, const Worker& worker, bool limitView, const View& view ) { if( limitView ) { auto vec = worker.GetSamplesForSymbol( baseAddr ); if( !vec ) return 0; auto it = std::lower_bound( vec->begin(), vec->end(), view.m_statRange.min, [] ( const auto& lhs, const auto& rhs ) { return lhs.time.Val() < rhs; } ); if( it == vec->end() ) return 0; auto end = std::lower_bound( it, vec->end(), view.m_statRange.max, [] ( const auto& lhs, const auto& rhs ) { return lhs.time.Val() < rhs; } ); return end - it; } else { uint32_t cnt = 0; auto ipmap = worker.GetSymbolInstructionPointers( baseAddr ); if( !ipmap ) return 0; for( auto& ip : *ipmap ) cnt += ip.second; return cnt; } } void SourceView::SelectMicroArchitecture( const char* moniker ) { int idx = 0; for( auto& v : s_uArchUx ) { if( strcmp( v.moniker, moniker ) == 0 ) { m_selMicroArch = idx; break; } idx++; } for( idx=0; idxaddr == data.jumpAddr ) { CheckRead( fit - m_asm.begin(), reg, limit ); } if( !data.jumpConditional ) return; } if( line+1 < m_asm.size() ) { CheckRead( line+1, reg, limit ); } } void SourceView::FollowWrite( size_t line, RegsX86 reg, size_t limit ) { if( limit == 0 ) return; const auto& data = m_asm[line]; if( m_jumpOut.find( data.addr ) != m_jumpOut.end() && !data.jumpConditional ) return; auto it = m_jumpTable.find( data.addr ); if( it != m_jumpTable.end() ) { for( auto& v : it->second.source ) { auto fit = std::lower_bound( m_asm.begin(), m_asm.end(), v, []( const auto& l, const auto& r ) { return l.addr < r; } ); assert( fit != m_asm.end() && fit->addr == v ); CheckWrite( fit - m_asm.begin(), reg, limit ); } } if( line > 0 ) { CheckWrite( line-1, reg, limit ); } } void SourceView::CheckRead( size_t line, RegsX86 reg, size_t limit ) { assert( limit > 0 ); auto& data = m_asm[line]; int idx = 0; for(;;) { if( data.readX86[idx] == RegsX86::invalid ) { idx = 0; for(;;) { if( data.writeX86[idx] == RegsX86::invalid ) { FollowRead( line, reg, limit - 1 ); return; } if( data.writeX86[idx] == reg ) { idx = 0; for(;;) { if( data.regData[idx] == 0 ) { data.regData[idx] = ReuseBit | (int)reg; return; } if( ( data.regData[idx] & RegMask ) == (int)reg ) { data.regData[idx] |= ReuseBit; return; } idx++; } } idx++; } } if( data.readX86[idx] == reg ) { idx = 0; for(;;) { if( data.regData[idx] == 0 ) { data.regData[idx] = ReadBit | (int)reg; return; } if( ( data.regData[idx] & RegMask ) == (int)reg ) { data.regData[idx] |= ReadBit; return; } idx++; } } idx++; } } void SourceView::CheckWrite( size_t line, RegsX86 reg, size_t limit ) { assert( limit > 0 ); auto& data = m_asm[line]; int idx = 0; for(;;) { if( data.writeX86[idx] == RegsX86::invalid ) { idx = 0; for(;;) { if( data.readX86[idx] == RegsX86::invalid ) { FollowWrite( line, reg, limit - 1 ); return; } if( data.readX86[idx] == reg ) { idx = 0; for(;;) { if( data.regData[idx] == 0 ) { data.regData[idx] = ReuseBit | (int)reg; return; } if( ( data.regData[idx] & RegMask ) == (int)reg ) { data.regData[idx] |= ReuseBit; return; } idx++; } } idx++; } } if( data.writeX86[idx] == reg ) { idx = 0; for(;;) { if( data.regData[idx] == 0 ) { data.regData[idx] = WriteBit | (int)reg; return; } else if( ( data.regData[idx] & RegMask ) == (int)reg ) { data.regData[idx] |= WriteBit; return; } idx++; } } idx++; } } #ifndef TRACY_NO_FILESELECTOR void SourceView::Save( const Worker& worker, size_t start, size_t stop ) { assert( start < m_asm.size() ); assert( start < stop ); nfdchar_t* fn; auto res = NFD_SaveDialog( "asm", nullptr, &fn, m_gwcb ? m_gwcb() : nullptr ); if( res == NFD_OKAY ) { FILE* f = nullptr; const auto sz = strlen( fn ); if( sz < 5 || memcmp( fn + sz - 4, ".asm", 4 ) != 0 ) { char tmp[1024]; sprintf( tmp, "%s.asm", fn ); f = fopen( tmp, "wb" ); } else { f = fopen( fn, "wb" ); } if( f ) { char tmp[16]; auto sym = worker.GetSymbolData( m_symAddr ); assert( sym ); const char* symName; if( sym->isInline ) { auto parent = worker.GetSymbolData( m_baseAddr ); if( parent ) { symName = worker.GetString( parent->name ); } else { sprintf( tmp, "0x%" PRIx64, m_baseAddr ); symName = tmp; } } else { symName = worker.GetString( sym->name ); } fprintf( f, "; Tracy Profiler disassembly of symbol %s [%s]\n\n", symName, worker.GetCaptureProgram().c_str() ); if( !m_atnt ) fprintf( f, ".intel_syntax\n\n" ); const auto end = m_asm.size() < stop ? m_asm.size() : stop; for( size_t i=start; isecond ); } bool hasJump = false; if( v.jumpAddr != 0 ) { auto lit = m_locMap.find( v.jumpAddr ); if( lit != m_locMap.end() ) { fprintf( f, "\t%-*s.L%" PRIu32 "\n", m_maxMnemonicLen, v.mnemonic.c_str(), lit->second ); hasJump = true; } } if( !hasJump ) { if( v.operands.empty() ) { fprintf( f, "\t%s\n", v.mnemonic.c_str() ); } else { fprintf( f, "\t%-*s%s\n", m_maxMnemonicLen, v.mnemonic.c_str(), v.operands.c_str() ); } } } fclose( f ); } } } #endif }