#ifndef __TRACYEVENT_HPP__ #define __TRACYEVENT_HPP__ #include #include #include #include #include #include "TracyCharUtil.hpp" #include "TracyShortPtr.hpp" #include "TracyVector.hpp" #include "tracy_flat_hash_map.hpp" #include "../common/TracyForceInline.hpp" namespace tracy { #pragma pack( 1 ) struct StringRef { enum Type { Ptr, Idx }; tracy_force_inline StringRef() : str( 0 ), __data( 0 ) {} tracy_force_inline StringRef( Type t, uint64_t data ) : str( data ) , __data( 0 ) { isidx = t == Idx; active = 1; } uint64_t str; union { struct { uint8_t isidx : 1; uint8_t active : 1; }; uint8_t __data; }; }; class StringIdx { public: tracy_force_inline StringIdx() { memset( m_idx, 0, sizeof( m_idx ) ); } tracy_force_inline StringIdx( uint32_t idx ) { SetIdx( idx ); } tracy_force_inline void SetIdx( uint32_t idx ) { idx++; memcpy( m_idx, &idx, 3 ); } tracy_force_inline uint32_t Idx() const { uint32_t idx = 0; memcpy( &idx, m_idx, 3 ); assert( idx != 0 ); return idx - 1; } tracy_force_inline bool Active() const { uint32_t zero = 0; return memcmp( m_idx, &zero, 3 ) != 0; } private: uint8_t m_idx[3]; }; struct __StringIdxOld { uint32_t idx : 31; uint32_t active : 1; }; class Int24 { public: tracy_force_inline Int24() { memset( m_val, 0, sizeof( m_val ) ); } tracy_force_inline Int24( uint32_t val ) { SetVal( val ); } tracy_force_inline void SetVal( uint32_t val ) { memcpy( m_val, &val, 3 ); } tracy_force_inline uint32_t Val() const { uint32_t val = 0; memcpy( &val, m_val, 3 ); return val; } private: uint8_t m_val[3]; }; class Int48 { public: tracy_force_inline Int48() {} tracy_force_inline Int48( int64_t val ) { SetVal( val ); } tracy_force_inline void SetVal( int64_t val ) { memcpy( m_val, &val, 6 ); } tracy_force_inline int64_t Val() const { int64_t val = 0; memcpy( ((char*)&val)+2, m_val, 6 ); val >>= 16; return val; } private: uint8_t m_val[6]; }; struct SourceLocationBase { StringRef name; StringRef function; StringRef file; uint32_t line; uint32_t color; }; struct SourceLocation : public SourceLocationBase { mutable uint32_t namehash; }; enum { SourceLocationSize = sizeof( SourceLocation ) }; struct ZoneEvent { tracy_force_inline ZoneEvent() {}; tracy_force_inline int64_t Start() const { return int64_t( _start_srcloc ) >> 16; } tracy_force_inline void SetStart( int64_t start ) { assert( start < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_start_srcloc)+2, &start, 4 ); memcpy( ((char*)&_start_srcloc)+6, ((char*)&start)+4, 2 ); } tracy_force_inline int64_t End() const { return int64_t( _end_child1 ) >> 16; } tracy_force_inline void SetEnd( int64_t end ) { assert( end < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_end_child1)+2, &end, 4 ); memcpy( ((char*)&_end_child1)+6, ((char*)&end)+4, 2 ); } tracy_force_inline int16_t SrcLoc() const { return int16_t( _start_srcloc & 0xFFFF ); } tracy_force_inline void SetSrcLoc( int16_t srcloc ) { memcpy( &_start_srcloc, &srcloc, 2 ); } tracy_force_inline int32_t Child() const { return int32_t( uint32_t( _end_child1 & 0xFFFF ) | ( uint32_t( _child2 ) << 16 ) ); } tracy_force_inline void SetChild( int32_t child ) { memcpy( &_end_child1, &child, 2 ); _child2 = uint32_t( child ) >> 16; } uint64_t _start_srcloc; uint64_t _end_child1; StringIdx text; Int24 callstack; StringIdx name; uint16_t _child2; }; enum { ZoneEventSize = sizeof( ZoneEvent ) }; static_assert( std::is_standard_layout::value, "ZoneEvent is not standard layout" ); struct LockEvent { enum class Type : uint8_t { Wait, Obtain, Release, WaitShared, ObtainShared, ReleaseShared }; tracy_force_inline int64_t Time() const { return int64_t( _time_srcloc ) >> 16; } tracy_force_inline void SetTime( int64_t time ) { assert( time < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_time_srcloc)+2, &time, 4 ); memcpy( ((char*)&_time_srcloc)+6, ((char*)&time)+4, 2 ); } tracy_force_inline int16_t SrcLoc() const { return int16_t( _time_srcloc & 0xFFFF ); } tracy_force_inline void SetSrcLoc( int16_t srcloc ) { memcpy( &_time_srcloc, &srcloc, 2 ); } uint64_t _time_srcloc; uint8_t thread; Type type; }; struct LockEventShared : public LockEvent { uint64_t waitShared; uint64_t sharedList; }; struct LockEventPtr { short_ptr ptr; uint8_t lockingThread; uint8_t lockCount; uint64_t waitList; }; enum { LockEventSize = sizeof( LockEvent ) }; enum { LockEventSharedSize = sizeof( LockEventShared ) }; enum { LockEventPtrSize = sizeof( LockEventPtr ) }; enum { MaxLockThreads = sizeof( LockEventPtr::waitList ) * 8 }; static_assert( std::numeric_limits::max() >= MaxLockThreads, "Not enough space for lock count." ); struct GpuEvent { tracy_force_inline int64_t CpuStart() const { return int64_t( _cpuStart_srcloc ) >> 16; } tracy_force_inline void SetCpuStart( int64_t cpuStart ) { assert( cpuStart < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_cpuStart_srcloc)+2, &cpuStart, 4 ); memcpy( ((char*)&_cpuStart_srcloc)+6, ((char*)&cpuStart)+4, 2 ); } tracy_force_inline int64_t CpuEnd() const { return int64_t( _cpuEnd_thread ) >> 16; } tracy_force_inline void SetCpuEnd( int64_t cpuEnd ) { assert( cpuEnd < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_cpuEnd_thread)+2, &cpuEnd, 4 ); memcpy( ((char*)&_cpuEnd_thread)+6, ((char*)&cpuEnd)+4, 2 ); } tracy_force_inline int64_t GpuStart() const { return int64_t( _gpuStart_child1 ) >> 16; } tracy_force_inline void SetGpuStart( int64_t gpuStart ) { /*assert( gpuStart < (int64_t)( 1ull << 47 ) );*/ memcpy( ((char*)&_gpuStart_child1)+2, &gpuStart, 4 ); memcpy( ((char*)&_gpuStart_child1)+6, ((char*)&gpuStart)+4, 2 ); } tracy_force_inline int64_t GpuEnd() const { return int64_t( _gpuEnd_child2 ) >> 16; } tracy_force_inline void SetGpuEnd( int64_t gpuEnd ) { assert( gpuEnd < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_gpuEnd_child2)+2, &gpuEnd, 4 ); memcpy( ((char*)&_gpuEnd_child2)+6, ((char*)&gpuEnd)+4, 2 ); } tracy_force_inline int16_t SrcLoc() const { return int16_t( _cpuStart_srcloc & 0xFFFF ); } tracy_force_inline void SetSrcLoc( int16_t srcloc ) { memcpy( &_cpuStart_srcloc, &srcloc, 2 ); } tracy_force_inline uint16_t Thread() const { return uint16_t( _cpuEnd_thread & 0xFFFF ); } tracy_force_inline void SetThread( uint16_t thread ) { memcpy( &_cpuEnd_thread, &thread, 2 ); } tracy_force_inline int32_t Child() const { return int32_t( uint32_t( _gpuStart_child1 & 0xFFFF ) | ( uint32_t( _gpuEnd_child2 & 0xFFFF ) << 16 ) ); } tracy_force_inline void SetChild( int32_t child ) { memcpy( &_gpuStart_child1, &child, 2 ); memcpy( &_gpuEnd_child2, ((char*)&child)+2, 2 ); } uint64_t _cpuStart_srcloc; uint64_t _cpuEnd_thread; uint64_t _gpuStart_child1; uint64_t _gpuEnd_child2; Int24 callstack; }; enum { GpuEventSize = sizeof( GpuEvent ) }; static_assert( std::is_standard_layout::value, "GpuEvent is not standard layout" ); struct MemEvent { tracy_force_inline uint64_t Ptr() const { return uint64_t( int64_t( _ptr_csalloc1 ) >> 8 ); } tracy_force_inline void SetPtr( uint64_t ptr ) { memcpy( ((char*)&_ptr_csalloc1)+1, &ptr, 4 ); memcpy( ((char*)&_ptr_csalloc1)+5, ((char*)&ptr)+4, 2 ); memcpy( ((char*)&_ptr_csalloc1)+7, ((char*)&ptr)+6, 1 ); } tracy_force_inline uint64_t Size() const { return _size_csalloc2 >> 16; } tracy_force_inline void SetSize( uint64_t size ) { assert( size < ( 1ull << 47 ) ); memcpy( ((char*)&_size_csalloc2)+2, &size, 4 ); memcpy( ((char*)&_size_csalloc2)+6, ((char*)&size)+4, 2 ); } tracy_force_inline uint32_t CsAlloc() const { return uint8_t( _ptr_csalloc1 ) | ( uint16_t( _size_csalloc2 ) << 8 ); } tracy_force_inline void SetCsAlloc( uint32_t csAlloc ) { memcpy( &_ptr_csalloc1, &csAlloc, 1 ); memcpy( &_size_csalloc2, ((char*)&csAlloc)+1, 2 ); } tracy_force_inline int64_t TimeAlloc() const { return int64_t( _time_thread_alloc ) >> 16; } tracy_force_inline void SetTimeAlloc( int64_t time ) { assert( time < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_time_thread_alloc)+2, &time, 4 ); memcpy( ((char*)&_time_thread_alloc)+6, ((char*)&time)+4, 2 ); } tracy_force_inline int64_t TimeFree() const { return int64_t( _time_thread_free ) >> 16; } tracy_force_inline void SetTimeFree( int64_t time ) { assert( time < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_time_thread_free)+2, &time, 4 ); memcpy( ((char*)&_time_thread_free)+6, ((char*)&time)+4, 2 ); } tracy_force_inline uint16_t ThreadAlloc() const { return uint16_t( _time_thread_alloc ); } tracy_force_inline void SetThreadAlloc( uint16_t thread ) { memcpy( &_time_thread_alloc, &thread, 2 ); } tracy_force_inline uint16_t ThreadFree() const { return uint16_t( _time_thread_free ); } tracy_force_inline void SetThreadFree( uint16_t thread ) { memcpy( &_time_thread_free, &thread, 2 ); } uint64_t _ptr_csalloc1; uint64_t _size_csalloc2; Int24 csFree; uint64_t _time_thread_alloc; uint64_t _time_thread_free; }; enum { MemEventSize = sizeof( MemEvent ) }; static_assert( std::is_standard_layout::value, "MemEvent is not standard layout" ); struct CallstackFrame { StringIdx name; StringIdx file; uint32_t line; }; enum { CallstackFrameSize = sizeof( CallstackFrame ) }; struct CallstackFrameData { short_ptr data; uint8_t size; }; enum { CallstackFrameDataSize = sizeof( CallstackFrameData ) }; // This union exploits the fact that the current implementations of x64 and arm64 do not provide // full 64 bit address space. The high bits must be bit-extended, so 0x80... is an invalid pointer. // This allows using the highest bit as a selector between a native pointer and a table index here. union CallstackFrameId { struct { uint64_t idx : 63; uint64_t sel : 1; }; uint64_t data; }; enum { CallstackFrameIdSize = sizeof( CallstackFrameId ) }; struct CallstackFrameTree { CallstackFrameId frame; uint64_t alloc; uint32_t count; flat_hash_map> children; flat_hash_set> callstacks; }; enum { CallstackFrameTreeSize = sizeof( CallstackFrameTree ) }; struct CrashEvent { uint64_t thread = 0; int64_t time = 0; uint64_t message = 0; uint32_t callstack = 0; }; enum { CrashEventSize = sizeof( CrashEvent ) }; struct ContextSwitchData { enum : int8_t { NoState = 100 }; enum : int8_t { Wakeup = -2 }; tracy_force_inline int64_t Start() const { return int64_t( _start_cpu ) >> 16; } tracy_force_inline void SetStart( int64_t start ) { assert( start < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_start_cpu)+2, &start, 4 ); memcpy( ((char*)&_start_cpu)+6, ((char*)&start)+4, 2 ); } tracy_force_inline int64_t End() const { return int64_t( _end_reason_state ) >> 16; } tracy_force_inline void SetEnd( int64_t end ) { assert( end < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_end_reason_state)+2, &end, 4 ); memcpy( ((char*)&_end_reason_state)+6, ((char*)&end)+4, 2 ); } tracy_force_inline uint8_t Cpu() const { return uint8_t( _start_cpu & 0xFF ); } tracy_force_inline void SetCpu( uint8_t cpu ) { memcpy( &_start_cpu, &cpu, 1 ); } tracy_force_inline int8_t Reason() const { return int8_t( (_end_reason_state >> 8) & 0xFF ); } tracy_force_inline void SetReason( int8_t reason ) { memcpy( ((char*)&_end_reason_state)+1, &reason, 1 ); } tracy_force_inline int8_t State() const { return int8_t( _end_reason_state & 0xFF ); } tracy_force_inline void SetState( int8_t state ) { memcpy( &_end_reason_state, &state, 1 ); } tracy_force_inline int64_t WakeupVal() const { return _wakeup.Val(); } tracy_force_inline void SetWakeup( int64_t wakeup ) { assert( wakeup < (int64_t)( 1ull << 47 ) ); _wakeup.SetVal( wakeup ); } uint64_t _start_cpu; uint64_t _end_reason_state; Int48 _wakeup; }; enum { ContextSwitchDataSize = sizeof( ContextSwitchData ) }; struct ContextSwitchCpu { tracy_force_inline int64_t Start() const { return int64_t( _start_thread ) >> 16; } tracy_force_inline void SetStart( int64_t start ) { assert( start < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_start_thread)+2, &start, 4 ); memcpy( ((char*)&_start_thread)+6, ((char*)&start)+4, 2 ); } tracy_force_inline int64_t End() const { return _end.Val(); } tracy_force_inline void SetEnd( int64_t end ) { assert( end < (int64_t)( 1ull << 47 ) ); _end.SetVal( end ); } tracy_force_inline uint16_t Thread() const { return uint16_t( _start_thread ); } tracy_force_inline void SetThread( uint16_t thread ) { memcpy( &_start_thread, &thread, 2 ); } uint64_t _start_thread; Int48 _end; }; enum { ContextSwitchCpuSize = sizeof( ContextSwitchCpu ) }; struct ContextSwitchUsage { ContextSwitchUsage() {} ContextSwitchUsage( int64_t time, uint8_t other, uint8_t own ) { SetTime( time ); SetOther( other ); SetOwn( own ); } tracy_force_inline int64_t Time() const { return int64_t( _time_other_own ) >> 16; } tracy_force_inline void SetTime( int64_t time ) { assert( time < (int64_t)( 1ull << 47 ) ); memcpy( ((char*)&_time_other_own)+2, &time, 4 ); memcpy( ((char*)&_time_other_own)+6, ((char*)&time)+4, 2 ); } tracy_force_inline uint8_t Other() const { return uint8_t( _time_other_own ); } tracy_force_inline void SetOther( uint8_t other ) { memcpy( &_time_other_own, &other, 1 ); } tracy_force_inline uint8_t Own() const { return uint8_t( _time_other_own >> 8 ); } tracy_force_inline void SetOwn( uint8_t own ) { memcpy( ((char*)&_time_other_own)+1, &own, 1 ); } uint64_t _time_other_own; }; enum { ContextSwitchUsageSize = sizeof( ContextSwitchUsage ) }; struct MessageData { int64_t time; StringRef ref; uint16_t thread; uint32_t color; Int24 callstack; }; enum { MessageDataSize = sizeof( MessageData ) }; struct PlotItem { Int48 time; double val; }; enum { PlotItemSize = sizeof( PlotItem ) }; struct FrameEvent { int64_t start; int64_t end; int32_t frameImage; }; enum { FrameEventSize = sizeof( FrameEvent ) }; #pragma pack() struct ThreadData { uint64_t id; uint64_t count; Vector> timeline; Vector> stack; Vector> messages; uint32_t nextZoneId; Vector zoneIdStack; #ifndef TRACY_NO_STATISTICS Vector childTimeStack; #endif }; struct GpuCtxThreadData { Vector> timeline; Vector> stack; }; struct GpuCtxData { int64_t timeDiff; uint64_t thread; uint64_t count; uint8_t accuracyBits; float period; flat_hash_map> threadData; short_ptr query[64*1024]; }; enum { GpuCtxDataSize = sizeof( GpuCtxData ) }; struct LockMap { struct TimeRange { int64_t start = std::numeric_limits::max(); int64_t end = std::numeric_limits::min(); }; int16_t srcloc; Vector timeline; flat_hash_map> threadMap; std::vector threadList; LockType type; int64_t timeAnnounce; int64_t timeTerminate; bool valid; bool isContended; TimeRange range[64]; }; struct LockHighlight { int64_t id; int64_t begin; int64_t end; uint8_t thread; bool blocked; }; enum class PlotType : uint8_t { User, Memory, SysTime }; enum class PlotValueFormatting : uint8_t { Number, Memory, Percentage }; struct PlotData { uint64_t name; double min; double max; Vector data; Vector postpone; uint64_t postponeTime; PlotType type; PlotValueFormatting format; }; struct MemData { Vector data; Vector frees; flat_hash_map> active; uint64_t high = std::numeric_limits::min(); uint64_t low = std::numeric_limits::max(); uint64_t usage = 0; PlotData* plot = nullptr; }; struct FrameData { uint64_t name; Vector frames; uint8_t continuous; int64_t min = std::numeric_limits::max(); int64_t max = std::numeric_limits::min(); int64_t total = 0; double sumSq = 0; }; struct StringLocation { const char* ptr; uint32_t idx; }; struct SourceLocationHasher { size_t operator()( const SourceLocation* ptr ) const { return charutil::hash( (const char*)ptr, sizeof( SourceLocationBase ) ); } typedef tracy::power_of_two_hash_policy hash_policy; }; struct SourceLocationComparator { bool operator()( const SourceLocation* lhs, const SourceLocation* rhs ) const { return memcmp( lhs, rhs, sizeof( SourceLocationBase ) ) == 0; } }; struct FrameImage { short_ptr ptr; uint32_t csz; uint16_t w, h; uint32_t frameRef; uint8_t flip; }; enum { FrameImageSize = sizeof( FrameImage ) }; struct ContextSwitch { Vector v; int64_t runningTime = 0; }; struct CpuData { Vector cs; }; struct CpuThreadData { int64_t runningTime = 0; uint32_t runningRegions = 0; uint32_t migrations = 0; }; enum { CpuThreadDataSize = sizeof( CpuThreadData ) }; } #endif