/*BEGIN_LEGAL Intel Open Source License Copyright (c) 2002-2005 Intel Corporation All rights reserved. Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. Neither the name of the Intel Corporation nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE INTEL OR ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. END_LEGAL */ /* ===================================================================== */ /* @ORIGINAL_AUTHOR: Robert Muth and Artur Klauser */ /* ===================================================================== */ /*! @file * This file contains a real time opcode mix profiler */ #include "pin.H" #include "portability.H" #include #include #include #include #include // for sort #include /* ===================================================================== */ /* Commandline Switches */ /* ===================================================================== */ KNOB KnobOutputFile(KNOB_MODE_WRITEONCE, "pintool", "o", "opcodetop.out", "specify output file name"); KNOB KnobThreshold(KNOB_MODE_WRITEONCE, "pintool", "t", "10000", "print histogram after every n BBLs"); KNOB KnobCutoff(KNOB_MODE_WRITEONCE, "pintool", "c", "100", "minimum count for opcode to show"); KNOB KnobMaxLines(KNOB_MODE_WRITEONCE, "pintool", "l", "24", "max number of output lines"); KNOB KnobDetachUpdates(KNOB_MODE_WRITEONCE, "pintool", "d", "0", "detach after n screen updates"); KNOB KnobDecayFactor(KNOB_MODE_WRITEONCE, "pintool", "f", "0.0", "x"); /* ===================================================================== */ INT32 Usage() { cerr << "This pin tool provides a real time opcode mix profile\n" "\n"; cerr << KNOB_BASE::StringKnobSummary(); cerr << endl; return -1; } /* ===================================================================== */ /* INDEX HELPERS */ /* ===================================================================== */ const UINT32 MAX_INDEX = 4096; // enough even for IPF const UINT32 INDEX_SPECIAL = 3000; const UINT32 MAX_MEM_SIZE = 512; const UINT32 INDEX_TOTAL = INDEX_SPECIAL + 0; const UINT32 INDEX_MEM_ATOMIC = INDEX_SPECIAL + 1; const UINT32 INDEX_STACK_READ = INDEX_SPECIAL + 2; const UINT32 INDEX_STACK_WRITE = INDEX_SPECIAL + 3; const UINT32 INDEX_IPREL_READ = INDEX_SPECIAL + 4; const UINT32 INDEX_IPREL_WRITE = INDEX_SPECIAL + 5; const UINT32 INDEX_MEM_READ_VARIABLE = INDEX_SPECIAL + 6; const UINT32 INDEX_MEM_WRITE_VARIABLE = INDEX_SPECIAL + 7; const UINT32 INDEX_MEM_READ_SIZE = INDEX_SPECIAL + 8; const UINT32 INDEX_MEM_WRITE_SIZE = INDEX_SPECIAL + 8 + MAX_MEM_SIZE; const UINT32 INDEX_SPECIAL_END = INDEX_SPECIAL + 8 + MAX_MEM_SIZE + MAX_MEM_SIZE; BOOL IsMemReadIndex(UINT32 i) { return (INDEX_MEM_READ_SIZE <= i && i < INDEX_MEM_READ_SIZE + MAX_MEM_SIZE ); } BOOL IsMemWriteIndex(UINT32 i) { return (INDEX_MEM_WRITE_SIZE <= i && i < INDEX_MEM_WRITE_SIZE + MAX_MEM_SIZE ); } /* ===================================================================== */ LOCALFUN UINT32 INS_GetIndex(INS ins) { return INS_Opcode(ins); } /* ===================================================================== */ LOCALFUN UINT32 IndexStringLength(BBL bbl, BOOL memory_acess_profile) { UINT32 count = 0; for (INS ins = BBL_InsHead(bbl); INS_Valid(ins); ins = INS_Next(ins)) { count++; if( memory_acess_profile ) { if( INS_IsMemoryRead(ins) ) count++; // for size if( INS_IsStackRead(ins) ) count++; if( INS_IsIpRelRead(ins) ) count++; if( INS_IsMemoryWrite(ins) ) count++; // for size if( INS_IsStackWrite(ins) ) count++; if( INS_IsIpRelWrite(ins) ) count++; if( INS_IsAtomicUpdate(ins) ) count++; } } return count; } /* ===================================================================== */ LOCALFUN UINT32 MemsizeToIndex(UINT32 size, BOOL write) { if( size == VARIABLE_MEMORY_REFERENCE_SIZE ) { return write ? INDEX_MEM_WRITE_VARIABLE : INDEX_MEM_READ_VARIABLE; } else { return (write ? INDEX_MEM_WRITE_SIZE : INDEX_MEM_READ_SIZE ) + size; } } /* ===================================================================== */ LOCALFUN UINT16 *INS_GenerateIndexString(INS ins, UINT16 *stats, BOOL memory_acess_profile) { *stats++ = INS_GetIndex(ins); if( memory_acess_profile ) { if( INS_IsMemoryRead(ins) ) *stats++ = MemsizeToIndex( INS_MemoryReadSize(ins), 0 ); if( INS_IsMemoryWrite(ins) ) *stats++ = MemsizeToIndex( INS_MemoryWriteSize(ins), 1 ); if( INS_IsAtomicUpdate(ins) ) *stats++ = INDEX_MEM_ATOMIC; if( INS_IsStackRead(ins) ) *stats++ = INDEX_STACK_READ; if( INS_IsStackWrite(ins) ) *stats++ = INDEX_STACK_WRITE; if( INS_IsIpRelRead(ins) ) *stats++ = INDEX_IPREL_READ; if( INS_IsIpRelWrite(ins) ) *stats++ = INDEX_IPREL_WRITE; } return stats; } /* ===================================================================== */ LOCALFUN string IndexToOpcodeString( UINT32 index ) { if( INDEX_SPECIAL <= index && index < INDEX_SPECIAL_END) { if( index == INDEX_TOTAL ) return "*total"; else if( IsMemReadIndex(index) ) return "*mem-read-" + decstr( index - INDEX_MEM_READ_SIZE ); else if( IsMemWriteIndex(index)) return "*mem-write-" + decstr( index - INDEX_MEM_WRITE_SIZE ); else if( index == INDEX_MEM_READ_VARIABLE ) return "*mem-read-variable"; else if( index == INDEX_MEM_WRITE_VARIABLE ) return "*mem-write-variable"; else if( index == INDEX_MEM_ATOMIC ) return "*mem-atomic"; else if( index == INDEX_STACK_READ ) return "*stack-read"; else if( index == INDEX_STACK_WRITE ) return "*stack-write"; else if( index == INDEX_IPREL_READ ) return "*iprel-read"; else if( index == INDEX_IPREL_WRITE ) return "*iprel-write"; else { ASSERTX(0); return ""; } } else { return OPCODE_StringShort(index); } } /* ===================================================================== */ /* ===================================================================== */ typedef UINT64 COUNTER; /* zero initialized */ class STATS { public: COUNTER unpredicated[MAX_INDEX]; VOID Clear(FLT64 factor) { for ( UINT32 i = 0; i < MAX_INDEX; i++) { unpredicated[i] = COUNTER(unpredicated[i] * factor); } } }; STATS GlobalStats; class BBLSTATS { public: COUNTER _counter; const UINT16 * const _stats; public: BBLSTATS(UINT16 * stats) : _counter(0), _stats(stats) {}; }; LOCALVAR vector statsList; /* ===================================================================== */ LOCALVAR UINT64 bbl_counter = 0; LOCALVAR UINT64 updates = 0; /* ===================================================================== */ typedef pair PAIR; typedef vector VEC; /* ===================================================================== */ LOCALFUN BOOL CompareLess(PAIR s1 , PAIR s2) { return s1.second > s2.second; } /* ===================================================================== */ VOID DumpHistogram(std::ostream& out) { const UINT64 cutoff = KnobCutoff.Value(); const UINT64 maxlines = KnobMaxLines.Value(); out << "\033[0;0H"; out << "\033[2J"; out << "\033[44m"; out << ljstr("OPCODE",15) << " " << setw(16) << "COUNT"; out << "\033[0m"; out << endl; for (vector::iterator bi = statsList.begin(); bi != statsList.end(); bi++) { BBLSTATS *b = (*bi); for (const UINT16 * stats = b->_stats; *stats; stats++) { GlobalStats.unpredicated[*stats] += b->_counter; } b->_counter = 0; } COUNTER total = 0; VEC CountMap; for (UINT32 index = 0; index <= INDEX_SPECIAL_END; index++) { total += GlobalStats.unpredicated[index]; if( GlobalStats.unpredicated[index] < cutoff ) continue; CountMap.push_back(PAIR(index,GlobalStats.unpredicated[index])); } CountMap.push_back(PAIR(INDEX_TOTAL,total)); sort( CountMap.begin(), CountMap.end(), CompareLess ); UINT32 lines = 0; for (VEC::iterator bi = CountMap.begin(); bi != CountMap.end(); bi++) { UINT32 i = bi->first; // out << setw(4) << i << " " << ljstr(IndexToOpcodeString(i),15) << " " << out << ljstr(IndexToOpcodeString(i),15) << " " << setw(16) << bi->second << endl; lines++; if (lines >= maxlines) break; } } /* ===================================================================== */ std::ofstream Out; /* ===================================================================== */ VOID docount(COUNTER * counter) { (*counter)++; if( bbl_counter == 0 ) { #if defined(TARGET_IA32) || defined(TARGET_IA32E) static char buffer[512+16]; static char* aligned_bufp =reinterpret_cast(((reinterpret_cast(buffer) + 16) >> 4)<<4); #if defined(PIN_GNU_COMPATIBLE) asm("fxsave %0" : "=m"(*aligned_bufp)); #else __asm { push eax mov eax, aligned_bufp fxsave [eax] pop eax } #endif #endif DumpHistogram(Out); Out << flush; FLT64 factor = KnobDecayFactor.Value(); GlobalStats.Clear(factor); bbl_counter = KnobThreshold.Value(); updates++; if ( updates == KnobDetachUpdates.Value() ) { PIN_Detach(); } #if defined(TARGET_IA32) || defined(TARGET_IA32E) #if defined(PIN_GNU_COMPATIBLE) asm("fxrstor %0" :: "m"(*aligned_bufp)); #else __asm { push eax mov eax, aligned_bufp fxrstor [eax] pop eax } #endif #endif } bbl_counter--; } /* ===================================================================== */ VOID Trace(TRACE trace, VOID *v) { for (BBL bbl = TRACE_BblHead(trace); BBL_Valid(bbl); bbl = BBL_Next(bbl)) { const INS head = BBL_InsHead(bbl); if (! INS_Valid(head)) continue; // Summarize the stats for the bbl in a 0 terminated list // This is done at instrumentation time const UINT32 n = IndexStringLength(bbl, 1); UINT16 *const stats = new UINT16[ n + 1]; UINT16 *const stats_end = stats + (n + 1); UINT16 *curr = stats; for (INS ins = head; INS_Valid(ins); ins = INS_Next(ins)) { curr = INS_GenerateIndexString(ins,curr,1); } // string terminator *curr++ = 0; ASSERTX( curr == stats_end ); // Insert instrumentation to count the number of times the bbl is executed BBLSTATS * bblstats = new BBLSTATS(stats); INS_InsertCall(head, IPOINT_BEFORE, AFUNPTR(docount), IARG_PTR, &(bblstats->_counter), IARG_END); // Remember the counter and stats so we can compute a summary at the end statsList.push_back(bblstats); } } /* ===================================================================== */ int main(int argc, CHAR *argv[]) { PIN_InitSymbols(); if( PIN_Init(argc,argv) ) { return Usage(); } Out.open(KnobOutputFile.Value().c_str()); TRACE_AddInstrumentFunction(Trace, 0); // Never returns PIN_StartProgram(); return 0; } /* ===================================================================== */ /* eof */ /* ===================================================================== */