/************************************************************************** * * Copyright 2008 Tungsten Graphics, Inc., Cedar Park, Texas. * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * **************************************************************************/ /** * @file * Poor-man profiling. * * @author José Fonseca * * @sa http://blogs.msdn.com/joshpoley/archive/2008/03/12/poor-man-s-profiler.aspx * @sa http://www.johnpanzer.com/aci_cuj/index.html */ #include "pipe/p_config.h" #if defined(PROFILE) && defined(PIPE_SUBSYSTEM_WINDOWS_DISPLAY) #include #include #include "pipe/p_debug.h" #include "util/u_string.h" #define PROFILE_TABLE_SIZE (1024*1024) #define FILE_NAME_SIZE 256 struct debug_profile_entry { uintptr_t caller; uintptr_t callee; uint64_t samples; }; static unsigned long enabled = 0; static WCHAR wFileName[FILE_NAME_SIZE] = L"\\??\\c:\\00000000.prof"; static ULONG_PTR iFile = 0; static struct debug_profile_entry *table = NULL; static unsigned long free_table_entries = 0; static unsigned long max_table_entries = 0; uint64_t start_stamp = 0; uint64_t end_stamp = 0; static void debug_profile_entry(uintptr_t caller, uintptr_t callee, uint64_t samples) { unsigned hash = ( caller + callee ) & PROFILE_TABLE_SIZE - 1; while(1) { if(table[hash].caller == 0 && table[hash].callee == 0) { table[hash].caller = caller; table[hash].callee = callee; table[hash].samples = samples; --free_table_entries; break; } else if(table[hash].caller == caller && table[hash].callee == callee) { table[hash].samples += samples; break; } else { ++hash; } } } static uintptr_t caller_stack[1024]; static unsigned last_caller = 0; static int64_t delta(void) { int64_t result = end_stamp - start_stamp; if(result > UINT64_C(0xffffffff)) result = 0; return result; } static void __cdecl debug_profile_enter(uintptr_t callee) { uintptr_t caller = last_caller ? caller_stack[last_caller - 1] : 0; if (caller) debug_profile_entry(caller, 0, delta()); debug_profile_entry(caller, callee, 1); caller_stack[last_caller++] = callee; } static void __cdecl debug_profile_exit(uintptr_t callee) { debug_profile_entry(callee, 0, delta()); if(last_caller) --last_caller; } /** * Called at the start of every method or function. * * @sa http://msdn.microsoft.com/en-us/library/c63a9b7h.aspx */ void __declspec(naked) __cdecl _penter(void) { _asm { push eax mov eax, [enabled] test eax, eax jz skip push edx rdtsc mov dword ptr [end_stamp], eax mov dword ptr [end_stamp+4], edx xor eax, eax mov [enabled], eax mov eax, [esp+8] push ebx push ecx push ebp push edi push esi push eax call debug_profile_enter add esp, 4 pop esi pop edi pop ebp pop ecx pop ebx mov eax, 1 mov [enabled], eax rdtsc mov dword ptr [start_stamp], eax mov dword ptr [start_stamp+4], edx pop edx skip: pop eax ret } } /** * Called at the end of Calls the end of every method or function. * * @sa http://msdn.microsoft.com/en-us/library/xc11y76y.aspx */ void __declspec(naked) __cdecl _pexit(void) { _asm { push eax mov eax, [enabled] test eax, eax jz skip push edx rdtsc mov dword ptr [end_stamp], eax mov dword ptr [end_stamp+4], edx xor eax, eax mov [enabled], eax mov eax, [esp+8] push ebx push ecx push ebp push edi push esi push eax call debug_profile_exit add esp, 4 pop esi pop edi pop ebp pop ecx pop ebx mov eax, 1 mov [enabled], eax rdtsc mov dword ptr [start_stamp], eax mov dword ptr [start_stamp+4], edx pop edx skip: pop eax ret } } /** * Reference function for calibration. */ void __declspec(naked) __debug_profile_reference(void) { _asm { call _penter call _pexit ret } } void debug_profile_start(void) { WCHAR *p; // increment starting from the less significant digit p = &wFileName[14]; while(1) { if(*p == '9') { *p-- = '0'; } else { *p += 1; break; } } table = EngMapFile(wFileName, PROFILE_TABLE_SIZE*sizeof(struct debug_profile_entry), &iFile); if(table) { unsigned i; free_table_entries = max_table_entries = PROFILE_TABLE_SIZE; memset(table, 0, PROFILE_TABLE_SIZE*sizeof(struct debug_profile_entry)); table[0].caller = (uintptr_t)&__debug_profile_reference; table[0].callee = 0; table[0].samples = 0; --free_table_entries; _asm { push edx push eax rdtsc mov dword ptr [start_stamp], eax mov dword ptr [start_stamp+4], edx pop edx pop eax } last_caller = 0; enabled = 1; for(i = 0; i < 8; ++i) { _asm { call __debug_profile_reference } } } } void debug_profile_stop(void) { enabled = 0; if(iFile) EngUnmapFile(iFile); iFile = 0; table = NULL; free_table_entries = max_table_entries = 0; } #endif /* PROFILE */