rockbox/firmware/profile.c

344 lines
12 KiB
C

/***************************************************************************
* __________ __ ___.
* Open \______ \ ____ ____ | | _\_ |__ _______ ___
* Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
* Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
* Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
* \/ \/ \/ \/ \/
* $Id$
*
* Profiling routines counts ticks and calls to each profiled function.
*
* Copyright (C) 2005 by Brandon Low
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation; either version 2
* of the License, or (at your option) any later version.
*
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
* KIND, either express or implied.
*
****************************************************************************
*
* profile_func_enter() based on mcount found in gmon.c:
*
***************************************************************************
* Copyright (c) 1991, 1998 The Regents of the University of California.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. [rescinded 22 July 1999]
* 4. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
* @(#)gmon.c 5.3 (Berkeley) 5/22/91
*/
#include <file.h>
#include <system.h>
#include <string.h>
#include <timer.h>
#include "inttypes.h"
#include "profile.h"
/* PFD is Profiled Function Data */
/* Indices are shorts which means that we use 4k of RAM */
#define INDEX_BITS 11 /* What is a reasonable size for this? */
#define INDEX_SIZE 2048 /* 2 ^ INDEX_BITS */
#define INDEX_MASK 0x7FF /* lower INDEX_BITS 1 */
/*
* In the current setup (pfd has 4 longs and 2 shorts) this uses 20k of RAM
* for profiling, and allows for profiling sections of code with up-to
* 1024 function caller->callee pairs
*/
#define NUMPFDS 512
struct pfd_struct {
void *self_pc;
unsigned long count;
unsigned long time;
unsigned short link;
struct pfd_struct *caller;
};
/* Possible states of profiling */
#define PROF_ON 0x00
#define PROF_BUSY 0x01
#define PROF_ERROR 0x02
#define PROF_OFF 0x03
/* Masks for thread switches */
#define PROF_OFF_THREAD 0x10
#define PROF_ON_THREAD 0x0F
static unsigned short profiling = PROF_OFF;
static size_t recursion_level;
static unsigned short indices[INDEX_SIZE];
static struct pfd_struct pfds[NUMPFDS];
/* This holds a pointer to the last pfd effected for time tracking */
static struct pfd_struct *last_pfd;
/* These are used to track the time when we've lost the CPU so it doesn't count
* against any of the profiled functions */
static int profiling_thread = -1;
/* internal function prototypes */
static void profile_timer_tick(void);
static void profile_timer_unregister(void);
static void write_function_recursive(int fd, struct pfd_struct *pfd, int depth);
/* Be careful to use the right one for the size of your variable */
#ifdef CPU_COLDFIRE
#define ADDQI_L(_var,_value) \
asm ("addq.l %[value],%[var];" \
: [var] "+g" (_var) \
: [value] "I" (_value) )
#else
#define ADDQI_L(var, value) var += value
#endif
void profile_thread_stopped(int current_thread) {
if (current_thread == profiling_thread) {
/* If profiling is busy or idle */
if (profiling < PROF_ERROR) {
/* Unregister the timer so that other threads aren't interrupted */
timer_unregister();
}
/* Make sure we don't waste time profiling when we're running the
* wrong thread */
profiling |= PROF_OFF_THREAD;
}
}
void profile_thread_started(int current_thread) {
if (current_thread == profiling_thread) {
/* Now we are allowed to profile again */
profiling &= PROF_ON_THREAD;
/* if profiling was busy or idle */
if (profiling < PROF_ERROR) {
/* After we de-mask, if profiling is active, reactivate the timer */
timer_register(0, profile_timer_unregister,
TIMER_FREQ/10000, profile_timer_tick IF_COP(, 0 ) );
}
}
}
static void profile_timer_tick(void) {
if (!profiling) {
register struct pfd_struct *my_last_pfd = last_pfd;
if (my_last_pfd) {
ADDQI_L(my_last_pfd->time,1);
}
}
}
static void profile_timer_unregister(void) {
profiling = PROF_ERROR;
profstop();
}
/* This function clears the links on top level linkers, and clears the needed
* parts of memory in the index array */
void profstart(int current_thread) {
recursion_level = 0;
profiling_thread = current_thread;
last_pfd = (struct pfd_struct*)0;
pfds[0].link = 0;
pfds[0].self_pc = 0;
memset(indices,0,INDEX_SIZE * sizeof(unsigned short));
timer_register(
0, profile_timer_unregister, TIMER_FREQ/10000, profile_timer_tick IF_COP(, 0 ) );
profiling = PROF_ON;
}
static void write_function_recursive(int fd, struct pfd_struct *pfd, int depth){
unsigned short link = pfd->link;
fdprintf(fd,"0x%08lX\t%08ld\t%08ld\t%04d\n", (size_t)pfd->self_pc,
pfd->count, pfd->time, depth);
if (link > 0 && link < NUMPFDS) {
write_function_recursive(fd, &pfds[link], ++depth);
}
}
void profstop() {
int profiling_exit = profiling;
int fd = 0;
int i;
unsigned short current_index;
timer_unregister();
profiling = PROF_OFF;
fd = open("/profile.out", O_WRONLY|O_CREAT|O_TRUNC, 0666);
if (profiling_exit == PROF_ERROR) {
fdprintf(fd,"Profiling exited with an error.\n");
fdprintf(fd,"Overflow or timer stolen most likely.\n");
}
fdprintf(fd,"PROFILE_THREAD\tPFDS_USED\n");
fdprintf(fd,"%08d\t%08d\n", profiling_thread,
pfds[0].link);
fdprintf(fd,"FUNCTION_PC\tCALL_COUNT\tTICKS\t\tDEPTH\n");
for (i = 0; i < INDEX_SIZE; i++) {
current_index = indices[i];
if (current_index != 0) {
write_function_recursive(fd, &pfds[current_index], 0);
}
}
fdprintf(fd,"DEBUG PROFILE DATA FOLLOWS\n");
fdprintf(fd,"INDEX\tLOCATION\tSELF_PC\t\tCOUNT\t\tTIME\t\tLINK\tCALLER_IDX\n");
for (i = 0; i < NUMPFDS; i++) {
struct pfd_struct *my_last_pfd = &pfds[i];
if (my_last_pfd->self_pc != 0) {
fdprintf(fd,
"%04d\t0x%08lX\t0x%08lX\t0x%08lX\t0x%08lX\t%04d\t0x%08lX\n",
i, (size_t)my_last_pfd, (size_t)my_last_pfd->self_pc,
my_last_pfd->count, my_last_pfd->time, my_last_pfd->link,
(size_t)my_last_pfd->caller );
}
}
fdprintf(fd,"INDEX_ADDRESS=INDEX\n");
for (i=0; i < INDEX_SIZE; i++) {
fdprintf(fd,"%08lX=%04d\n",(size_t)&indices[i],indices[i]);
}
close(fd);
}
void __cyg_profile_func_exit(void *self_pc, void *call_site) {
(void)call_site;
(void)self_pc;
/* When we started timing, we set the time to the tick at that time
* less the time already used in function */
if (profiling) {
return;
}
profiling = PROF_BUSY;
{
register unsigned short my_recursion_level = recursion_level;
if (my_recursion_level) {
my_recursion_level--;
recursion_level = my_recursion_level;
} else {
/* This shouldn't be necessary, maybe exit could be called first */
register struct pfd_struct *my_last_pfd = last_pfd;
if (my_last_pfd) {
last_pfd = my_last_pfd->caller;
}
}
}
profiling = PROF_ON;
}
#define ALLOCATE_PFD(temp) \
temp = ++pfds[0].link;\
if (temp >= NUMPFDS) goto overflow; \
pfd = &pfds[temp];\
pfd->self_pc = self_pc; pfd->count = 1; pfd->time = 0
void __cyg_profile_func_enter(void *self_pc, void *from_pc) {
struct pfd_struct *pfd;
struct pfd_struct *prev_pfd;
unsigned short *pfd_index_pointer;
unsigned short pfd_index;
/* check that we are profiling and that we aren't recursively invoked
* this is equivalent to 'if (profiling != PROF_ON)' but it's faster */
if (profiling) {
return;
}
profiling = PROF_BUSY;
/* A check that the PC is in the code range here wouldn't hurt, but this is
* logically guaranteed to be a valid address unless the constants are
* breaking the rules. */
pfd_index_pointer = &indices[((size_t)from_pc)&INDEX_MASK];
pfd_index = *pfd_index_pointer;
if (pfd_index == 0) {
/* new caller, allocate new storage */
ALLOCATE_PFD(pfd_index);
pfd->link = 0;
*pfd_index_pointer = pfd_index;
goto done;
}
pfd = &pfds[pfd_index];
if (pfd->self_pc == self_pc) {
/* only / most recent function called by this caller, usual case */
/* increment count, start timing and exit */
goto found;
}
/* collision, bad for performance, look down the list of functions called by
* colliding PCs */
for (; /* goto done */; ) {
pfd_index = pfd->link;
if (pfd_index == 0) {
/* no more previously called functions, allocate a new one */
ALLOCATE_PFD(pfd_index);
/* this function becomes the new head, link to the old head */
pfd->link = *pfd_index_pointer;
/* and set the index to point to this function */
*pfd_index_pointer = pfd_index;
/* start timing and exit */
goto done;
}
/* move along the chain */
prev_pfd = pfd;
pfd = &pfds[pfd_index];
if (pfd->self_pc == self_pc) {
/* found ourself */
/* Remove me from my old spot */
prev_pfd->link = pfd->link;
/* Link to the old head */
pfd->link = *pfd_index_pointer;
/* Make me head */
*pfd_index_pointer = pfd_index;
/* increment count, start timing and exit */
goto found;
}
}
/* We've found a pfd, increment it */
found:
ADDQI_L(pfd->count,1);
/* We've (found or created) and updated our pfd, save it and start timing */
done:
{
register struct pfd_struct *my_last_pfd = last_pfd;
if (pfd != my_last_pfd) {
/* If we are not recursing */
pfd->caller = my_last_pfd;
last_pfd = pfd;
} else {
ADDQI_L(recursion_level,1);
}
}
/* Start timing this function */
profiling = PROF_ON;
return; /* normal return restores saved registers */
overflow:
/* this is the same as 'profiling = PROF_ERROR' */
profiling = PROF_ERROR;
return;
}