#include "gprof.h"
int valcmp(const void *, const void *);
static struct gmonhdr gmonhdr;
extern char *__progname;
long hz;
char *a_outname;
char *gmonname;
nltype *nl;
nltype *npe;
int nname;
arctype *archead;
cltype *cyclehead;
int cyclecnt;
nltype *cyclenl;
int ncycle;
int debug;
UNIT *samples;
unsigned long s_lowpc;
unsigned long s_highpc;
unsigned long lowpc, highpc;
unsigned sampbytes;
int nsamples;
double actime;
double totime;
double printtime;
double scale;
unsigned char *textspace;
int cyclethreshold;
bool aflag;
bool bflag;
bool cflag;
bool Cflag;
bool dflag;
bool eflag;
bool Eflag;
bool fflag;
bool Fflag;
bool kflag;
bool sflag;
bool zflag;
int
main(int argc, char *argv[])
{
char **sp;
nltype **timesortnlp;
char **defaultEs;
if (pledge("stdio rpath wpath cpath", NULL) == -1)
err(1, NULL);
--argc;
argv++;
debug = 0;
bflag = TRUE;
while ( *argv != 0 && **argv == '-' ) {
(*argv)++;
switch ( **argv ) {
case 'a':
aflag = TRUE;
break;
case 'b':
bflag = FALSE;
break;
case 'C':
Cflag = TRUE;
cyclethreshold = atoi( *++argv );
break;
case 'c':
#if defined(__i386__) || defined(__mips64__)
cflag = TRUE;
#else
fprintf(stderr, "%s: -c isn't supported on this architecture yet\n", __progname);
exit(1);
#endif
break;
case 'd':
dflag = TRUE;
setvbuf(stdout, NULL, _IOLBF, 0);
debug |= atoi( *++argv );
debug |= ANYDEBUG;
# ifdef DEBUG
printf("[main] debug = %d\n", debug);
# else
warnx("-d ignored");
# endif
break;
case 'E':
++argv;
addlist( Elist , *argv );
Eflag = TRUE;
addlist( elist , *argv );
eflag = TRUE;
break;
case 'e':
addlist( elist , *++argv );
eflag = TRUE;
break;
case 'F':
++argv;
addlist( Flist , *argv );
Fflag = TRUE;
addlist( flist , *argv );
fflag = TRUE;
break;
case 'f':
addlist( flist , *++argv );
fflag = TRUE;
break;
case 'k':
addlist( kfromlist , *++argv );
addlist( ktolist , *++argv );
kflag = TRUE;
break;
case 's':
sflag = TRUE;
break;
case 'z':
zflag = TRUE;
break;
}
argv++;
}
if ( *argv != 0 ) {
a_outname = *argv;
argv++;
} else {
a_outname = A_OUTNAME;
}
if ( *argv != 0 ) {
gmonname = *argv;
argv++;
} else {
gmonname = GMONNAME;
}
if ( sflag == FALSE ) {
if (pledge("stdio rpath", NULL) == -1)
err(1, "pledge");
}
if (getnfile(a_outname, &defaultEs) == -1)
errx(1, "%s: bad format", a_outname);
qsort(nl, nname, sizeof(nltype), valcmp);
for ( sp = &defaultEs[0] ; *sp ; sp++ ) {
Eflag = TRUE;
addlist( Elist , *sp );
eflag = TRUE;
addlist( elist , *sp );
}
do {
getpfile( gmonname );
if ( *argv != 0 ) {
gmonname = *argv;
}
} while ( *argv++ != 0 );
if (hz == 0) {
hz = 1;
warnx("time is in ticks, not seconds");
}
if ( sflag ) {
dumpsum( GMONSUM );
}
asgnsamples();
timesortnlp = doarcs();
printgprof( timesortnlp );
printprof();
printindex();
return (0);
}
void
getpfile(const char *filename)
{
FILE *pfile;
struct rawarc arc;
pfile = openpfile(filename);
readsamples(pfile);
while ( fread( &arc , sizeof arc , 1 , pfile ) == 1 ) {
# ifdef DEBUG
if ( debug & SAMPLEDEBUG ) {
printf( "[getpfile] frompc 0x%lx selfpc 0x%lx count %ld\n" ,
arc.raw_frompc , arc.raw_selfpc , arc.raw_count );
}
# endif
tally( &arc );
}
fclose(pfile);
}
FILE *
openpfile(const char *filename)
{
struct gmonhdr tmp;
FILE *pfile;
int size;
int rate;
if((pfile = fopen(filename, "r")) == NULL)
err(1, "fopen: %s", filename);
if (fread(&tmp, sizeof(struct gmonhdr), 1, pfile) != 1)
errx(1, "%s: bad gmon header", filename);
if ( s_highpc != 0 && ( tmp.lpc != gmonhdr.lpc ||
tmp.hpc != gmonhdr.hpc || tmp.ncnt != gmonhdr.ncnt))
errx(1, "%s: incompatible with first gmon file", filename);
gmonhdr = tmp;
if ( gmonhdr.version == GMONVERSION ) {
rate = gmonhdr.profrate;
size = sizeof(struct gmonhdr);
} else {
fseek(pfile, sizeof(struct ophdr), SEEK_SET);
size = sizeof(struct ophdr);
gmonhdr.profrate = rate = hertz();
gmonhdr.version = GMONVERSION;
}
if (hz == 0) {
hz = rate;
} else if (hz != rate)
errx(1, "%s: profile clock rate (%d) incompatible with clock rate "
"(%ld) in first gmon file", filename, rate, hz);
s_lowpc = (unsigned long) gmonhdr.lpc;
s_highpc = (unsigned long) gmonhdr.hpc;
lowpc = (unsigned long)gmonhdr.lpc / sizeof(UNIT);
highpc = (unsigned long)gmonhdr.hpc / sizeof(UNIT);
sampbytes = gmonhdr.ncnt - size;
nsamples = sampbytes / sizeof (UNIT);
# ifdef DEBUG
if ( debug & SAMPLEDEBUG ) {
printf( "[openpfile] hdr.lpc 0x%lx hdr.hpc 0x%lx hdr.ncnt %d\n",
gmonhdr.lpc , gmonhdr.hpc , gmonhdr.ncnt );
printf( "[openpfile] s_lowpc 0x%lx s_highpc 0x%lx\n" ,
s_lowpc , s_highpc );
printf( "[openpfile] lowpc 0x%lx highpc 0x%lx\n" ,
lowpc , highpc );
printf( "[openpfile] sampbytes %d nsamples %d\n" ,
sampbytes , nsamples );
printf( "[openpfile] sample rate %ld\n" , hz );
}
# endif
return(pfile);
}
void
tally(struct rawarc *rawp)
{
nltype *parentp;
nltype *childp;
parentp = nllookup( rawp -> raw_frompc );
childp = nllookup( rawp -> raw_selfpc );
if ( parentp == 0 || childp == 0 )
return;
if ( kflag
&& onlist( kfromlist , parentp -> name )
&& onlist( ktolist , childp -> name ) ) {
return;
}
childp -> ncall += rawp -> raw_count;
# ifdef DEBUG
if ( debug & TALLYDEBUG ) {
printf( "[tally] arc from %s to %s traversed %ld times\n" ,
parentp -> name , childp -> name , rawp -> raw_count );
}
# endif
addarc( parentp , childp , rawp -> raw_count );
}
void
dumpsum(const char *sumfile)
{
nltype *nlp;
arctype *arcp;
struct rawarc arc;
FILE *sfile;
if ( ( sfile = fopen ( sumfile , "w" ) ) == NULL )
err(1, "fopen: %s", sumfile);
if ( fwrite( &gmonhdr , sizeof gmonhdr , 1 , sfile ) != 1 )
err(1, "fwrite: %s", sumfile);
if (fwrite(samples, sizeof (UNIT), nsamples, sfile) != nsamples)
err(1, "fwrite: %s", sumfile);
for ( nlp = nl ; nlp < npe ; nlp++ ) {
for ( arcp = nlp -> children ; arcp ; arcp = arcp -> arc_childlist ) {
arc.raw_frompc = arcp -> arc_parentp -> value;
arc.raw_selfpc = arcp -> arc_childp -> value;
arc.raw_count = arcp -> arc_count;
if (fwrite ( &arc , sizeof arc , 1 , sfile ) != 1)
err(1, "fwrite: %s", sumfile);
# ifdef DEBUG
if ( debug & SAMPLEDEBUG ) {
printf( "[dumpsum] frompc 0x%lx selfpc 0x%lx count %ld\n" ,
arc.raw_frompc , arc.raw_selfpc , arc.raw_count );
}
# endif
}
}
fclose( sfile );
}
int
valcmp(const void *vp1, const void *vp2)
{
const nltype *p1 = vp1;
const nltype *p2 = vp2;
if ( p1 -> value < p2 -> value ) {
return LESSTHAN;
}
if ( p1 -> value > p2 -> value ) {
return GREATERTHAN;
}
return EQUALTO;
}
void
readsamples(FILE *pfile)
{
UNIT sample;
int i;
if (samples == 0) {
samples = calloc(sampbytes, sizeof (UNIT));
if (samples == 0)
errx(1, "No room for %ld sample pc's", sampbytes / sizeof (UNIT));
}
for (i = 0; i < nsamples; i++) {
fread(&sample, sizeof (UNIT), 1, pfile);
if (feof(pfile))
break;
samples[i] += sample;
}
if (i != nsamples)
errx(1, "unexpected EOF after reading %d/%d samples", i, nsamples );
}
void
asgnsamples(void)
{
int j;
UNIT ccnt;
double time;
unsigned long pcl, pch;
unsigned long i;
unsigned long overlap;
unsigned long svalue0, svalue1;
scale = highpc - lowpc;
scale /= nsamples;
alignentries();
for (i = 0, j = 1; i < nsamples; i++) {
ccnt = samples[i];
if (ccnt == 0)
continue;
pcl = lowpc + (unsigned long)(scale * i);
pch = lowpc + (unsigned long)(scale * (i + 1));
time = ccnt;
# ifdef DEBUG
if ( debug & SAMPLEDEBUG ) {
printf( "[asgnsamples] pcl 0x%lx pch 0x%lx ccnt %d\n" ,
pcl , pch , ccnt );
}
# endif
totime += time;
for (j = j - 1; j < nname; j++) {
svalue0 = nl[j].svalue;
svalue1 = nl[j+1].svalue;
if (pch < svalue0)
break;
if (pcl >= svalue1)
continue;
overlap = min(pch, svalue1) - max(pcl, svalue0);
if (overlap > 0) {
# ifdef DEBUG
if (debug & SAMPLEDEBUG) {
printf("[asgnsamples] (0x%lx->0x%lx-0x%lx) %s gets %f ticks %ld overlap\n",
nl[j].value/sizeof(UNIT), svalue0, svalue1,
nl[j].name,
overlap * time / scale, overlap);
}
# endif
nl[j].time += overlap * time / scale;
}
}
}
# ifdef DEBUG
if (debug & SAMPLEDEBUG) {
printf("[asgnsamples] totime %f\n", totime);
}
# endif
}
unsigned long
min(unsigned long a, unsigned long b)
{
if (a<b)
return(a);
return(b);
}
unsigned long
max(unsigned long a, unsigned long b)
{
if (a>b)
return(a);
return(b);
}
void
alignentries(void)
{
struct nl *nlp;
unsigned long bucket_of_entry;
unsigned long bucket_of_code;
for (nlp = nl; nlp < npe; nlp++) {
nlp -> svalue = nlp -> value / sizeof(UNIT);
bucket_of_entry = (nlp->svalue - lowpc) / scale;
bucket_of_code = (nlp->svalue + UNITS_TO_CODE - lowpc) / scale;
if (bucket_of_entry < bucket_of_code) {
# ifdef DEBUG
if (debug & SAMPLEDEBUG) {
printf("[alignentries] pushing svalue 0x%lx to 0x%lx\n",
nlp->svalue, nlp->svalue + UNITS_TO_CODE);
}
# endif
nlp->svalue += UNITS_TO_CODE;
}
}
}