xref: /original-bsd/usr.bin/gprof/gprof.c (revision 4ec22e22)
1 /*
2  * Copyright (c) 1983 Regents of the University of California.
3  * All rights reserved.
4  *
5  * %sccs.include.redist.c%
6  */
7 
8 #ifndef lint
9 char copyright[] =
10 "@(#) Copyright (c) 1983 Regents of the University of California.\n\
11  All rights reserved.\n";
12 #endif /* not lint */
13 
14 #ifndef lint
15 static char sccsid[] = "@(#)gprof.c	5.6 (Berkeley) 06/01/90";
16 #endif /* not lint */
17 
18 #include "gprof.h"
19 
20 char	*whoami = "gprof";
21 
22     /*
23      *	things which get -E excluded by default.
24      */
25 char	*defaultEs[] = { "mcount" , "__mcleanup" , 0 };
26 
27 main(argc, argv)
28     int argc;
29     char **argv;
30 {
31     char	**sp;
32     nltype	**timesortnlp;
33 
34     --argc;
35     argv++;
36     debug = 0;
37     bflag = TRUE;
38     while ( *argv != 0 && **argv == '-' ) {
39 	(*argv)++;
40 	switch ( **argv ) {
41 	case 'a':
42 	    aflag = TRUE;
43 	    break;
44 	case 'b':
45 	    bflag = FALSE;
46 	    break;
47 	case 'c':
48 	    cflag = TRUE;
49 	    break;
50 	case 'd':
51 	    dflag = TRUE;
52 	    (*argv)++;
53 	    debug |= atoi( *argv );
54 	    debug |= ANYDEBUG;
55 #	    ifdef DEBUG
56 		printf("[main] debug = %d\n", debug);
57 #	    else not DEBUG
58 		printf("%s: -d ignored\n", whoami);
59 #	    endif DEBUG
60 	    break;
61 	case 'E':
62 	    ++argv;
63 	    addlist( Elist , *argv );
64 	    Eflag = TRUE;
65 	    addlist( elist , *argv );
66 	    eflag = TRUE;
67 	    break;
68 	case 'e':
69 	    addlist( elist , *++argv );
70 	    eflag = TRUE;
71 	    break;
72 	case 'F':
73 	    ++argv;
74 	    addlist( Flist , *argv );
75 	    Fflag = TRUE;
76 	    addlist( flist , *argv );
77 	    fflag = TRUE;
78 	    break;
79 	case 'f':
80 	    addlist( flist , *++argv );
81 	    fflag = TRUE;
82 	    break;
83 	case 'k':
84 	    addlist( kfromlist , *++argv );
85 	    addlist( ktolist , *++argv );
86 	    kflag = TRUE;
87 	    break;
88 	case 's':
89 	    sflag = TRUE;
90 	    break;
91 	case 'z':
92 	    zflag = TRUE;
93 	    break;
94 	}
95 	argv++;
96     }
97     if ( *argv != 0 ) {
98 	a_outname  = *argv;
99 	argv++;
100     } else {
101 	a_outname  = A_OUTNAME;
102     }
103     if ( *argv != 0 ) {
104 	gmonname = *argv;
105 	argv++;
106     } else {
107 	gmonname = GMONNAME;
108     }
109 	/*
110 	 *	turn off default functions
111 	 */
112     for ( sp = &defaultEs[0] ; *sp ; sp++ ) {
113 	Eflag = TRUE;
114 	addlist( Elist , *sp );
115 	eflag = TRUE;
116 	addlist( elist , *sp );
117     }
118 	/*
119 	 *	how many ticks per second?
120 	 *	if we can't tell, report time in ticks.
121 	 */
122     hz = hertz();
123     if (hz == 0) {
124 	hz = 1;
125 	fprintf(stderr, "time is in ticks, not seconds\n");
126     }
127 	/*
128 	 *	get information about a.out file.
129 	 */
130     getnfile();
131 	/*
132 	 *	get information about mon.out file(s).
133 	 */
134     do	{
135 	getpfile( gmonname );
136 	if ( *argv != 0 ) {
137 	    gmonname = *argv;
138 	}
139     } while ( *argv++ != 0 );
140 	/*
141 	 *	dump out a gmon.sum file if requested
142 	 */
143     if ( sflag ) {
144 	dumpsum( GMONSUM );
145     }
146 	/*
147 	 *	assign samples to procedures
148 	 */
149     asgnsamples();
150 	/*
151 	 *	assemble the dynamic profile
152 	 */
153     timesortnlp = doarcs();
154 	/*
155 	 *	print the dynamic profile
156 	 */
157     printgprof( timesortnlp );
158 	/*
159 	 *	print the flat profile
160 	 */
161     printprof();
162 	/*
163 	 *	print the index
164 	 */
165     printindex();
166     done();
167 }
168 
169     /*
170      * Set up string and symbol tables from a.out.
171      *	and optionally the text space.
172      * On return symbol table is sorted by value.
173      */
174 getnfile()
175 {
176     FILE	*nfile;
177     int		valcmp();
178 
179     nfile = fopen( a_outname ,"r");
180     if (nfile == NULL) {
181 	perror( a_outname );
182 	done();
183     }
184     fread(&xbuf, 1, sizeof(xbuf), nfile);
185     if (N_BADMAG(xbuf)) {
186 	fprintf(stderr, "%s: %s: bad format\n", whoami , a_outname );
187 	done();
188     }
189     getstrtab(nfile);
190     getsymtab(nfile);
191     gettextspace( nfile );
192     qsort(nl, nname, sizeof(nltype), valcmp);
193     fclose(nfile);
194 #   ifdef DEBUG
195 	if ( debug & AOUTDEBUG ) {
196 	    register int j;
197 
198 	    for (j = 0; j < nname; j++){
199 		printf("[getnfile] 0X%08x\t%s\n", nl[j].value, nl[j].name);
200 	    }
201 	}
202 #   endif DEBUG
203 }
204 
205 getstrtab(nfile)
206     FILE	*nfile;
207 {
208 
209     fseek(nfile, (long)(N_SYMOFF(xbuf) + xbuf.a_syms), 0);
210     if (fread(&ssiz, sizeof (ssiz), 1, nfile) == 0) {
211 	fprintf(stderr, "%s: %s: no string table (old format?)\n" ,
212 		whoami , a_outname );
213 	done();
214     }
215     strtab = (char *)calloc(ssiz, 1);
216     if (strtab == NULL) {
217 	fprintf(stderr, "%s: %s: no room for %d bytes of string table",
218 		whoami , a_outname , ssiz);
219 	done();
220     }
221     if (fread(strtab+sizeof(ssiz), ssiz-sizeof(ssiz), 1, nfile) != 1) {
222 	fprintf(stderr, "%s: %s: error reading string table\n",
223 		whoami , a_outname );
224 	done();
225     }
226 }
227 
228     /*
229      * Read in symbol table
230      */
231 getsymtab(nfile)
232     FILE	*nfile;
233 {
234     register long	i;
235     int			askfor;
236     struct nlist	nbuf;
237 
238     /* pass1 - count symbols */
239     fseek(nfile, (long)N_SYMOFF(xbuf), 0);
240     nname = 0;
241     for (i = xbuf.a_syms; i > 0; i -= sizeof(struct nlist)) {
242 	fread(&nbuf, sizeof(nbuf), 1, nfile);
243 	if ( ! funcsymbol( &nbuf ) ) {
244 	    continue;
245 	}
246 	nname++;
247     }
248     if (nname == 0) {
249 	fprintf(stderr, "%s: %s: no symbols\n", whoami , a_outname );
250 	done();
251     }
252     askfor = nname + 1;
253     nl = (nltype *) calloc( askfor , sizeof(nltype) );
254     if (nl == 0) {
255 	fprintf(stderr, "%s: No room for %d bytes of symbol table\n",
256 		whoami, askfor * sizeof(nltype) );
257 	done();
258     }
259 
260     /* pass2 - read symbols */
261     fseek(nfile, (long)N_SYMOFF(xbuf), 0);
262     npe = nl;
263     nname = 0;
264     for (i = xbuf.a_syms; i > 0; i -= sizeof(struct nlist)) {
265 	fread(&nbuf, sizeof(nbuf), 1, nfile);
266 	if ( ! funcsymbol( &nbuf ) ) {
267 #	    ifdef DEBUG
268 		if ( debug & AOUTDEBUG ) {
269 		    printf( "[getsymtab] rejecting: 0x%x %s\n" ,
270 			    nbuf.n_type , strtab + nbuf.n_un.n_strx );
271 		}
272 #	    endif DEBUG
273 	    continue;
274 	}
275 	npe->value = nbuf.n_value;
276 	npe->name = strtab+nbuf.n_un.n_strx;
277 #	ifdef DEBUG
278 	    if ( debug & AOUTDEBUG ) {
279 		printf( "[getsymtab] %d %s 0x%08x\n" ,
280 			nname , npe -> name , npe -> value );
281 	    }
282 #	endif DEBUG
283 	npe++;
284 	nname++;
285     }
286     npe->value = -1;
287 }
288 
289     /*
290      *	read in the text space of an a.out file
291      */
292 gettextspace( nfile )
293     FILE	*nfile;
294 {
295     char	*malloc();
296 
297     if ( cflag == 0 ) {
298 	return;
299     }
300     textspace = (u_char *) malloc( xbuf.a_text );
301     if ( textspace == 0 ) {
302 	fprintf( stderr , "%s: ran out room for %d bytes of text space:  " ,
303 			whoami , xbuf.a_text );
304 	fprintf( stderr , "can't do -c\n" );
305 	return;
306     }
307     (void) fseek( nfile , N_TXTOFF( xbuf ) , 0 );
308     if ( fread( textspace , 1 , xbuf.a_text , nfile ) != xbuf.a_text ) {
309 	fprintf( stderr , "%s: couldn't read text space:  " , whoami );
310 	fprintf( stderr , "can't do -c\n" );
311 	free( textspace );
312 	textspace = 0;
313 	return;
314     }
315 }
316     /*
317      *	information from a gmon.out file is in two parts:
318      *	an array of sampling hits within pc ranges,
319      *	and the arcs.
320      */
321 getpfile(filename)
322     char *filename;
323 {
324     FILE		*pfile;
325     FILE		*openpfile();
326     struct rawarc	arc;
327 
328     pfile = openpfile(filename);
329     readsamples(pfile);
330 	/*
331 	 *	the rest of the file consists of
332 	 *	a bunch of <from,self,count> tuples.
333 	 */
334     while ( fread( &arc , sizeof arc , 1 , pfile ) == 1 ) {
335 #	ifdef DEBUG
336 	    if ( debug & SAMPLEDEBUG ) {
337 		printf( "[getpfile] frompc 0x%x selfpc 0x%x count %d\n" ,
338 			arc.raw_frompc , arc.raw_selfpc , arc.raw_count );
339 	    }
340 #	endif DEBUG
341 	    /*
342 	     *	add this arc
343 	     */
344 	tally( &arc );
345     }
346     fclose(pfile);
347 }
348 
349 FILE *
350 openpfile(filename)
351     char *filename;
352 {
353     struct hdr	tmp;
354     FILE	*pfile;
355 
356     if((pfile = fopen(filename, "r")) == NULL) {
357 	perror(filename);
358 	done();
359     }
360     fread(&tmp, sizeof(struct hdr), 1, pfile);
361     if ( s_highpc != 0 && ( tmp.lowpc != h.lowpc ||
362 	 tmp.highpc != h.highpc || tmp.ncnt != h.ncnt ) ) {
363 	fprintf(stderr, "%s: incompatible with first gmon file\n", filename);
364 	done();
365     }
366     h = tmp;
367     s_lowpc = (unsigned long) h.lowpc;
368     s_highpc = (unsigned long) h.highpc;
369     lowpc = (unsigned long)h.lowpc / sizeof(UNIT);
370     highpc = (unsigned long)h.highpc / sizeof(UNIT);
371     sampbytes = h.ncnt - sizeof(struct hdr);
372     nsamples = sampbytes / sizeof (UNIT);
373 #   ifdef DEBUG
374 	if ( debug & SAMPLEDEBUG ) {
375 	    printf( "[openpfile] hdr.lowpc 0x%x hdr.highpc 0x%x hdr.ncnt %d\n",
376 		h.lowpc , h.highpc , h.ncnt );
377 	    printf( "[openpfile]   s_lowpc 0x%x   s_highpc 0x%x\n" ,
378 		s_lowpc , s_highpc );
379 	    printf( "[openpfile]     lowpc 0x%x     highpc 0x%x\n" ,
380 		lowpc , highpc );
381 	    printf( "[openpfile] sampbytes %d nsamples %d\n" ,
382 		sampbytes , nsamples );
383 	}
384 #   endif DEBUG
385     return(pfile);
386 }
387 
388 tally( rawp )
389     struct rawarc	*rawp;
390 {
391     nltype		*parentp;
392     nltype		*childp;
393 
394     parentp = nllookup( rawp -> raw_frompc );
395     childp = nllookup( rawp -> raw_selfpc );
396     if ( kflag
397 	 && onlist( kfromlist , parentp -> name )
398 	 && onlist( ktolist , childp -> name ) ) {
399 	return;
400     }
401     childp -> ncall += rawp -> raw_count;
402 #   ifdef DEBUG
403 	if ( debug & TALLYDEBUG ) {
404 	    printf( "[tally] arc from %s to %s traversed %d times\n" ,
405 		    parentp -> name , childp -> name , rawp -> raw_count );
406 	}
407 #   endif DEBUG
408     addarc( parentp , childp , rawp -> raw_count );
409 }
410 
411 /*
412  * dump out the gmon.sum file
413  */
414 dumpsum( sumfile )
415     char *sumfile;
416 {
417     register nltype *nlp;
418     register arctype *arcp;
419     struct rawarc arc;
420     FILE *sfile;
421 
422     if ( ( sfile = fopen ( sumfile , "w" ) ) == NULL ) {
423 	perror( sumfile );
424 	done();
425     }
426     /*
427      * dump the header; use the last header read in
428      */
429     if ( fwrite( &h , sizeof h , 1 , sfile ) != 1 ) {
430 	perror( sumfile );
431 	done();
432     }
433     /*
434      * dump the samples
435      */
436     if (fwrite(samples, sizeof (UNIT), nsamples, sfile) != nsamples) {
437 	perror( sumfile );
438 	done();
439     }
440     /*
441      * dump the normalized raw arc information
442      */
443     for ( nlp = nl ; nlp < npe ; nlp++ ) {
444 	for ( arcp = nlp -> children ; arcp ; arcp = arcp -> arc_childlist ) {
445 	    arc.raw_frompc = arcp -> arc_parentp -> value;
446 	    arc.raw_selfpc = arcp -> arc_childp -> value;
447 	    arc.raw_count = arcp -> arc_count;
448 	    if ( fwrite ( &arc , sizeof arc , 1 , sfile ) != 1 ) {
449 		perror( sumfile );
450 		done();
451 	    }
452 #	    ifdef DEBUG
453 		if ( debug & SAMPLEDEBUG ) {
454 		    printf( "[dumpsum] frompc 0x%x selfpc 0x%x count %d\n" ,
455 			    arc.raw_frompc , arc.raw_selfpc , arc.raw_count );
456 		}
457 #	    endif DEBUG
458 	}
459     }
460     fclose( sfile );
461 }
462 
463 valcmp(p1, p2)
464     nltype *p1, *p2;
465 {
466     if ( p1 -> value < p2 -> value ) {
467 	return LESSTHAN;
468     }
469     if ( p1 -> value > p2 -> value ) {
470 	return GREATERTHAN;
471     }
472     return EQUALTO;
473 }
474 
475 readsamples(pfile)
476     FILE	*pfile;
477 {
478     register i;
479     UNIT	sample;
480 
481     if (samples == 0) {
482 	samples = (UNIT *) calloc(sampbytes, sizeof (UNIT));
483 	if (samples == 0) {
484 	    fprintf( stderr , "%s: No room for %d sample pc's\n",
485 		whoami , sampbytes / sizeof (UNIT));
486 	    done();
487 	}
488     }
489     for (i = 0; i < nsamples; i++) {
490 	fread(&sample, sizeof (UNIT), 1, pfile);
491 	if (feof(pfile))
492 		break;
493 	samples[i] += sample;
494     }
495     if (i != nsamples) {
496 	fprintf(stderr,
497 	    "%s: unexpected EOF after reading %d/%d samples\n",
498 		whoami , --i , nsamples );
499 	done();
500     }
501 }
502 
503 /*
504  *	Assign samples to the procedures to which they belong.
505  *
506  *	There are three cases as to where pcl and pch can be
507  *	with respect to the routine entry addresses svalue0 and svalue1
508  *	as shown in the following diagram.  overlap computes the
509  *	distance between the arrows, the fraction of the sample
510  *	that is to be credited to the routine which starts at svalue0.
511  *
512  *	    svalue0                                         svalue1
513  *	       |                                               |
514  *	       v                                               v
515  *
516  *	       +-----------------------------------------------+
517  *	       |					       |
518  *	  |  ->|    |<-		->|         |<-		->|    |<-  |
519  *	  |         |		  |         |		  |         |
520  *	  +---------+		  +---------+		  +---------+
521  *
522  *	  ^         ^		  ^         ^		  ^         ^
523  *	  |         |		  |         |		  |         |
524  *	 pcl       pch		 pcl       pch		 pcl       pch
525  *
526  *	For the vax we assert that samples will never fall in the first
527  *	two bytes of any routine, since that is the entry mask,
528  *	thus we give call alignentries() to adjust the entry points if
529  *	the entry mask falls in one bucket but the code for the routine
530  *	doesn't start until the next bucket.  In conjunction with the
531  *	alignment of routine addresses, this should allow us to have
532  *	only one sample for every four bytes of text space and never
533  *	have any overlap (the two end cases, above).
534  */
535 asgnsamples()
536 {
537     register int	j;
538     UNIT		ccnt;
539     double		time;
540     unsigned long	pcl, pch;
541     register int	i;
542     unsigned long	overlap;
543     unsigned long	svalue0, svalue1;
544 
545     /* read samples and assign to namelist symbols */
546     scale = highpc - lowpc;
547     scale /= nsamples;
548     alignentries();
549     for (i = 0, j = 1; i < nsamples; i++) {
550 	ccnt = samples[i];
551 	if (ccnt == 0)
552 		continue;
553 	pcl = lowpc + scale * i;
554 	pch = lowpc + scale * (i + 1);
555 	time = ccnt;
556 #	ifdef DEBUG
557 	    if ( debug & SAMPLEDEBUG ) {
558 		printf( "[asgnsamples] pcl 0x%x pch 0x%x ccnt %d\n" ,
559 			pcl , pch , ccnt );
560 	    }
561 #	endif DEBUG
562 	totime += time;
563 	for (j = j - 1; j < nname; j++) {
564 	    svalue0 = nl[j].svalue;
565 	    svalue1 = nl[j+1].svalue;
566 		/*
567 		 *	if high end of tick is below entry address,
568 		 *	go for next tick.
569 		 */
570 	    if (pch < svalue0)
571 		    break;
572 		/*
573 		 *	if low end of tick into next routine,
574 		 *	go for next routine.
575 		 */
576 	    if (pcl >= svalue1)
577 		    continue;
578 	    overlap = min(pch, svalue1) - max(pcl, svalue0);
579 	    if (overlap > 0) {
580 #		ifdef DEBUG
581 		    if (debug & SAMPLEDEBUG) {
582 			printf("[asgnsamples] (0x%x->0x%x-0x%x) %s gets %f ticks %d overlap\n",
583 				nl[j].value/sizeof(UNIT), svalue0, svalue1,
584 				nl[j].name,
585 				overlap * time / scale, overlap);
586 		    }
587 #		endif DEBUG
588 		nl[j].time += overlap * time / scale;
589 	    }
590 	}
591     }
592 #   ifdef DEBUG
593 	if (debug & SAMPLEDEBUG) {
594 	    printf("[asgnsamples] totime %f\n", totime);
595 	}
596 #   endif DEBUG
597 }
598 
599 
600 unsigned long
601 min(a, b)
602     unsigned long a,b;
603 {
604     if (a<b)
605 	return(a);
606     return(b);
607 }
608 
609 unsigned long
610 max(a, b)
611     unsigned long a,b;
612 {
613     if (a>b)
614 	return(a);
615     return(b);
616 }
617 
618     /*
619      *	calculate scaled entry point addresses (to save time in asgnsamples),
620      *	and possibly push the scaled entry points over the entry mask,
621      *	if it turns out that the entry point is in one bucket and the code
622      *	for a routine is in the next bucket.
623      */
624 alignentries()
625 {
626     register struct nl	*nlp;
627     unsigned long	bucket_of_entry;
628     unsigned long	bucket_of_code;
629 
630     for (nlp = nl; nlp < npe; nlp++) {
631 	nlp -> svalue = nlp -> value / sizeof(UNIT);
632 	bucket_of_entry = (nlp->svalue - lowpc) / scale;
633 	bucket_of_code = (nlp->svalue + UNITS_TO_CODE - lowpc) / scale;
634 	if (bucket_of_entry < bucket_of_code) {
635 #	    ifdef DEBUG
636 		if (debug & SAMPLEDEBUG) {
637 		    printf("[alignentries] pushing svalue 0x%x to 0x%x\n",
638 			    nlp->svalue, nlp->svalue + UNITS_TO_CODE);
639 		}
640 #	    endif DEBUG
641 	    nlp->svalue += UNITS_TO_CODE;
642 	}
643     }
644 }
645 
646 bool
647 funcsymbol( nlistp )
648     struct nlist	*nlistp;
649 {
650     extern char	*strtab;	/* string table from a.out */
651     extern int	aflag;		/* if static functions aren't desired */
652     char	*name;
653 
654 	/*
655 	 *	must be a text symbol,
656 	 *	and static text symbols don't qualify if aflag set.
657 	 */
658     if ( ! (  ( nlistp -> n_type == ( N_TEXT | N_EXT ) )
659 	   || ( ( nlistp -> n_type == N_TEXT ) && ( aflag == 0 ) ) ) ) {
660 	return FALSE;
661     }
662 	/*
663 	 *	can't have any `funny' characters in name,
664 	 *	where `funny' includes	`.', .o file names
665 	 *			and	`$', pascal labels.
666 	 */
667     for ( name = strtab + nlistp -> n_un.n_strx ; *name ; name += 1 ) {
668 	if ( *name == '.' || *name == '$' ) {
669 	    return FALSE;
670 	}
671     }
672     return TRUE;
673 }
674 
675 done()
676 {
677 
678     exit(0);
679 }
680