xref: /freebsd-src/cddl/contrib/opensolaris/cmd/lockstat/lockstat.c (revision f4f5e69c84df74e8834aed173af1127b1ff50970)
17e1e3d94SStacey Son /*
27e1e3d94SStacey Son  * CDDL HEADER START
37e1e3d94SStacey Son  *
47e1e3d94SStacey Son  * The contents of this file are subject to the terms of the
57e1e3d94SStacey Son  * Common Development and Distribution License (the "License").
67e1e3d94SStacey Son  * You may not use this file except in compliance with the License.
77e1e3d94SStacey Son  *
87e1e3d94SStacey Son  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97e1e3d94SStacey Son  * or http://www.opensolaris.org/os/licensing.
107e1e3d94SStacey Son  * See the License for the specific language governing permissions
117e1e3d94SStacey Son  * and limitations under the License.
127e1e3d94SStacey Son  *
137e1e3d94SStacey Son  * When distributing Covered Code, include this CDDL HEADER in each
147e1e3d94SStacey Son  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157e1e3d94SStacey Son  * If applicable, add the following below this CDDL HEADER, with the
167e1e3d94SStacey Son  * fields enclosed by brackets "[]" replaced with your own identifying
177e1e3d94SStacey Son  * information: Portions Copyright [yyyy] [name of copyright owner]
187e1e3d94SStacey Son  *
197e1e3d94SStacey Son  * CDDL HEADER END
207e1e3d94SStacey Son  */
217e1e3d94SStacey Son /*
227e1e3d94SStacey Son  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
237e1e3d94SStacey Son  * Use is subject to license terms.
247e1e3d94SStacey Son  */
257e1e3d94SStacey Son 
267e1e3d94SStacey Son #pragma ident	"%Z%%M%	%I%	%E% SMI"
277e1e3d94SStacey Son 
287e1e3d94SStacey Son #include <stdio.h>
297e1e3d94SStacey Son #include <stddef.h>
307e1e3d94SStacey Son #include <stdlib.h>
317e1e3d94SStacey Son #include <stdarg.h>
327e1e3d94SStacey Son #include <string.h>
337e1e3d94SStacey Son #include <strings.h>
347e1e3d94SStacey Son #include <ctype.h>
357e1e3d94SStacey Son #include <fcntl.h>
367e1e3d94SStacey Son #include <unistd.h>
377e1e3d94SStacey Son #include <errno.h>
387e1e3d94SStacey Son #include <limits.h>
397e1e3d94SStacey Son #include <sys/types.h>
407e1e3d94SStacey Son #include <sys/modctl.h>
417e1e3d94SStacey Son #include <sys/stat.h>
427e1e3d94SStacey Son #include <sys/wait.h>
437e1e3d94SStacey Son #include <dtrace.h>
447e1e3d94SStacey Son #include <sys/lockstat.h>
457e1e3d94SStacey Son #include <alloca.h>
467e1e3d94SStacey Son #include <signal.h>
477e1e3d94SStacey Son #include <assert.h>
487e1e3d94SStacey Son 
49bc96366cSSteven Hartland #ifdef illumos
504fb6e7b1SStacey Son #define	GETOPT_EOF	EOF
514fb6e7b1SStacey Son #else
527e1e3d94SStacey Son #include <sys/time.h>
537e1e3d94SStacey Son #include <sys/resource.h>
547e1e3d94SStacey Son 
557e1e3d94SStacey Son #define	mergesort(a, b, c, d)	lsmergesort(a, b, c, d)
564fb6e7b1SStacey Son #define	GETOPT_EOF		(-1)
574fb6e7b1SStacey Son 
584fb6e7b1SStacey Son typedef	uintptr_t	pc_t;
59bc96366cSSteven Hartland #endif
607e1e3d94SStacey Son 
617e1e3d94SStacey Son #define	LOCKSTAT_OPTSTR	"x:bths:n:d:i:l:f:e:ckwWgCHEATID:RpPo:V"
627e1e3d94SStacey Son 
637e1e3d94SStacey Son #define	LS_MAX_STACK_DEPTH	50
647e1e3d94SStacey Son #define	LS_MAX_EVENTS		64
657e1e3d94SStacey Son 
667e1e3d94SStacey Son typedef struct lsrec {
677e1e3d94SStacey Son 	struct lsrec	*ls_next;	/* next in hash chain */
683142b376SMark Johnston #ifdef illumos
697e1e3d94SStacey Son 	uintptr_t	ls_lock;	/* lock address */
703142b376SMark Johnston #else
713142b376SMark Johnston 	char		*ls_lock;	/* lock name */
723142b376SMark Johnston #endif
737e1e3d94SStacey Son 	uintptr_t	ls_caller;	/* caller address */
747e1e3d94SStacey Son 	uint32_t	ls_count;	/* cumulative event count */
757e1e3d94SStacey Son 	uint32_t	ls_event;	/* type of event */
767e1e3d94SStacey Son 	uintptr_t	ls_refcnt;	/* cumulative reference count */
777e1e3d94SStacey Son 	uint64_t	ls_time;	/* cumulative event duration */
787e1e3d94SStacey Son 	uint32_t	ls_hist[64];	/* log2(duration) histogram */
797e1e3d94SStacey Son 	uintptr_t	ls_stack[LS_MAX_STACK_DEPTH];
807e1e3d94SStacey Son } lsrec_t;
817e1e3d94SStacey Son 
827e1e3d94SStacey Son typedef struct lsdata {
837e1e3d94SStacey Son 	struct lsrec	*lsd_next;	/* next available */
847e1e3d94SStacey Son 	int		lsd_count;	/* number of records */
857e1e3d94SStacey Son } lsdata_t;
867e1e3d94SStacey Son 
877e1e3d94SStacey Son /*
887e1e3d94SStacey Son  * Definitions for the types of experiments which can be run.  They are
897e1e3d94SStacey Son  * listed in increasing order of memory cost and processing time cost.
907e1e3d94SStacey Son  * The numerical value of each type is the number of bytes needed per record.
917e1e3d94SStacey Son  */
927e1e3d94SStacey Son #define	LS_BASIC	offsetof(lsrec_t, ls_time)
937e1e3d94SStacey Son #define	LS_TIME		offsetof(lsrec_t, ls_hist[0])
947e1e3d94SStacey Son #define	LS_HIST		offsetof(lsrec_t, ls_stack[0])
957e1e3d94SStacey Son #define	LS_STACK(depth)	offsetof(lsrec_t, ls_stack[depth])
967e1e3d94SStacey Son 
977e1e3d94SStacey Son static void report_stats(FILE *, lsrec_t **, size_t, uint64_t, uint64_t);
987e1e3d94SStacey Son static void report_trace(FILE *, lsrec_t **);
997e1e3d94SStacey Son 
1007e1e3d94SStacey Son extern int symtab_init(void);
1017e1e3d94SStacey Son extern char *addr_to_sym(uintptr_t, uintptr_t *, size_t *);
1027e1e3d94SStacey Son extern uintptr_t sym_to_addr(char *name);
1037e1e3d94SStacey Son extern size_t sym_size(char *name);
1047e1e3d94SStacey Son extern char *strtok_r(char *, const char *, char **);
1057e1e3d94SStacey Son 
1067e1e3d94SStacey Son #define	DEFAULT_NRECS	10000
1077e1e3d94SStacey Son #define	DEFAULT_HZ	97
1087e1e3d94SStacey Son #define	MAX_HZ		1000
1097e1e3d94SStacey Son #define	MIN_AGGSIZE	(16 * 1024)
1107e1e3d94SStacey Son #define	MAX_AGGSIZE	(32 * 1024 * 1024)
1117e1e3d94SStacey Son 
1127e1e3d94SStacey Son static int g_stkdepth;
1137e1e3d94SStacey Son static int g_topn = INT_MAX;
1147e1e3d94SStacey Son static hrtime_t g_elapsed;
1157e1e3d94SStacey Son static int g_rates = 0;
1167e1e3d94SStacey Son static int g_pflag = 0;
1177e1e3d94SStacey Son static int g_Pflag = 0;
1187e1e3d94SStacey Son static int g_wflag = 0;
1197e1e3d94SStacey Son static int g_Wflag = 0;
1207e1e3d94SStacey Son static int g_cflag = 0;
1217e1e3d94SStacey Son static int g_kflag = 0;
1227e1e3d94SStacey Son static int g_gflag = 0;
1237e1e3d94SStacey Son static int g_Vflag = 0;
1247e1e3d94SStacey Son static int g_tracing = 0;
1257e1e3d94SStacey Son static size_t g_recsize;
1267e1e3d94SStacey Son static size_t g_nrecs;
1277e1e3d94SStacey Son static int g_nrecs_used;
1287e1e3d94SStacey Son static uchar_t g_enabled[LS_MAX_EVENTS];
1297e1e3d94SStacey Son static hrtime_t g_min_duration[LS_MAX_EVENTS];
1307e1e3d94SStacey Son static dtrace_hdl_t *g_dtp;
1317e1e3d94SStacey Son static char *g_predicate;
1327e1e3d94SStacey Son static char *g_ipredicate;
1337e1e3d94SStacey Son static char *g_prog;
1347e1e3d94SStacey Son static int g_proglen;
1357e1e3d94SStacey Son static int g_dropped;
1367e1e3d94SStacey Son 
1377e1e3d94SStacey Son typedef struct ls_event_info {
1387e1e3d94SStacey Son 	char	ev_type;
1397e1e3d94SStacey Son 	char	ev_lhdr[20];
1407e1e3d94SStacey Son 	char	ev_desc[80];
1417e1e3d94SStacey Son 	char	ev_units[10];
1427e1e3d94SStacey Son 	char	ev_name[DTRACE_NAMELEN];
1437e1e3d94SStacey Son 	char	*ev_predicate;
1447e1e3d94SStacey Son 	char	*ev_acquire;
1457e1e3d94SStacey Son } ls_event_info_t;
1467e1e3d94SStacey Son 
1477e1e3d94SStacey Son static ls_event_info_t g_event_info[LS_MAX_EVENTS] = {
1487e1e3d94SStacey Son 	{ 'C',	"Lock",	"Adaptive mutex spin",			"nsec",
1497e1e3d94SStacey Son 	    "lockstat:::adaptive-spin" },
1507e1e3d94SStacey Son 	{ 'C',	"Lock",	"Adaptive mutex block",			"nsec",
1517e1e3d94SStacey Son 	    "lockstat:::adaptive-block" },
1527e1e3d94SStacey Son 	{ 'C',	"Lock",	"Spin lock spin",			"nsec",
1537e1e3d94SStacey Son 	    "lockstat:::spin-spin" },
1547e1e3d94SStacey Son 	{ 'C',	"Lock",	"Thread lock spin",			"nsec",
1557e1e3d94SStacey Son 	    "lockstat:::thread-spin" },
1567e1e3d94SStacey Son 	{ 'C',	"Lock",	"R/W writer blocked by writer",		"nsec",
1577e1e3d94SStacey Son 	    "lockstat:::rw-block", "arg2 == 0 && arg3 == 1" },
1587e1e3d94SStacey Son 	{ 'C',	"Lock",	"R/W writer blocked by readers",	"nsec",
1597e1e3d94SStacey Son 	    "lockstat:::rw-block", "arg2 == 0 && arg3 == 0 && arg4" },
1607e1e3d94SStacey Son 	{ 'C',	"Lock",	"R/W reader blocked by writer",		"nsec",
1615b699f16SMark Johnston 	    "lockstat:::rw-block", "arg2 == 1 && arg3 == 1" },
1627e1e3d94SStacey Son 	{ 'C',	"Lock",	"R/W reader blocked by write wanted",	"nsec",
1635b699f16SMark Johnston 	    "lockstat:::rw-block", "arg2 == 1 && arg3 == 0 && arg4" },
164076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"R/W writer spin on writer",		"nsec",
165076dd8ebSAndriy Gapon 	    "lockstat:::rw-spin", "arg2 == 0 && arg3 == 1" },
166076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"R/W writer spin on readers",		"nsec",
167076dd8ebSAndriy Gapon 	    "lockstat:::rw-spin", "arg2 == 0 && arg3 == 0 && arg4" },
168076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"R/W reader spin on writer",		"nsec",
1695b699f16SMark Johnston 	    "lockstat:::rw-spin", "arg2 == 1 && arg3 == 1" },
170076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"R/W reader spin on write wanted",	"nsec",
1715b699f16SMark Johnston 	    "lockstat:::rw-spin", "arg2 == 1 && arg3 == 0 && arg4" },
172076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"SX exclusive block",			"nsec",
173076dd8ebSAndriy Gapon 	    "lockstat:::sx-block", "arg2 == 0" },
174076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"SX shared block",			"nsec",
1755b699f16SMark Johnston 	    "lockstat:::sx-block", "arg2 == 1" },
176076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"SX exclusive spin",			"nsec",
177076dd8ebSAndriy Gapon 	    "lockstat:::sx-spin", "arg2 == 0" },
178076dd8ebSAndriy Gapon 	{ 'C',	"Lock",	"SX shared spin",			"nsec",
1795b699f16SMark Johnston 	    "lockstat:::sx-spin", "arg2 == 1" },
1805b699f16SMark Johnston 	{ 'C',	"Lock",	"lockmgr writer blocked by writer",	"nsec",
1815b699f16SMark Johnston 	    "lockstat:::lockmgr-block", "arg2 == 0 && arg3 == 1" },
1825b699f16SMark Johnston 	{ 'C',	"Lock",	"lockmgr writer blocked by readers",	"nsec",
1835b699f16SMark Johnston 	    "lockstat:::lockmgr-block", "arg2 == 0 && arg3 == 0 && arg4" },
1845b699f16SMark Johnston 	{ 'C',	"Lock",	"lockmgr reader blocked by writer",	"nsec",
1855b699f16SMark Johnston 	    "lockstat:::lockmgr-block", "arg2 == 1 && arg3 == 1" },
1865b699f16SMark Johnston 	{ 'C',	"Lock",	"lockmgr reader blocked by write wanted", "nsec",
1875b699f16SMark Johnston 	    "lockstat:::lockmgr-block", "arg2 == 1 && arg3 == 0 && arg4" },
1887e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 20)",		"units"	},
1897e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 21)",		"units"	},
1907e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 22)",		"units"	},
1917e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 23)",		"units"	},
1927e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 24)",		"units"	},
1937e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 25)",		"units"	},
1947e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 26)",		"units"	},
1957e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 27)",		"units"	},
1967e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 28)",		"units"	},
1977e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 29)",		"units"	},
1987e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 30)",		"units"	},
1997e1e3d94SStacey Son 	{ 'C',	"Lock",	"Unknown event (type 31)",		"units"	},
2007e1e3d94SStacey Son 	{ 'H',	"Lock",	"Adaptive mutex hold",			"nsec",
2017e1e3d94SStacey Son 	    "lockstat:::adaptive-release", NULL,
2027e1e3d94SStacey Son 	    "lockstat:::adaptive-acquire" },
2037e1e3d94SStacey Son 	{ 'H',	"Lock",	"Spin lock hold",			"nsec",
2047e1e3d94SStacey Son 	    "lockstat:::spin-release", NULL,
2057e1e3d94SStacey Son 	    "lockstat:::spin-acquire" },
2067e1e3d94SStacey Son 	{ 'H',	"Lock",	"R/W writer hold",			"nsec",
207de2c95ccSMark Johnston 	    "lockstat:::rw-release", "arg1 == 0",
208de2c95ccSMark Johnston 	    "lockstat:::rw-acquire" },
2097e1e3d94SStacey Son 	{ 'H',	"Lock",	"R/W reader hold",			"nsec",
210de2c95ccSMark Johnston 	    "lockstat:::rw-release", "arg1 == 1",
211de2c95ccSMark Johnston 	    "lockstat:::rw-acquire" },
212076dd8ebSAndriy Gapon 	{ 'H',	"Lock",	"SX shared hold",			"nsec",
2136ad06a5eSMark Johnston 	    "lockstat:::sx-release", "arg1 == 1",
214de2c95ccSMark Johnston 	    "lockstat:::sx-acquire" },
215076dd8ebSAndriy Gapon 	{ 'H',	"Lock",	"SX exclusive hold",			"nsec",
2166ad06a5eSMark Johnston 	    "lockstat:::sx-release", "arg1 == 0",
217de2c95ccSMark Johnston 	    "lockstat:::sx-acquire" },
218e1a29d8cSMark Johnston 	{ 'H',	"Lock",	"lockmgr shared hold",			"nsec",
219e1a29d8cSMark Johnston 	    "lockstat:::lockmgr-release", "arg1 == 1",
220e1a29d8cSMark Johnston 	    "lockstat:::lockmgr-acquire" },
221e1a29d8cSMark Johnston 	{ 'H',	"Lock",	"lockmgr exclusive hold",		"nsec",
222e1a29d8cSMark Johnston 	    "lockstat:::lockmgr-release,lockstat:::lockmgr-disown", "arg1 == 0",
223e1a29d8cSMark Johnston 	    "lockstat:::lockmgr-acquire" },
2247e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 40)",		"units"	},
2257e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 41)",		"units"	},
2267e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 42)",		"units"	},
2277e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 43)",		"units"	},
2287e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 44)",		"units"	},
2297e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 45)",		"units"	},
2307e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 46)",		"units"	},
2317e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 47)",		"units"	},
2327e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 48)",		"units"	},
2337e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 49)",		"units"	},
2347e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 50)",		"units"	},
2357e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 51)",		"units"	},
2367e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 52)",		"units"	},
2377e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 53)",		"units"	},
2387e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 54)",		"units"	},
2397e1e3d94SStacey Son 	{ 'H',	"Lock",	"Unknown event (type 55)",		"units"	},
240bc96366cSSteven Hartland #ifdef illumos
2417e1e3d94SStacey Son 	{ 'I',	"CPU+PIL", "Profiling interrupt",		"nsec",
2427e1e3d94SStacey Son #else
2437e1e3d94SStacey Son 	{ 'I',	"CPU+Pri_Class", "Profiling interrupt",		"nsec",
2447e1e3d94SStacey Son #endif
2457e1e3d94SStacey Son 	    "profile:::profile-97", NULL },
2467e1e3d94SStacey Son 	{ 'I',	"Lock",	"Unknown event (type 57)",		"units"	},
2477e1e3d94SStacey Son 	{ 'I',	"Lock",	"Unknown event (type 58)",		"units"	},
2487e1e3d94SStacey Son 	{ 'I',	"Lock",	"Unknown event (type 59)",		"units"	},
2497e1e3d94SStacey Son 	{ 'E',	"Lock",	"Recursive lock entry detected",	"(N/A)",
2507e1e3d94SStacey Son 	    "lockstat:::rw-release", NULL, "lockstat:::rw-acquire" },
2517e1e3d94SStacey Son 	{ 'E',	"Lock",	"Lockstat enter failure",		"(N/A)"	},
2527e1e3d94SStacey Son 	{ 'E',	"Lock",	"Lockstat exit failure",		"nsec"	},
2537e1e3d94SStacey Son 	{ 'E',	"Lock",	"Lockstat record failure",		"(N/A)"	},
2547e1e3d94SStacey Son };
2557e1e3d94SStacey Son 
256bc96366cSSteven Hartland #ifndef illumos
2577e1e3d94SStacey Son static char *g_pri_class[] = {
2587e1e3d94SStacey Son 	"",
2597e1e3d94SStacey Son 	"Intr",
2607e1e3d94SStacey Son 	"RealT",
2617e1e3d94SStacey Son 	"TShar",
2627e1e3d94SStacey Son 	"Idle"
2637e1e3d94SStacey Son };
2647e1e3d94SStacey Son #endif
2657e1e3d94SStacey Son 
2667e1e3d94SStacey Son static void
fail(int do_perror,const char * message,...)2677e1e3d94SStacey Son fail(int do_perror, const char *message, ...)
2687e1e3d94SStacey Son {
2697e1e3d94SStacey Son 	va_list args;
2707e1e3d94SStacey Son 	int save_errno = errno;
2717e1e3d94SStacey Son 
2727e1e3d94SStacey Son 	va_start(args, message);
2737e1e3d94SStacey Son 	(void) fprintf(stderr, "lockstat: ");
2747e1e3d94SStacey Son 	(void) vfprintf(stderr, message, args);
2757e1e3d94SStacey Son 	va_end(args);
2767e1e3d94SStacey Son 	if (do_perror)
2777e1e3d94SStacey Son 		(void) fprintf(stderr, ": %s", strerror(save_errno));
2787e1e3d94SStacey Son 	(void) fprintf(stderr, "\n");
2797e1e3d94SStacey Son 	exit(2);
2807e1e3d94SStacey Son }
2817e1e3d94SStacey Son 
2827e1e3d94SStacey Son static void
dfail(const char * message,...)2837e1e3d94SStacey Son dfail(const char *message, ...)
2847e1e3d94SStacey Son {
2857e1e3d94SStacey Son 	va_list args;
2867e1e3d94SStacey Son 
2877e1e3d94SStacey Son 	va_start(args, message);
2887e1e3d94SStacey Son 	(void) fprintf(stderr, "lockstat: ");
2897e1e3d94SStacey Son 	(void) vfprintf(stderr, message, args);
2907e1e3d94SStacey Son 	va_end(args);
2917e1e3d94SStacey Son 	(void) fprintf(stderr, ": %s\n",
2927e1e3d94SStacey Son 	    dtrace_errmsg(g_dtp, dtrace_errno(g_dtp)));
2937e1e3d94SStacey Son 
2947e1e3d94SStacey Son 	exit(2);
2957e1e3d94SStacey Son }
2967e1e3d94SStacey Son 
2977e1e3d94SStacey Son static void
show_events(char event_type,char * desc)2987e1e3d94SStacey Son show_events(char event_type, char *desc)
2997e1e3d94SStacey Son {
3007e1e3d94SStacey Son 	int i, first = -1, last;
3017e1e3d94SStacey Son 
3027e1e3d94SStacey Son 	for (i = 0; i < LS_MAX_EVENTS; i++) {
3037e1e3d94SStacey Son 		ls_event_info_t *evp = &g_event_info[i];
3047e1e3d94SStacey Son 		if (evp->ev_type != event_type ||
3057e1e3d94SStacey Son 		    strncmp(evp->ev_desc, "Unknown event", 13) == 0)
3067e1e3d94SStacey Son 			continue;
3077e1e3d94SStacey Son 		if (first == -1)
3087e1e3d94SStacey Son 			first = i;
3097e1e3d94SStacey Son 		last = i;
3107e1e3d94SStacey Son 	}
3117e1e3d94SStacey Son 
3127e1e3d94SStacey Son 	(void) fprintf(stderr,
3137e1e3d94SStacey Son 	    "\n%s events (lockstat -%c or lockstat -e %d-%d):\n\n",
3147e1e3d94SStacey Son 	    desc, event_type, first, last);
3157e1e3d94SStacey Son 
3167e1e3d94SStacey Son 	for (i = first; i <= last; i++)
3177e1e3d94SStacey Son 		(void) fprintf(stderr,
3187e1e3d94SStacey Son 		    "%4d = %s\n", i, g_event_info[i].ev_desc);
3197e1e3d94SStacey Son }
3207e1e3d94SStacey Son 
3217e1e3d94SStacey Son static void
usage(void)3227e1e3d94SStacey Son usage(void)
3237e1e3d94SStacey Son {
3247e1e3d94SStacey Son 	(void) fprintf(stderr,
3257e1e3d94SStacey Son 	    "Usage: lockstat [options] command [args]\n"
3269b055b74SMark Johnston 	    "\nGeneral options:\n\n"
3279b055b74SMark Johnston 	    "  -V              print the corresponding D program\n"
3287e1e3d94SStacey Son 	    "\nEvent selection options:\n\n"
3297e1e3d94SStacey Son 	    "  -C              watch contention events [on by default]\n"
3307e1e3d94SStacey Son 	    "  -E              watch error events [off by default]\n"
3317e1e3d94SStacey Son 	    "  -H              watch hold events [off by default]\n"
3327e1e3d94SStacey Son 	    "  -I              watch interrupt events [off by default]\n"
3337e1e3d94SStacey Son 	    "  -A              watch all lock events [equivalent to -CH]\n"
3347e1e3d94SStacey Son 	    "  -e event_list   only watch the specified events (shown below);\n"
3357e1e3d94SStacey Son 	    "                  <event_list> is a comma-separated list of\n"
3367e1e3d94SStacey Son 	    "                  events or ranges of events, e.g. 1,4-7,35\n"
3377e1e3d94SStacey Son 	    "  -i rate         interrupt rate for -I [default: %d Hz]\n"
3387e1e3d94SStacey Son 	    "\nData gathering options:\n\n"
3397e1e3d94SStacey Son 	    "  -b              basic statistics (lock, caller, event count)\n"
3407e1e3d94SStacey Son 	    "  -t              timing for all events [default]\n"
3417e1e3d94SStacey Son 	    "  -h              histograms for event times\n"
3427e1e3d94SStacey Son 	    "  -s depth        stack traces <depth> deep\n"
3437e1e3d94SStacey Son 	    "  -x opt[=val]    enable or modify DTrace options\n"
3447e1e3d94SStacey Son 	    "\nData filtering options:\n\n"
3457e1e3d94SStacey Son 	    "  -n nrecords     maximum number of data records [default: %d]\n"
3467e1e3d94SStacey Son 	    "  -l lock[,size]  only watch <lock>, which can be specified as a\n"
3477e1e3d94SStacey Son 	    "                  symbolic name or hex address; <size> defaults\n"
3487e1e3d94SStacey Son 	    "                  to the ELF symbol size if available, 1 if not\n"
3497e1e3d94SStacey Son 	    "  -f func[,size]  only watch events generated by <func>\n"
3507e1e3d94SStacey Son 	    "  -d duration     only watch events longer than <duration>\n"
3517e1e3d94SStacey Son 	    "  -T              trace (rather than sample) events\n"
3527e1e3d94SStacey Son 	    "\nData reporting options:\n\n"
3533142b376SMark Johnston #ifdef illumos
3547e1e3d94SStacey Son 	    "  -c              coalesce lock data for arrays like pse_mutex[]\n"
3553142b376SMark Johnston #endif
3567e1e3d94SStacey Son 	    "  -k              coalesce PCs within functions\n"
3577e1e3d94SStacey Son 	    "  -g              show total events generated by function\n"
3587e1e3d94SStacey Son 	    "  -w              wherever: don't distinguish events by caller\n"
3597e1e3d94SStacey Son 	    "  -W              whichever: don't distinguish events by lock\n"
3607e1e3d94SStacey Son 	    "  -R              display rates rather than counts\n"
3617e1e3d94SStacey Son 	    "  -p              parsable output format (awk(1)-friendly)\n"
3627e1e3d94SStacey Son 	    "  -P              sort lock data by (count * avg_time) product\n"
3637e1e3d94SStacey Son 	    "  -D n            only display top <n> events of each type\n"
3647e1e3d94SStacey Son 	    "  -o filename     send output to <filename>\n",
3657e1e3d94SStacey Son 	    DEFAULT_HZ, DEFAULT_NRECS);
3667e1e3d94SStacey Son 
3677e1e3d94SStacey Son 	show_events('C', "Contention");
3687e1e3d94SStacey Son 	show_events('H', "Hold-time");
3697e1e3d94SStacey Son 	show_events('I', "Interrupt");
3707e1e3d94SStacey Son 	show_events('E', "Error");
3717e1e3d94SStacey Son 	(void) fprintf(stderr, "\n");
3727e1e3d94SStacey Son 
3737e1e3d94SStacey Son 	exit(1);
3747e1e3d94SStacey Son }
3757e1e3d94SStacey Son 
3767e1e3d94SStacey Son static int
lockcmp(lsrec_t * a,lsrec_t * b)3777e1e3d94SStacey Son lockcmp(lsrec_t *a, lsrec_t *b)
3787e1e3d94SStacey Son {
3797e1e3d94SStacey Son 	int i;
3807e1e3d94SStacey Son 
3817e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
3827e1e3d94SStacey Son 		return (-1);
3837e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
3847e1e3d94SStacey Son 		return (1);
3857e1e3d94SStacey Son 
3867e1e3d94SStacey Son 	for (i = g_stkdepth - 1; i >= 0; i--) {
3877e1e3d94SStacey Son 		if (a->ls_stack[i] < b->ls_stack[i])
3887e1e3d94SStacey Son 			return (-1);
3897e1e3d94SStacey Son 		if (a->ls_stack[i] > b->ls_stack[i])
3907e1e3d94SStacey Son 			return (1);
3917e1e3d94SStacey Son 	}
3927e1e3d94SStacey Son 
3937e1e3d94SStacey Son 	if (a->ls_caller < b->ls_caller)
3947e1e3d94SStacey Son 		return (-1);
3957e1e3d94SStacey Son 	if (a->ls_caller > b->ls_caller)
3967e1e3d94SStacey Son 		return (1);
3977e1e3d94SStacey Son 
3983142b376SMark Johnston #ifdef illumos
3997e1e3d94SStacey Son 	if (a->ls_lock < b->ls_lock)
4007e1e3d94SStacey Son 		return (-1);
4017e1e3d94SStacey Son 	if (a->ls_lock > b->ls_lock)
4027e1e3d94SStacey Son 		return (1);
4037e1e3d94SStacey Son 
4047e1e3d94SStacey Son 	return (0);
4053142b376SMark Johnston #else
4063142b376SMark Johnston 	return (strcmp(a->ls_lock, b->ls_lock));
4073142b376SMark Johnston #endif
4087e1e3d94SStacey Son }
4097e1e3d94SStacey Son 
4107e1e3d94SStacey Son static int
countcmp(lsrec_t * a,lsrec_t * b)4117e1e3d94SStacey Son countcmp(lsrec_t *a, lsrec_t *b)
4127e1e3d94SStacey Son {
4137e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
4147e1e3d94SStacey Son 		return (-1);
4157e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
4167e1e3d94SStacey Son 		return (1);
4177e1e3d94SStacey Son 
4187e1e3d94SStacey Son 	return (b->ls_count - a->ls_count);
4197e1e3d94SStacey Son }
4207e1e3d94SStacey Son 
4217e1e3d94SStacey Son static int
timecmp(lsrec_t * a,lsrec_t * b)4227e1e3d94SStacey Son timecmp(lsrec_t *a, lsrec_t *b)
4237e1e3d94SStacey Son {
4247e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
4257e1e3d94SStacey Son 		return (-1);
4267e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
4277e1e3d94SStacey Son 		return (1);
4287e1e3d94SStacey Son 
4297e1e3d94SStacey Son 	if (a->ls_time < b->ls_time)
4307e1e3d94SStacey Son 		return (1);
4317e1e3d94SStacey Son 	if (a->ls_time > b->ls_time)
4327e1e3d94SStacey Son 		return (-1);
4337e1e3d94SStacey Son 
4347e1e3d94SStacey Son 	return (0);
4357e1e3d94SStacey Son }
4367e1e3d94SStacey Son 
4377e1e3d94SStacey Son static int
lockcmp_anywhere(lsrec_t * a,lsrec_t * b)4387e1e3d94SStacey Son lockcmp_anywhere(lsrec_t *a, lsrec_t *b)
4397e1e3d94SStacey Son {
4407e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
4417e1e3d94SStacey Son 		return (-1);
4427e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
4437e1e3d94SStacey Son 		return (1);
4447e1e3d94SStacey Son 
4453142b376SMark Johnston #ifdef illumos
4467e1e3d94SStacey Son 	if (a->ls_lock < b->ls_lock)
4477e1e3d94SStacey Son 		return (-1);
4487e1e3d94SStacey Son 	if (a->ls_lock > b->ls_lock)
4497e1e3d94SStacey Son 		return (1);
4507e1e3d94SStacey Son 
4517e1e3d94SStacey Son 	return (0);
4523142b376SMark Johnston #else
4533142b376SMark Johnston 	return (strcmp(a->ls_lock, b->ls_lock));
4543142b376SMark Johnston #endif
4557e1e3d94SStacey Son }
4567e1e3d94SStacey Son 
4577e1e3d94SStacey Son static int
lock_and_count_cmp_anywhere(lsrec_t * a,lsrec_t * b)4587e1e3d94SStacey Son lock_and_count_cmp_anywhere(lsrec_t *a, lsrec_t *b)
4597e1e3d94SStacey Son {
4603142b376SMark Johnston #ifndef illumos
4613142b376SMark Johnston 	int cmp;
4623142b376SMark Johnston #endif
4633142b376SMark Johnston 
4647e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
4657e1e3d94SStacey Son 		return (-1);
4667e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
4677e1e3d94SStacey Son 		return (1);
4687e1e3d94SStacey Son 
4693142b376SMark Johnston #ifdef illumos
4707e1e3d94SStacey Son 	if (a->ls_lock < b->ls_lock)
4717e1e3d94SStacey Son 		return (-1);
4727e1e3d94SStacey Son 	if (a->ls_lock > b->ls_lock)
4737e1e3d94SStacey Son 		return (1);
4743142b376SMark Johnston #else
4753142b376SMark Johnston 	cmp = strcmp(a->ls_lock, b->ls_lock);
4763142b376SMark Johnston 	if (cmp != 0)
4773142b376SMark Johnston 		return (cmp);
4783142b376SMark Johnston #endif
4797e1e3d94SStacey Son 
4807e1e3d94SStacey Son 	return (b->ls_count - a->ls_count);
4817e1e3d94SStacey Son }
4827e1e3d94SStacey Son 
4837e1e3d94SStacey Son static int
sitecmp_anylock(lsrec_t * a,lsrec_t * b)4847e1e3d94SStacey Son sitecmp_anylock(lsrec_t *a, lsrec_t *b)
4857e1e3d94SStacey Son {
4867e1e3d94SStacey Son 	int i;
4877e1e3d94SStacey Son 
4887e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
4897e1e3d94SStacey Son 		return (-1);
4907e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
4917e1e3d94SStacey Son 		return (1);
4927e1e3d94SStacey Son 
4937e1e3d94SStacey Son 	for (i = g_stkdepth - 1; i >= 0; i--) {
4947e1e3d94SStacey Son 		if (a->ls_stack[i] < b->ls_stack[i])
4957e1e3d94SStacey Son 			return (-1);
4967e1e3d94SStacey Son 		if (a->ls_stack[i] > b->ls_stack[i])
4977e1e3d94SStacey Son 			return (1);
4987e1e3d94SStacey Son 	}
4997e1e3d94SStacey Son 
5007e1e3d94SStacey Son 	if (a->ls_caller < b->ls_caller)
5017e1e3d94SStacey Son 		return (-1);
5027e1e3d94SStacey Son 	if (a->ls_caller > b->ls_caller)
5037e1e3d94SStacey Son 		return (1);
5047e1e3d94SStacey Son 
5057e1e3d94SStacey Son 	return (0);
5067e1e3d94SStacey Son }
5077e1e3d94SStacey Son 
5087e1e3d94SStacey Son static int
site_and_count_cmp_anylock(lsrec_t * a,lsrec_t * b)5097e1e3d94SStacey Son site_and_count_cmp_anylock(lsrec_t *a, lsrec_t *b)
5107e1e3d94SStacey Son {
5117e1e3d94SStacey Son 	int i;
5127e1e3d94SStacey Son 
5137e1e3d94SStacey Son 	if (a->ls_event < b->ls_event)
5147e1e3d94SStacey Son 		return (-1);
5157e1e3d94SStacey Son 	if (a->ls_event > b->ls_event)
5167e1e3d94SStacey Son 		return (1);
5177e1e3d94SStacey Son 
5187e1e3d94SStacey Son 	for (i = g_stkdepth - 1; i >= 0; i--) {
5197e1e3d94SStacey Son 		if (a->ls_stack[i] < b->ls_stack[i])
5207e1e3d94SStacey Son 			return (-1);
5217e1e3d94SStacey Son 		if (a->ls_stack[i] > b->ls_stack[i])
5227e1e3d94SStacey Son 			return (1);
5237e1e3d94SStacey Son 	}
5247e1e3d94SStacey Son 
5257e1e3d94SStacey Son 	if (a->ls_caller < b->ls_caller)
5267e1e3d94SStacey Son 		return (-1);
5277e1e3d94SStacey Son 	if (a->ls_caller > b->ls_caller)
5287e1e3d94SStacey Son 		return (1);
5297e1e3d94SStacey Son 
5307e1e3d94SStacey Son 	return (b->ls_count - a->ls_count);
5317e1e3d94SStacey Son }
5327e1e3d94SStacey Son 
5337e1e3d94SStacey Son static void
lsmergesort(int (* cmp)(lsrec_t *,lsrec_t *),lsrec_t ** a,lsrec_t ** b,int n)5347e1e3d94SStacey Son lsmergesort(int (*cmp)(lsrec_t *, lsrec_t *), lsrec_t **a, lsrec_t **b, int n)
5357e1e3d94SStacey Son {
5367e1e3d94SStacey Son 	int m = n / 2;
5377e1e3d94SStacey Son 	int i, j;
5387e1e3d94SStacey Son 
5397e1e3d94SStacey Son 	if (m > 1)
5407e1e3d94SStacey Son 		lsmergesort(cmp, a, b, m);
5417e1e3d94SStacey Son 	if (n - m > 1)
5427e1e3d94SStacey Son 		lsmergesort(cmp, a + m, b + m, n - m);
5437e1e3d94SStacey Son 	for (i = m; i > 0; i--)
5447e1e3d94SStacey Son 		b[i - 1] = a[i - 1];
5457e1e3d94SStacey Son 	for (j = m - 1; j < n - 1; j++)
5467e1e3d94SStacey Son 		b[n + m - j - 2] = a[j + 1];
5477e1e3d94SStacey Son 	while (i < j)
5487e1e3d94SStacey Son 		*a++ = cmp(b[i], b[j]) < 0 ? b[i++] : b[j--];
5497e1e3d94SStacey Son 	*a = b[i];
5507e1e3d94SStacey Son }
5517e1e3d94SStacey Son 
5527e1e3d94SStacey Son static void
coalesce(int (* cmp)(lsrec_t *,lsrec_t *),lsrec_t ** lock,int n)5537e1e3d94SStacey Son coalesce(int (*cmp)(lsrec_t *, lsrec_t *), lsrec_t **lock, int n)
5547e1e3d94SStacey Son {
5557e1e3d94SStacey Son 	int i, j;
5567e1e3d94SStacey Son 	lsrec_t *target, *current;
5577e1e3d94SStacey Son 
5587e1e3d94SStacey Son 	target = lock[0];
5597e1e3d94SStacey Son 
5607e1e3d94SStacey Son 	for (i = 1; i < n; i++) {
5617e1e3d94SStacey Son 		current = lock[i];
5627e1e3d94SStacey Son 		if (cmp(current, target) != 0) {
5637e1e3d94SStacey Son 			target = current;
5647e1e3d94SStacey Son 			continue;
5657e1e3d94SStacey Son 		}
5667e1e3d94SStacey Son 		current->ls_event = LS_MAX_EVENTS;
5677e1e3d94SStacey Son 		target->ls_count += current->ls_count;
5687e1e3d94SStacey Son 		target->ls_refcnt += current->ls_refcnt;
5697e1e3d94SStacey Son 		if (g_recsize < LS_TIME)
5707e1e3d94SStacey Son 			continue;
5717e1e3d94SStacey Son 		target->ls_time += current->ls_time;
5727e1e3d94SStacey Son 		if (g_recsize < LS_HIST)
5737e1e3d94SStacey Son 			continue;
5747e1e3d94SStacey Son 		for (j = 0; j < 64; j++)
5757e1e3d94SStacey Son 			target->ls_hist[j] += current->ls_hist[j];
5767e1e3d94SStacey Son 	}
5777e1e3d94SStacey Son }
5787e1e3d94SStacey Son 
5797e1e3d94SStacey Son static void
coalesce_symbol(uintptr_t * addrp)5807e1e3d94SStacey Son coalesce_symbol(uintptr_t *addrp)
5817e1e3d94SStacey Son {
5827e1e3d94SStacey Son 	uintptr_t symoff;
5837e1e3d94SStacey Son 	size_t symsize;
5847e1e3d94SStacey Son 
5857e1e3d94SStacey Son 	if (addr_to_sym(*addrp, &symoff, &symsize) != NULL && symoff < symsize)
5867e1e3d94SStacey Son 		*addrp -= symoff;
5877e1e3d94SStacey Son }
5887e1e3d94SStacey Son 
5897e1e3d94SStacey Son static void
predicate_add(char ** pred,char * what,char * cmp,uintptr_t value)5907e1e3d94SStacey Son predicate_add(char **pred, char *what, char *cmp, uintptr_t value)
5917e1e3d94SStacey Son {
5927e1e3d94SStacey Son 	char *new;
5937e1e3d94SStacey Son 	int len, newlen;
5947e1e3d94SStacey Son 
5957e1e3d94SStacey Son 	if (what == NULL)
5967e1e3d94SStacey Son 		return;
5977e1e3d94SStacey Son 
5987e1e3d94SStacey Son 	if (*pred == NULL) {
5997e1e3d94SStacey Son 		*pred = malloc(1);
6007e1e3d94SStacey Son 		*pred[0] = '\0';
6017e1e3d94SStacey Son 	}
6027e1e3d94SStacey Son 
6037e1e3d94SStacey Son 	len = strlen(*pred);
6047e1e3d94SStacey Son 	newlen = len + strlen(what) + 32 + strlen("( && )");
6057e1e3d94SStacey Son 	new = malloc(newlen);
6067e1e3d94SStacey Son 
6077e1e3d94SStacey Son 	if (*pred[0] != '\0') {
6087e1e3d94SStacey Son 		if (cmp != NULL) {
6099dbacce2SKornel Dulęba 			(void) sprintf(new, "(%s) && (%s %s %p)",
6107e1e3d94SStacey Son 			    *pred, what, cmp, (void *)value);
6117e1e3d94SStacey Son 		} else {
6127e1e3d94SStacey Son 			(void) sprintf(new, "(%s) && (%s)", *pred, what);
6137e1e3d94SStacey Son 		}
6147e1e3d94SStacey Son 	} else {
6157e1e3d94SStacey Son 		if (cmp != NULL) {
6169dbacce2SKornel Dulęba 			(void) sprintf(new, "%s %s %p",
6177e1e3d94SStacey Son 			    what, cmp, (void *)value);
6187e1e3d94SStacey Son 		} else {
6197e1e3d94SStacey Son 			(void) sprintf(new, "%s", what);
6207e1e3d94SStacey Son 		}
6217e1e3d94SStacey Son 	}
6227e1e3d94SStacey Son 
6237e1e3d94SStacey Son 	free(*pred);
6247e1e3d94SStacey Son 	*pred = new;
6257e1e3d94SStacey Son }
6267e1e3d94SStacey Son 
6277e1e3d94SStacey Son static void
predicate_destroy(char ** pred)6287e1e3d94SStacey Son predicate_destroy(char **pred)
6297e1e3d94SStacey Son {
6307e1e3d94SStacey Son 	free(*pred);
6317e1e3d94SStacey Son 	*pred = NULL;
6327e1e3d94SStacey Son }
6337e1e3d94SStacey Son 
6347e1e3d94SStacey Son static void
filter_add(char ** filt,char * what,uintptr_t base,size_t size)635*f4f5e69cSMark Johnston filter_add(char **filt, char *what, uintptr_t base, size_t size)
6367e1e3d94SStacey Son {
6377e1e3d94SStacey Son 	char buf[256], *c = buf, *new;
6387e1e3d94SStacey Son 	int len, newlen;
6397e1e3d94SStacey Son 
6407e1e3d94SStacey Son 	if (*filt == NULL) {
6417e1e3d94SStacey Son 		*filt = malloc(1);
6427e1e3d94SStacey Son 		*filt[0] = '\0';
6437e1e3d94SStacey Son 	}
6447e1e3d94SStacey Son 
645bc96366cSSteven Hartland #ifdef illumos
6467e1e3d94SStacey Son 	(void) sprintf(c, "%s(%s >= 0x%p && %s < 0x%p)", *filt[0] != '\0' ?
6477e1e3d94SStacey Son 	    " || " : "", what, (void *)base, what, (void *)(base + size));
6487e1e3d94SStacey Son #else
6497e1e3d94SStacey Son 	(void) sprintf(c, "%s(%s >= %p && %s < %p)", *filt[0] != '\0' ?
6507e1e3d94SStacey Son 	    " || " : "", what, (void *)base, what, (void *)(base + size));
6517e1e3d94SStacey Son #endif
6527e1e3d94SStacey Son 
6537e1e3d94SStacey Son 	newlen = (len = strlen(*filt) + 1) + strlen(c);
6547e1e3d94SStacey Son 	new = malloc(newlen);
6557e1e3d94SStacey Son 	bcopy(*filt, new, len);
6567e1e3d94SStacey Son 	(void) strcat(new, c);
6577e1e3d94SStacey Son 	free(*filt);
6587e1e3d94SStacey Son 	*filt = new;
6597e1e3d94SStacey Son }
6607e1e3d94SStacey Son 
6617e1e3d94SStacey Son static void
filter_destroy(char ** filt)6627e1e3d94SStacey Son filter_destroy(char **filt)
6637e1e3d94SStacey Son {
6647e1e3d94SStacey Son 	free(*filt);
6657e1e3d94SStacey Son 	*filt = NULL;
6667e1e3d94SStacey Son }
6677e1e3d94SStacey Son 
6687e1e3d94SStacey Son static void
dprog_add(const char * fmt,...)6697e1e3d94SStacey Son dprog_add(const char *fmt, ...)
6707e1e3d94SStacey Son {
6717e1e3d94SStacey Son 	va_list args;
6727e1e3d94SStacey Son 	int size, offs;
6737e1e3d94SStacey Son 	char c;
6747e1e3d94SStacey Son 
6757e1e3d94SStacey Son 	va_start(args, fmt);
6767e1e3d94SStacey Son 	size = vsnprintf(&c, 1, fmt, args) + 1;
6777e1e3d94SStacey Son 	va_end(args);
6787e1e3d94SStacey Son 
6797e1e3d94SStacey Son 	if (g_proglen == 0) {
6807e1e3d94SStacey Son 		offs = 0;
6817e1e3d94SStacey Son 	} else {
6827e1e3d94SStacey Son 		offs = g_proglen - 1;
6837e1e3d94SStacey Son 	}
6847e1e3d94SStacey Son 
6857e1e3d94SStacey Son 	g_proglen = offs + size;
6867e1e3d94SStacey Son 
6877e1e3d94SStacey Son 	if ((g_prog = realloc(g_prog, g_proglen)) == NULL)
6887e1e3d94SStacey Son 		fail(1, "failed to reallocate program text");
6897e1e3d94SStacey Son 
6907e1e3d94SStacey Son 	va_start(args, fmt);
6917e1e3d94SStacey Son 	(void) vsnprintf(&g_prog[offs], size, fmt, args);
6927e1e3d94SStacey Son 	va_end(args);
6937e1e3d94SStacey Son }
6947e1e3d94SStacey Son 
6957e1e3d94SStacey Son /*
6967e1e3d94SStacey Son  * This function may read like an open sewer, but keep in mind that programs
6977e1e3d94SStacey Son  * that generate other programs are rarely pretty.  If one has the unenviable
6987e1e3d94SStacey Son  * task of maintaining or -- worse -- extending this code, use the -V option
6997e1e3d94SStacey Son  * to examine the D program as generated by this function.
7007e1e3d94SStacey Son  */
7017e1e3d94SStacey Son static void
dprog_addevent(int event)7027e1e3d94SStacey Son dprog_addevent(int event)
7037e1e3d94SStacey Son {
7047e1e3d94SStacey Son 	ls_event_info_t *info = &g_event_info[event];
7057e1e3d94SStacey Son 	char *pred = NULL;
7067e1e3d94SStacey Son 	char stack[20];
7077e1e3d94SStacey Son 	const char *arg0, *caller;
7087e1e3d94SStacey Son 	char *arg1 = "arg1";
7097e1e3d94SStacey Son 	char buf[80];
7107e1e3d94SStacey Son 	hrtime_t dur;
7117e1e3d94SStacey Son 	int depth;
7127e1e3d94SStacey Son 
7137e1e3d94SStacey Son 	if (info->ev_name[0] == '\0')
7147e1e3d94SStacey Son 		return;
7157e1e3d94SStacey Son 
7167e1e3d94SStacey Son 	if (info->ev_type == 'I') {
7177e1e3d94SStacey Son 		/*
7187e1e3d94SStacey Son 		 * For interrupt events, arg0 (normally the lock pointer) is
7197e1e3d94SStacey Son 		 * the CPU address plus the current pil, and arg1 (normally
7207e1e3d94SStacey Son 		 * the number of nanoseconds) is the number of nanoseconds
7217e1e3d94SStacey Son 		 * late -- and it's stored in arg2.
7227e1e3d94SStacey Son 		 */
723bc96366cSSteven Hartland #ifdef illumos
7247e1e3d94SStacey Son 		arg0 = "(uintptr_t)curthread->t_cpu + \n"
7257e1e3d94SStacey Son 		    "\t    curthread->t_cpu->cpu_profile_pil";
7267e1e3d94SStacey Son #else
7277e1e3d94SStacey Son 		arg0 = "(uintptr_t)(curthread->td_oncpu << 16) + \n"
7287e1e3d94SStacey Son 		    "\t    0x01000000 + curthread->td_pri_class";
7297e1e3d94SStacey Son #endif
7307e1e3d94SStacey Son 		caller = "(uintptr_t)arg0";
7317e1e3d94SStacey Son 		arg1 = "arg2";
7327e1e3d94SStacey Son 	} else {
7333142b376SMark Johnston #ifdef illumos
7347e1e3d94SStacey Son 		arg0 = "(uintptr_t)arg0";
7353142b376SMark Johnston #else
7363142b376SMark Johnston 		arg0 = "stringof(args[0]->lock_object.lo_name)";
7373142b376SMark Johnston #endif
7387e1e3d94SStacey Son 		caller = "caller";
7397e1e3d94SStacey Son 	}
7407e1e3d94SStacey Son 
7417e1e3d94SStacey Son 	if (g_recsize > LS_HIST) {
7427e1e3d94SStacey Son 		for (depth = 0; g_recsize > LS_STACK(depth); depth++)
7437e1e3d94SStacey Son 			continue;
7447e1e3d94SStacey Son 
7457e1e3d94SStacey Son 		if (g_tracing) {
7467e1e3d94SStacey Son 			(void) sprintf(stack, "\tstack(%d);\n", depth);
7477e1e3d94SStacey Son 		} else {
7487e1e3d94SStacey Son 			(void) sprintf(stack, ", stack(%d)", depth);
7497e1e3d94SStacey Son 		}
7507e1e3d94SStacey Son 	} else {
7517e1e3d94SStacey Son 		(void) sprintf(stack, "");
7527e1e3d94SStacey Son 	}
7537e1e3d94SStacey Son 
7547e1e3d94SStacey Son 	if (info->ev_acquire != NULL) {
7557e1e3d94SStacey Son 		/*
7567e1e3d94SStacey Son 		 * If this is a hold event, we need to generate an additional
7577e1e3d94SStacey Son 		 * clause for the acquire; the clause for the release will be
7587e1e3d94SStacey Son 		 * generated with the aggregating statement, below.
7597e1e3d94SStacey Son 		 */
7607e1e3d94SStacey Son 		dprog_add("%s\n", info->ev_acquire);
7617e1e3d94SStacey Son 		predicate_add(&pred, info->ev_predicate, NULL, 0);
7627e1e3d94SStacey Son 		predicate_add(&pred, g_predicate, NULL, 0);
7637e1e3d94SStacey Son 		if (pred != NULL)
7647e1e3d94SStacey Son 			dprog_add("/%s/\n", pred);
7657e1e3d94SStacey Son 
7667e1e3d94SStacey Son 		dprog_add("{\n");
7677e1e3d94SStacey Son 		(void) sprintf(buf, "self->ev%d[(uintptr_t)arg0]", event);
7687e1e3d94SStacey Son 
7697e1e3d94SStacey Son 		if (info->ev_type == 'H') {
7707e1e3d94SStacey Son 			dprog_add("\t%s = timestamp;\n", buf);
7717e1e3d94SStacey Son 		} else {
7727e1e3d94SStacey Son 			/*
7737e1e3d94SStacey Son 			 * If this isn't a hold event, it's the recursive
7747e1e3d94SStacey Son 			 * error event.  For this, we simply bump the
7757e1e3d94SStacey Son 			 * thread-local, per-lock count.
7767e1e3d94SStacey Son 			 */
7777e1e3d94SStacey Son 			dprog_add("\t%s++;\n", buf);
7787e1e3d94SStacey Son 		}
7797e1e3d94SStacey Son 
7807e1e3d94SStacey Son 		dprog_add("}\n\n");
7817e1e3d94SStacey Son 		predicate_destroy(&pred);
7827e1e3d94SStacey Son 		pred = NULL;
7837e1e3d94SStacey Son 
7847e1e3d94SStacey Son 		if (info->ev_type == 'E') {
7857e1e3d94SStacey Son 			/*
7867e1e3d94SStacey Son 			 * If this is the recursive lock error event, we need
7877e1e3d94SStacey Son 			 * to generate an additional clause to decrement the
7887e1e3d94SStacey Son 			 * thread-local, per-lock count.  This assures that we
7897e1e3d94SStacey Son 			 * only execute the aggregating clause if we have
7907e1e3d94SStacey Son 			 * recursive entry.
7917e1e3d94SStacey Son 			 */
7927e1e3d94SStacey Son 			dprog_add("%s\n", info->ev_name);
7937e1e3d94SStacey Son 			dprog_add("/%s/\n{\n\t%s--;\n}\n\n", buf, buf);
7947e1e3d94SStacey Son 		}
7957e1e3d94SStacey Son 
7967e1e3d94SStacey Son 		predicate_add(&pred, buf, NULL, 0);
7977e1e3d94SStacey Son 
7987e1e3d94SStacey Son 		if (info->ev_type == 'H') {
7997e1e3d94SStacey Son 			(void) sprintf(buf, "timestamp -\n\t    "
8007e1e3d94SStacey Son 			    "self->ev%d[(uintptr_t)arg0]", event);
8017e1e3d94SStacey Son 		}
8027e1e3d94SStacey Son 
8037e1e3d94SStacey Son 		arg1 = buf;
8047e1e3d94SStacey Son 	} else {
8057e1e3d94SStacey Son 		predicate_add(&pred, info->ev_predicate, NULL, 0);
8067e1e3d94SStacey Son 		if (info->ev_type != 'I')
8077e1e3d94SStacey Son 			predicate_add(&pred, g_predicate, NULL, 0);
8087e1e3d94SStacey Son 		else
8097e1e3d94SStacey Son 			predicate_add(&pred, g_ipredicate, NULL, 0);
8107e1e3d94SStacey Son 	}
8117e1e3d94SStacey Son 
8127e1e3d94SStacey Son 	if ((dur = g_min_duration[event]) != 0)
8137e1e3d94SStacey Son 		predicate_add(&pred, arg1, ">=", dur);
8147e1e3d94SStacey Son 
8157e1e3d94SStacey Son 	dprog_add("%s\n", info->ev_name);
8167e1e3d94SStacey Son 
8177e1e3d94SStacey Son 	if (pred != NULL)
8187e1e3d94SStacey Son 		dprog_add("/%s/\n", pred);
8197e1e3d94SStacey Son 	predicate_destroy(&pred);
8207e1e3d94SStacey Son 
8217e1e3d94SStacey Son 	dprog_add("{\n");
8227e1e3d94SStacey Son 
8237e1e3d94SStacey Son 	if (g_tracing) {
8247e1e3d94SStacey Son 		dprog_add("\ttrace(%dULL);\n", event);
8257e1e3d94SStacey Son 		dprog_add("\ttrace(%s);\n", arg0);
8267e1e3d94SStacey Son 		dprog_add("\ttrace(%s);\n", caller);
8277e1e3d94SStacey Son 		dprog_add(stack);
8287e1e3d94SStacey Son 	} else {
8297e1e3d94SStacey Son 		/*
8307e1e3d94SStacey Son 		 * The ordering here is important:  when we process the
8317e1e3d94SStacey Son 		 * aggregate, we count on the fact that @avg appears before
8327e1e3d94SStacey Son 		 * @hist in program order to assure that @avg is assigned the
8337e1e3d94SStacey Son 		 * first aggregation variable ID and @hist assigned the
8347e1e3d94SStacey Son 		 * second; see the comment in process_aggregate() for details.
8357e1e3d94SStacey Son 		 */
8367e1e3d94SStacey Son 		dprog_add("\t@avg[%dULL, %s, %s%s] = avg(%s);\n",
8377e1e3d94SStacey Son 		    event, arg0, caller, stack, arg1);
8387e1e3d94SStacey Son 
8397e1e3d94SStacey Son 		if (g_recsize >= LS_HIST) {
8407e1e3d94SStacey Son 			dprog_add("\t@hist[%dULL, %s, %s%s] = quantize"
8417e1e3d94SStacey Son 			    "(%s);\n", event, arg0, caller, stack, arg1);
8427e1e3d94SStacey Son 		}
8437e1e3d94SStacey Son 	}
8447e1e3d94SStacey Son 
8457e1e3d94SStacey Son 	if (info->ev_acquire != NULL)
8467e1e3d94SStacey Son 		dprog_add("\tself->ev%d[arg0] = 0;\n", event);
8477e1e3d94SStacey Son 
8487e1e3d94SStacey Son 	dprog_add("}\n\n");
8497e1e3d94SStacey Son }
8507e1e3d94SStacey Son 
8517e1e3d94SStacey Son static void
dprog_compile()8527e1e3d94SStacey Son dprog_compile()
8537e1e3d94SStacey Son {
8547e1e3d94SStacey Son 	dtrace_prog_t *prog;
8557e1e3d94SStacey Son 	dtrace_proginfo_t info;
8567e1e3d94SStacey Son 
8577e1e3d94SStacey Son 	if (g_Vflag) {
8587e1e3d94SStacey Son 		(void) fprintf(stderr, "lockstat: vvvv D program vvvv\n");
8597e1e3d94SStacey Son 		(void) fputs(g_prog, stderr);
8607e1e3d94SStacey Son 		(void) fprintf(stderr, "lockstat: ^^^^ D program ^^^^\n");
8617e1e3d94SStacey Son 	}
8627e1e3d94SStacey Son 
8637e1e3d94SStacey Son 	if ((prog = dtrace_program_strcompile(g_dtp, g_prog,
8647e1e3d94SStacey Son 	    DTRACE_PROBESPEC_NAME, 0, 0, NULL)) == NULL)
8657e1e3d94SStacey Son 		dfail("failed to compile program");
8667e1e3d94SStacey Son 
8677e1e3d94SStacey Son 	if (dtrace_program_exec(g_dtp, prog, &info) == -1)
8687e1e3d94SStacey Son 		dfail("failed to enable probes");
8697e1e3d94SStacey Son 
8707e1e3d94SStacey Son 	if (dtrace_go(g_dtp) != 0)
8717e1e3d94SStacey Son 		dfail("couldn't start tracing");
8727e1e3d94SStacey Son }
8737e1e3d94SStacey Son 
8747e1e3d94SStacey Son static void
875bc96366cSSteven Hartland #ifdef illumos
status_fire(void)8767e1e3d94SStacey Son status_fire(void)
8777e1e3d94SStacey Son #else
8787e1e3d94SStacey Son status_fire(int i)
8797e1e3d94SStacey Son #endif
8807e1e3d94SStacey Son {}
8817e1e3d94SStacey Son 
8827e1e3d94SStacey Son static void
status_init(void)8837e1e3d94SStacey Son status_init(void)
8847e1e3d94SStacey Son {
8857e1e3d94SStacey Son 	dtrace_optval_t val, status, agg;
8867e1e3d94SStacey Son 	struct sigaction act;
8877e1e3d94SStacey Son 	struct itimerspec ts;
8887e1e3d94SStacey Son 	struct sigevent ev;
8897e1e3d94SStacey Son 	timer_t tid;
8907e1e3d94SStacey Son 
8917e1e3d94SStacey Son 	if (dtrace_getopt(g_dtp, "statusrate", &status) == -1)
8927e1e3d94SStacey Son 		dfail("failed to get 'statusrate'");
8937e1e3d94SStacey Son 
8947e1e3d94SStacey Son 	if (dtrace_getopt(g_dtp, "aggrate", &agg) == -1)
8957e1e3d94SStacey Son 		dfail("failed to get 'statusrate'");
8967e1e3d94SStacey Son 
8977e1e3d94SStacey Son 	/*
8987e1e3d94SStacey Son 	 * We would want to awaken at a rate that is the GCD of the statusrate
8997e1e3d94SStacey Son 	 * and the aggrate -- but that seems a bit absurd.  Instead, we'll
9007e1e3d94SStacey Son 	 * simply awaken at a rate that is the more frequent of the two, which
9017e1e3d94SStacey Son 	 * assures that we're never later than the interval implied by the
9027e1e3d94SStacey Son 	 * more frequent rate.
9037e1e3d94SStacey Son 	 */
9047e1e3d94SStacey Son 	val = status < agg ? status : agg;
9057e1e3d94SStacey Son 
9067e1e3d94SStacey Son 	(void) sigemptyset(&act.sa_mask);
9077e1e3d94SStacey Son 	act.sa_flags = 0;
9087e1e3d94SStacey Son 	act.sa_handler = status_fire;
9097e1e3d94SStacey Son 	(void) sigaction(SIGUSR1, &act, NULL);
9107e1e3d94SStacey Son 
9117e1e3d94SStacey Son 	ev.sigev_notify = SIGEV_SIGNAL;
9127e1e3d94SStacey Son 	ev.sigev_signo = SIGUSR1;
9137e1e3d94SStacey Son 
9147e1e3d94SStacey Son 	if (timer_create(CLOCK_REALTIME, &ev, &tid) == -1)
9157e1e3d94SStacey Son 		dfail("cannot create CLOCK_REALTIME timer");
9167e1e3d94SStacey Son 
9177e1e3d94SStacey Son 	ts.it_value.tv_sec = val / NANOSEC;
9187e1e3d94SStacey Son 	ts.it_value.tv_nsec = val % NANOSEC;
9197e1e3d94SStacey Son 	ts.it_interval = ts.it_value;
9207e1e3d94SStacey Son 
9217e1e3d94SStacey Son 	if (timer_settime(tid, TIMER_RELTIME, &ts, NULL) == -1)
9227e1e3d94SStacey Son 		dfail("cannot set time on CLOCK_REALTIME timer");
9237e1e3d94SStacey Son }
9247e1e3d94SStacey Son 
9257e1e3d94SStacey Son static void
status_check(void)9267e1e3d94SStacey Son status_check(void)
9277e1e3d94SStacey Son {
9287e1e3d94SStacey Son 	if (!g_tracing && dtrace_aggregate_snap(g_dtp) != 0)
9297e1e3d94SStacey Son 		dfail("failed to snap aggregate");
9307e1e3d94SStacey Son 
9317e1e3d94SStacey Son 	if (dtrace_status(g_dtp) == -1)
9327e1e3d94SStacey Son 		dfail("dtrace_status()");
9337e1e3d94SStacey Son }
9347e1e3d94SStacey Son 
9357e1e3d94SStacey Son static void
lsrec_fill(lsrec_t * lsrec,const dtrace_recdesc_t * rec,int nrecs,caddr_t data)9367e1e3d94SStacey Son lsrec_fill(lsrec_t *lsrec, const dtrace_recdesc_t *rec, int nrecs, caddr_t data)
9377e1e3d94SStacey Son {
9387e1e3d94SStacey Son 	bzero(lsrec, g_recsize);
9397e1e3d94SStacey Son 	lsrec->ls_count = 1;
9407e1e3d94SStacey Son 
9417e1e3d94SStacey Son 	if ((g_recsize > LS_HIST && nrecs < 4) || (nrecs < 3))
9427e1e3d94SStacey Son 		fail(0, "truncated DTrace record");
9437e1e3d94SStacey Son 
9447e1e3d94SStacey Son 	if (rec->dtrd_size != sizeof (uint64_t))
9457e1e3d94SStacey Son 		fail(0, "bad event size in first record");
9467e1e3d94SStacey Son 
9477e1e3d94SStacey Son 	/* LINTED - alignment */
9487e1e3d94SStacey Son 	lsrec->ls_event = (uint32_t)*((uint64_t *)(data + rec->dtrd_offset));
9497e1e3d94SStacey Son 	rec++;
9507e1e3d94SStacey Son 
9513142b376SMark Johnston #ifdef illumos
9527e1e3d94SStacey Son 	if (rec->dtrd_size != sizeof (uintptr_t))
9537e1e3d94SStacey Son 		fail(0, "bad lock address size in second record");
9547e1e3d94SStacey Son 
9557e1e3d94SStacey Son 	/* LINTED - alignment */
9567e1e3d94SStacey Son 	lsrec->ls_lock = *((uintptr_t *)(data + rec->dtrd_offset));
9577e1e3d94SStacey Son 	rec++;
9583142b376SMark Johnston #else
9593142b376SMark Johnston 	lsrec->ls_lock = strdup((const char *)(data + rec->dtrd_offset));
9603142b376SMark Johnston 	rec++;
9613142b376SMark Johnston #endif
9627e1e3d94SStacey Son 
9637e1e3d94SStacey Son 	if (rec->dtrd_size != sizeof (uintptr_t))
9647e1e3d94SStacey Son 		fail(0, "bad caller size in third record");
9657e1e3d94SStacey Son 
9667e1e3d94SStacey Son 	/* LINTED - alignment */
9677e1e3d94SStacey Son 	lsrec->ls_caller = *((uintptr_t *)(data + rec->dtrd_offset));
9687e1e3d94SStacey Son 	rec++;
9697e1e3d94SStacey Son 
9707e1e3d94SStacey Son 	if (g_recsize > LS_HIST) {
9717e1e3d94SStacey Son 		int frames, i;
9727e1e3d94SStacey Son 		pc_t *stack;
9737e1e3d94SStacey Son 
9747e1e3d94SStacey Son 		frames = rec->dtrd_size / sizeof (pc_t);
9757e1e3d94SStacey Son 		/* LINTED - alignment */
9767e1e3d94SStacey Son 		stack = (pc_t *)(data + rec->dtrd_offset);
9777e1e3d94SStacey Son 
9787e1e3d94SStacey Son 		for (i = 1; i < frames; i++)
9797e1e3d94SStacey Son 			lsrec->ls_stack[i - 1] = stack[i];
9807e1e3d94SStacey Son 	}
9817e1e3d94SStacey Son }
9827e1e3d94SStacey Son 
9837e1e3d94SStacey Son /*ARGSUSED*/
9847e1e3d94SStacey Son static int
count_aggregate(const dtrace_aggdata_t * agg,void * arg)9857e1e3d94SStacey Son count_aggregate(const dtrace_aggdata_t *agg, void *arg)
9867e1e3d94SStacey Son {
9877e1e3d94SStacey Son 	*((size_t *)arg) += 1;
9887e1e3d94SStacey Son 
9897e1e3d94SStacey Son 	return (DTRACE_AGGWALK_NEXT);
9907e1e3d94SStacey Son }
9917e1e3d94SStacey Son 
9927e1e3d94SStacey Son static int
process_aggregate(const dtrace_aggdata_t * agg,void * arg)9937e1e3d94SStacey Son process_aggregate(const dtrace_aggdata_t *agg, void *arg)
9947e1e3d94SStacey Son {
9957e1e3d94SStacey Son 	const dtrace_aggdesc_t *aggdesc = agg->dtada_desc;
9967e1e3d94SStacey Son 	caddr_t data = agg->dtada_data;
9977e1e3d94SStacey Son 	lsdata_t *lsdata = arg;
9987e1e3d94SStacey Son 	lsrec_t *lsrec = lsdata->lsd_next;
9997e1e3d94SStacey Son 	const dtrace_recdesc_t *rec;
10007e1e3d94SStacey Son 	uint64_t *avg, *quantized;
10017e1e3d94SStacey Son 	int i, j;
10027e1e3d94SStacey Son 
10037e1e3d94SStacey Son 	assert(lsdata->lsd_count < g_nrecs);
10047e1e3d94SStacey Son 
10057e1e3d94SStacey Son 	/*
10067e1e3d94SStacey Son 	 * Aggregation variable IDs are guaranteed to be generated in program
10077e1e3d94SStacey Son 	 * order, and they are guaranteed to start from DTRACE_AGGVARIDNONE
10087e1e3d94SStacey Son 	 * plus one.  As "avg" appears before "hist" in program order, we know
10097e1e3d94SStacey Son 	 * that "avg" will be allocated the first aggregation variable ID, and
10107e1e3d94SStacey Son 	 * "hist" will be allocated the second aggregation variable ID -- and
10117e1e3d94SStacey Son 	 * we therefore use the aggregation variable ID to differentiate the
10127e1e3d94SStacey Son 	 * cases.
10137e1e3d94SStacey Son 	 */
10147e1e3d94SStacey Son 	if (aggdesc->dtagd_varid > DTRACE_AGGVARIDNONE + 1) {
10157e1e3d94SStacey Son 		/*
10167e1e3d94SStacey Son 		 * If this is the histogram entry.  We'll copy the quantized
10177e1e3d94SStacey Son 		 * data into lc_hist, and jump over the rest.
10187e1e3d94SStacey Son 		 */
10197e1e3d94SStacey Son 		rec = &aggdesc->dtagd_rec[aggdesc->dtagd_nrecs - 1];
10207e1e3d94SStacey Son 
10217e1e3d94SStacey Son 		if (aggdesc->dtagd_varid != DTRACE_AGGVARIDNONE + 2)
10227e1e3d94SStacey Son 			fail(0, "bad variable ID in aggregation record");
10237e1e3d94SStacey Son 
10247e1e3d94SStacey Son 		if (rec->dtrd_size !=
10257e1e3d94SStacey Son 		    DTRACE_QUANTIZE_NBUCKETS * sizeof (uint64_t))
10267e1e3d94SStacey Son 			fail(0, "bad quantize size in aggregation record");
10277e1e3d94SStacey Son 
10287e1e3d94SStacey Son 		/* LINTED - alignment */
10297e1e3d94SStacey Son 		quantized = (uint64_t *)(data + rec->dtrd_offset);
10307e1e3d94SStacey Son 
10317e1e3d94SStacey Son 		for (i = DTRACE_QUANTIZE_ZEROBUCKET, j = 0;
10327e1e3d94SStacey Son 		    i < DTRACE_QUANTIZE_NBUCKETS; i++, j++)
10337e1e3d94SStacey Son 			lsrec->ls_hist[j] = quantized[i];
10347e1e3d94SStacey Son 
10357e1e3d94SStacey Son 		goto out;
10367e1e3d94SStacey Son 	}
10377e1e3d94SStacey Son 
10387e1e3d94SStacey Son 	lsrec_fill(lsrec, &aggdesc->dtagd_rec[1],
10397e1e3d94SStacey Son 	    aggdesc->dtagd_nrecs - 1, data);
10407e1e3d94SStacey Son 
10417e1e3d94SStacey Son 	rec = &aggdesc->dtagd_rec[aggdesc->dtagd_nrecs - 1];
10427e1e3d94SStacey Son 
10437e1e3d94SStacey Son 	if (rec->dtrd_size != 2 * sizeof (uint64_t))
10447e1e3d94SStacey Son 		fail(0, "bad avg size in aggregation record");
10457e1e3d94SStacey Son 
10467e1e3d94SStacey Son 	/* LINTED - alignment */
10477e1e3d94SStacey Son 	avg = (uint64_t *)(data + rec->dtrd_offset);
10487e1e3d94SStacey Son 	lsrec->ls_count = (uint32_t)avg[0];
10497e1e3d94SStacey Son 	lsrec->ls_time = (uintptr_t)avg[1];
10507e1e3d94SStacey Son 
10517e1e3d94SStacey Son 	if (g_recsize >= LS_HIST)
10527e1e3d94SStacey Son 		return (DTRACE_AGGWALK_NEXT);
10537e1e3d94SStacey Son 
10547e1e3d94SStacey Son out:
10557e1e3d94SStacey Son 	lsdata->lsd_next = (lsrec_t *)((uintptr_t)lsrec + g_recsize);
10567e1e3d94SStacey Son 	lsdata->lsd_count++;
10577e1e3d94SStacey Son 
10587e1e3d94SStacey Son 	return (DTRACE_AGGWALK_NEXT);
10597e1e3d94SStacey Son }
10607e1e3d94SStacey Son 
10617e1e3d94SStacey Son static int
process_trace(const dtrace_probedata_t * pdata,void * arg)10627e1e3d94SStacey Son process_trace(const dtrace_probedata_t *pdata, void *arg)
10637e1e3d94SStacey Son {
10647e1e3d94SStacey Son 	lsdata_t *lsdata = arg;
10657e1e3d94SStacey Son 	lsrec_t *lsrec = lsdata->lsd_next;
10667e1e3d94SStacey Son 	dtrace_eprobedesc_t *edesc = pdata->dtpda_edesc;
10677e1e3d94SStacey Son 	caddr_t data = pdata->dtpda_data;
10687e1e3d94SStacey Son 
10697e1e3d94SStacey Son 	if (lsdata->lsd_count >= g_nrecs)
10707e1e3d94SStacey Son 		return (DTRACE_CONSUME_NEXT);
10717e1e3d94SStacey Son 
10727e1e3d94SStacey Son 	lsrec_fill(lsrec, edesc->dtepd_rec, edesc->dtepd_nrecs, data);
10737e1e3d94SStacey Son 
10747e1e3d94SStacey Son 	lsdata->lsd_next = (lsrec_t *)((uintptr_t)lsrec + g_recsize);
10757e1e3d94SStacey Son 	lsdata->lsd_count++;
10767e1e3d94SStacey Son 
10777e1e3d94SStacey Son 	return (DTRACE_CONSUME_NEXT);
10787e1e3d94SStacey Son }
10797e1e3d94SStacey Son 
10807e1e3d94SStacey Son static int
process_data(FILE * out,char * data)10817e1e3d94SStacey Son process_data(FILE *out, char *data)
10827e1e3d94SStacey Son {
10837e1e3d94SStacey Son 	lsdata_t lsdata;
10847e1e3d94SStacey Son 
10857e1e3d94SStacey Son 	/* LINTED - alignment */
10867e1e3d94SStacey Son 	lsdata.lsd_next = (lsrec_t *)data;
10877e1e3d94SStacey Son 	lsdata.lsd_count = 0;
10887e1e3d94SStacey Son 
10897e1e3d94SStacey Son 	if (g_tracing) {
10907e1e3d94SStacey Son 		if (dtrace_consume(g_dtp, out,
10917e1e3d94SStacey Son 		    process_trace, NULL, &lsdata) != 0)
10927e1e3d94SStacey Son 			dfail("failed to consume buffer");
10937e1e3d94SStacey Son 
10947e1e3d94SStacey Son 		return (lsdata.lsd_count);
10957e1e3d94SStacey Son 	}
10967e1e3d94SStacey Son 
10977e1e3d94SStacey Son 	if (dtrace_aggregate_walk_keyvarsorted(g_dtp,
10987e1e3d94SStacey Son 	    process_aggregate, &lsdata) != 0)
10997e1e3d94SStacey Son 		dfail("failed to walk aggregate");
11007e1e3d94SStacey Son 
11017e1e3d94SStacey Son 	return (lsdata.lsd_count);
11027e1e3d94SStacey Son }
11037e1e3d94SStacey Son 
11047e1e3d94SStacey Son /*ARGSUSED*/
11057e1e3d94SStacey Son static int
drophandler(const dtrace_dropdata_t * data,void * arg)11067e1e3d94SStacey Son drophandler(const dtrace_dropdata_t *data, void *arg)
11077e1e3d94SStacey Son {
11087e1e3d94SStacey Son 	g_dropped++;
11097e1e3d94SStacey Son 	(void) fprintf(stderr, "lockstat: warning: %s", data->dtdda_msg);
11107e1e3d94SStacey Son 	return (DTRACE_HANDLE_OK);
11117e1e3d94SStacey Son }
11127e1e3d94SStacey Son 
11137e1e3d94SStacey Son int
main(int argc,char ** argv)11147e1e3d94SStacey Son main(int argc, char **argv)
11157e1e3d94SStacey Son {
11167e1e3d94SStacey Son 	char *data_buf;
11177e1e3d94SStacey Son 	lsrec_t *lsp, **current, **first, **sort_buf, **merge_buf;
11187e1e3d94SStacey Son 	FILE *out = stdout;
11194fb6e7b1SStacey Son 	int c;
11207e1e3d94SStacey Son 	pid_t child;
11217e1e3d94SStacey Son 	int status;
11227e1e3d94SStacey Son 	int i, j;
11237e1e3d94SStacey Son 	hrtime_t duration;
11247e1e3d94SStacey Son 	char *addrp, *offp, *sizep, *evp, *lastp, *p;
11257e1e3d94SStacey Son 	uintptr_t addr;
11267e1e3d94SStacey Son 	size_t size, off;
11277e1e3d94SStacey Son 	int events_specified = 0;
11287e1e3d94SStacey Son 	int exec_errno = 0;
11297e1e3d94SStacey Son 	uint32_t event;
11307e1e3d94SStacey Son 	char *filt = NULL, *ifilt = NULL;
11317e1e3d94SStacey Son 	static uint64_t ev_count[LS_MAX_EVENTS + 1];
11327e1e3d94SStacey Son 	static uint64_t ev_time[LS_MAX_EVENTS + 1];
11337e1e3d94SStacey Son 	dtrace_optval_t aggsize;
11347e1e3d94SStacey Son 	char aggstr[10];
11357e1e3d94SStacey Son 	long ncpus;
11367e1e3d94SStacey Son 	int dynvar = 0;
11377e1e3d94SStacey Son 	int err;
11387e1e3d94SStacey Son 
11397e1e3d94SStacey Son 	if ((g_dtp = dtrace_open(DTRACE_VERSION, 0, &err)) == NULL) {
11407e1e3d94SStacey Son 		fail(0, "cannot open dtrace library: %s",
11417e1e3d94SStacey Son 		    dtrace_errmsg(NULL, err));
11427e1e3d94SStacey Son 	}
11437e1e3d94SStacey Son 
11447e1e3d94SStacey Son 	if (dtrace_handle_drop(g_dtp, &drophandler, NULL) == -1)
11457e1e3d94SStacey Son 		dfail("couldn't establish drop handler");
11467e1e3d94SStacey Son 
11477e1e3d94SStacey Son 	if (symtab_init() == -1)
11487e1e3d94SStacey Son 		fail(1, "can't load kernel symbols");
11497e1e3d94SStacey Son 
11507e1e3d94SStacey Son 	g_nrecs = DEFAULT_NRECS;
11517e1e3d94SStacey Son 
11524fb6e7b1SStacey Son 	while ((c = getopt(argc, argv, LOCKSTAT_OPTSTR)) != GETOPT_EOF) {
11537e1e3d94SStacey Son 		switch (c) {
11547e1e3d94SStacey Son 		case 'b':
11557e1e3d94SStacey Son 			g_recsize = LS_BASIC;
11567e1e3d94SStacey Son 			break;
11577e1e3d94SStacey Son 
11587e1e3d94SStacey Son 		case 't':
11597e1e3d94SStacey Son 			g_recsize = LS_TIME;
11607e1e3d94SStacey Son 			break;
11617e1e3d94SStacey Son 
11627e1e3d94SStacey Son 		case 'h':
11637e1e3d94SStacey Son 			g_recsize = LS_HIST;
11647e1e3d94SStacey Son 			break;
11657e1e3d94SStacey Son 
11667e1e3d94SStacey Son 		case 's':
11677e1e3d94SStacey Son 			if (!isdigit(optarg[0]))
11687e1e3d94SStacey Son 				usage();
11697e1e3d94SStacey Son 			g_stkdepth = atoi(optarg);
11707e1e3d94SStacey Son 			if (g_stkdepth > LS_MAX_STACK_DEPTH)
11717e1e3d94SStacey Son 				fail(0, "max stack depth is %d",
11727e1e3d94SStacey Son 				    LS_MAX_STACK_DEPTH);
11737e1e3d94SStacey Son 			g_recsize = LS_STACK(g_stkdepth);
11747e1e3d94SStacey Son 			break;
11757e1e3d94SStacey Son 
11767e1e3d94SStacey Son 		case 'n':
11777e1e3d94SStacey Son 			if (!isdigit(optarg[0]))
11787e1e3d94SStacey Son 				usage();
11797e1e3d94SStacey Son 			g_nrecs = atoi(optarg);
11807e1e3d94SStacey Son 			break;
11817e1e3d94SStacey Son 
11827e1e3d94SStacey Son 		case 'd':
11837e1e3d94SStacey Son 			if (!isdigit(optarg[0]))
11847e1e3d94SStacey Son 				usage();
11857e1e3d94SStacey Son 			duration = atoll(optarg);
11867e1e3d94SStacey Son 
11877e1e3d94SStacey Son 			/*
11887e1e3d94SStacey Son 			 * XXX -- durations really should be per event
11897e1e3d94SStacey Son 			 * since the units are different, but it's hard
11907e1e3d94SStacey Son 			 * to express this nicely in the interface.
11917e1e3d94SStacey Son 			 * Not clear yet what the cleanest solution is.
11927e1e3d94SStacey Son 			 */
11937e1e3d94SStacey Son 			for (i = 0; i < LS_MAX_EVENTS; i++)
11947e1e3d94SStacey Son 				if (g_event_info[i].ev_type != 'E')
11957e1e3d94SStacey Son 					g_min_duration[i] = duration;
11967e1e3d94SStacey Son 
11977e1e3d94SStacey Son 			break;
11987e1e3d94SStacey Son 
11997e1e3d94SStacey Son 		case 'i':
12007e1e3d94SStacey Son 			if (!isdigit(optarg[0]))
12017e1e3d94SStacey Son 				usage();
12027e1e3d94SStacey Son 			i = atoi(optarg);
12037e1e3d94SStacey Son 			if (i <= 0)
12047e1e3d94SStacey Son 				usage();
12057e1e3d94SStacey Son 			if (i > MAX_HZ)
12067e1e3d94SStacey Son 				fail(0, "max interrupt rate is %d Hz", MAX_HZ);
12077e1e3d94SStacey Son 
12087e1e3d94SStacey Son 			for (j = 0; j < LS_MAX_EVENTS; j++)
12097e1e3d94SStacey Son 				if (strcmp(g_event_info[j].ev_desc,
12107e1e3d94SStacey Son 				    "Profiling interrupt") == 0)
12117e1e3d94SStacey Son 					break;
12127e1e3d94SStacey Son 
12137e1e3d94SStacey Son 			(void) sprintf(g_event_info[j].ev_name,
12147e1e3d94SStacey Son 			    "profile:::profile-%d", i);
12157e1e3d94SStacey Son 			break;
12167e1e3d94SStacey Son 
12177e1e3d94SStacey Son 		case 'l':
12187e1e3d94SStacey Son 		case 'f':
12197e1e3d94SStacey Son 			addrp = strtok(optarg, ",");
12207e1e3d94SStacey Son 			sizep = strtok(NULL, ",");
12217e1e3d94SStacey Son 			addrp = strtok(optarg, ",+");
12227e1e3d94SStacey Son 			offp = strtok(NULL, ",");
12237e1e3d94SStacey Son 
12247e1e3d94SStacey Son 			size = sizep ? strtoul(sizep, NULL, 0) : 1;
12257e1e3d94SStacey Son 			off = offp ? strtoul(offp, NULL, 0) : 0;
12267e1e3d94SStacey Son 
12277e1e3d94SStacey Son 			if (addrp[0] == '0') {
12287e1e3d94SStacey Son 				addr = strtoul(addrp, NULL, 16) + off;
12297e1e3d94SStacey Son 			} else {
12307e1e3d94SStacey Son 				addr = sym_to_addr(addrp) + off;
12317e1e3d94SStacey Son 				if (sizep == NULL)
12327e1e3d94SStacey Son 					size = sym_size(addrp) - off;
12337e1e3d94SStacey Son 				if (addr - off == 0)
12347e1e3d94SStacey Son 					fail(0, "symbol '%s' not found", addrp);
12357e1e3d94SStacey Son 				if (size == 0)
12367e1e3d94SStacey Son 					size = 1;
12377e1e3d94SStacey Son 			}
12387e1e3d94SStacey Son 
12397e1e3d94SStacey Son 
12407e1e3d94SStacey Son 			if (c == 'l') {
12417e1e3d94SStacey Son 				filter_add(&filt, "arg0", addr, size);
12427e1e3d94SStacey Son 			} else {
12437e1e3d94SStacey Son 				filter_add(&filt, "caller", addr, size);
12447e1e3d94SStacey Son 				filter_add(&ifilt, "arg0", addr, size);
12457e1e3d94SStacey Son 			}
12467e1e3d94SStacey Son 			break;
12477e1e3d94SStacey Son 
12487e1e3d94SStacey Son 		case 'e':
12497e1e3d94SStacey Son 			evp = strtok_r(optarg, ",", &lastp);
12507e1e3d94SStacey Son 			while (evp) {
12517e1e3d94SStacey Son 				int ev1, ev2;
12527e1e3d94SStacey Son 				char *evp2;
12537e1e3d94SStacey Son 
12547e1e3d94SStacey Son 				(void) strtok(evp, "-");
12557e1e3d94SStacey Son 				evp2 = strtok(NULL, "-");
12567e1e3d94SStacey Son 				ev1 = atoi(evp);
12577e1e3d94SStacey Son 				ev2 = evp2 ? atoi(evp2) : ev1;
12587e1e3d94SStacey Son 				if ((uint_t)ev1 >= LS_MAX_EVENTS ||
12597e1e3d94SStacey Son 				    (uint_t)ev2 >= LS_MAX_EVENTS || ev1 > ev2)
12607e1e3d94SStacey Son 					fail(0, "-e events out of range");
12617e1e3d94SStacey Son 				for (i = ev1; i <= ev2; i++)
12627e1e3d94SStacey Son 					g_enabled[i] = 1;
12637e1e3d94SStacey Son 				evp = strtok_r(NULL, ",", &lastp);
12647e1e3d94SStacey Son 			}
12657e1e3d94SStacey Son 			events_specified = 1;
12667e1e3d94SStacey Son 			break;
12677e1e3d94SStacey Son 
12683142b376SMark Johnston #ifdef illumos
12697e1e3d94SStacey Son 		case 'c':
12707e1e3d94SStacey Son 			g_cflag = 1;
12717e1e3d94SStacey Son 			break;
12723142b376SMark Johnston #endif
12737e1e3d94SStacey Son 
12747e1e3d94SStacey Son 		case 'k':
12757e1e3d94SStacey Son 			g_kflag = 1;
12767e1e3d94SStacey Son 			break;
12777e1e3d94SStacey Son 
12787e1e3d94SStacey Son 		case 'w':
12797e1e3d94SStacey Son 			g_wflag = 1;
12807e1e3d94SStacey Son 			break;
12817e1e3d94SStacey Son 
12827e1e3d94SStacey Son 		case 'W':
12837e1e3d94SStacey Son 			g_Wflag = 1;
12847e1e3d94SStacey Son 			break;
12857e1e3d94SStacey Son 
12867e1e3d94SStacey Son 		case 'g':
12877e1e3d94SStacey Son 			g_gflag = 1;
12887e1e3d94SStacey Son 			break;
12897e1e3d94SStacey Son 
12907e1e3d94SStacey Son 		case 'C':
12917e1e3d94SStacey Son 		case 'E':
12927e1e3d94SStacey Son 		case 'H':
12937e1e3d94SStacey Son 		case 'I':
12947e1e3d94SStacey Son 			for (i = 0; i < LS_MAX_EVENTS; i++)
12957e1e3d94SStacey Son 				if (g_event_info[i].ev_type == c)
12967e1e3d94SStacey Son 					g_enabled[i] = 1;
12977e1e3d94SStacey Son 			events_specified = 1;
12987e1e3d94SStacey Son 			break;
12997e1e3d94SStacey Son 
13007e1e3d94SStacey Son 		case 'A':
13017e1e3d94SStacey Son 			for (i = 0; i < LS_MAX_EVENTS; i++)
13027e1e3d94SStacey Son 				if (strchr("CH", g_event_info[i].ev_type))
13037e1e3d94SStacey Son 					g_enabled[i] = 1;
13047e1e3d94SStacey Son 			events_specified = 1;
13057e1e3d94SStacey Son 			break;
13067e1e3d94SStacey Son 
13077e1e3d94SStacey Son 		case 'T':
13087e1e3d94SStacey Son 			g_tracing = 1;
13097e1e3d94SStacey Son 			break;
13107e1e3d94SStacey Son 
13117e1e3d94SStacey Son 		case 'D':
13127e1e3d94SStacey Son 			if (!isdigit(optarg[0]))
13137e1e3d94SStacey Son 				usage();
13147e1e3d94SStacey Son 			g_topn = atoi(optarg);
13157e1e3d94SStacey Son 			break;
13167e1e3d94SStacey Son 
13177e1e3d94SStacey Son 		case 'R':
13187e1e3d94SStacey Son 			g_rates = 1;
13197e1e3d94SStacey Son 			break;
13207e1e3d94SStacey Son 
13217e1e3d94SStacey Son 		case 'p':
13227e1e3d94SStacey Son 			g_pflag = 1;
13237e1e3d94SStacey Son 			break;
13247e1e3d94SStacey Son 
13257e1e3d94SStacey Son 		case 'P':
13267e1e3d94SStacey Son 			g_Pflag = 1;
13277e1e3d94SStacey Son 			break;
13287e1e3d94SStacey Son 
13297e1e3d94SStacey Son 		case 'o':
13307e1e3d94SStacey Son 			if ((out = fopen(optarg, "w")) == NULL)
13317e1e3d94SStacey Son 				fail(1, "error opening file");
13327e1e3d94SStacey Son 			break;
13337e1e3d94SStacey Son 
13347e1e3d94SStacey Son 		case 'V':
13357e1e3d94SStacey Son 			g_Vflag = 1;
13367e1e3d94SStacey Son 			break;
13377e1e3d94SStacey Son 
13387e1e3d94SStacey Son 		default:
13397e1e3d94SStacey Son 			if (strchr(LOCKSTAT_OPTSTR, c) == NULL)
13407e1e3d94SStacey Son 				usage();
13417e1e3d94SStacey Son 		}
13427e1e3d94SStacey Son 	}
13437e1e3d94SStacey Son 
13447e1e3d94SStacey Son 	if (filt != NULL) {
13457e1e3d94SStacey Son 		predicate_add(&g_predicate, filt, NULL, 0);
13467e1e3d94SStacey Son 		filter_destroy(&filt);
13477e1e3d94SStacey Son 	}
13487e1e3d94SStacey Son 
13497e1e3d94SStacey Son 	if (ifilt != NULL) {
13507e1e3d94SStacey Son 		predicate_add(&g_ipredicate, ifilt, NULL, 0);
13517e1e3d94SStacey Son 		filter_destroy(&ifilt);
13527e1e3d94SStacey Son 	}
13537e1e3d94SStacey Son 
13547e1e3d94SStacey Son 	if (g_recsize == 0) {
13557e1e3d94SStacey Son 		if (g_gflag) {
13567e1e3d94SStacey Son 			g_stkdepth = LS_MAX_STACK_DEPTH;
13577e1e3d94SStacey Son 			g_recsize = LS_STACK(g_stkdepth);
13587e1e3d94SStacey Son 		} else {
13597e1e3d94SStacey Son 			g_recsize = LS_TIME;
13607e1e3d94SStacey Son 		}
13617e1e3d94SStacey Son 	}
13627e1e3d94SStacey Son 
13637e1e3d94SStacey Son 	if (g_gflag && g_recsize <= LS_STACK(0))
13647e1e3d94SStacey Son 		fail(0, "'-g' requires at least '-s 1' data gathering");
13657e1e3d94SStacey Son 
13667e1e3d94SStacey Son 	/*
13677e1e3d94SStacey Son 	 * Make sure the alignment is reasonable
13687e1e3d94SStacey Son 	 */
13697e1e3d94SStacey Son 	g_recsize = -(-g_recsize & -sizeof (uint64_t));
13707e1e3d94SStacey Son 
13717e1e3d94SStacey Son 	for (i = 0; i < LS_MAX_EVENTS; i++) {
13727e1e3d94SStacey Son 		/*
13737e1e3d94SStacey Son 		 * If no events were specified, enable -C.
13747e1e3d94SStacey Son 		 */
13757e1e3d94SStacey Son 		if (!events_specified && g_event_info[i].ev_type == 'C')
13767e1e3d94SStacey Son 			g_enabled[i] = 1;
13777e1e3d94SStacey Son 	}
13787e1e3d94SStacey Son 
13797e1e3d94SStacey Son 	for (i = 0; i < LS_MAX_EVENTS; i++) {
13807e1e3d94SStacey Son 		if (!g_enabled[i])
13817e1e3d94SStacey Son 			continue;
13827e1e3d94SStacey Son 
13837e1e3d94SStacey Son 		if (g_event_info[i].ev_acquire != NULL) {
13847e1e3d94SStacey Son 			/*
13857e1e3d94SStacey Son 			 * If we've enabled a hold event, we must explicitly
13867e1e3d94SStacey Son 			 * allocate dynamic variable space.
13877e1e3d94SStacey Son 			 */
13887e1e3d94SStacey Son 			dynvar = 1;
13897e1e3d94SStacey Son 		}
13907e1e3d94SStacey Son 
13917e1e3d94SStacey Son 		dprog_addevent(i);
13927e1e3d94SStacey Son 	}
13937e1e3d94SStacey Son 
13947e1e3d94SStacey Son 	/*
13957e1e3d94SStacey Son 	 * Make sure there are remaining arguments to specify a child command
13967e1e3d94SStacey Son 	 * to execute.
13977e1e3d94SStacey Son 	 */
13987e1e3d94SStacey Son 	if (argc <= optind)
13997e1e3d94SStacey Son 		usage();
14007e1e3d94SStacey Son 
14017e1e3d94SStacey Son 	if ((ncpus = sysconf(_SC_NPROCESSORS_ONLN)) == -1)
14027e1e3d94SStacey Son 		dfail("couldn't determine number of online CPUs");
14037e1e3d94SStacey Son 
14047e1e3d94SStacey Son 	/*
14057e1e3d94SStacey Son 	 * By default, we set our data buffer size to be the number of records
14067e1e3d94SStacey Son 	 * multiplied by the size of the record, doubled to account for some
14077e1e3d94SStacey Son 	 * DTrace slop and divided by the number of CPUs.  We silently clamp
14087e1e3d94SStacey Son 	 * the aggregation size at both a minimum and a maximum to prevent
14097e1e3d94SStacey Son 	 * absurdly low or high values.
14107e1e3d94SStacey Son 	 */
14117e1e3d94SStacey Son 	if ((aggsize = (g_nrecs * g_recsize * 2) / ncpus) < MIN_AGGSIZE)
14127e1e3d94SStacey Son 		aggsize = MIN_AGGSIZE;
14137e1e3d94SStacey Son 
14147e1e3d94SStacey Son 	if (aggsize > MAX_AGGSIZE)
14157e1e3d94SStacey Son 		aggsize = MAX_AGGSIZE;
14167e1e3d94SStacey Son 
14177e1e3d94SStacey Son 	(void) sprintf(aggstr, "%lld", (long long)aggsize);
14187e1e3d94SStacey Son 
14197e1e3d94SStacey Son 	if (!g_tracing) {
14207e1e3d94SStacey Son 		if (dtrace_setopt(g_dtp, "bufsize", "4k") == -1)
14217e1e3d94SStacey Son 			dfail("failed to set 'bufsize'");
14227e1e3d94SStacey Son 
14237e1e3d94SStacey Son 		if (dtrace_setopt(g_dtp, "aggsize", aggstr) == -1)
14247e1e3d94SStacey Son 			dfail("failed to set 'aggsize'");
14257e1e3d94SStacey Son 
14267e1e3d94SStacey Son 		if (dynvar) {
14277e1e3d94SStacey Son 			/*
14287e1e3d94SStacey Son 			 * If we're using dynamic variables, we set our
14297e1e3d94SStacey Son 			 * dynamic variable size to be one megabyte per CPU,
14307e1e3d94SStacey Son 			 * with a hard-limit of 32 megabytes.  This may still
14317e1e3d94SStacey Son 			 * be too small in some cases, but it can be tuned
14327e1e3d94SStacey Son 			 * manually via -x if need be.
14337e1e3d94SStacey Son 			 */
14347e1e3d94SStacey Son 			(void) sprintf(aggstr, "%ldm", ncpus < 32 ? ncpus : 32);
14357e1e3d94SStacey Son 
14367e1e3d94SStacey Son 			if (dtrace_setopt(g_dtp, "dynvarsize", aggstr) == -1)
14377e1e3d94SStacey Son 				dfail("failed to set 'dynvarsize'");
14387e1e3d94SStacey Son 		}
14397e1e3d94SStacey Son 	} else {
14407e1e3d94SStacey Son 		if (dtrace_setopt(g_dtp, "bufsize", aggstr) == -1)
14417e1e3d94SStacey Son 			dfail("failed to set 'bufsize'");
14427e1e3d94SStacey Son 	}
14437e1e3d94SStacey Son 
14447e1e3d94SStacey Son 	if (dtrace_setopt(g_dtp, "statusrate", "10sec") == -1)
14457e1e3d94SStacey Son 		dfail("failed to set 'statusrate'");
14467e1e3d94SStacey Son 
14477e1e3d94SStacey Son 	optind = 1;
14484fb6e7b1SStacey Son 	while ((c = getopt(argc, argv, LOCKSTAT_OPTSTR)) != GETOPT_EOF) {
14497e1e3d94SStacey Son 		switch (c) {
14507e1e3d94SStacey Son 		case 'x':
14517e1e3d94SStacey Son 			if ((p = strchr(optarg, '=')) != NULL)
14527e1e3d94SStacey Son 				*p++ = '\0';
14537e1e3d94SStacey Son 
14547e1e3d94SStacey Son 			if (dtrace_setopt(g_dtp, optarg, p) != 0)
14557e1e3d94SStacey Son 				dfail("failed to set -x %s", optarg);
14567e1e3d94SStacey Son 			break;
14577e1e3d94SStacey Son 		}
14587e1e3d94SStacey Son 	}
14597e1e3d94SStacey Son 
14607e1e3d94SStacey Son 	argc -= optind;
14617e1e3d94SStacey Son 	argv += optind;
14627e1e3d94SStacey Son 
14637e1e3d94SStacey Son 	dprog_compile();
14647e1e3d94SStacey Son 	status_init();
14657e1e3d94SStacey Son 
14667e1e3d94SStacey Son 	g_elapsed = -gethrtime();
14677e1e3d94SStacey Son 
14687e1e3d94SStacey Son 	/*
14697e1e3d94SStacey Son 	 * Spawn the specified command and wait for it to complete.
14707e1e3d94SStacey Son 	 */
14717e1e3d94SStacey Son 	child = fork();
14727e1e3d94SStacey Son 	if (child == -1)
14737e1e3d94SStacey Son 		fail(1, "cannot fork");
14747e1e3d94SStacey Son 	if (child == 0) {
14757e1e3d94SStacey Son 		(void) dtrace_close(g_dtp);
14767e1e3d94SStacey Son 		(void) execvp(argv[0], &argv[0]);
14777e1e3d94SStacey Son 		exec_errno = errno;
14787e1e3d94SStacey Son 		exit(127);
14797e1e3d94SStacey Son 	}
14807e1e3d94SStacey Son 
1481bc96366cSSteven Hartland #ifdef illumos
14827e1e3d94SStacey Son 	while (waitpid(child, &status, WEXITED) != child)
14837e1e3d94SStacey Son #else
14847e1e3d94SStacey Son 	while (waitpid(child, &status, 0) != child)
14857e1e3d94SStacey Son #endif
14867e1e3d94SStacey Son 		status_check();
14877e1e3d94SStacey Son 
14887e1e3d94SStacey Son 	g_elapsed += gethrtime();
14897e1e3d94SStacey Son 
14907e1e3d94SStacey Son 	if (WIFEXITED(status)) {
14917e1e3d94SStacey Son 		if (WEXITSTATUS(status) != 0) {
14927e1e3d94SStacey Son 			if (exec_errno != 0) {
14937e1e3d94SStacey Son 				errno = exec_errno;
14947e1e3d94SStacey Son 				fail(1, "could not execute %s", argv[0]);
14957e1e3d94SStacey Son 			}
14967e1e3d94SStacey Son 			(void) fprintf(stderr,
14977e1e3d94SStacey Son 			    "lockstat: warning: %s exited with code %d\n",
14987e1e3d94SStacey Son 			    argv[0], WEXITSTATUS(status));
14997e1e3d94SStacey Son 		}
15007e1e3d94SStacey Son 	} else {
15017e1e3d94SStacey Son 		(void) fprintf(stderr,
15027e1e3d94SStacey Son 		    "lockstat: warning: %s died on signal %d\n",
15037e1e3d94SStacey Son 		    argv[0], WTERMSIG(status));
15047e1e3d94SStacey Son 	}
15057e1e3d94SStacey Son 
15067e1e3d94SStacey Son 	if (dtrace_stop(g_dtp) == -1)
15077e1e3d94SStacey Son 		dfail("failed to stop dtrace");
15087e1e3d94SStacey Son 
15097e1e3d94SStacey Son 	/*
15107e1e3d94SStacey Son 	 * Before we read out the results, we need to allocate our buffer.
15117e1e3d94SStacey Son 	 * If we're tracing, then we'll just use the precalculated size.  If
15127e1e3d94SStacey Son 	 * we're not, then we'll take a snapshot of the aggregate, and walk
15137e1e3d94SStacey Son 	 * it to count the number of records.
15147e1e3d94SStacey Son 	 */
15157e1e3d94SStacey Son 	if (!g_tracing) {
15167e1e3d94SStacey Son 		if (dtrace_aggregate_snap(g_dtp) != 0)
15177e1e3d94SStacey Son 			dfail("failed to snap aggregate");
15187e1e3d94SStacey Son 
15197e1e3d94SStacey Son 		g_nrecs = 0;
15207e1e3d94SStacey Son 
15217e1e3d94SStacey Son 		if (dtrace_aggregate_walk(g_dtp,
15227e1e3d94SStacey Son 		    count_aggregate, &g_nrecs) != 0)
15237e1e3d94SStacey Son 			dfail("failed to walk aggregate");
15247e1e3d94SStacey Son 	}
15257e1e3d94SStacey Son 
1526bc96366cSSteven Hartland #ifdef illumos
15277e1e3d94SStacey Son 	if ((data_buf = memalign(sizeof (uint64_t),
15287e1e3d94SStacey Son 	    (g_nrecs + 1) * g_recsize)) == NULL)
15297e1e3d94SStacey Son #else
15307e1e3d94SStacey Son 	if (posix_memalign((void **)&data_buf, sizeof (uint64_t),
15317e1e3d94SStacey Son 	    (g_nrecs + 1) * g_recsize) )
15327e1e3d94SStacey Son #endif
15337e1e3d94SStacey Son 		fail(1, "Memory allocation failed");
15347e1e3d94SStacey Son 
15357e1e3d94SStacey Son 	/*
15367e1e3d94SStacey Son 	 * Read out the DTrace data.
15377e1e3d94SStacey Son 	 */
15387e1e3d94SStacey Son 	g_nrecs_used = process_data(out, data_buf);
15397e1e3d94SStacey Son 
15407e1e3d94SStacey Son 	if (g_nrecs_used > g_nrecs || g_dropped)
15417e1e3d94SStacey Son 		(void) fprintf(stderr, "lockstat: warning: "
15427e1e3d94SStacey Son 		    "ran out of data records (use -n for more)\n");
15437e1e3d94SStacey Son 
15447e1e3d94SStacey Son 	/* LINTED - alignment */
15457e1e3d94SStacey Son 	for (i = 0, lsp = (lsrec_t *)data_buf; i < g_nrecs_used; i++,
15467e1e3d94SStacey Son 	    /* LINTED - alignment */
15477e1e3d94SStacey Son 	    lsp = (lsrec_t *)((char *)lsp + g_recsize)) {
15487e1e3d94SStacey Son 		ev_count[lsp->ls_event] += lsp->ls_count;
15497e1e3d94SStacey Son 		ev_time[lsp->ls_event] += lsp->ls_time;
15507e1e3d94SStacey Son 	}
15517e1e3d94SStacey Son 
15527e1e3d94SStacey Son 	/*
15537e1e3d94SStacey Son 	 * If -g was specified, convert stacks into individual records.
15547e1e3d94SStacey Son 	 */
15557e1e3d94SStacey Son 	if (g_gflag) {
15567e1e3d94SStacey Son 		lsrec_t *newlsp, *oldlsp;
15577e1e3d94SStacey Son 
1558bc96366cSSteven Hartland #ifdef illumos
15597e1e3d94SStacey Son 		newlsp = memalign(sizeof (uint64_t),
15607e1e3d94SStacey Son 		    g_nrecs_used * LS_TIME * (g_stkdepth + 1));
15617e1e3d94SStacey Son #else
15627e1e3d94SStacey Son 		posix_memalign((void **)&newlsp, sizeof (uint64_t),
15637e1e3d94SStacey Son 		    g_nrecs_used * LS_TIME * (g_stkdepth + 1));
15647e1e3d94SStacey Son #endif
15657e1e3d94SStacey Son 		if (newlsp == NULL)
15667e1e3d94SStacey Son 			fail(1, "Cannot allocate space for -g processing");
15677e1e3d94SStacey Son 		lsp = newlsp;
15687e1e3d94SStacey Son 		/* LINTED - alignment */
15697e1e3d94SStacey Son 		for (i = 0, oldlsp = (lsrec_t *)data_buf; i < g_nrecs_used; i++,
15707e1e3d94SStacey Son 		    /* LINTED - alignment */
15717e1e3d94SStacey Son 		    oldlsp = (lsrec_t *)((char *)oldlsp + g_recsize)) {
15727e1e3d94SStacey Son 			int fr;
15737e1e3d94SStacey Son 			int caller_in_stack = 0;
15747e1e3d94SStacey Son 
15757e1e3d94SStacey Son 			if (oldlsp->ls_count == 0)
15767e1e3d94SStacey Son 				continue;
15777e1e3d94SStacey Son 
15787e1e3d94SStacey Son 			for (fr = 0; fr < g_stkdepth; fr++) {
15797e1e3d94SStacey Son 				if (oldlsp->ls_stack[fr] == 0)
15807e1e3d94SStacey Son 					break;
15817e1e3d94SStacey Son 				if (oldlsp->ls_stack[fr] == oldlsp->ls_caller)
15827e1e3d94SStacey Son 					caller_in_stack = 1;
15837e1e3d94SStacey Son 				bcopy(oldlsp, lsp, LS_TIME);
15847e1e3d94SStacey Son 				lsp->ls_caller = oldlsp->ls_stack[fr];
15853142b376SMark Johnston #ifndef illumos
15863142b376SMark Johnston 				lsp->ls_lock = strdup(oldlsp->ls_lock);
15873142b376SMark Johnston #endif
15887e1e3d94SStacey Son 				/* LINTED - alignment */
15897e1e3d94SStacey Son 				lsp = (lsrec_t *)((char *)lsp + LS_TIME);
15907e1e3d94SStacey Son 			}
15917e1e3d94SStacey Son 			if (!caller_in_stack) {
15927e1e3d94SStacey Son 				bcopy(oldlsp, lsp, LS_TIME);
15937e1e3d94SStacey Son 				/* LINTED - alignment */
15947e1e3d94SStacey Son 				lsp = (lsrec_t *)((char *)lsp + LS_TIME);
15957e1e3d94SStacey Son 			}
15963142b376SMark Johnston #ifndef illumos
15973142b376SMark Johnston 			free(oldlsp->ls_lock);
15983142b376SMark Johnston #endif
15997e1e3d94SStacey Son 		}
16007e1e3d94SStacey Son 		g_nrecs = g_nrecs_used =
16017e1e3d94SStacey Son 		    ((uintptr_t)lsp - (uintptr_t)newlsp) / LS_TIME;
16027e1e3d94SStacey Son 		g_recsize = LS_TIME;
16037e1e3d94SStacey Son 		g_stkdepth = 0;
16047e1e3d94SStacey Son 		free(data_buf);
16057e1e3d94SStacey Son 		data_buf = (char *)newlsp;
16067e1e3d94SStacey Son 	}
16077e1e3d94SStacey Son 
16087e1e3d94SStacey Son 	if ((sort_buf = calloc(2 * (g_nrecs + 1),
16097e1e3d94SStacey Son 	    sizeof (void *))) == NULL)
16107e1e3d94SStacey Son 		fail(1, "Sort buffer allocation failed");
16117e1e3d94SStacey Son 	merge_buf = sort_buf + (g_nrecs + 1);
16127e1e3d94SStacey Son 
16137e1e3d94SStacey Son 	/*
16147e1e3d94SStacey Son 	 * Build the sort buffer, discarding zero-count records along the way.
16157e1e3d94SStacey Son 	 */
16167e1e3d94SStacey Son 	/* LINTED - alignment */
16177e1e3d94SStacey Son 	for (i = 0, lsp = (lsrec_t *)data_buf; i < g_nrecs_used; i++,
16187e1e3d94SStacey Son 	    /* LINTED - alignment */
16197e1e3d94SStacey Son 	    lsp = (lsrec_t *)((char *)lsp + g_recsize)) {
16207e1e3d94SStacey Son 		if (lsp->ls_count == 0)
16217e1e3d94SStacey Son 			lsp->ls_event = LS_MAX_EVENTS;
16227e1e3d94SStacey Son 		sort_buf[i] = lsp;
16237e1e3d94SStacey Son 	}
16247e1e3d94SStacey Son 
16257e1e3d94SStacey Son 	if (g_nrecs_used == 0)
16267e1e3d94SStacey Son 		exit(0);
16277e1e3d94SStacey Son 
16287e1e3d94SStacey Son 	/*
16297e1e3d94SStacey Son 	 * Add a sentinel after the last record
16307e1e3d94SStacey Son 	 */
16317e1e3d94SStacey Son 	sort_buf[i] = lsp;
16327e1e3d94SStacey Son 	lsp->ls_event = LS_MAX_EVENTS;
16337e1e3d94SStacey Son 
16347e1e3d94SStacey Son 	if (g_tracing) {
16357e1e3d94SStacey Son 		report_trace(out, sort_buf);
16367e1e3d94SStacey Son 		return (0);
16377e1e3d94SStacey Son 	}
16387e1e3d94SStacey Son 
16397e1e3d94SStacey Son 	/*
16407e1e3d94SStacey Son 	 * Application of -g may have resulted in multiple records
16417e1e3d94SStacey Son 	 * with the same signature; coalesce them.
16427e1e3d94SStacey Son 	 */
16437e1e3d94SStacey Son 	if (g_gflag) {
16447e1e3d94SStacey Son 		mergesort(lockcmp, sort_buf, merge_buf, g_nrecs_used);
16457e1e3d94SStacey Son 		coalesce(lockcmp, sort_buf, g_nrecs_used);
16467e1e3d94SStacey Son 	}
16477e1e3d94SStacey Son 
16487e1e3d94SStacey Son 	/*
16497e1e3d94SStacey Son 	 * Coalesce locks within the same symbol if -c option specified.
16507e1e3d94SStacey Son 	 * Coalesce PCs within the same function if -k option specified.
16517e1e3d94SStacey Son 	 */
16527e1e3d94SStacey Son 	if (g_cflag || g_kflag) {
16537e1e3d94SStacey Son 		for (i = 0; i < g_nrecs_used; i++) {
16547e1e3d94SStacey Son 			int fr;
16557e1e3d94SStacey Son 			lsp = sort_buf[i];
16563142b376SMark Johnston #ifdef illumos
16577e1e3d94SStacey Son 			if (g_cflag)
16587e1e3d94SStacey Son 				coalesce_symbol(&lsp->ls_lock);
16593142b376SMark Johnston #endif
16607e1e3d94SStacey Son 			if (g_kflag) {
16617e1e3d94SStacey Son 				for (fr = 0; fr < g_stkdepth; fr++)
16627e1e3d94SStacey Son 					coalesce_symbol(&lsp->ls_stack[fr]);
16637e1e3d94SStacey Son 				coalesce_symbol(&lsp->ls_caller);
16647e1e3d94SStacey Son 			}
16657e1e3d94SStacey Son 		}
16667e1e3d94SStacey Son 		mergesort(lockcmp, sort_buf, merge_buf, g_nrecs_used);
16677e1e3d94SStacey Son 		coalesce(lockcmp, sort_buf, g_nrecs_used);
16687e1e3d94SStacey Son 	}
16697e1e3d94SStacey Son 
16707e1e3d94SStacey Son 	/*
16717e1e3d94SStacey Son 	 * Coalesce callers if -w option specified
16727e1e3d94SStacey Son 	 */
16737e1e3d94SStacey Son 	if (g_wflag) {
16747e1e3d94SStacey Son 		mergesort(lock_and_count_cmp_anywhere,
16757e1e3d94SStacey Son 		    sort_buf, merge_buf, g_nrecs_used);
16767e1e3d94SStacey Son 		coalesce(lockcmp_anywhere, sort_buf, g_nrecs_used);
16777e1e3d94SStacey Son 	}
16787e1e3d94SStacey Son 
16797e1e3d94SStacey Son 	/*
16807e1e3d94SStacey Son 	 * Coalesce locks if -W option specified
16817e1e3d94SStacey Son 	 */
16827e1e3d94SStacey Son 	if (g_Wflag) {
16837e1e3d94SStacey Son 		mergesort(site_and_count_cmp_anylock,
16847e1e3d94SStacey Son 		    sort_buf, merge_buf, g_nrecs_used);
16857e1e3d94SStacey Son 		coalesce(sitecmp_anylock, sort_buf, g_nrecs_used);
16867e1e3d94SStacey Son 	}
16877e1e3d94SStacey Son 
16887e1e3d94SStacey Son 	/*
16897e1e3d94SStacey Son 	 * Sort data by contention count (ls_count) or total time (ls_time),
16907e1e3d94SStacey Son 	 * depending on g_Pflag.  Override g_Pflag if time wasn't measured.
16917e1e3d94SStacey Son 	 */
16927e1e3d94SStacey Son 	if (g_recsize < LS_TIME)
16937e1e3d94SStacey Son 		g_Pflag = 0;
16947e1e3d94SStacey Son 
16957e1e3d94SStacey Son 	if (g_Pflag)
16967e1e3d94SStacey Son 		mergesort(timecmp, sort_buf, merge_buf, g_nrecs_used);
16977e1e3d94SStacey Son 	else
16987e1e3d94SStacey Son 		mergesort(countcmp, sort_buf, merge_buf, g_nrecs_used);
16997e1e3d94SStacey Son 
17007e1e3d94SStacey Son 	/*
17017e1e3d94SStacey Son 	 * Display data by event type
17027e1e3d94SStacey Son 	 */
17037e1e3d94SStacey Son 	first = &sort_buf[0];
17047e1e3d94SStacey Son 	while ((event = (*first)->ls_event) < LS_MAX_EVENTS) {
17057e1e3d94SStacey Son 		current = first;
17067e1e3d94SStacey Son 		while ((lsp = *current)->ls_event == event)
17077e1e3d94SStacey Son 			current++;
17087e1e3d94SStacey Son 		report_stats(out, first, current - first, ev_count[event],
17097e1e3d94SStacey Son 		    ev_time[event]);
17107e1e3d94SStacey Son 		first = current;
17117e1e3d94SStacey Son 	}
17127e1e3d94SStacey Son 
17133142b376SMark Johnston #ifndef illumos
17143142b376SMark Johnston 	/*
17153142b376SMark Johnston 	 * Free lock name buffers
17163142b376SMark Johnston 	 */
17173142b376SMark Johnston 	for (i = 0, lsp = (lsrec_t *)data_buf; i < g_nrecs_used; i++,
17183142b376SMark Johnston 	    lsp = (lsrec_t *)((char *)lsp + g_recsize))
17193142b376SMark Johnston 		free(lsp->ls_lock);
17203142b376SMark Johnston #endif
17213142b376SMark Johnston 
17227e1e3d94SStacey Son 	return (0);
17237e1e3d94SStacey Son }
17247e1e3d94SStacey Son 
17257e1e3d94SStacey Son static char *
format_symbol(char * buf,uintptr_t addr,int show_size)17267e1e3d94SStacey Son format_symbol(char *buf, uintptr_t addr, int show_size)
17277e1e3d94SStacey Son {
17287e1e3d94SStacey Son 	uintptr_t symoff;
17297e1e3d94SStacey Son 	char *symname;
17307e1e3d94SStacey Son 	size_t symsize;
17317e1e3d94SStacey Son 
17327e1e3d94SStacey Son 	symname = addr_to_sym(addr, &symoff, &symsize);
17337e1e3d94SStacey Son 
17347e1e3d94SStacey Son 	if (show_size && symoff == 0)
17357e1e3d94SStacey Son 		(void) sprintf(buf, "%s[%ld]", symname, (long)symsize);
17367e1e3d94SStacey Son 	else if (symoff == 0)
17377e1e3d94SStacey Son 		(void) sprintf(buf, "%s", symname);
17387e1e3d94SStacey Son 	else if (symoff < 16 && bcmp(symname, "cpu[", 4) == 0)	/* CPU+PIL */
1739bc96366cSSteven Hartland #ifdef illumos
17407e1e3d94SStacey Son 		(void) sprintf(buf, "%s+%ld", symname, (long)symoff);
17417e1e3d94SStacey Son #else
17427e1e3d94SStacey Son 		(void) sprintf(buf, "%s+%s", symname, g_pri_class[(int)symoff]);
17437e1e3d94SStacey Son #endif
17447e1e3d94SStacey Son 	else if (symoff <= symsize || (symoff < 256 && addr != symoff))
17457e1e3d94SStacey Son 		(void) sprintf(buf, "%s+0x%llx", symname,
17467e1e3d94SStacey Son 		    (unsigned long long)symoff);
17477e1e3d94SStacey Son 	else
17487e1e3d94SStacey Son 		(void) sprintf(buf, "0x%llx", (unsigned long long)addr);
17497e1e3d94SStacey Son 	return (buf);
17507e1e3d94SStacey Son }
17517e1e3d94SStacey Son 
17527e1e3d94SStacey Son static void
report_stats(FILE * out,lsrec_t ** sort_buf,size_t nrecs,uint64_t total_count,uint64_t total_time)17537e1e3d94SStacey Son report_stats(FILE *out, lsrec_t **sort_buf, size_t nrecs, uint64_t total_count,
17547e1e3d94SStacey Son 	uint64_t total_time)
17557e1e3d94SStacey Son {
17567e1e3d94SStacey Son 	uint32_t event = sort_buf[0]->ls_event;
17577e1e3d94SStacey Son 	lsrec_t *lsp;
17587e1e3d94SStacey Son 	double ptotal = 0.0;
17597e1e3d94SStacey Son 	double percent;
17607e1e3d94SStacey Son 	int i, j, fr;
17617e1e3d94SStacey Son 	int displayed;
17627e1e3d94SStacey Son 	int first_bin, last_bin, max_bin_count, total_bin_count;
17637e1e3d94SStacey Son 	int rectype;
17647e1e3d94SStacey Son 	char buf[256];
17657e1e3d94SStacey Son 	char lhdr[80], chdr[80];
17667e1e3d94SStacey Son 
17677e1e3d94SStacey Son 	rectype = g_recsize;
17687e1e3d94SStacey Son 
17697e1e3d94SStacey Son 	if (g_topn == 0) {
17707e1e3d94SStacey Son 		(void) fprintf(out, "%20llu %s\n",
17717e1e3d94SStacey Son 		    g_rates == 0 ? total_count :
17727e1e3d94SStacey Son 		    ((unsigned long long)total_count * NANOSEC) / g_elapsed,
17737e1e3d94SStacey Son 		    g_event_info[event].ev_desc);
17747e1e3d94SStacey Son 		return;
17757e1e3d94SStacey Son 	}
17767e1e3d94SStacey Son 
17777e1e3d94SStacey Son 	(void) sprintf(lhdr, "%s%s",
17787e1e3d94SStacey Son 	    g_Wflag ? "Hottest " : "", g_event_info[event].ev_lhdr);
17797e1e3d94SStacey Son 	(void) sprintf(chdr, "%s%s",
17807e1e3d94SStacey Son 	    g_wflag ? "Hottest " : "", "Caller");
17817e1e3d94SStacey Son 
17827e1e3d94SStacey Son 	if (!g_pflag)
17837e1e3d94SStacey Son 		(void) fprintf(out,
17847e1e3d94SStacey Son 		    "\n%s: %.0f events in %.3f seconds (%.0f events/sec)\n\n",
17857e1e3d94SStacey Son 		    g_event_info[event].ev_desc, (double)total_count,
17867e1e3d94SStacey Son 		    (double)g_elapsed / NANOSEC,
17877e1e3d94SStacey Son 		    (double)total_count * NANOSEC / g_elapsed);
17887e1e3d94SStacey Son 
17897e1e3d94SStacey Son 	if (!g_pflag && rectype < LS_HIST) {
17907e1e3d94SStacey Son 		(void) sprintf(buf, "%s", g_event_info[event].ev_units);
17917e1e3d94SStacey Son 		(void) fprintf(out, "%5s %4s %4s %4s %8s %-22s %-24s\n",
17927e1e3d94SStacey Son 		    g_rates ? "ops/s" : "Count",
17937e1e3d94SStacey Son 		    g_gflag ? "genr" : "indv",
17947e1e3d94SStacey Son 		    "cuml", "rcnt", rectype >= LS_TIME ? buf : "", lhdr, chdr);
17957e1e3d94SStacey Son 		(void) fprintf(out, "---------------------------------"
17967e1e3d94SStacey Son 		    "----------------------------------------------\n");
17977e1e3d94SStacey Son 	}
17987e1e3d94SStacey Son 
17997e1e3d94SStacey Son 	displayed = 0;
18007e1e3d94SStacey Son 	for (i = 0; i < nrecs; i++) {
18017e1e3d94SStacey Son 		lsp = sort_buf[i];
18027e1e3d94SStacey Son 
18037e1e3d94SStacey Son 		if (displayed++ >= g_topn)
18047e1e3d94SStacey Son 			break;
18057e1e3d94SStacey Son 
18067e1e3d94SStacey Son 		if (g_pflag) {
18077e1e3d94SStacey Son 			int j;
18087e1e3d94SStacey Son 
18097e1e3d94SStacey Son 			(void) fprintf(out, "%u %u",
18107e1e3d94SStacey Son 			    lsp->ls_event, lsp->ls_count);
18113142b376SMark Johnston #ifdef illumos
18127e1e3d94SStacey Son 			(void) fprintf(out, " %s",
18137e1e3d94SStacey Son 			    format_symbol(buf, lsp->ls_lock, g_cflag));
18143142b376SMark Johnston #else
18153142b376SMark Johnston 			(void) fprintf(out, " %s", lsp->ls_lock);
18163142b376SMark Johnston #endif
18177e1e3d94SStacey Son 			(void) fprintf(out, " %s",
18187e1e3d94SStacey Son 			    format_symbol(buf, lsp->ls_caller, 0));
18197e1e3d94SStacey Son 			(void) fprintf(out, " %f",
18207e1e3d94SStacey Son 			    (double)lsp->ls_refcnt / lsp->ls_count);
18217e1e3d94SStacey Son 			if (rectype >= LS_TIME)
18227e1e3d94SStacey Son 				(void) fprintf(out, " %llu",
18237e1e3d94SStacey Son 				    (unsigned long long)lsp->ls_time);
18247e1e3d94SStacey Son 			if (rectype >= LS_HIST) {
18257e1e3d94SStacey Son 				for (j = 0; j < 64; j++)
18267e1e3d94SStacey Son 					(void) fprintf(out, " %u",
18277e1e3d94SStacey Son 					    lsp->ls_hist[j]);
18287e1e3d94SStacey Son 			}
18297e1e3d94SStacey Son 			for (j = 0; j < LS_MAX_STACK_DEPTH; j++) {
18307e1e3d94SStacey Son 				if (rectype <= LS_STACK(j) ||
18317e1e3d94SStacey Son 				    lsp->ls_stack[j] == 0)
18327e1e3d94SStacey Son 					break;
18337e1e3d94SStacey Son 				(void) fprintf(out, " %s",
18347e1e3d94SStacey Son 				    format_symbol(buf, lsp->ls_stack[j], 0));
18357e1e3d94SStacey Son 			}
18367e1e3d94SStacey Son 			(void) fprintf(out, "\n");
18377e1e3d94SStacey Son 			continue;
18387e1e3d94SStacey Son 		}
18397e1e3d94SStacey Son 
18407e1e3d94SStacey Son 		if (rectype >= LS_HIST) {
18417e1e3d94SStacey Son 			(void) fprintf(out, "---------------------------------"
18427e1e3d94SStacey Son 			    "----------------------------------------------\n");
18437e1e3d94SStacey Son 			(void) sprintf(buf, "%s",
18447e1e3d94SStacey Son 			    g_event_info[event].ev_units);
18457e1e3d94SStacey Son 			(void) fprintf(out, "%5s %4s %4s %4s %8s %-22s %-24s\n",
18467e1e3d94SStacey Son 			    g_rates ? "ops/s" : "Count",
18477e1e3d94SStacey Son 			    g_gflag ? "genr" : "indv",
18487e1e3d94SStacey Son 			    "cuml", "rcnt", buf, lhdr, chdr);
18497e1e3d94SStacey Son 		}
18507e1e3d94SStacey Son 
18517e1e3d94SStacey Son 		if (g_Pflag && total_time != 0)
18527e1e3d94SStacey Son 			percent = (lsp->ls_time * 100.00) / total_time;
18537e1e3d94SStacey Son 		else
18547e1e3d94SStacey Son 			percent = (lsp->ls_count * 100.00) / total_count;
18557e1e3d94SStacey Son 
18567e1e3d94SStacey Son 		ptotal += percent;
18577e1e3d94SStacey Son 
18587e1e3d94SStacey Son 		if (rectype >= LS_TIME)
18597e1e3d94SStacey Son 			(void) sprintf(buf, "%llu",
18607e1e3d94SStacey Son 			    (unsigned long long)(lsp->ls_time / lsp->ls_count));
18617e1e3d94SStacey Son 		else
18627e1e3d94SStacey Son 			buf[0] = '\0';
18637e1e3d94SStacey Son 
18647e1e3d94SStacey Son 		(void) fprintf(out, "%5llu ",
18657e1e3d94SStacey Son 		    g_rates == 0 ? lsp->ls_count :
18667e1e3d94SStacey Son 		    ((uint64_t)lsp->ls_count * NANOSEC) / g_elapsed);
18677e1e3d94SStacey Son 
18687e1e3d94SStacey Son 		(void) fprintf(out, "%3.0f%% ", percent);
18697e1e3d94SStacey Son 
18707e1e3d94SStacey Son 		if (g_gflag)
18717e1e3d94SStacey Son 			(void) fprintf(out, "---- ");
18727e1e3d94SStacey Son 		else
18737e1e3d94SStacey Son 			(void) fprintf(out, "%3.0f%% ", ptotal);
18747e1e3d94SStacey Son 
18757e1e3d94SStacey Son 		(void) fprintf(out, "%4.2f %8s ",
18767e1e3d94SStacey Son 		    (double)lsp->ls_refcnt / lsp->ls_count, buf);
18777e1e3d94SStacey Son 
18783142b376SMark Johnston #ifdef illumos
18797e1e3d94SStacey Son 		(void) fprintf(out, "%-22s ",
18807e1e3d94SStacey Son 		    format_symbol(buf, lsp->ls_lock, g_cflag));
18813142b376SMark Johnston #else
18823142b376SMark Johnston 		(void) fprintf(out, "%-22s ", lsp->ls_lock);
18833142b376SMark Johnston #endif
18847e1e3d94SStacey Son 
18857e1e3d94SStacey Son 		(void) fprintf(out, "%-24s\n",
18867e1e3d94SStacey Son 		    format_symbol(buf, lsp->ls_caller, 0));
18877e1e3d94SStacey Son 
18887e1e3d94SStacey Son 		if (rectype < LS_HIST)
18897e1e3d94SStacey Son 			continue;
18907e1e3d94SStacey Son 
18917e1e3d94SStacey Son 		(void) fprintf(out, "\n");
18927e1e3d94SStacey Son 		(void) fprintf(out, "%10s %31s %-9s %-24s\n",
18937e1e3d94SStacey Son 		    g_event_info[event].ev_units,
18947e1e3d94SStacey Son 		    "------ Time Distribution ------",
18957e1e3d94SStacey Son 		    g_rates ? "ops/s" : "count",
18967e1e3d94SStacey Son 		    rectype > LS_STACK(0) ? "Stack" : "");
18977e1e3d94SStacey Son 
18987e1e3d94SStacey Son 		first_bin = 0;
18997e1e3d94SStacey Son 		while (lsp->ls_hist[first_bin] == 0)
19007e1e3d94SStacey Son 			first_bin++;
19017e1e3d94SStacey Son 
19027e1e3d94SStacey Son 		last_bin = 63;
19037e1e3d94SStacey Son 		while (lsp->ls_hist[last_bin] == 0)
19047e1e3d94SStacey Son 			last_bin--;
19057e1e3d94SStacey Son 
19067e1e3d94SStacey Son 		max_bin_count = 0;
19077e1e3d94SStacey Son 		total_bin_count = 0;
19087e1e3d94SStacey Son 		for (j = first_bin; j <= last_bin; j++) {
19097e1e3d94SStacey Son 			total_bin_count += lsp->ls_hist[j];
19107e1e3d94SStacey Son 			if (lsp->ls_hist[j] > max_bin_count)
19117e1e3d94SStacey Son 				max_bin_count = lsp->ls_hist[j];
19127e1e3d94SStacey Son 		}
19137e1e3d94SStacey Son 
19147e1e3d94SStacey Son 		/*
19157e1e3d94SStacey Son 		 * If we went a few frames below the caller, ignore them
19167e1e3d94SStacey Son 		 */
19177e1e3d94SStacey Son 		for (fr = 3; fr > 0; fr--)
19187e1e3d94SStacey Son 			if (lsp->ls_stack[fr] == lsp->ls_caller)
19197e1e3d94SStacey Son 				break;
19207e1e3d94SStacey Son 
19217e1e3d94SStacey Son 		for (j = first_bin; j <= last_bin; j++) {
19227e1e3d94SStacey Son 			uint_t depth = (lsp->ls_hist[j] * 30) / total_bin_count;
19237e1e3d94SStacey Son 			(void) fprintf(out, "%10llu |%s%s %-9u ",
19247e1e3d94SStacey Son 			    1ULL << j,
19257e1e3d94SStacey Son 			    "@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@" + 30 - depth,
19267e1e3d94SStacey Son 			    "                              " + depth,
19277e1e3d94SStacey Son 			    g_rates == 0 ? lsp->ls_hist[j] :
19287e1e3d94SStacey Son 			    (uint_t)(((uint64_t)lsp->ls_hist[j] * NANOSEC) /
19297e1e3d94SStacey Son 			    g_elapsed));
19307e1e3d94SStacey Son 			if (rectype <= LS_STACK(fr) || lsp->ls_stack[fr] == 0) {
19317e1e3d94SStacey Son 				(void) fprintf(out, "\n");
19327e1e3d94SStacey Son 				continue;
19337e1e3d94SStacey Son 			}
19347e1e3d94SStacey Son 			(void) fprintf(out, "%-24s\n",
19357e1e3d94SStacey Son 			    format_symbol(buf, lsp->ls_stack[fr], 0));
19367e1e3d94SStacey Son 			fr++;
19377e1e3d94SStacey Son 		}
19387e1e3d94SStacey Son 		while (rectype > LS_STACK(fr) && lsp->ls_stack[fr] != 0) {
19397e1e3d94SStacey Son 			(void) fprintf(out, "%15s %-36s %-24s\n", "", "",
19407e1e3d94SStacey Son 			    format_symbol(buf, lsp->ls_stack[fr], 0));
19417e1e3d94SStacey Son 			fr++;
19427e1e3d94SStacey Son 		}
19437e1e3d94SStacey Son 	}
19447e1e3d94SStacey Son 
19457e1e3d94SStacey Son 	if (!g_pflag)
19467e1e3d94SStacey Son 		(void) fprintf(out, "---------------------------------"
19477e1e3d94SStacey Son 		    "----------------------------------------------\n");
19487e1e3d94SStacey Son 
19497e1e3d94SStacey Son 	(void) fflush(out);
19507e1e3d94SStacey Son }
19517e1e3d94SStacey Son 
19527e1e3d94SStacey Son static void
report_trace(FILE * out,lsrec_t ** sort_buf)19537e1e3d94SStacey Son report_trace(FILE *out, lsrec_t **sort_buf)
19547e1e3d94SStacey Son {
19557e1e3d94SStacey Son 	lsrec_t *lsp;
19567e1e3d94SStacey Son 	int i, fr;
19577e1e3d94SStacey Son 	int rectype;
19587e1e3d94SStacey Son 	char buf[256], buf2[256];
19597e1e3d94SStacey Son 
19607e1e3d94SStacey Son 	rectype = g_recsize;
19617e1e3d94SStacey Son 
19627e1e3d94SStacey Son 	if (!g_pflag) {
19637e1e3d94SStacey Son 		(void) fprintf(out, "%5s  %7s  %11s  %-24s  %-24s\n",
19647e1e3d94SStacey Son 		    "Event", "Time", "Owner", "Lock", "Caller");
19657e1e3d94SStacey Son 		(void) fprintf(out, "---------------------------------"
19667e1e3d94SStacey Son 		    "----------------------------------------------\n");
19677e1e3d94SStacey Son 	}
19687e1e3d94SStacey Son 
19697e1e3d94SStacey Son 	for (i = 0; i < g_nrecs_used; i++) {
19707e1e3d94SStacey Son 
19717e1e3d94SStacey Son 		lsp = sort_buf[i];
19727e1e3d94SStacey Son 
19737e1e3d94SStacey Son 		if (lsp->ls_event >= LS_MAX_EVENTS || lsp->ls_count == 0)
19747e1e3d94SStacey Son 			continue;
19757e1e3d94SStacey Son 
19767e1e3d94SStacey Son 		(void) fprintf(out, "%2d  %10llu  %11p  %-24s  %-24s\n",
19777e1e3d94SStacey Son 		    lsp->ls_event, (unsigned long long)lsp->ls_time,
19787e1e3d94SStacey Son 		    (void *)lsp->ls_next,
19793142b376SMark Johnston #ifdef illumos
19807e1e3d94SStacey Son 		    format_symbol(buf, lsp->ls_lock, 0),
19813142b376SMark Johnston #else
19823142b376SMark Johnston 		    lsp->ls_lock,
19833142b376SMark Johnston #endif
19847e1e3d94SStacey Son 		    format_symbol(buf2, lsp->ls_caller, 0));
19857e1e3d94SStacey Son 
19867e1e3d94SStacey Son 		if (rectype <= LS_STACK(0))
19877e1e3d94SStacey Son 			continue;
19887e1e3d94SStacey Son 
19897e1e3d94SStacey Son 		/*
19907e1e3d94SStacey Son 		 * If we went a few frames below the caller, ignore them
19917e1e3d94SStacey Son 		 */
19927e1e3d94SStacey Son 		for (fr = 3; fr > 0; fr--)
19937e1e3d94SStacey Son 			if (lsp->ls_stack[fr] == lsp->ls_caller)
19947e1e3d94SStacey Son 				break;
19957e1e3d94SStacey Son 
19967e1e3d94SStacey Son 		while (rectype > LS_STACK(fr) && lsp->ls_stack[fr] != 0) {
19977e1e3d94SStacey Son 			(void) fprintf(out, "%53s  %-24s\n", "",
19987e1e3d94SStacey Son 			    format_symbol(buf, lsp->ls_stack[fr], 0));
19997e1e3d94SStacey Son 			fr++;
20007e1e3d94SStacey Son 		}
20017e1e3d94SStacey Son 		(void) fprintf(out, "\n");
20027e1e3d94SStacey Son 	}
20037e1e3d94SStacey Son 
20047e1e3d94SStacey Son 	(void) fflush(out);
20057e1e3d94SStacey Son }
2006