354 lines
12 KiB
C
354 lines
12 KiB
C
/* $NetBSD: pmc.c,v 1.2 2001/02/20 23:55:12 cgd Exp $ */
|
|
|
|
/*
|
|
* Copyright 2000 Wasabi Systems, Inc.
|
|
* All rights reserved.
|
|
*
|
|
* Written by Frank van der Linden for Wasabi Systems, Inc.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. All advertising materials mentioning features or use of this software
|
|
* must display the following acknowledgement:
|
|
* This product includes software developed for the NetBSD Project by
|
|
* Wasabi Systems, Inc.
|
|
* 4. The name of Wasabi Systems, Inc. may not be used to endorse
|
|
* or promote products derived from this software without specific prior
|
|
* written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC
|
|
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
* POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include <sys/types.h>
|
|
#include <machine/sysarch.h>
|
|
#include <machine/specialreg.h>
|
|
#include <sys/wait.h>
|
|
#include <err.h>
|
|
#include <errno.h>
|
|
#include <signal.h>
|
|
#include <stdlib.h>
|
|
#include <stdio.h>
|
|
#include <unistd.h>
|
|
|
|
const struct pmc_name2val {
|
|
const char *name;
|
|
int val;
|
|
int unit;
|
|
} pmc_names[] = {
|
|
{ "mem-refs", PMC6_DATA_MEM_REFS, 0 },
|
|
{ "l1cache-lines", PMC6_DCU_LINES_IN, 0 },
|
|
{ "l1cache-mlines", PMC6_DCU_M_LINES_IN, 0 },
|
|
{ "l1cache-mlines-evict", PMC6_DCU_M_LINES_OUT, 0 },
|
|
{ "l1cache-miss-wait", PMC6_DCU_MISS_OUTSTANDING, 0 },
|
|
{ "ins-fetch", PMC6_IFU_IFETCH, 0 },
|
|
{ "ins-fetch-misses", PMC6_IFU_IFETCH_MISS, 0 },
|
|
{ "itlb-misses", PMC6_IFU_IFETCH_MISS, 0 },
|
|
{ "insfetch-mem-stall", PMC6_IFU_MEM_STALL, 0 },
|
|
{ "insfetch-decode-stall", PMC6_ILD_STALL, 0 },
|
|
|
|
{ "l2cache-insfetch", PMC6_L2_IFETCH, 0x0f },
|
|
{ "l2cache-data-loads", PMC6_L2_LD, 0x0f },
|
|
{ "l2cache-data-stores", PMC6_L2_ST, 0x0f },
|
|
{ "l2cache-lines", PMC6_L2_LINES_IN, 0 },
|
|
{ "l2cache-lines-evict", PMC6_L2_LINES_OUT, 0 },
|
|
{ "l2cache-mlines", PMC6_L2_M_LINES_INM, 0 },
|
|
{ "l2cache-mlines-evict", PMC6_L2_M_LINES_OUTM, 0x0f },
|
|
{ "l2cache-reqs", PMC6_L2_RQSTS, 0 },
|
|
{ "l2cache-addr-strobes", PMC6_L2_ADS, 0 },
|
|
{ "l2cache-data-busy", PMC6_L2_DBUS_BUSY, 0 },
|
|
{ "l2cache-data-busy-read", PMC6_L2_DBUS_BUSY_RD },
|
|
|
|
{ "bus-drdy-clocks-self", PMC6_BUS_DRDY_CLOCKS, 0x00 },
|
|
{ "bus-drdy-clocks-any", PMC6_BUS_DRDY_CLOCKS, 0x20 },
|
|
{ "bus-lock-clocks-self", PMC6_BUS_LOCK_CLOCKS, 0x00 },
|
|
{ "bus-lock-clocks-any", PMC6_BUS_LOCK_CLOCKS, 0x20 },
|
|
{ "bus-req-outstanding-self", PMC6_BUS_REQ_OUTSTANDING, 0x00 },
|
|
{ "bus-req-outstanding-any", PMC6_BUS_REQ_OUTSTANDING, 0x20 },
|
|
{ "bus-burst-reads-self", PMC6_BUS_TRAN_BRD, 0x00 },
|
|
{ "bus-burst-reads-any", PMC6_BUS_TRAN_BRD, 0x20 },
|
|
{ "bus-read-for-ownership-self",PMC6_BUS_TRAN_RFO, 0x00 },
|
|
{ "bus-read-for-ownership-any", PMC6_BUS_TRAN_RFO, 0x20 },
|
|
{ "bus-write-back-self", PMC6_BUS_TRANS_WB, 0x00 },
|
|
{ "bus-write-back-any", PMC6_BUS_TRANS_WB, 0x20 },
|
|
{ "bus-ins-fetches-self", PMC6_BUS_TRAN_IFETCH, 0x00 },
|
|
{ "bus-ins-fetches-any", PMC6_BUS_TRAN_IFETCH, 0x20 },
|
|
{ "bus-invalidates-self", PMC6_BUS_TRAN_INVAL, 0x00 },
|
|
{ "bus-invalidates-any", PMC6_BUS_TRAN_INVAL, 0x20 },
|
|
{ "bus-partial-writes-self", PMC6_BUS_TRAN_PWR, 0x00 },
|
|
{ "bus-partial-writes-any", PMC6_BUS_TRAN_PWR, 0x20 },
|
|
{ "bus-partial-trans-self", PMC6_BUS_TRANS_P, 0x00 },
|
|
{ "bus-partial-trans-any", PMC6_BUS_TRANS_P, 0x20 },
|
|
{ "bus-io-trans-self", PMC6_BUS_TRANS_IO, 0x00 },
|
|
{ "bus-io-trans-any", PMC6_BUS_TRANS_IO, 0x20 },
|
|
{ "bus-deferred-trans-self", PMC6_BUS_TRAN_DEF, 0x00 },
|
|
{ "bus-deferred-trans-any", PMC6_BUS_TRAN_DEF, 0x20 },
|
|
{ "bus-burst-trans-self", PMC6_BUS_TRAN_BURST, 0x00 },
|
|
{ "bus-burst-trans-any", PMC6_BUS_TRAN_BURST, 0x20 },
|
|
{ "bus-total-trans-self", PMC6_BUS_TRAN_ANY, 0x00 },
|
|
{ "bus-total-trans-any", PMC6_BUS_TRAN_ANY, 0x20 },
|
|
{ "bus-mem-trans-self", PMC6_BUS_TRAN_MEM, 0x00 },
|
|
{ "bus-mem-trans-any", PMC6_BUS_TRAN_MEM, 0x20 },
|
|
{ "bus-recv-cycles", PMC6_BUS_DATA_RCV, 0 },
|
|
{ "bus-bnr-cycles", PMC6_BUS_BNR_DRV, 0 },
|
|
{ "bus-hit-cycles", PMC6_BUS_HIT_DRV, 0 },
|
|
{ "bus-hitm-cycles", PMC6_BUS_HITM_DRDV, 0 },
|
|
{ "bus-snoop-stall", PMC6_BUS_SNOOP_STALL, 0 },
|
|
|
|
{ "fpu-flops", PMC6_FLOPS, 0 },
|
|
{ "fpu-comp-ops", PMC6_FP_COMP_OPS_EXE, 0 },
|
|
{ "fpu-except-assist", PMC6_FP_ASSIST, 0 },
|
|
{ "fpu-mul", PMC6_MUL, 0 },
|
|
{ "fpu-div", PMC6_DIV, 0 },
|
|
{ "fpu-div-busy", PMC6_CYCLES_DIV_BUSY, 0 },
|
|
|
|
{ "mem-sb-blocks", PMC6_LD_BLOCKS, 0 },
|
|
{ "mem-sb-drains", PMC6_SB_DRAINS, 0 },
|
|
{ "mem-misalign-ref", PMC6_MISALIGN_MEM_REF, 0 },
|
|
{ "ins-pref-dispatch-nta", PMC6_EMON_KNI_PREF_DISPATCHED, 0x01 },
|
|
{ "ins-pref-dispatch-t1", PMC6_EMON_KNI_PREF_DISPATCHED, 0x01 },
|
|
{ "ins-pref-dispatch-t2", PMC6_EMON_KNI_PREF_DISPATCHED, 0x02 },
|
|
{ "ins-pref-dispatch-weak", PMC6_EMON_KNI_PREF_DISPATCHED, 0x03 },
|
|
{ "ins-pref-miss-nta", PMC6_EMON_KNI_PREF_MISS, 0x01 },
|
|
{ "ins-pref-miss-t1", PMC6_EMON_KNI_PREF_MISS, 0x01 },
|
|
{ "ins-pref-miss-t2", PMC6_EMON_KNI_PREF_MISS, 0x02 },
|
|
{ "ins-pref-miss-weak", PMC6_EMON_KNI_PREF_MISS, 0x03 },
|
|
|
|
{ "ins-retired", PMC6_INST_RETIRED, 0 },
|
|
{ "uops-retired", PMC6_UOPS_RETIRED, 0 },
|
|
{ "ins-decoded", PMC6_INST_DECODED, 0 },
|
|
{ "ins-stream-retired-packed-scalar",
|
|
PMC6_EMON_KNI_INST_RETIRED, 0x00 },
|
|
{ "ins-stream-retired-scalar",
|
|
PMC6_EMON_KNI_INST_RETIRED, 0x01 },
|
|
{ "ins-stream-comp-retired-packed-scalar",
|
|
PMC6_EMON_KNI_COMP_INST_RET, 0x00 },
|
|
{ "ins-stream-comp-retired--scalar",
|
|
PMC6_EMON_KNI_COMP_INST_RET, 0x01 },
|
|
|
|
|
|
{ "int-hw", PMC6_HW_INT_RX, 0 },
|
|
{ "int-cycles-masked", PMC6_CYCLES_INT_MASKED, 0 },
|
|
{ "int-cycles-masked-pending", PMC6_CYCLES_INT_PENDING_AND_MASKED, 0 },
|
|
|
|
{ "branch-retired", PMC6_BR_INST_RETIRED, 0 },
|
|
{ "branch-miss-retired", PMC6_BR_MISS_PRED_RETIRED, 0 },
|
|
{ "branch-taken-retired", PMC6_BR_TAKEN_RETIRED, 0 },
|
|
{ "branch-taken-mispred-retired", PMC6_BR_MISS_PRED_TAKEN_RET, 0 },
|
|
{ "branch-decoded", PMC6_BR_INST_DECODED, 0 },
|
|
{ "branch-btb-miss", PMC6_BTB_MISSES, 0 },
|
|
{ "branch-bogus", PMC6_BR_BOGUS, 0 },
|
|
{ "branch-baclear", PMC6_BACLEARS, 0 },
|
|
|
|
{ "stall-resource", PMC6_RESOURCE_STALLS, 0 },
|
|
{ "stall-partial", PMC6_PARTIAL_RAT_STALLS, 0 },
|
|
|
|
{ "seg-loads", PMC6_SEGMENT_REG_LOADS, 0 },
|
|
|
|
{ "unhalted-cycles", PMC6_CPU_CLK_UNHALTED, 0 },
|
|
|
|
{ "mmx-exec", PMC6_MMX_INSTR_EXEC, 0 },
|
|
{ "mmx-sat-exec", PMC6_MMX_SAT_INSTR_EXEC, 0 },
|
|
{ "mmx-uops-exec", PMC6_MMX_UOPS_EXEC, 0x0f },
|
|
{ "mmx-exec-packed-mul", PMC6_MMX_INSTR_TYPE_EXEC, 0x01 },
|
|
{ "mmx-exec-packed-shift", PMC6_MMX_INSTR_TYPE_EXEC, 0x02 },
|
|
{ "mmx-exec-pack-ops", PMC6_MMX_INSTR_TYPE_EXEC, 0x04 },
|
|
{ "mmx-exec-unpack-ops", PMC6_MMX_INSTR_TYPE_EXEC, 0x08 },
|
|
{ "mmx-exec-packed-logical", PMC6_MMX_INSTR_TYPE_EXEC, 0x10 },
|
|
{ "mmx-exec-packed-arith", PMC6_MMX_INSTR_TYPE_EXEC, 0x20 },
|
|
{ "mmx-trans-mmx-float", PMC6_FP_MMX_TRANS, 0x00 },
|
|
{ "mmx-trans-float-mmx", PMC6_FP_MMX_TRANS, 0x01 },
|
|
{ "mmx-assist", PMC6_MMX_ASSIST, 0 },
|
|
{ "mmx-retire", PMC6_MMX_INSTR_RET, 0 },
|
|
|
|
{ "seg-rename-stalls-es", PMC6_SEG_RENAME_STALLS, 0x01 },
|
|
{ "seg-rename-stalls-ds", PMC6_SEG_RENAME_STALLS, 0x02 },
|
|
{ "seg-rename-stalls-fs", PMC6_SEG_RENAME_STALLS, 0x04 },
|
|
{ "seg-rename-stalls-gs", PMC6_SEG_RENAME_STALLS, 0x08 },
|
|
{ "seg-rename-stalls-all", PMC6_SEG_RENAME_STALLS, 0x0f },
|
|
{ "seg-rename-es", PMC6_SEG_REG_RENAMES, 0x01 },
|
|
{ "seg-rename-ds", PMC6_SEG_REG_RENAMES, 0x02 },
|
|
{ "seg-rename-fs", PMC6_SEG_REG_RENAMES, 0x04 },
|
|
{ "seg-rename-gs", PMC6_SEG_REG_RENAMES, 0x08 },
|
|
{ "seg-rename-all", PMC6_SEG_REG_RENAMES, 0x0f },
|
|
{ "seg-rename-retire", PMC6_RET_SEG_RENAMES, 0 },
|
|
};
|
|
|
|
static const struct pmc_name2val *
|
|
find_pmc_name(const char *name)
|
|
{
|
|
int i;
|
|
const struct pmc_name2val *pnp = NULL;
|
|
|
|
for (i = 0; i < sizeof (pmc_names) / (sizeof (struct pmc_name2val));
|
|
i++) {
|
|
if (strcmp(pmc_names[i].name, name) == 0) {
|
|
pnp = &pmc_names[i];
|
|
break;
|
|
}
|
|
}
|
|
|
|
return pnp;
|
|
}
|
|
|
|
static void
|
|
list_pmc_names(void)
|
|
{
|
|
int i, n, left, pairs;
|
|
|
|
printf("Supported performance counter events:\n");
|
|
n = sizeof (pmc_names) / sizeof (struct pmc_name2val);
|
|
pairs = n / 2;
|
|
left = n % 2;
|
|
|
|
for (i = 0; i < pairs; i++)
|
|
printf(" %37s %37s\n", pmc_names[i * 2].name,
|
|
pmc_names[i * 2 + 1].name);
|
|
if (left != 0)
|
|
printf("\t%37s\n", pmc_names[n - 1].name);
|
|
}
|
|
|
|
static void
|
|
usage(void)
|
|
{
|
|
|
|
fprintf(stderr, "Usage: %s -h\n"
|
|
" %s -C\n"
|
|
" %s -c <event> command [options] ...\n",
|
|
getprogname(), getprogname(), getprogname());
|
|
exit(1);
|
|
}
|
|
|
|
int
|
|
main(int argc, char **argv)
|
|
{
|
|
int c, status, ret0, ret1, errn0, errn1;
|
|
char *event;
|
|
const struct pmc_name2val *pnp;
|
|
struct i386_pmc_info_args pi;
|
|
struct i386_pmc_startstop_args pss0, pss1;
|
|
struct i386_pmc_read_args pr0, pr1;
|
|
pid_t pid;
|
|
|
|
pnp = NULL;
|
|
while ((c = getopt(argc, argv, "Cc:h")) != -1) {
|
|
switch (c) {
|
|
case 'C':
|
|
if (argc != 2)
|
|
usage();
|
|
/*
|
|
* Just clear both counters. Useful if
|
|
* a previous run got killed and did not
|
|
* clean up.
|
|
*/
|
|
memset(&pss0, 0, sizeof pss0);
|
|
i386_pmc_startstop(&pss0);
|
|
pss0.counter = 1;
|
|
i386_pmc_startstop(&pss0);
|
|
exit(0);
|
|
case 'c':
|
|
event = optarg;
|
|
pnp = find_pmc_name(event);
|
|
break;
|
|
case 'h':
|
|
if (argc == 2) {
|
|
list_pmc_names();
|
|
exit(0);
|
|
}
|
|
default:
|
|
usage();
|
|
}
|
|
}
|
|
|
|
if (pnp == NULL)
|
|
usage();
|
|
|
|
if (i386_pmc_info(&pi) < 0)
|
|
err(2, "pmc_info");
|
|
if (pi.type != PMC_TYPE_I686)
|
|
errx(3, "only 686 counters are supported");
|
|
|
|
memset(&pss0, 0, sizeof pss0);
|
|
memset(&pss1, 0, sizeof pss1);
|
|
pss0.event = pss1.event = pnp->val;
|
|
pss0.unit = pss1.unit = pnp->unit;
|
|
pss0.flags = PMC_SETUP_USER;
|
|
pss0.counter = 0;
|
|
pss1.flags = PMC_SETUP_KERNEL;
|
|
pss0.counter = 1;
|
|
|
|
/*
|
|
* XXX should catch signals and tidy up in the parent.
|
|
*/
|
|
if (i386_pmc_startstop(&pss0) < 0)
|
|
err(4, "pmc_start user");
|
|
pss0.flags = 0;
|
|
if (i386_pmc_startstop(&pss1) < 0)
|
|
err(5, "pmc_start kernel");
|
|
pss1.flags = 0;
|
|
|
|
pid = vfork();
|
|
|
|
switch(pid) {
|
|
case -1:
|
|
errx(5, "vfork");
|
|
case 0:
|
|
execvp(argv[optind], &argv[optind]);
|
|
errx(6, "execvp");
|
|
}
|
|
|
|
(void)signal(SIGINT, SIG_IGN);
|
|
(void)signal(SIGQUIT, SIG_IGN);
|
|
|
|
waitpid(pid, &status, 0);
|
|
if (!WIFEXITED(status))
|
|
return 0;
|
|
|
|
/*
|
|
* Do not immediately exit on errors below. The counters
|
|
* must be stopped first, or subsequent runs will get
|
|
* EBUSY.
|
|
*/
|
|
pr0.counter = 0;
|
|
ret0 = i386_pmc_read(&pr0);
|
|
if (ret0 < 0)
|
|
errn0 = errno;
|
|
pr1.counter = 1;
|
|
ret1 = i386_pmc_read(&pr1);
|
|
if (ret1 < 0)
|
|
errn1 = errno;
|
|
|
|
if (i386_pmc_startstop(&pss0) < 0)
|
|
warn("pmc_stop user");
|
|
if (i386_pmc_startstop(&pss1) < 0)
|
|
warn("pmc_stop kernel");
|
|
|
|
if (ret0 < 0) {
|
|
errno = errn0;
|
|
errx(6, "pmc_read");
|
|
}
|
|
if (ret1 < 0) {
|
|
errno = errn1;
|
|
errx(7, "pmc_read");
|
|
}
|
|
|
|
printf("%s: user %llu kernel %llu\n", event, pr0.val, pr1.val);
|
|
|
|
return 0;
|
|
}
|