[BACK]Return to pctrctl.c CVS log [TXT][DIR] Up to [local] / src / usr.bin / pctrctl

Diff for /src/usr.bin/pctrctl/Attic/pctrctl.c between version 1.2 and 1.3

version 1.2, 1996/08/14 03:02:52 version 1.3, 1996/08/14 22:03:17
Line 1 
Line 1 
 /*      $OpenBSD$       */  /*      $OpenBSD$       */
   
 /*  /*
  * Pentium performance counter driver for OpenBSD.   * Pentium performance counter control program for OpenBSD.
  * Author: David Mazieres <dm@lcs.mit.edu>   * Copyright 1996 David Mazieres <dm@lcs.mit.edu>.
    *
    * Modification and redistribution in source and binary forms is
    * permitted provided that due credit is given to the author and the
    * OpenBSD project (for instance by leaving this copyright notice
    * intact).
  */   */
   
 #include <stdio.h>  #include <stdio.h>
Line 15 
Line 21 
 #include <machine/pctr.h>  #include <machine/pctr.h>
   
 char *progname;  char *progname;
   int cpufamily;
   
 char *pctr_name[] = {  #define CFL_MESI 0x1   /* Unit mask accepts MESI encoding */
   "Data read", /* 0 */  #define CFL_SA   0x2   /* Unit mask accepts Self/Any bit */
   "Data write",  #define CFL_C0   0x4   /* Counter 0 only */
   "Data TLB miss",  #define CFL_C1   0x8   /* Counter 1 only */
   "Data read miss",  
   "Data write miss",  struct ctrfn {
   "Write (hit) to M or E state lines",    u_int fn;
   "Data cache lines written back",    int flags;
   "Data cache snoops",    char *name;
   "Data cache snoop hits", /* 8 */    char *desc;
   "Memory accesses in both pipes",  
   "Bank conflicts",  
   "Misaligned data memory references",  
   "Code read",  
   "Code TLB miss",  
   "Code cache miss",  
   "Any segment register load",  
   NULL, /* 0x10 */  
   NULL,  
   "Branches",  
   "BTB hits",  
   "Taken branch or BTB hit",  
   "Pipeline flushes",  
   "Instructions executed",  
   "Instructions executed in the V-pipe",  
   "Bus utilization (clocks)", /* 0x18 */  
   "Pipeline stalled by write backup",  
   "Pipeline stalled by data memory read",  
   "Pipeline stalled by write to E or M line",  
   "Locked bus cycle",  
   "I/O read or write cycle",  
   "Noncacheable memory references",  
   "AGI (Address Generation Interlock)",  
   NULL, /* 0x20 */  
   NULL,  
   "Floating-point operations",  
   "Breakpoint 0 match",  
   "Breakpoint 1 match",  
   "Breakpoint 2 match",  
   "Breakpoint 3 match",  
   "Hardware interupts",  
   "Data read or data write", /* 0x28 */  
   "Data read miss or data write miss",  
 };  };
   
 static const int pctr_name_size =  (sizeof (pctr_name) / sizeof (char *));  struct ctrfn p5fn[] = {
     {0x00, 0, "Data read", NULL},
     {0x01, 0, "Data write", NULL},
     {0x02, 0, "Data TLB miss", NULL},
     {0x03, 0, "Data read miss", NULL},
     {0x04, 0, "Data write miss", NULL},
     {0x05, 0, "Write (hit) to M or E state lines", NULL},
     {0x06, 0, "Data cache lines written back", NULL},
     {0x07, 0, "Data cache snoops", NULL},
     {0x08, 0, "Data cache snoop hits", NULL},
     {0x09, 0, "Memory accesses in both pipes", NULL},
     {0x0a, 0, "Bank conflicts", NULL},
     {0x0b, 0, "Misaligned data memory references", NULL},
     {0x0c, 0, "Code read", NULL},
     {0x0d, 0, "Code TLB miss", NULL},
     {0x0e, 0, "Code cache miss", NULL},
     {0x0f, 0, "Any segment register load", NULL},
     {0x12, 0, "Branches", NULL},
     {0x13, 0, "BTB hits", NULL},
     {0x14, 0, "Taken branch or BTB hit", NULL},
     {0x15, 0, "Pipeline flushes", NULL},
     {0x16, 0, "Instructions executed", NULL},
     {0x17, 0, "Instructions executed in the V-pipe", NULL},
     {0x18, 0, "Bus utilization (clocks)", NULL},
     {0x19, 0, "Pipeline stalled by write backup", NULL},
     {0x1a, 0, "Pipeline stalled by data memory read", NULL},
     {0x1b, 0, "Pipeline stalled by write to E or M line", NULL},
     {0x1c, 0, "Locked bus cycle", NULL},
     {0x1d, 0, "I/O read or write cycle", NULL},
     {0x1e, 0, "Noncacheable memory references", NULL},
     {0x1f, 0, "AGI (Address Generation Interlock)", NULL},
     {0x22, 0, "Floating-point operations", NULL},
     {0x23, 0, "Breakpoint 0 match", NULL},
     {0x24, 0, "Breakpoint 1 match", NULL},
     {0x25, 0, "Breakpoint 2 match", NULL},
     {0x26, 0, "Breakpoint 3 match", NULL},
     {0x27, 0, "Hardware interupts", NULL},
     {0x28, 0, "Data read or data write", NULL},
     {0x29, 0, "Data read miss or data write miss", NULL},
     {0x0, 0, NULL, NULL},
   };
   
   struct ctrfn p6fn[] = {
     {0x03, 0, "LD_BLOCKS",
      "Number of store buffer blocks."},
     {0x04, 0, "SB_DRAINS",
      "Number of store buffer drain cycles."},
     {0x04, 0, "MISALIGN_MEM_REF",
      "Number of misaligned data memory references."},
     {0x06, 0, "SEGMENT_REG_LOADS",
      "Number of segment register loads."},
     {0x10, CFL_C0, "FP_COMP_OPS_EXE",
      "Number of computational floating-point operations executed."},
     {0x11, CFL_C1, "FP_ASSIST",
      "Number of floating-point exception cases handled by microcode."},
     {0x12, CFL_C1, "MUL",
      "Number of multiplies."},
     {0x13, CFL_C1, "DIV",
      "Number of divides."},
     {0x14, CFL_C0, "CYCLES_DIV_BUSY",
      "Number of cycles during which the divider is busy."},
     {0x21, 0, "L2_ADS",
      "Number of L2 address strobes."},
     {0x22, 0, "L2_DBUS_BUSY",
      "Number of cycles durring which the data bus was busy."},
     {0x23, 0, "L2_DBUS_BUSY_RD",
      "Number of cycles during which the data bus was busy transferring "
      "data from L2 to the processor."},
     {0x24, 0, "L2_LINES_IN",
      "Number of lines allocated in the L2."},
     {0x25, 0, "L2_M_LINES_INM",
      "Number of modified lines allocated in the L2."},
     {0x26, 0, "L2_LINES_OUT",
      "Number of lines removed from the L2 for any reason."},
     {0x27, 0, "L2_M_LINES_OUTM",
      "Number of modified lines removed from the L2 for any reason."},
     {0x28, CFL_MESI, "L2_IFETCH",
      "Number of L2 instruction fetches."},
     {0x29, CFL_MESI, "L2_LD",
      "Number of L2 data loads."},
     {0x2a, CFL_MESI, "L2_ST",
      "Number of L2 data stores."},
     {0x2e, CFL_MESI, "L2_RQSTS",
      "Number of L2 requests."},
     {0x43, 0, "DATA_MEM_REFS",
      "All memory references, both cacheable and non-cacheable."},
     {0x45, 0, "DCU_LINES_IN",
      "Total lines allocated in the DCU."},
     {0x46, 0, "DCU_M_LINES_IN",
      "Number of M state lines allocated in the DCU."},
     {0x47, 0, "DCU_M_LINES_OUT",
      "Number of M state lines evicted from the DCU.  "
      "This includes evictions via snoop HITM, interfention or replacement"},
     {0x48, 0, "DCU_MISS_OUTSTANDING",
      "Weighted number of cycles while a DCU miss is outstanding."},
     {0x60, 0, "BUS_REQ_OUTSTANDING",
      "Number of bus requests outstanding."},
     {0x61, 0, "BUS_BNR_DRV",
      "Number of bus clock cycles during which the processor is "
      "driving the BNR pin."},
     {0x62, CFL_SA, "BUS_DRDY_CLOCKS",
      "Number of clocks during which DRDY is asserted."},
     {0x63, CFL_SA, "BUS_LOCK_CLOCKS",
      "Number of clocks during which LOCK is asserted."},
     {0x64, 0, "BUS_DATA_RCV",
      "Number of bus clock cycles during which the processor is "
      "receiving data."},
     {0x65, CFL_SA, "BUS_TRAN_BRD",
      "Number of burst read transactions."},
     {0x66, CFL_SA, "BUS_TRAN_RFO",
      "Number of read for ownership transactions."},
     {0x67, CFL_SA, "BUS_TRANS_WB",
      "Number of write back transactions."},
     {0x68, CFL_SA, "BUS_TRAN_IFETCH",
      "Number of instruction fetch transactions."},
     {0x69, CFL_SA, "BUS_TRAN_INVAL",
      "Number of invalidate transactions."},
     {0x6a, CFL_SA, "BUS_TRAN_PWR",
      "Number of partial write transactions."},
     {0x6b, CFL_SA, "BUS_TRANS_P",
      "Number of partial transactions."},
     {0x6c, CFL_SA, "BUS_TRANS_IO",
      "Number of I/O transactions."},
     {0x6d, CFL_SA, "BUS_TRAN_DEF",
      "Number of deferred transactions."},
     {0x6e, CFL_SA, "BUS_TRAN_BURST",
      "Number of burst transactions."},
     {0x6f, CFL_SA, "BUS_TRAN_MEM",
      "Number of memory transactions."},
     {0x70, CFL_SA, "BUS_TRAN_ANY",
      "Number of all transactions."},
     {0x79, 0, "CPU_CLK_UNHALTED",
      "Number of cycles during which the processor is not halted."},
     {0x7a, 0, "BUS_HIT_DRV",
      "Number of bus clock cycles during which the processor is "
      "driving the HIT pin."},
     {0x7b, 0, "BUS_HITM_DRV",
      "Number of bus clock cycles during which the processor is "
      "driving the HITM pin."},
     {0x7e, 0, "BUS_SNOOP_STALL",
      "Number of clock cycles during which the bus is snoop stalled."},
     {0x80, 0, "IFU_IFETCH",
      "Number of instruction fetches, both cacheable and non-cacheable."},
     {0x81, 0, "IFU_IFETCH_MISS",
      "Number of instruction fetch misses."},
     {0x85, 0, "ITLB_MISS",
      "Number of ITLB misses."},
     {0x86, 0, "IFU_MEM_STALL",
      "Number of cycles that the instruction fetch pipe stage is stalled, "
      "including cache mises, ITLB misses, ITLB faults, "
      "and victim cache evictions"},
     {0x87, 0, "ILD_STALL",
      "Number of cycles that the instruction length decoder is stalled"},
     {0xa2, 0, "RESOURCE_STALLS",
      "Number of cycles during which there are resource-related stalls."},
     {0xc0, 0, "INST_RETIRED",
      "Number of instructions retired."},
     {0xc1, CFL_C0, "FLOPS",
      "Number of computational floating-point operations retired."},
     {0xc2, 0, "UOPS_RETIRED",
      "Number of UOPs retired."},
     {0xc4, 0, "BR_INST_RETIRED",
      "Number of branch instructions retired."},
     {0xc5, 0, "BR_MISS_PRED_RETIRED",
      "Number of mispredicted branches retired."},
     {0xc6, 0, "CYCLES_INT_MASKED",
      "Number of processor cycles for which interrupts are disabled."},
     {0xc7, 0, "CYCLES_INT_PENDING_AND_MASKED",
      "Number of processor cycles for which interrupts are disabled "
      "and interrupts are pending."},
     {0xc8, 0, "HW_INT_RX",
      "Number of hardware interrupts received."},
     {0xc9, 0, "BR_TAKEN_RETIRED",
      "Number of taken branches retired."},
     {0xca, 0, "BR_MISS_PRED_TAKEN_RET",
      "Number of taken mispredictioned branches retired."},
     {0xd0, 0, "INST_DECODER",
      "Number of instructions decoded."},
     {0xd2, 0, "PARTIAL_RAT_STALLS",
      "Number of cycles or events for partial stalls."},
     {0xe0, 0, "BR_INST_DECODED",
      "Number of branch instructions decoded."},
     {0xe2, 0, "BTB_MISSES",
      "Number of branches that miss the BTB."},
     {0xe4, 0, "BR_BOGUS",
      "Number of bogus branches."},
     {0xe6, 0, "BACLEARS",
      "Number of times BACLEAR is asserted."},
     {0x0, 0, NULL, NULL},
   };
   
   static void
   printdesc (char *desc)
   {
     char *p;
   
     for (;;) {
       while (*desc == ' ')
         desc++;
       if (strlen (desc) < 70) {
         if (*desc)
           printf ("      %s\n", desc);
         return;
       }
       p = desc + 72;
       while (*--p != ' ')
         ;
       while (*--p == ' ')
         ;
       p++;
       printf ("      %.*s\n", p - desc, desc);
       desc = p;
     }
   
   }
   
 /* Print all possible counter functions */  /* Print all possible counter functions */
 static void  static void
 list (void)  list (int fam)
 {  {
   int i;    struct ctrfn *cfnp;
   
   printf ("Hardware counter event types:\n");    if (fam == 5)
   for (i = 0; i < pctr_name_size; i++)      cfnp = p5fn;
     printf ("  %02x  %s\n", i, pctr_name[i] ? pctr_name[i] : "invalid");    else if (fam == 6)
       cfnp = p6fn;
     else {
       fprintf (stderr, "Unknown CPU family %d\n", fam);
       exit (1);
     }
     printf ("Hardware counter functions for the %s:\n\n",
             fam == 5 ? "Pentium" : "Pentium Pro");
     for (; cfnp->name; cfnp++) {
       printf ("%02x  %s", cfnp->fn, cfnp->name);
       if (cfnp->flags & CFL_MESI)
         printf ("/mesi");
       else if (cfnp->flags & CFL_SA)
         printf ("/a");
       if (cfnp->flags & CFL_C0)
         printf ("  (ctr0 only)");
       if (cfnp->flags & CFL_C1)
         printf ("  (ctr1 only)");
       printf ("\n");
       if (cfnp->desc)
         printdesc (cfnp->desc);
     }
 }  }
   
   struct ctrfn *
   fn2cfnp (u_int family, u_int sel)
   {
     struct ctrfn *cfnp;
   
     if (family == 6) {
       cfnp = p6fn;
       sel &= 0xff;
     }
     else {
       cfnp = p5fn;
       sel &= 0x3f;
     }
     for (; cfnp->name; cfnp++)
       if (cfnp->fn == sel)
         return (cfnp);
     return (NULL);
   }
   
   static char *
   fn2str (int family, u_int sel)
   {
     static char buf[128];
     char um[9] = "";
     char cm[6] = "";
     struct ctrfn *cfnp;
     u_int fn;
   
     if (family == 5) {
       fn = sel & 0x3f;
       cfnp = fn2cfnp (family, fn);
       sprintf (buf, "%c%c%c %02x %s",
                sel & P5CTR_C ? 'c' : '-',
                sel & P5CTR_U ? 'u' : '-',
                sel & P5CTR_K ? 'k' : '-',
                fn, cfnp ? cfnp->name : "unknown function");
     }
     else if (family == 6) {
       fn = sel & 0xff;
       cfnp = fn2cfnp (family, fn);
       if (cfnp && cfnp->flags & CFL_MESI)
         sprintf (um, "/%c%c%c%c",
                  sel & P6CTR_UM_M ? 'm' : '-',
                  sel & P6CTR_UM_E ? 'e' : '-',
                  sel & P6CTR_UM_S ? 's' : '-',
                  sel & P6CTR_UM_I ? 'i' : '-');
       else if (cfnp && cfnp->flags & CFL_SA)
         sprintf (um, "/%c", sel & P6CTR_UM_A ? 'a' : '-');
       if (sel >> 24)
         sprintf (cm, "+%d", sel >> 24);
       sprintf (buf, "%c%c%c%c %02x%s%s%*s %s",
                sel & P6CTR_I ? 'i' : '-',
                sel & P6CTR_E ? 'e' : '-',
                sel & P6CTR_K ? 'k' : '-',
                sel & P6CTR_U ? 'u' : '-',
                fn, cm, um, 7 - (strlen (cm) + strlen (um)), "",
                cfnp ? cfnp->name : "unknown function");
     }
     else
       return (NULL);
     return (buf);
   }
   
 /* Print status of counters */  /* Print status of counters */
 static void  static void
 readst (void)  readst (void)
Line 92 
Line 364 
   }    }
   close (fd);    close (fd);
   
     if (cpufamily == 6) {
       st.pctr_hwc[0] = rdpmc (0);
       st.pctr_hwc[1] = rdpmc (1);
     }
   for (i = 0; i < PCTR_NUM; i++)    for (i = 0; i < PCTR_NUM; i++)
     printf (" ctr%d = %16qd  [%c%c%c %02x (%s)]\n", i, st.pctr_hwc[i],      printf (" ctr%d = %16qd  [%s]\n", i, st.pctr_hwc[i],
             (st.pctr_fn[i] & P5CTR_C) ? 'c' : 'e',              fn2str (cpufamily, st.pctr_fn[i]));
             (st.pctr_fn[i] & P5CTR_U) ? 'u' : '-',  
             (st.pctr_fn[i] & P5CTR_K) ? 'k' : '-',  
             (st.pctr_fn[i] & 0x3f),  
             (((st.pctr_fn[i] & 0x3f) < pctr_name_size  
               && pctr_name[st.pctr_fn[i] & 0x3f])  
              ? pctr_name[st.pctr_fn[i] & 0x3f] : "invalid"));  
   printf ("  tsc = %16qd\n  idl = %16qd\n", st.pctr_tsc, st.pctr_idl);    printf ("  tsc = %16qd\n  idl = %16qd\n", st.pctr_tsc, st.pctr_idl);
 }  }
   
Line 125 
Line 395 
 usage (void)  usage (void)
 {  {
   fprintf (stderr,    fprintf (stderr,
            "usage: %s [-l | -s ctr [selstr] evtype]\n"             "usage:\n"
            "     -l  list event types\n"             "  %s\n"
            "     -s  set counter <ctr> to monitor events of type <evtype>\n"             "    Read the counters.\n"
            "           <selstr> = [e|c][u][k]  (default euk)\n"             "  %s -l [5|6]\n"
            "              e - count number of events\n"             "    List all possible counter functions for P5/P6.\n",
            "              c - count number of cycles\n"             progname, progname);
            "              u - count events in user mode (ring 3)\n"    if (cpufamily == 5)
            "              k - count events in kernel mode (rings 0-2)\n",      fprintf (stderr,
            progname);               "  %s -s {0|1} [-[c][u][k]] function\n"
                "    Configure counter.\n"
                "      0/1 - counter to configure\n"
                "        c - count cycles not events\n"
                "        u - count events in user mode (ring 3)\n"
                "        k - count events in kernel mode (rings 0-2)\n",
                progname);
     else if (cpufamily == 6)
       fprintf (stderr,
                "  %s -s {0|1} [-[i][e][k][u]] "
                "function[+cm][/{[m][e][s][i]|[a]}]\n"
                "    Configure counter.\n"
                "       0/1 - counter number to configure\n"
                "         i - invert cm\n"
                "         e - edge detect\n"
                "         k - count events in kernel mode (rings 0-2)\n"
                "         u - count events in user mode (ring 3)\n"
                "        cm - # events/cycle required to bump ctr\n"
                "      mesi - Modified/Exclusive/Shared/Invalid in cache\n"
                "       s/a - self generated/all events\n", progname);
   exit (1);    exit (1);
 }  }
   
Line 144 
Line 433 
   int fd;    int fd;
   u_int ctr;    u_int ctr;
   char *cp;    char *cp;
   u_short fn;    u_int fn, fl = 0;
   pctrval id = __cpuid ();    pctrval id = __cpuid ();
     char **ap;
     int ac;
     struct ctrfn *cfnp;
   
   if (__hasp6ctr (id)) {    cpufamily = (id >> 8) & 0xf;
     fprintf (stderr, "Pentium Pro not supported\n");  
     exit (1);  
   }  
   
   if (progname = strrchr (argv[0], '/'))    if (progname = strrchr (argv[0], '/'))
     progname++;      progname++;
Line 160 
Line 449 
   if (argc <= 1)    if (argc <= 1)
     readst ();      readst ();
   else if (argc == 2 && !strcmp (argv[1], "-l"))    else if (argc == 2 && !strcmp (argv[1], "-l"))
     list ();      list (cpufamily);
     else if (argc == 3 && !strcmp (argv[1], "-l"))
       list (atoi (argv[2]));
   else if (!strcmp (argv[1], "-s") && argc >= 4) {    else if (!strcmp (argv[1], "-s") && argc >= 4) {
     if (argc > 5)  
       usage ();  
     ctr = atoi (argv[2]);      ctr = atoi (argv[2]);
     if (ctr >= PCTR_NUM)      if (ctr >= PCTR_NUM)
       usage ();        usage ();
     if (argc == 5) {      ap = &argv[3];
       fn = strtoul (argv[4], NULL, 16);      ac = argc - 3;
       if (fn & ~0x3f)  
         usage ();      if (cpufamily == 6)
       for (cp = argv[3]; *cp; cp++) {        fl |= P6CTR_EN;
         switch (*cp) {      if (**ap == '-') {
         case 'c':        cp = *ap;
           fn |= P5CTR_C;        if (cpufamily == 6)
           break;          while (*++cp)
         case 'e':            switch (*cp) {
           fn &= ~P5CTR_C;            case 'i':
           break;              fl |= P6CTR_I;
         case 'k':              break;
           fn |= P5CTR_K;            case 'e':
           break;              fl |= P6CTR_E;
         case 'u':              break;
           fn |= P5CTR_U;            case 'k':
           break;              fl |= P6CTR_K;
         default:              break;
           usage ();            case 'u':
         }              fl |= P6CTR_U;
       }              break;
             default:
               usage ();
             }
         else
           while (*++cp)
             switch (*cp) {
             case 'c':
               fl |= P5CTR_C;
               break;
             case 'k':
               fl |= P5CTR_K;
               break;
             case 'u':
               fl |= P5CTR_U;
               break;
             default:
               usage ();
             }
         ap++;
         ac--;
     }      }
     else {      else {
       fn = strtoul (argv[3], NULL, 16);        if (cpufamily == 6)
       if (fn & ~0x3f)          fl |= P6CTR_U|P6CTR_K;
         else
           fl |= P5CTR_U|P5CTR_K;
       }
   
       if (!ac)
         usage ();
   
       fn = strtoul (*ap, NULL, 16);
       if (cpufamily == 6 && (fn & ~0xff) || cpufamily != 6 && (fn & ~0x3f))
         usage ();
       fl |= fn;
       if (cpufamily == 6 && (cp = strchr (*ap, '+'))) {
         cp++;
         fn = strtol (cp, NULL, 0);
         if (fn & ~0xff)
         usage ();          usage ();
       fn |= P5CTR_K | P5CTR_U;        fl |= (fn << 24);
     }      }
     setctr (ctr, fn);      cfnp = fn2cfnp (6, fl);
       if (cpufamily == 6 && cfnp && (cp = strchr (*ap, '/'))) {
         if (cfnp->flags & CFL_MESI)
           while (*++cp)
             switch (*cp) {
             case 'm':
               fl |= P6CTR_UM_M;
               break;
             case 'e':
               fl |= P6CTR_UM_E;
               break;
             case 's':
               fl |= P6CTR_UM_S;
               break;
             case 'i':
               fl |= P6CTR_UM_I;
               break;
             default:
               usage ();
             }
         else if (cfnp->flags & CFL_SA)
           while (*++cp)
             switch (*cp) {
             case 'a':
               fl |= P6CTR_UM_A;
               break;
             default:
               usage ();
             }
         else
           usage ();
       }
       else if (cfnp && (cfnp->flags & CFL_MESI))
         fl |= P6CTR_UM_MESI;
       ap++;
       ac--;
   
       if (ac)
         usage ();
   
       if (cpufamily == 6 && ! (fl & 0xff))
         fl = 0;
       setctr (ctr, fl);
   }    }
   else    else
     usage ();      usage ();

Legend:
Removed from v.1.2  
changed lines
  Added in v.1.3