Make start address of `osReserveHeapMemory` tunable via command line -xb
[ghc.git] / rts / Ticky.c
index c874d1a..44d49b6 100644 (file)
@@ -6,12 +6,29 @@
  * Ticky-ticky profiling
  *-------------------------------------------------------------------------- */
 
-#if defined(TICKY_TICKY)
-
-#define TICKY_C                        /* define those variables */
+#define TICKY_C                 /* define those variables */
 #include "PosixSource.h"
 #include "Rts.h"
 
+/* Catch-all top-level counter struct.  Allocations from CAFs will go
+ * here.
+ */
+StgEntCounter top_ct
+        = { 0, 0, 0,
+            "TOP", "",
+            0, 0, NULL };
+
+/* Data structure used in ``registering'' one of these counters. */
+
+StgEntCounter *ticky_entry_ctrs = NULL; /* root of list of them */
+
+/* We want Haskell code compiled with -ticky to be linkable with any
+ * version of the RTS, so we have to make sure all the symbols that
+ * ticky-compiled code may refer to are defined by every RTS. (#3439)
+ * Hence the #ifdef is here, rather than up above.
+ */
+#if defined(TICKY_TICKY)
+
 #include "Ticky.h"
 
 /* -----------------------------------------------------------------------------
 static void printRegisteredCounterInfo (FILE *); /* fwd decl */
 
 #define INTAVG(a,b) ((b == 0) ? 0.0 : ((double) (a) / (double) (b)))
-#define PC(a)      (100.0 * a)
+#define PC(a)       (100.0 * a)
 
 #define AVG(thing) \
-       StgDouble avg##thing  = INTAVG(tot##thing,ctr##thing)
+        StgDouble avg##thing  = INTAVG(tot##thing,ctr##thing)
 
 void
 PrintTickyInfo(void)
 {
-  // XXX This is only used in commented out or #if FALSE'd out code currently:
-  // unsigned long i;
-
-/* XXX These are used only in an #if FALSE block below */
-#if FALSE
-  unsigned long tot_allocs = /* total number of things allocated */
-       ALLOC_FUN_ctr + ALLOC_SE_THK_ctr + ALLOC_UP_THK_ctr + ALLOC_CON_ctr + ALLOC_TUP_ctr +
-       + ALLOC_TSO_ctr + ALLOC_BH_ctr  + ALLOC_PAP_ctr + ALLOC_PRIM_ctr
-      ;        
-
-  unsigned long tot_adm_wds = /* total number of admin words allocated */
-       ALLOC_FUN_adm + ALLOC_THK_adm + ALLOC_CON_adm + ALLOC_TUP_adm
-       + ALLOC_TSO_adm + ALLOC_BH_adm  + ALLOC_PAP_adm + ALLOC_PRIM_adm
-      ;
-
-  unsigned long tot_gds_wds = /* total number of words of ``good stuff'' allocated */
-       ALLOC_FUN_gds + ALLOC_THK_gds + ALLOC_CON_gds + ALLOC_TUP_gds
-       + ALLOC_TSO_gds + ALLOC_BH_gds  + ALLOC_PAP_gds + ALLOC_PRIM_gds
-      ;
-
-  unsigned long tot_slp_wds = /* total number of ``slop'' words allocated */
-       ALLOC_FUN_slp + ALLOC_THK_slp + ALLOC_CON_slp + ALLOC_TUP_slp
-       + ALLOC_TSO_slp + ALLOC_BH_slp  + ALLOC_PAP_slp + ALLOC_PRIM_slp
-      ;
-
-  unsigned long tot_wds = /* total words */
-       tot_adm_wds + tot_gds_wds + tot_slp_wds;
-#endif
-
-  unsigned long tot_thk_enters = ENT_STATIC_THK_ctr + ENT_DYN_THK_ctr;
+  unsigned long i;
+
+  unsigned long tot_thk_enters = ENT_STATIC_THK_MANY_ctr + ENT_DYN_THK_MANY_ctr
+                               + ENT_STATIC_THK_SINGLE_ctr + ENT_DYN_THK_SINGLE_ctr;
   unsigned long tot_con_enters = ENT_STATIC_CON_ctr + ENT_DYN_CON_ctr;
 
   unsigned long tot_fun_direct_enters = ENT_STATIC_FUN_DIRECT_ctr + ENT_DYN_FUN_DIRECT_ctr;
   unsigned long tot_ind_enters = ENT_STATIC_IND_ctr + ENT_DYN_IND_ctr;
-  
-  // This is the number of times we entered a function via some kind
-  // of slow call.  It amounts to all the slow applications, not
-  // counting those that were to too few arguments.
-  /*
-  XXX This us unused - can we delete it? -- IGL 2008-04-25
-  unsigned long tot_fun_slow_enters = 
-      SLOW_CALL_ctr - 
-      SLOW_CALL_FUN_TOO_FEW_ctr -
-      SLOW_CALL_PAP_TOO_FEW_ctr;
-  */
 
   unsigned long tot_known_calls =
-      KNOWN_CALL_ctr + KNOWN_CALL_TOO_FEW_ARGS_ctr + 
+      KNOWN_CALL_ctr + KNOWN_CALL_TOO_FEW_ARGS_ctr +
       + KNOWN_CALL_EXTRA_ARGS_ctr;
   unsigned long tot_tail_calls =
       UNKNOWN_CALL_ctr + tot_known_calls;
 
-  unsigned long tot_enters = 
+  unsigned long tot_enters =
       tot_con_enters + tot_fun_direct_enters +
-       tot_ind_enters + ENT_PERM_IND_ctr + ENT_PAP_ctr + tot_thk_enters;
+        tot_ind_enters + ENT_PERM_IND_ctr + ENT_PAP_ctr + tot_thk_enters;
   unsigned long jump_direct_enters =
-       tot_enters - ENT_VIA_NODE_ctr;
+        tot_enters - ENT_VIA_NODE_ctr;
 
 
   unsigned long tot_returns =
@@ -105,194 +85,111 @@ PrintTickyInfo(void)
   FILE *tf = RtsFlags.TickyFlags.tickyFile;
 
   /* If tf = NULL, that means the user passed in stderr for the ticky stats
-     file. According to a comment in RtsFlags.c, this means to use 
+     file. According to a comment in RtsFlags.c, this means to use
      debugBelch to print out messages. But this function prints out a lot
      of stuff so in order to avoid changing a lot of code, we just dump
      the same output to stderr (for now). */
   if( tf == NULL )
     tf = stderr;
 
-  /* krc: avoid dealing with this just now */
-#if FALSE
-  fprintf(tf,"\n\nALLOCATIONS: %ld (%ld words total: %ld admin, %ld goods, %ld slop)\n",
-         tot_allocs, tot_wds, tot_adm_wds, tot_gds_wds, tot_slp_wds);
-  fprintf(tf,"\t\t\t\ttotal words:\t    2     3     4     5    6+\n");
-
-#define ALLOC_HISTO_MAGIC(categ) \
-       (PC(INTAVG(ALLOC_##categ##_hst[0], ALLOC_##categ##_ctr))), \
-       (PC(INTAVG(ALLOC_##categ##_hst[1], ALLOC_##categ##_ctr))), \
-       (PC(INTAVG(ALLOC_##categ##_hst[2], ALLOC_##categ##_ctr))), \
-       (PC(INTAVG(ALLOC_##categ##_hst[3], ALLOC_##categ##_ctr))), \
-       (PC(INTAVG(ALLOC_##categ##_hst[4], ALLOC_##categ##_ctr)))
-
-  fprintf(tf,"%7ld (%5.1f%%) function values",
-       ALLOC_FUN_ctr,
-       PC(INTAVG(ALLOC_FUN_ctr, tot_allocs)));
-  if (ALLOC_FUN_ctr != 0)
-      fprintf(tf,"\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(FUN));
-
-  fprintf(tf,"\n%7ld (%5.1f%%) thunks",
-       ALLOC_SE_THK_ctr + ALLOC_UP_THK_ctr,
-       PC(INTAVG(ALLOC_SE_THK_ctr + ALLOC_UP_THK_ctr, tot_allocs)));
-
-#define ALLOC_THK_ctr (ALLOC_UP_THK_ctr + ALLOC_SE_THK_ctr)
-  /* hack to make ALLOC_HISTO_MAGIC still work for THK */
-  if ((ALLOC_SE_THK_ctr + ALLOC_UP_THK_ctr) != 0)
-      fprintf(tf,"\t\t\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(THK));
-#undef ALLOC_THK_ctr
-
-  fprintf(tf,"\n%7ld (%5.1f%%) data values",
-       ALLOC_CON_ctr,
-       PC(INTAVG(ALLOC_CON_ctr, tot_allocs)));
-  if (ALLOC_CON_ctr != 0)
-      fprintf(tf,"\t\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(CON));
-
-  fprintf(tf,"\n%7ld (%5.1f%%) big tuples",
-       ALLOC_TUP_ctr,
-       PC(INTAVG(ALLOC_TUP_ctr, tot_allocs)));
-  if (ALLOC_TUP_ctr != 0)
-      fprintf(tf,"\t\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(TUP));
-
-  fprintf(tf,"\n%7ld (%5.1f%%) black holes",
-       ALLOC_BH_ctr,
-       PC(INTAVG(ALLOC_BH_ctr, tot_allocs)));
-  if (ALLOC_BH_ctr != 0)
-      fprintf(tf,"\t\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(BH));
-
-  fprintf(tf,"\n%7ld (%5.1f%%) prim things",
-       ALLOC_PRIM_ctr,
-       PC(INTAVG(ALLOC_PRIM_ctr, tot_allocs)));
-  if (ALLOC_PRIM_ctr != 0)
-      fprintf(tf,"\t\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(PRIM));
-
-  fprintf(tf,"\n%7ld (%5.1f%%) partial applications",
-       ALLOC_PAP_ctr,
-       PC(INTAVG(ALLOC_PAP_ctr, tot_allocs)));
-  if (ALLOC_PAP_ctr != 0)
-      fprintf(tf,"\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(PAP));
-
-  fprintf(tf,"\n%7ld (%5.1f%%) thread state objects",
-       ALLOC_TSO_ctr,
-       PC(INTAVG(ALLOC_TSO_ctr, tot_allocs)));
-  if (ALLOC_TSO_ctr != 0)
-      fprintf(tf,"\t\t%5.1f %5.1f %5.1f %5.1f %5.1f", ALLOC_HISTO_MAGIC(TSO));
-
-  fprintf(tf,"\n");
-
-  fprintf(tf,"\nTotal storage-manager allocations: %ld (%ld words)\n\t[%ld words lost to speculative heap-checks]\n", ALLOC_HEAP_ctr, ALLOC_HEAP_tot, ALLOC_HEAP_tot - tot_wds);
-#endif /* FALSE */
-
-
   fprintf(tf,"\nSTACK USAGE:\n"); /* NB: some bits are direction sensitive */
 
 
-  fprintf(tf,"\nENTERS: %ld  of which %ld (%.1f%%) direct to the entry code\n\t\t  [the rest indirected via Node's info ptr]\n",
-       tot_enters,
-       jump_direct_enters,
-       PC(INTAVG(jump_direct_enters,tot_enters)));
-  fprintf(tf,"%7ld (%5.1f%%) thunks\n",
-       tot_thk_enters,
-       PC(INTAVG(tot_thk_enters,tot_enters)));
-  fprintf(tf,"%7ld (%5.1f%%) data values\n",
-       tot_con_enters,
-       PC(INTAVG(tot_con_enters,tot_enters)));
-  fprintf(tf,"%7ld (%5.1f%%) normal indirections\n",
-       tot_ind_enters,
-       PC(INTAVG(tot_ind_enters,tot_enters)));
-  fprintf(tf,"%7ld (%5.1f%%) permanent indirections\n",
-       ENT_PERM_IND_ctr,
-       PC(INTAVG(ENT_PERM_IND_ctr,tot_enters)));
-
-
-  fprintf(tf,"\nFUNCTION ENTRIES: %ld\n", tot_fun_direct_enters);
-
-  fprintf(tf, "\nTAIL CALLS: %ld, of which %ld (%.lf%%) were to known functions\n", 
-         tot_tail_calls, tot_known_calls,
-         PC(INTAVG(tot_known_calls,tot_tail_calls)));
-
-  fprintf(tf, "\nSLOW APPLICATIONS: %ld evaluated, %ld unevaluated\n",
-         SLOW_CALL_ctr, SLOW_CALL_UNEVALD_ctr);
+  fprintf(tf,"\nENTERS: %lu  of which %lu (%.1f%%) direct to the entry code\n\t\t  [the rest indirected via Node's info ptr]\n",
+        tot_enters,
+        jump_direct_enters,
+        PC(INTAVG(jump_direct_enters,tot_enters)));
+  fprintf(tf,"%11lu (%5.1f%%) thunks\n",
+        tot_thk_enters,
+        PC(INTAVG(tot_thk_enters,tot_enters)));
+  fprintf(tf, "%11lu (%5.1f%%) data values\n",
+        tot_con_enters,
+        PC(INTAVG(tot_con_enters,tot_enters)));
+  fprintf(tf, "%11lu (%5.1f%%) normal indirections\n",
+        tot_ind_enters,
+        PC(INTAVG(tot_ind_enters,tot_enters)));
+  fprintf(tf,"%11" FMT_Int " (%5.1f%%) permanent indirections\n",
+        ENT_PERM_IND_ctr,
+        PC(INTAVG(ENT_PERM_IND_ctr,tot_enters)));
+
+
+  fprintf(tf, "\nFUNCTION ENTRIES: %lu\n", tot_fun_direct_enters);
+
+  fprintf(tf, "\nTAIL CALLS: %lu, of which %lu (%.lf%%) were to known functions\n",
+          tot_tail_calls, tot_known_calls,
+          PC(INTAVG(tot_known_calls,tot_tail_calls)));
+
+  fprintf(tf, "\nSLOW APPLICATIONS: %" FMT_Int " evaluated, %" FMT_Int " unevaluated\n",
+          SLOW_CALL_ctr, SLOW_CALL_UNEVALD_ctr);
   fprintf(tf, "\n");
   fprintf(tf, "         Too few args   Correct args   Too many args\n");
-  fprintf(tf, "   FUN     %8ld       %8ld        %8ld\n", 
-         SLOW_CALL_FUN_TOO_FEW_ctr, SLOW_CALL_FUN_CORRECT_ctr, SLOW_CALL_FUN_TOO_MANY_ctr);
-  fprintf(tf, "   PAP     %8ld       %8ld        %8ld\n", 
-         SLOW_CALL_PAP_TOO_FEW_ctr, SLOW_CALL_PAP_CORRECT_ctr, SLOW_CALL_PAP_TOO_MANY_ctr);
+  fprintf(tf, "   FUN     %8" FMT_Int "       %8" FMT_Int "        %8" FMT_Int "\n",
+          SLOW_CALL_FUN_TOO_FEW_ctr, SLOW_CALL_FUN_CORRECT_ctr, SLOW_CALL_FUN_TOO_MANY_ctr);
+  fprintf(tf, "   PAP     %8" FMT_Int "       %8" FMT_Int "        %8" FMT_Int "\n",
+          SLOW_CALL_PAP_TOO_FEW_ctr, SLOW_CALL_PAP_CORRECT_ctr, SLOW_CALL_PAP_TOO_MANY_ctr);
   fprintf(tf, "\n");
 
-  fprintf(tf,"\nRETURNS: %ld\n", tot_returns);
-  fprintf(tf,"%7ld (%5.1f%%) from entering a new constructor\n\t\t  [the rest from entering an existing constructor]\n",
-       tot_returns_of_new,
-       PC(INTAVG(tot_returns_of_new,tot_returns)));
+  fprintf(tf, "\nRETURNS: %lu\n", tot_returns);
+  fprintf(tf, "%11lu (%5.1f%%) from entering a new constructor\n\t\t  [the rest from entering an existing constructor]\n",
+        tot_returns_of_new,
+        PC(INTAVG(tot_returns_of_new,tot_returns)));
 
-  /* krc: comment out some of this stuff temporarily */
 
-  /*
-  fprintf(tf, "\nRET_NEW:         %7ld: ", RET_NEW_ctr);
-  for (i = 0; i < 9; i++) { fprintf(tf, "%5.1f%%",
-                               PC(INTAVG(RET_NEW_hst[i],RET_NEW_ctr))); }
+  fprintf(tf, "\nRET_NEW:         %11" FMT_Int ": ", RET_NEW_ctr);
+  for (i = 0; i < TICKY_BIN_COUNT; i++) {
+    fprintf(tf, "%5.1f%%", PC(INTAVG(RET_NEW_hst[i], RET_NEW_ctr)));
+  }
   fprintf(tf, "\n");
-  fprintf(tf, "RET_OLD:         %7ld: ", RET_OLD_ctr);
-  for (i = 0; i < 9; i++) { fprintf(tf, "%5.1f%%",
-                               PC(INTAVG(RET_OLD_hst[i],RET_OLD_ctr))); }
+
+  fprintf(tf, "RET_OLD:         %11" FMT_Int ": ", RET_OLD_ctr);
+  for (i = 0; i < TICKY_BIN_COUNT; i++) {
+    fprintf(tf, "%5.1f%%", PC(INTAVG(RET_OLD_hst[i], RET_OLD_ctr)));
+  }
   fprintf(tf, "\n");
-  fprintf(tf, "RET_UNBOXED_TUP: %7ld: ", RET_UNBOXED_TUP_ctr);
-  for (i = 0; i < 9; i++) { fprintf(tf, "%5.1f%%",
-                                   PC(INTAVG(RET_UNBOXED_TUP_hst[i],
-                                             RET_UNBOXED_TUP_ctr))); }
+
+  fprintf(tf, "RET_UNBOXED_TUP: %11" FMT_Int ": ", RET_UNBOXED_TUP_ctr);
+  for (i = 0; i < TICKY_BIN_COUNT; i++) {
+    fprintf(tf, "%5.1f%%", PC(INTAVG(RET_UNBOXED_TUP_hst[i],
+                           RET_UNBOXED_TUP_ctr)));
+  }
   fprintf(tf, "\n");
-  */
 
-  fprintf(tf,"\nUPDATE FRAMES: %ld (%ld omitted from thunks)",
-       UPDF_PUSHED_ctr,
-       UPDF_OMITTED_ctr);
+  fprintf(tf,"\nUPDATE FRAMES: %" FMT_Int " (%" FMT_Int " omitted from thunks)",
+        UPDF_PUSHED_ctr,
+        UPDF_OMITTED_ctr);
 
-  fprintf(tf,"\nCATCH FRAMES:  %ld", CATCHF_PUSHED_ctr);
+  fprintf(tf,"\nCATCH FRAMES:  %" FMT_Int "", CATCHF_PUSHED_ctr);
 
-  if (UPDF_RCC_PUSHED_ctr != 0)
-     fprintf(tf,"%7ld restore cost centre frames (%ld omitted)\n",
-       UPDF_RCC_PUSHED_ctr,
-       UPDF_RCC_OMITTED_ctr);
+  if (UPDF_RCC_PUSHED_ctr != 0) {
+     fprintf(tf,"%11" FMT_Int " restore cost centre frames (%" FMT_Int " omitted)\n",
+        UPDF_RCC_PUSHED_ctr,
+        UPDF_RCC_OMITTED_ctr);
+  }
 
   fprintf(tf,"\nUPDATES: %ld\n", tot_updates);
-  fprintf(tf,"%7ld (%5.1f%%) data values\n\t\t  [%ld in place, %ld allocated new space]\n",
-       con_updates,
-       PC(INTAVG(con_updates,tot_updates)),
-       UPD_CON_IN_PLACE_ctr, UPD_CON_IN_NEW_ctr);
-  fprintf(tf,"%7ld (%5.1f%%) partial applications\n\t\t  [%ld in place, %ld allocated new space]\n",
-       pap_updates,
-       PC(INTAVG(pap_updates,tot_updates)),
-       UPD_PAP_IN_PLACE_ctr, UPD_PAP_IN_NEW_ctr);
-  fprintf(tf,"%7ld (%5.1f%%) updates by squeezing\n",
-       UPD_SQUEEZED_ctr,
-       PC(INTAVG(UPD_SQUEEZED_ctr, tot_updates)));
-
-  /* krc: also avoid dealing with this for now */
-#if FALSE
-  fprintf(tf, "\nUPD_CON_IN_NEW:   %7ld: ", UPD_CON_IN_NEW_ctr);
-  for (i = 0; i < 9; i++) { fprintf(tf, "%7ld", UPD_CON_IN_NEW_hst[i]); }
-  fprintf(tf, "\n");
-  fprintf(tf, "UPD_CON_IN_PLACE: %7ld: ", UPD_CON_IN_PLACE_ctr);
-  for (i = 0; i < 9; i++) { fprintf(tf, "%7ld", UPD_CON_IN_PLACE_hst[i]); }
-  fprintf(tf, "\n");
-  fprintf(tf, "UPD_PAP_IN_NEW:   %7ld: ", UPD_PAP_IN_NEW_ctr);
-  for (i = 0; i < 9; i++) { fprintf(tf, "%7ld", UPD_PAP_IN_NEW_hst[i]); }
-  fprintf(tf, "\n");
-#endif
+  fprintf(tf, "%11lu (%5.1f%%) data values\n\t\t  [%" FMT_Int " in place, %" FMT_Int " allocated new space]\n",
+        con_updates,
+        PC(INTAVG(con_updates,tot_updates)),
+        UPD_CON_IN_PLACE_ctr, UPD_CON_IN_NEW_ctr);
+
+  fprintf(tf, "%11lu (%5.1f%%) partial applications\n\t\t  [%" FMT_Int " in place, %" FMT_Int " allocated new space]\n",
+        pap_updates,
+        PC(INTAVG(pap_updates,tot_updates)),
+        UPD_PAP_IN_PLACE_ctr, UPD_PAP_IN_NEW_ctr);
+
+  fprintf(tf,"%11" FMT_Int " (%5.1f%%) updates by squeezing\n",
+        UPD_SQUEEZED_ctr,
+        PC(INTAVG(UPD_SQUEEZED_ctr, tot_updates)));
 
   if (tot_gengc_updates != 0) {
-      fprintf(tf,"\nNEW GEN UPDATES: %9ld (%5.1f%%)\n",
-             tot_new_updates,
-             PC(INTAVG(tot_new_updates,tot_gengc_updates)));
-      fprintf(tf,"OLD GEN UPDATES: %9ld (%5.1f%%)\n",
-             tot_old_updates,
-             PC(INTAVG(tot_old_updates,tot_gengc_updates)));
+      fprintf(tf, "\nNEW GEN UPDATES: %9lu (%5.1f%%)\n",
+              tot_new_updates,
+              PC(INTAVG(tot_new_updates,tot_gengc_updates)));
+      fprintf(tf, "OLD GEN UPDATES: %9lu (%5.1f%%)\n",
+              tot_old_updates,
+              PC(INTAVG(tot_old_updates,tot_gengc_updates)));
   }
 
-  fprintf(tf,"\nTotal bytes copied during GC: %ld\n",
-         GC_WORDS_COPIED_ctr * sizeof(W_));
-
   printRegisteredCounterInfo(tf);
 
   fprintf(tf,"\n**************************************************\n");
@@ -303,99 +200,51 @@ PrintTickyInfo(void)
   */
 
 #define PR_CTR(ctr) \
-  do { fprintf(tf,"%7ld " #ctr "\n", ctr); } while(0)
+  do { fprintf(tf,"%11" FMT_Int " " #ctr "\n", ctr); } while(0)
+
 /* COND_PR_CTR takes a boolean; if false then msg is the printname rather than ctr */
 #define COND_PR_CTR(ctr,b,msg) \
-    if (b) { fprintf(tf,"%7ld " #ctr "\n", ctr); } else { fprintf(tf,"%7ld " msg "\n", ctr); }
+    if (b) { fprintf(tf,"%11" FMT_Int " " #ctr "\n", ctr); } else { fprintf(tf,"%11" FMT_Int " " msg "\n", ctr); }
+
 #define PR_HST(hst,i) \
-  do { fprintf(tf,"%7ld " #hst "_" #i "\n", hst[i]); } while(0)
+  do { fprintf(tf,"%11" FMT_Int " " #hst "_" #i "\n", hst[i]); } while(0)
+
+  ALLOC_HEAP_ctr = (StgInt)ALLOC_HEAP_ctr + (StgInt)ALLOC_RTS_ctr;
+  ALLOC_HEAP_tot = (StgInt)ALLOC_HEAP_tot + (StgInt)ALLOC_RTS_tot;
 
   PR_CTR(ALLOC_HEAP_ctr);
   PR_CTR(ALLOC_HEAP_tot);
 
+  PR_CTR(HEAP_CHK_ctr);
+  PR_CTR(STK_CHK_ctr);
+
+  PR_CTR(ALLOC_RTS_ctr);
+  PR_CTR(ALLOC_RTS_tot);
+
   PR_CTR(ALLOC_FUN_ctr);
-  PR_CTR(ALLOC_FUN_adm);
   PR_CTR(ALLOC_FUN_gds);
-  PR_CTR(ALLOC_FUN_slp);
-
-  /* krc: comment out some of this stuff temporarily
-  PR_HST(ALLOC_FUN_hst,0);
-  PR_HST(ALLOC_FUN_hst,1);
-  PR_HST(ALLOC_FUN_hst,2);
-  PR_HST(ALLOC_FUN_hst,3);
-  PR_HST(ALLOC_FUN_hst,4);
+
+  PR_CTR(ALLOC_PAP_ctr);
+  PR_CTR(ALLOC_PAP_adm);
+  PR_CTR(ALLOC_PAP_gds);
+
   PR_CTR(ALLOC_UP_THK_ctr);
   PR_CTR(ALLOC_SE_THK_ctr);
-  PR_CTR(ALLOC_THK_adm);
   PR_CTR(ALLOC_THK_gds);
-  PR_CTR(ALLOC_THK_slp);
-  PR_HST(ALLOC_THK_hst,0);
-  PR_HST(ALLOC_THK_hst,1);
-  PR_HST(ALLOC_THK_hst,2);
-  PR_HST(ALLOC_THK_hst,3);
-  PR_HST(ALLOC_THK_hst,4);
+
   PR_CTR(ALLOC_CON_ctr);
-  PR_CTR(ALLOC_CON_adm);
   PR_CTR(ALLOC_CON_gds);
-  PR_CTR(ALLOC_CON_slp);
-  PR_HST(ALLOC_CON_hst,0);
-  PR_HST(ALLOC_CON_hst,1);
-  PR_HST(ALLOC_CON_hst,2);
-  PR_HST(ALLOC_CON_hst,3);
-  PR_HST(ALLOC_CON_hst,4);
-  PR_CTR(ALLOC_TUP_ctr);
-  PR_CTR(ALLOC_TUP_adm);
-  PR_CTR(ALLOC_TUP_gds);
-  PR_CTR(ALLOC_TUP_slp);
-  PR_HST(ALLOC_TUP_hst,0);
-  PR_HST(ALLOC_TUP_hst,1);
-  PR_HST(ALLOC_TUP_hst,2);
-  PR_HST(ALLOC_TUP_hst,3);
-  PR_HST(ALLOC_TUP_hst,4);
-  PR_CTR(ALLOC_BH_ctr);
-  PR_CTR(ALLOC_BH_adm);
-  PR_CTR(ALLOC_BH_gds);
-  PR_CTR(ALLOC_BH_slp);
-  PR_HST(ALLOC_BH_hst,0);
-  PR_HST(ALLOC_BH_hst,1);
-  PR_HST(ALLOC_BH_hst,2);
-  PR_HST(ALLOC_BH_hst,3);
-  PR_HST(ALLOC_BH_hst,4);
+
   PR_CTR(ALLOC_PRIM_ctr);
-  PR_CTR(ALLOC_PRIM_adm);
   PR_CTR(ALLOC_PRIM_gds);
   PR_CTR(ALLOC_PRIM_slp);
-  PR_HST(ALLOC_PRIM_hst,0);
-  PR_HST(ALLOC_PRIM_hst,1);
-  PR_HST(ALLOC_PRIM_hst,2);
-  PR_HST(ALLOC_PRIM_hst,3);
-  PR_HST(ALLOC_PRIM_hst,4);
-  PR_CTR(ALLOC_PAP_ctr);
-  PR_CTR(ALLOC_PAP_adm);
-  PR_CTR(ALLOC_PAP_gds);
-  PR_CTR(ALLOC_PAP_slp);
-  PR_HST(ALLOC_PAP_hst,0);
-  PR_HST(ALLOC_PAP_hst,1);
-  PR_HST(ALLOC_PAP_hst,2);
-  PR_HST(ALLOC_PAP_hst,3);
-  PR_HST(ALLOC_PAP_hst,4);
-
-  PR_CTR(ALLOC_TSO_ctr);
-  PR_CTR(ALLOC_TSO_adm);
-  PR_CTR(ALLOC_TSO_gds);
-  PR_CTR(ALLOC_TSO_slp);
-  PR_HST(ALLOC_TSO_hst,0);
-  PR_HST(ALLOC_TSO_hst,1);
-  PR_HST(ALLOC_TSO_hst,2);
-  PR_HST(ALLOC_TSO_hst,3);
-  PR_HST(ALLOC_TSO_hst,4);
-  */
 
   PR_CTR(ENT_VIA_NODE_ctr);
   PR_CTR(ENT_STATIC_CON_ctr);
   PR_CTR(ENT_DYN_CON_ctr);
   PR_CTR(ENT_STATIC_FUN_DIRECT_ctr);
   PR_CTR(ENT_DYN_FUN_DIRECT_ctr);
+  PR_CTR(ENT_LNE_ctr);
   PR_CTR(ENT_STATIC_IND_ctr);
   PR_CTR(ENT_DYN_IND_ctr);
 
@@ -408,8 +257,8 @@ PrintTickyInfo(void)
  * the ENT_PERM_IND, but we then enter the PERM_IND that was built for
  * the next update frame below, and so on down the chain until we
  * finally reach the value.  Thus we count many new ENT_PERM_INDs too
- * early.  
- * 
+ * early.
+ *
  * This of course refers to the -ticky version that uses PERM_INDs to
  * determine the number of closures entered 0/1/>1.  KSW 1999-04.  */
   COND_PR_CTR(ENT_PERM_IND_ctr,RtsFlags.GcFlags.squeezeUpdFrames == rtsFalse,"E!NT_PERM_IND_ctr requires +RTS -Z");
@@ -418,24 +267,29 @@ PrintTickyInfo(void)
   PR_CTR(ENT_PAP_ctr);
   PR_CTR(ENT_AP_STACK_ctr);
   PR_CTR(ENT_BH_ctr);
-  PR_CTR(ENT_STATIC_THK_ctr);
-  PR_CTR(ENT_DYN_THK_ctr);
-
-  PR_CTR(SLOW_CALL_v_ctr);
-  PR_CTR(SLOW_CALL_f_ctr);
-  PR_CTR(SLOW_CALL_d_ctr);
-  PR_CTR(SLOW_CALL_l_ctr);
-  PR_CTR(SLOW_CALL_n_ctr);
-  PR_CTR(SLOW_CALL_p_ctr);
-  PR_CTR(SLOW_CALL_pv_ctr);
-  PR_CTR(SLOW_CALL_pp_ctr);
-  PR_CTR(SLOW_CALL_ppv_ctr);
-  PR_CTR(SLOW_CALL_ppp_ctr);
-  PR_CTR(SLOW_CALL_pppv_ctr);
-  PR_CTR(SLOW_CALL_pppp_ctr);
-  PR_CTR(SLOW_CALL_ppppp_ctr);
-  PR_CTR(SLOW_CALL_pppppp_ctr);
-  PR_CTR(SLOW_CALL_OTHER_ctr);
+  PR_CTR(ENT_STATIC_THK_SINGLE_ctr);
+  PR_CTR(ENT_STATIC_THK_MANY_ctr);
+  PR_CTR(ENT_DYN_THK_SINGLE_ctr);
+  PR_CTR(ENT_DYN_THK_MANY_ctr);
+  PR_CTR(UPD_CAF_BH_UPDATABLE_ctr);
+  PR_CTR(UPD_CAF_BH_SINGLE_ENTRY_ctr);
+
+  PR_CTR(SLOW_CALL_fast_v16_ctr);
+  PR_CTR(SLOW_CALL_fast_v_ctr);
+  PR_CTR(SLOW_CALL_fast_f_ctr);
+  PR_CTR(SLOW_CALL_fast_d_ctr);
+  PR_CTR(SLOW_CALL_fast_l_ctr);
+  PR_CTR(SLOW_CALL_fast_n_ctr);
+  PR_CTR(SLOW_CALL_fast_p_ctr);
+  PR_CTR(SLOW_CALL_fast_pv_ctr);
+  PR_CTR(SLOW_CALL_fast_pp_ctr);
+  PR_CTR(SLOW_CALL_fast_ppv_ctr);
+  PR_CTR(SLOW_CALL_fast_ppp_ctr);
+  PR_CTR(SLOW_CALL_fast_pppv_ctr);
+  PR_CTR(SLOW_CALL_fast_pppp_ctr);
+  PR_CTR(SLOW_CALL_fast_ppppp_ctr);
+  PR_CTR(SLOW_CALL_fast_pppppp_ctr);
+  PR_CTR(VERY_SLOW_CALL_ctr);
 
   PR_CTR(UNKNOWN_CALL_ctr);
   PR_CTR(KNOWN_CALL_ctr);
@@ -452,52 +306,18 @@ PrintTickyInfo(void)
   PR_CTR(SLOW_CALL_PAP_TOO_MANY_ctr);
   PR_CTR(SLOW_CALL_UNEVALD_ctr);
 
-  /* krc: put off till later... */
-#if FALSE
-  PR_HST(SLOW_CALL_hst,0);
-  PR_HST(SLOW_CALL_hst,1);
-  PR_HST(SLOW_CALL_hst,2);
-  PR_HST(SLOW_CALL_hst,3);
-  PR_HST(SLOW_CALL_hst,4);
-  PR_HST(SLOW_CALL_hst,5);
-  PR_HST(SLOW_CALL_hst,6);
-  PR_HST(SLOW_CALL_hst,7);
-#endif
-
   PR_CTR(RET_NEW_ctr);
   PR_CTR(RET_OLD_ctr);
   PR_CTR(RET_UNBOXED_TUP_ctr);
 
-  /* krc: put off till later... */
-#if FALSE
-  PR_HST(RET_NEW_hst,0);
-  PR_HST(RET_NEW_hst,1);
-  PR_HST(RET_NEW_hst,2);
-  PR_HST(RET_NEW_hst,3);
-  PR_HST(RET_NEW_hst,4);
-  PR_HST(RET_NEW_hst,5);
-  PR_HST(RET_NEW_hst,6);
-  PR_HST(RET_NEW_hst,7);
-  PR_HST(RET_NEW_hst,8);
-  PR_HST(RET_OLD_hst,0);
-  PR_HST(RET_OLD_hst,1);
-  PR_HST(RET_OLD_hst,2);
-  PR_HST(RET_OLD_hst,3);
-  PR_HST(RET_OLD_hst,4);
-  PR_HST(RET_OLD_hst,5);
-  PR_HST(RET_OLD_hst,6);
-  PR_HST(RET_OLD_hst,7);
-  PR_HST(RET_OLD_hst,8);
-  PR_HST(RET_UNBOXED_TUP_hst,0);
-  PR_HST(RET_UNBOXED_TUP_hst,1);
-  PR_HST(RET_UNBOXED_TUP_hst,2);
-  PR_HST(RET_UNBOXED_TUP_hst,3);
-  PR_HST(RET_UNBOXED_TUP_hst,4);
-  PR_HST(RET_UNBOXED_TUP_hst,5);
-  PR_HST(RET_UNBOXED_TUP_hst,6);
-  PR_HST(RET_UNBOXED_TUP_hst,7);
-  PR_HST(RET_UNBOXED_TUP_hst,8);
-#endif /* FALSE */
+#define PR_HST_BINS(hst) for (i = 0; i < TICKY_BIN_COUNT; i++) \
+  { fprintf(tf,"%11" FMT_Int " " #hst "_%lu\n", hst[i], i); }
+
+  PR_HST_BINS(RET_NEW_hst);
+  PR_HST_BINS(RET_OLD_hst);
+  PR_HST_BINS(RET_UNBOXED_TUP_hst);
+
+#undef PR_HST_BINS
 
   PR_CTR(UPDF_OMITTED_ctr);
   PR_CTR(UPDF_PUSHED_ctr);
@@ -512,33 +332,6 @@ PrintTickyInfo(void)
   PR_CTR(UPD_PAP_IN_NEW_ctr);
   PR_CTR(UPD_PAP_IN_PLACE_ctr);
 
-  PR_CTR(UPD_BH_UPDATABLE_ctr);
-  PR_CTR(UPD_BH_SINGLE_ENTRY_ctr);
-  PR_CTR(UPD_CAF_BH_UPDATABLE_ctr);
-  PR_CTR(UPD_CAF_BH_SINGLE_ENTRY_ctr);
-
-  /* krc: put off till later...*/
-#if FALSE
-  PR_HST(UPD_CON_IN_NEW_hst,0);
-  PR_HST(UPD_CON_IN_NEW_hst,1);
-  PR_HST(UPD_CON_IN_NEW_hst,2);
-  PR_HST(UPD_CON_IN_NEW_hst,3);
-  PR_HST(UPD_CON_IN_NEW_hst,4);
-  PR_HST(UPD_CON_IN_NEW_hst,5);
-  PR_HST(UPD_CON_IN_NEW_hst,6);
-  PR_HST(UPD_CON_IN_NEW_hst,7);
-  PR_HST(UPD_CON_IN_NEW_hst,8);
-  PR_HST(UPD_PAP_IN_NEW_hst,0);
-  PR_HST(UPD_PAP_IN_NEW_hst,1);
-  PR_HST(UPD_PAP_IN_NEW_hst,2);
-  PR_HST(UPD_PAP_IN_NEW_hst,3);
-  PR_HST(UPD_PAP_IN_NEW_hst,4);
-  PR_HST(UPD_PAP_IN_NEW_hst,5);
-  PR_HST(UPD_PAP_IN_NEW_hst,6);
-  PR_HST(UPD_PAP_IN_NEW_hst,7);
-  PR_HST(UPD_PAP_IN_NEW_hst,8);
-#endif /* FALSE */
-
   PR_CTR(UPD_NEW_IND_ctr);
   /* see comment on ENT_PERM_IND_ctr */
   COND_PR_CTR(UPD_NEW_PERM_IND_ctr,RtsFlags.GcFlags.squeezeUpdFrames == rtsFalse,"U!PD_NEW_PERM_IND_ctr requires +RTS -Z");
@@ -550,13 +343,8 @@ PrintTickyInfo(void)
   PR_CTR(GC_SEL_MINOR_ctr);
   PR_CTR(GC_SEL_MAJOR_ctr);
   PR_CTR(GC_FAILED_PROMOTION_ctr);
-  PR_CTR(GC_WORDS_COPIED_ctr);
 }
 
-/* Data structure used in ``registering'' one of these counters. */
-
-StgEntCounter *ticky_entry_ctrs = NULL; /* root of list of them */
-
 /* To print out all the registered-counter info: */
 
 static void
@@ -565,34 +353,25 @@ printRegisteredCounterInfo (FILE *tf)
     StgEntCounter *p;
 
     if ( ticky_entry_ctrs != NULL ) {
+      fprintf(tf,"\nThe following table is explained by http://ghc.haskell.org/trac/ghc/wiki/Debugging/TickyTicky\nAll allocation numbers are in bytes.\n");
       fprintf(tf,"\n**************************************************\n\n");
     }
-    fprintf(tf, "%11s%11s %6s%6s    %-11s%-30s\n",
-           "Entries", "Allocs", "Arity", "Stack", "Kinds", "Function");
+    fprintf(tf, "%11s%11s%11s  %-23s %s\n",
+            "Entries", "Alloc", "Alloc'd", "Non-void Arguments", "STG Name");
     fprintf(tf, "--------------------------------------------------------------------------------\n");
     /* Function name at the end so it doesn't mess up the tabulation */
 
     for (p = ticky_entry_ctrs; p != NULL; p = p->link) {
-       fprintf(tf, "%11ld%11ld %6zu%6zu    %-11s%-30s",
-               p->entry_count,
-               p->allocs,
-               p->arity,
-               p->stk_args,
-               p->arg_kinds,
-               p->str);
+        fprintf(tf, "%11" FMT_Int "%11" FMT_Int "%11" FMT_Int " %3lu %-20.20s %s",
+                p->entry_count,
+                p->allocs,
+                p->allocd,
+                (unsigned long)p->arity,
+                p->arg_kinds,
+                p->str);
 
-       fprintf(tf, "\n");
+        fprintf(tf, "\n");
 
     }
 }
-
-/* Catch-all top-level counter struct.  Allocations from CAFs will go
- * here.
- */
-StgEntCounter top_ct
-        = { 0, 0, 0,
-           "TOP", "",
-           0, 0, NULL };
-
 #endif /* TICKY_TICKY */
-