/* -----------------------------------------------------------------------------
- * $Id: Stats.c,v 1.14 1999/09/15 13:45:20 simonmar Exp $
*
- * (c) The GHC Team, 1998-1999
+ * (c) The GHC Team, 1998-2005
*
* Statistics and timing-related functions.
*
* ---------------------------------------------------------------------------*/
-#define NON_POSIX_SOURCE
-
#include "Rts.h"
#include "RtsFlags.h"
#include "RtsUtils.h"
-#include "StoragePriv.h"
#include "MBlock.h"
-
-/**
- * Ian: For the moment we just want to ignore
- * these on Nemesis
- **/
-#ifdef _NEMESIS_OS_
-#ifdef HAVE_SYS_TIMES_H
-#undef HAVE_SYS_TIMES_H /* <sys/times.h> */
-#endif
-#ifdef HAVE_SYS_RESOURCE_H /* <sys/resource.h> */
-#undef HAVE_SYS_RESOURCE_H
-#endif
-#ifdef HAVE_SYS_TIME_H /* <sys/time.h> */
-#undef HAVE_SYS_TIME_H
-#endif
-#ifdef HAVE_SYS_TIMEB_H
-#undef HAVE_SYS_TIMEB_H /* <sys/timeb.h> */
-#endif
-#ifdef HAVE_UNISTD_H
-#undef HAVE_UNISTD_H /* <unistd.h> */
-#endif
-#ifdef HAVE_TIMES
-#undef HAVE_TIMES
-#endif
-#ifdef HAVE_FTIME
-#undef HAVE_FTIME
-#endif
-#ifdef HAVE_GETRUSAGE
-#undef HAVE_GETRUSAGE
-#endif
-#ifdef HAVE_SYSCONF
-#undef HAVE_SYSCONF
-#endif
-#endif /* _NEMESIS_OS_ */
-
+#include "Schedule.h"
#include "Stats.h"
-
-#ifdef HAVE_UNISTD_H
-#include <unistd.h>
-#endif
-
-#ifndef __MINGW32__
-# ifdef HAVE_SYS_TIMES_H
-# include <sys/times.h>
-# endif
-#endif
-
-#ifdef HAVE_SYS_TIME_H
-#include <sys/time.h>
-#endif
-
-#ifdef __CYGWIN32__
-# ifdef HAVE_TIME_H
-# include <time.h>
-# endif
-#endif
-
-#if ! irix_TARGET_OS && ! defined(__MINGW32__)
-# if defined(HAVE_SYS_RESOURCE_H)
-# include <sys/resource.h>
-# endif
-#endif
-
-#ifdef HAVE_SYS_TIMEB_H
-#include <sys/timeb.h>
-#endif
-
-#if HAVE_STDLIB_H
-#include <stdlib.h>
-#endif
-
-#if HAVE_WINDOWS_H
-#include <windows.h>
-#endif
+#include "ParTicky.h" /* ToDo: move into Rts.h */
+#include "Profiling.h"
+#include "Storage.h"
+#include "GetTime.h"
/* huh? */
#define BIG_STRING_LEN 512
-static double ElapsedTimeStart = 0.0;
-static double TicksPerSecond = 0.0;
-
-static double InitUserTime = 0.0;
-static double InitElapsedTime = 0.0;
+#define TICK_TO_DBL(t) ((double)(t) / TICKS_PER_SECOND)
-static ullong GC_tot_alloc = 0;
-static ullong GC_tot_copied = 0;
+static Ticks ElapsedTimeStart = 0;
-static double GC_start_time, GC_tot_time = 0; /* User GC Time */
-static double GCe_start_time, GCe_tot_time = 0; /* Elapsed GC time */
+static Ticks InitUserTime = 0;
+static Ticks InitElapsedTime = 0;
+static Ticks InitElapsedStamp = 0;
-lnat MaxResidency = 0; /* in words; for stats only */
-lnat ResidencySamples = 0; /* for stats only */
+static Ticks MutUserTime = 0;
+static Ticks MutElapsedTime = 0;
+static Ticks MutElapsedStamp = 0;
-static lnat GC_start_faults = 0, GC_end_faults = 0;
+static Ticks ExitUserTime = 0;
+static Ticks ExitElapsedTime = 0;
-static double *GC_coll_times;
+static ullong GC_tot_alloc = 0;
+static ullong GC_tot_copied = 0;
+static ullong GC_tot_scavd_copied = 0;
-/* ToDo: convert this to use integers? --SDM */
+static Ticks GC_start_time = 0, GC_tot_time = 0; /* User GC Time */
+static Ticks GCe_start_time = 0, GCe_tot_time = 0; /* Elapsed GC time */
-/* elapsedtime() -- The current elapsed time in seconds */
+#ifdef PROFILING
+static Ticks RP_start_time = 0, RP_tot_time = 0; /* retainer prof user time */
+static Ticks RPe_start_time = 0, RPe_tot_time = 0; /* retainer prof elap time */
-#ifdef _WIN32
-#define NS_PER_SEC 10000000LL
-/* Convert FILETIMEs into secs since the Epoch (Jan1-1970) */
-#define FT2longlong(ll,ft) \
- (ll)=(ft).dwHighDateTime; \
- (ll) <<= 32; \
- (ll) |= (ft).dwLowDateTime; \
- (ll) /= (unsigned long long) (NS_PER_SEC / CLOCKS_PER_SEC)
+static Ticks HC_start_time, HC_tot_time = 0; // heap census prof user time
+static Ticks HCe_start_time, HCe_tot_time = 0; // heap census prof elap time
#endif
-#ifdef _WIN32
-/* cygwin32 or mingw32 version */
-double
-elapsedtime(void)
-{
- FILETIME creationTime, exitTime, kernelTime, userTime;
- long long int kT, uT;
-
-
- /* ToDo: pin down elapsed times to just the OS thread(s) that
- are evaluating/managing Haskell code.
- */
- if (!GetProcessTimes (GetCurrentProcess(), &creationTime,
- &exitTime, &kernelTime, &userTime)) {
- /* Probably on a Win95 box..*/
- return 0;
- }
-
- FT2longlong(kT,kernelTime);
- FT2longlong(uT,userTime);
- return (((StgDouble)(uT + kT))/TicksPerSecond - ElapsedTimeStart);
-}
-
-#else
-
-double
-elapsedtime(void)
-{
-# if ! (defined(HAVE_TIMES) || defined(HAVE_FTIME))
- /* We will #ifdef around the fprintf for machines
- we *know* are unsupported. (WDP 94/05)
- */
- fprintf(stderr, "NOTE: `elapsedtime' does nothing!\n");
- return 0.0;
+#ifdef PROFILING
+#define PROF_VAL(x) (x)
+#else
+#define PROF_VAL(x) 0
+#endif
-# else /* not stumped */
+static lnat MaxResidency = 0; // in words; for stats only
+static lnat AvgResidency = 0;
+static lnat ResidencySamples = 0; // for stats only
-/* "ftime" may be nicer, but "times" is more standard;
- but, on a Sun, if you do not get the SysV one, you are *hosed*...
- */
-
-# if defined(HAVE_TIMES) && ! sunos4_TARGET_OS
- struct tms t;
- clock_t r = times(&t);
+static lnat GC_start_faults = 0, GC_end_faults = 0;
- return (((double)r)/TicksPerSecond - ElapsedTimeStart);
+static Ticks *GC_coll_times;
-# else /* HAVE_FTIME */
- struct timeb t;
+static void statsPrintf( char *s, ... )
+ GNUC3_ATTRIBUTE(format (printf, 1, 2));
- ftime(&t);
- return (fabs(t.time + 1e-3*t.millitm - ElapsedTimeStart));
+static void statsFlush( void );
+static void statsClose( void );
-# endif /* HAVE_FTIME */
-# endif /* not stumped */
+Ticks stat_getElapsedGCTime(void)
+{
+ return GCe_tot_time;
}
-#endif /* !_WIN32 */
/* mut_user_time_during_GC() and mut_user_time()
*
- * This function can be used to get the current mutator time *during*
- * a GC, i.e. between stat_startGC and stat_endGC. This is used in
- * the heap profiler for accurately time stamping the heap sample.
+ * The former function can be used to get the current mutator time
+ * *during* a GC, i.e. between stat_startGC and stat_endGC. This is
+ * used in the heap profiler for accurately time stamping the heap
+ * sample.
+ *
+ * ATTENTION: mut_user_time_during_GC() relies on GC_start_time being
+ * defined in stat_startGC() - to minimise system calls,
+ * GC_start_time is, however, only defined when really needed (check
+ * stat_startGC() for details)
*/
double
-mut_user_time_during_GC(void)
+mut_user_time_during_GC( void )
{
- return (GC_start_time - GC_tot_time);
+ return TICK_TO_DBL(GC_start_time - GC_tot_time - PROF_VAL(RP_tot_time + HC_tot_time));
}
double
-mut_user_time(void)
+mut_user_time( void )
{
- return (usertime() - GC_tot_time);
+ Ticks user;
+ user = getProcessCPUTime();
+ return TICK_TO_DBL(user - GC_tot_time - PROF_VAL(RP_tot_time + HC_tot_time));
}
-
-static nat
-pagefaults(void)
+#ifdef PROFILING
+/*
+ mut_user_time_during_RP() is similar to mut_user_time_during_GC();
+ it returns the MUT time during retainer profiling.
+ The same is for mut_user_time_during_HC();
+ */
+double
+mut_user_time_during_RP( void )
{
- /* ToDo (on NT): better, get this via the performance data
- that's stored in the registry. */
-# if !defined(HAVE_GETRUSAGE) || irix_TARGET_OS || defined(_WIN32)
- return 0;
-# else
- struct rusage t;
-
- getrusage(RUSAGE_SELF, &t);
- return(t.ru_majflt);
-# endif
+ return TICK_TO_DBL(RP_start_time - GC_tot_time - RP_tot_time - HC_tot_time);
}
-/* ToDo: use gettimeofday on systems that support it (u-sec accuracy) */
-
-void
-start_time(void)
+double
+mut_user_time_during_heap_census( void )
{
-#ifdef HAVE_SYSCONF
- long ticks;
- /* Determine TicksPerSecond ... */
-
- ticks = sysconf(_SC_CLK_TCK);
- if ( ticks == -1 ) {
- fprintf(stderr, "stat_init: bad call to 'sysconf'!\n");
- stg_exit(EXIT_FAILURE);
- }
- TicksPerSecond = (double) ticks;
-
-/* no "sysconf"; had better guess */
-#elif defined(HZ)
- TicksPerSecond = (StgDouble) (HZ);
-
-#elif defined(CLOCKS_PER_SEC)
- TicksPerSecond = (StgDouble) (CLOCKS_PER_SEC);
-#else /* had better guess wildly */
- /* We will #ifdef around the fprintf for machines
- we *know* are unsupported. (WDP 94/05)
- */
- fprintf(stderr, "NOTE: Guessing `TicksPerSecond = 60'!\n");
- TicksPerSecond = 60.0;
-#endif
-
- ElapsedTimeStart = elapsedtime();
+ return TICK_TO_DBL(HC_start_time - GC_tot_time - RP_tot_time - HC_tot_time);
}
-
+#endif /* PROFILING */
void
initStats(void)
{
- nat i;
- FILE *sf = RtsFlags.GcFlags.statsFile;
+ nat i;
- if (RtsFlags.GcFlags.giveStats >= VERBOSE_GC_STATS) {
- fprintf(sf, " Alloc Collect Live GC GC TOT TOT Page Flts\n");
- fprintf(sf, " bytes bytes bytes user elap user elap\n");
- }
- GC_coll_times =
- (double *)stgMallocBytes(sizeof(double) * RtsFlags.GcFlags.generations,
- "initStats");
- for (i = 0; i < RtsFlags.GcFlags.generations; i++) {
- GC_coll_times[i] = 0.0;
- }
+ if (RtsFlags.GcFlags.giveStats >= VERBOSE_GC_STATS) {
+ statsPrintf(" Alloc Copied Live GC GC TOT TOT Page Flts\n");
+ statsPrintf(" bytes bytes bytes user elap user elap\n");
+ }
+ GC_coll_times =
+ (Ticks *)stgMallocBytes(
+ sizeof(Ticks)*RtsFlags.GcFlags.generations,
+ "initStats");
+ for (i = 0; i < RtsFlags.GcFlags.generations; i++) {
+ GC_coll_times[i] = 0;
+ }
}
-#ifdef _WIN32
-double
-usertime(void)
-{
- FILETIME creationTime, exitTime, kernelTime, userTime;
- long long int uT;
-
- /* Convert FILETIMEs into long longs */
+/* -----------------------------------------------------------------------------
+ Initialisation time...
+ -------------------------------------------------------------------------- */
- if (!GetProcessTimes (GetCurrentProcess(), &creationTime,
- &exitTime, &kernelTime, &userTime)) {
- /* Probably exec'ing this on a Win95 box..*/
- return 0;
- }
+void
+stat_startInit(void)
+{
+ Ticks elapsed;
- FT2longlong(uT,userTime);
- return (((StgDouble)uT)/TicksPerSecond);
+ elapsed = getProcessElapsedTime();
+ ElapsedTimeStart = elapsed;
}
-#else
-double
-usertime(void)
+void
+stat_endInit(void)
{
-# if ! (defined(HAVE_GETRUSAGE) || defined(HAVE_TIMES))
- /* We will #ifdef around the fprintf for machines
- we *know* are unsupported. (WDP 94/05)
- */
- fprintf(stderr, "NOTE: `usertime' does nothing!\n");
- return 0.0;
+ Ticks user, elapsed;
-# else /* not stumped */
+ getProcessTimes(&user, &elapsed);
-# if defined(HAVE_TIMES)
- struct tms t;
+ InitUserTime = user;
+ InitElapsedStamp = elapsed;
+ if (ElapsedTimeStart > elapsed) {
+ InitElapsedTime = 0;
+ } else {
+ InitElapsedTime = elapsed - ElapsedTimeStart;
+ }
+}
+
+/* -----------------------------------------------------------------------------
+ stat_startExit and stat_endExit
+
+ These two measure the time taken in shutdownHaskell().
+ -------------------------------------------------------------------------- */
- times(&t);
- return(((double)(t.tms_utime))/TicksPerSecond);
+void
+stat_startExit(void)
+{
+ Ticks user, elapsed;
-# else /* HAVE_GETRUSAGE */
- struct rusage t;
+ getProcessTimes(&user, &elapsed);
- getrusage(RUSAGE_SELF, &t);
- return(t.ru_utime.tv_sec + 1e-6*t.ru_utime.tv_usec);
+ MutElapsedStamp = elapsed;
+ MutElapsedTime = elapsed - GCe_tot_time -
+ PROF_VAL(RPe_tot_time + HCe_tot_time) - InitElapsedStamp;
+ if (MutElapsedTime < 0) { MutElapsedTime = 0; } /* sometimes -0.00 */
-# endif /* HAVE_GETRUSAGE */
-# endif /* not stumped */
+ MutUserTime = user - GC_tot_time - PROF_VAL(RP_tot_time + HC_tot_time) - InitUserTime;
+ if (MutUserTime < 0) { MutUserTime = 0; }
}
-#endif /* ! _WIN32 */
-void
-end_init(void)
+void
+stat_endExit(void)
{
- InitUserTime = usertime();
- InitElapsedTime = elapsedtime();
- if (InitElapsedTime < 0.0) {
- InitElapsedTime = 0.0;
- }
+ Ticks user, elapsed;
+
+ getProcessTimes(&user, &elapsed);
+
+ ExitUserTime = user - MutUserTime - GC_tot_time - PROF_VAL(RP_tot_time + HC_tot_time) - InitUserTime;
+ ExitElapsedTime = elapsed - MutElapsedStamp;
+ if (ExitUserTime < 0) {
+ ExitUserTime = 0;
+ }
+ if (ExitElapsedTime < 0) {
+ ExitElapsedTime = 0;
+ }
}
/* -----------------------------------------------------------------------------
static nat rub_bell = 0;
+/* initialise global variables needed during GC
+ *
+ * * GC_start_time is read in mut_user_time_during_GC(), which in turn is
+ * needed if either PROFILING or DEBUGing is enabled
+ */
void
stat_startGC(void)
{
- FILE *sf = RtsFlags.GcFlags.statsFile;
-
nat bell = RtsFlags.GcFlags.ringBell;
if (bell) {
if (bell > 1) {
- fprintf(stderr, " GC ");
+ debugBelch(" GC ");
rub_bell = 1;
} else {
- fprintf(stderr, "\007");
+ debugBelch("\007");
}
}
- if (sf != NULL) {
- GC_start_time = usertime();
- GCe_start_time = elapsedtime();
+#if defined(PROFILING) || defined(DEBUG)
+ GC_start_time = getProcessCPUTime(); // needed in mut_user_time_during_GC()
+#endif
+
+ if (RtsFlags.GcFlags.giveStats != NO_GC_STATS) {
+#if !defined(PROFILING) && !defined(DEBUG)
+ GC_start_time = getProcessCPUTime();
+#endif
+ GCe_start_time = getProcessElapsedTime();
if (RtsFlags.GcFlags.giveStats) {
- GC_start_faults = pagefaults();
+ GC_start_faults = getPageFaults();
}
}
}
-------------------------------------------------------------------------- */
void
-stat_endGC(lnat alloc, lnat collect, lnat live, lnat copied, lnat gen)
+stat_endGC (lnat alloc, lnat live, lnat copied,
+ lnat scavd_copied, lnat gen)
{
- FILE *sf = RtsFlags.GcFlags.statsFile;
-
- if (sf != NULL) {
- double time = usertime();
- double etime = elapsedtime();
-
- if (RtsFlags.GcFlags.giveStats >= VERBOSE_GC_STATS) {
- nat faults = pagefaults();
-
- fprintf(sf, "%9ld %9ld %9ld",
- alloc*sizeof(W_), collect*sizeof(W_), live*sizeof(W_));
- fprintf(sf, " %5.2f %5.2f %7.2f %7.2f %4ld %4ld (Gen: %2ld)\n",
- (time-GC_start_time),
- (etime-GCe_start_time),
- time,
- etime,
+ if (RtsFlags.GcFlags.giveStats != NO_GC_STATS) {
+ Ticks time, etime, gc_time, gc_etime;
+
+ getProcessTimes(&time, &etime);
+ gc_time = time - GC_start_time;
+ gc_etime = etime - GCe_start_time;
+
+ if (RtsFlags.GcFlags.giveStats == VERBOSE_GC_STATS) {
+ nat faults = getPageFaults();
+
+ statsPrintf("%9ld %9ld %9ld",
+ alloc*sizeof(W_), (copied+scavd_copied)*sizeof(W_),
+ live*sizeof(W_));
+ statsPrintf(" %5.2f %5.2f %7.2f %7.2f %4ld %4ld (Gen: %2ld)\n",
+ TICK_TO_DBL(gc_time),
+ TICK_TO_DBL(gc_etime),
+ TICK_TO_DBL(time),
+ TICK_TO_DBL(etime - ElapsedTimeStart),
faults - GC_start_faults,
GC_start_faults - GC_end_faults,
gen);
GC_end_faults = faults;
- fflush(sf);
+ statsFlush();
}
- GC_coll_times[gen] += time-GC_start_time;
+ GC_coll_times[gen] += gc_time;
GC_tot_copied += (ullong) copied;
+ GC_tot_scavd_copied += (ullong) scavd_copied;
GC_tot_alloc += (ullong) alloc;
- GC_tot_time += time-GC_start_time;
- GCe_tot_time += etime-GCe_start_time;
+ GC_tot_time += gc_time;
+ GCe_tot_time += gc_etime;
+
+#if defined(THREADED_RTS)
+ {
+ Task *task;
+ if ((task = myTask()) != NULL) {
+ task->gc_time += gc_time;
+ task->gc_etime += gc_etime;
+ }
+ }
+#endif
if (gen == RtsFlags.GcFlags.generations-1) { /* major GC? */
- if (live > MaxResidency) {
- MaxResidency = live;
- }
- ResidencySamples++;
+ if (live > MaxResidency) {
+ MaxResidency = live;
+ }
+ ResidencySamples++;
+ AvgResidency += live;
}
}
if (rub_bell) {
- fprintf(stderr, "\b\b\b \b\b\b");
+ debugBelch("\b\b\b \b\b\b");
rub_bell = 0;
}
}
/* -----------------------------------------------------------------------------
+ Called at the beginning of each Retainer Profiliing
+ -------------------------------------------------------------------------- */
+#ifdef PROFILING
+void
+stat_startRP(void)
+{
+ Ticks user, elapsed;
+ getProcessTimes( &user, &elapsed );
+
+ RP_start_time = user;
+ RPe_start_time = elapsed;
+}
+#endif /* PROFILING */
+
+/* -----------------------------------------------------------------------------
+ Called at the end of each Retainer Profiliing
+ -------------------------------------------------------------------------- */
+
+#ifdef PROFILING
+void
+stat_endRP(
+ nat retainerGeneration,
+#ifdef DEBUG_RETAINER
+ nat maxCStackSize,
+ int maxStackSize,
+#endif
+ double averageNumVisit)
+{
+ Ticks user, elapsed;
+ getProcessTimes( &user, &elapsed );
+
+ RP_tot_time += user - RP_start_time;
+ RPe_tot_time += elapsed - RPe_start_time;
+
+ fprintf(prof_file, "Retainer Profiling: %d, at %f seconds\n",
+ retainerGeneration, mut_user_time_during_RP());
+#ifdef DEBUG_RETAINER
+ fprintf(prof_file, "\tMax C stack size = %u\n", maxCStackSize);
+ fprintf(prof_file, "\tMax auxiliary stack size = %u\n", maxStackSize);
+#endif
+ fprintf(prof_file, "\tAverage number of visits per object = %f\n", averageNumVisit);
+}
+#endif /* PROFILING */
+
+/* -----------------------------------------------------------------------------
+ Called at the beginning of each heap census
+ -------------------------------------------------------------------------- */
+#ifdef PROFILING
+void
+stat_startHeapCensus(void)
+{
+ Ticks user, elapsed;
+ getProcessTimes( &user, &elapsed );
+
+ HC_start_time = user;
+ HCe_start_time = elapsed;
+}
+#endif /* PROFILING */
+
+/* -----------------------------------------------------------------------------
+ Called at the end of each heap census
+ -------------------------------------------------------------------------- */
+#ifdef PROFILING
+void
+stat_endHeapCensus(void)
+{
+ Ticks user, elapsed;
+ getProcessTimes( &user, &elapsed );
+
+ HC_tot_time += user - HC_start_time;
+ HCe_tot_time += elapsed - HCe_start_time;
+}
+#endif /* PROFILING */
+
+/* -----------------------------------------------------------------------------
Called at the end of execution
NOTE: number of allocations is not entirely accurate: it doesn't
void
stat_exit(int alloc)
{
- FILE *sf = RtsFlags.GcFlags.statsFile;
+ if (RtsFlags.GcFlags.giveStats != NO_GC_STATS) {
- if (sf != NULL){
char temp[BIG_STRING_LEN];
- double time = usertime();
- double etime = elapsedtime();
- double MutTime, MutElapsedTime;
+ Ticks time;
+ Ticks etime;
+ nat g, total_collections = 0;
+
+ getProcessTimes( &time, &etime );
+ etime -= ElapsedTimeStart;
+
+ GC_tot_alloc += alloc;
+
+ /* Count total garbage collections */
+ for (g = 0; g < RtsFlags.GcFlags.generations; g++)
+ total_collections += generations[g].collections;
/* avoid divide by zero if time is measured as 0.00 seconds -- SDM */
- if (time == 0.0) time = 0.0001;
- if (etime == 0.0) etime = 0.0001;
+ if (time == 0.0) time = 1;
+ if (etime == 0.0) etime = 1;
+ if (RtsFlags.GcFlags.giveStats >= VERBOSE_GC_STATS) {
+ statsPrintf("%9ld %9.9s %9.9s", (lnat)alloc*sizeof(W_), "", "");
+ statsPrintf(" %5.2f %5.2f\n\n", 0.0, 0.0);
+ }
- fprintf(sf, "%9ld %9.9s %9.9s",
- (lnat)alloc*sizeof(W_), "", "");
- fprintf(sf, " %5.2f %5.2f\n\n", 0.0, 0.0);
-
- GC_tot_alloc += alloc;
+ if (RtsFlags.GcFlags.giveStats >= SUMMARY_GC_STATS) {
+ ullong_format_string(GC_tot_alloc*sizeof(W_),
+ temp, rtsTrue/*commas*/);
+ statsPrintf("%11s bytes allocated in the heap\n", temp);
- ullong_format_string(GC_tot_alloc*sizeof(W_), temp, rtsTrue/*commas*/);
- fprintf(sf, "%11s bytes allocated in the heap\n", temp);
+ ullong_format_string(GC_tot_copied*sizeof(W_),
+ temp, rtsTrue/*commas*/);
+ statsPrintf("%11s bytes copied during GC (scavenged)\n", temp);
- ullong_format_string(GC_tot_copied*sizeof(W_), temp, rtsTrue/*commas*/);
- fprintf(sf, "%11s bytes copied during GC\n", temp);
+ ullong_format_string(GC_tot_scavd_copied*sizeof(W_),
+ temp, rtsTrue/*commas*/);
+ statsPrintf("%11s bytes copied during GC (not scavenged)\n", temp);
+
+ if ( ResidencySamples > 0 ) {
+ ullong_format_string(MaxResidency*sizeof(W_),
+ temp, rtsTrue/*commas*/);
+ statsPrintf("%11s bytes maximum residency (%ld sample(s))\n",
+ temp, ResidencySamples);
+ }
+ statsPrintf("\n");
+
+ /* Print garbage collections in each gen */
+ for (g = 0; g < RtsFlags.GcFlags.generations; g++) {
+ statsPrintf("%11d collections in generation %d (%6.2fs)\n",
+ generations[g].collections, g,
+ TICK_TO_DBL(GC_coll_times[g]));
+ }
+
+ statsPrintf("\n%11ld Mb total memory in use\n\n",
+ mblocks_allocated * MBLOCK_SIZE / (1024 * 1024));
+
+#if defined(THREADED_RTS)
+ {
+ nat i;
+ Task *task;
+ for (i = 0, task = all_tasks;
+ task != NULL;
+ i++, task = task->all_link) {
+ statsPrintf(" Task %2d %-8s : MUT time: %6.2fs (%6.2fs elapsed)\n"
+ " GC time: %6.2fs (%6.2fs elapsed)\n\n",
+ i,
+ (task->tso == NULL) ? "(worker)" : "(bound)",
+ TICK_TO_DBL(task->mut_time),
+ TICK_TO_DBL(task->mut_etime),
+ TICK_TO_DBL(task->gc_time),
+ TICK_TO_DBL(task->gc_etime));
+ }
+ }
+#endif
- if ( ResidencySamples > 0 ) {
- ullong_format_string(MaxResidency*sizeof(W_), temp, rtsTrue/*commas*/);
- fprintf(sf, "%11s bytes maximum residency (%ld sample(s))\n",
- temp,
- ResidencySamples);
- }
- fprintf(sf,"\n");
-
- { /* Count garbage collections */
- nat g;
- for (g = 0; g < RtsFlags.GcFlags.generations; g++) {
- fprintf(sf, "%11d collections in generation %d (%6.2fs)\n",
- generations[g].collections, g, GC_coll_times[g]);
- }
- }
- fprintf(sf,"\n%11ld Mb total memory in use\n\n",
- mblocks_allocated * MBLOCK_SIZE / (1024 * 1024));
-
- MutTime = time - GC_tot_time - InitUserTime;
- if (MutTime < 0) { MutTime = 0; }
- MutElapsedTime = etime - GCe_tot_time - InitElapsedTime;
- if (MutElapsedTime < 0) { MutElapsedTime = 0; } /* sometimes -0.00 */
-
- fprintf(sf, " INIT time %6.2fs (%6.2fs elapsed)\n",
- InitUserTime, InitElapsedTime);
- fprintf(sf, " MUT time %6.2fs (%6.2fs elapsed)\n",
- MutTime, MutElapsedTime);
- fprintf(sf, " GC time %6.2fs (%6.2fs elapsed)\n",
- GC_tot_time, GCe_tot_time);
- fprintf(sf, " Total time %6.2fs (%6.2fs elapsed)\n\n",
- time, etime);
-
- fprintf(sf, " %%GC time %5.1f%% (%.1f%% elapsed)\n\n",
- GC_tot_time*100./time, GCe_tot_time*100./etime);
-
- if (time - GC_tot_time == 0.0)
+ statsPrintf(" INIT time %6.2fs (%6.2fs elapsed)\n",
+ TICK_TO_DBL(InitUserTime), TICK_TO_DBL(InitElapsedTime));
+ statsPrintf(" MUT time %6.2fs (%6.2fs elapsed)\n",
+ TICK_TO_DBL(MutUserTime), TICK_TO_DBL(MutElapsedTime));
+ statsPrintf(" GC time %6.2fs (%6.2fs elapsed)\n",
+ TICK_TO_DBL(GC_tot_time), TICK_TO_DBL(GCe_tot_time));
+#ifdef PROFILING
+ statsPrintf(" RP time %6.2fs (%6.2fs elapsed)\n",
+ TICK_TO_DBL(RP_tot_time), TICK_TO_DBL(RPe_tot_time));
+ statsPrintf(" PROF time %6.2fs (%6.2fs elapsed)\n",
+ TICK_TO_DBL(HC_tot_time), TICK_TO_DBL(HCe_tot_time));
+#endif
+ statsPrintf(" EXIT time %6.2fs (%6.2fs elapsed)\n",
+ TICK_TO_DBL(ExitUserTime), TICK_TO_DBL(ExitElapsedTime));
+ statsPrintf(" Total time %6.2fs (%6.2fs elapsed)\n\n",
+ TICK_TO_DBL(time), TICK_TO_DBL(etime));
+ statsPrintf(" %%GC time %5.1f%% (%.1f%% elapsed)\n\n",
+ TICK_TO_DBL(GC_tot_time)*100/TICK_TO_DBL(time),
+ TICK_TO_DBL(GCe_tot_time)*100/TICK_TO_DBL(etime));
+
+ if (time - GC_tot_time - PROF_VAL(RP_tot_time + HC_tot_time) == 0)
ullong_format_string(0, temp, rtsTrue/*commas*/);
- else
- ullong_format_string((ullong)(GC_tot_alloc*sizeof(W_)/
- (time - GC_tot_time)),
- temp, rtsTrue/*commas*/);
+ else
+ ullong_format_string(
+ (ullong)((GC_tot_alloc*sizeof(W_))/
+ TICK_TO_DBL(time - GC_tot_time -
+ PROF_VAL(RP_tot_time + HC_tot_time))),
+ temp, rtsTrue/*commas*/);
+
+ statsPrintf(" Alloc rate %s bytes per MUT second\n\n", temp);
+
+ statsPrintf(" Productivity %5.1f%% of total user, %.1f%% of total elapsed\n\n",
+ TICK_TO_DBL(time - GC_tot_time -
+ PROF_VAL(RP_tot_time + HC_tot_time) - InitUserTime) * 100
+ / TICK_TO_DBL(time),
+ TICK_TO_DBL(time - GC_tot_time -
+ PROF_VAL(RP_tot_time + HC_tot_time) - InitUserTime) * 100
+ / TICK_TO_DBL(etime));
+ }
- fprintf(sf, " Alloc rate %s bytes per MUT second\n\n", temp);
+ if (RtsFlags.GcFlags.giveStats == ONELINE_GC_STATS) {
+ /* print the long long separately to avoid bugginess on mingwin (2001-07-02, mingw-0.5) */
+ statsPrintf("<<ghc: %llu bytes, ", GC_tot_alloc*(ullong)sizeof(W_));
+ statsPrintf("%d GCs, %ld/%ld avg/max bytes residency (%ld samples), %luM in use, %.2f INIT (%.2f elapsed), %.2f MUT (%.2f elapsed), %.2f GC (%.2f elapsed) :ghc>>\n",
+ total_collections,
+ ResidencySamples == 0 ? 0 :
+ AvgResidency*sizeof(W_)/ResidencySamples,
+ MaxResidency*sizeof(W_),
+ ResidencySamples,
+ (unsigned long)(mblocks_allocated * MBLOCK_SIZE / (1024L * 1024L)),
+ TICK_TO_DBL(InitUserTime), TICK_TO_DBL(InitElapsedTime),
+ TICK_TO_DBL(MutUserTime), TICK_TO_DBL(MutElapsedTime),
+ TICK_TO_DBL(GC_tot_time), TICK_TO_DBL(GCe_tot_time));
+ }
- fprintf(sf, " Productivity %5.1f%% of total user, %.1f%% of total elapsed\n\n",
- (time - GC_tot_time - InitUserTime) * 100. / time,
- (time - GC_tot_time - InitUserTime) * 100. / etime);
- fflush(sf);
- fclose(sf);
+ statsFlush();
+ statsClose();
}
}
Produce some detailed info on the state of the generational GC.
-------------------------------------------------------------------------- */
+#ifdef DEBUG
void
-stat_describe_gens(void)
+statDescribeGens(void)
{
- nat g, s, mut, mut_once, lge, live;
- StgMutClosure *m;
+ nat g, s, mut, lge;
+ lnat live;
bdescr *bd;
step *step;
- fprintf(stderr, " Gen Steps Max Mutable Mut-Once Step Blocks Live Large\n Blocks Closures Closures Objects\n");
+ debugBelch(
+" Gen Steps Max Mutable Step Blocks Live Large\n"
+" Blocks Closures Objects\n");
+ mut = 0;
for (g = 0; g < RtsFlags.GcFlags.generations; g++) {
- for (m = generations[g].mut_list, mut = 0; m != END_MUT_LIST;
- m = m->mut_link)
- mut++;
- for (m = generations[g].mut_once_list, mut_once = 0; m != END_MUT_LIST;
- m = m->mut_link)
- mut_once++;
- fprintf(stderr, "%8d %8d %8d %9d %9d", g, generations[g].n_steps,
- generations[g].max_blocks, mut, mut_once);
+ for (bd = generations[g].mut_list; bd != NULL; bd = bd->link) {
+ mut += bd->free - bd->start;
+ }
+
+ debugBelch("%8d %8d %8d %9d", g, generations[g].n_steps,
+ generations[g].max_blocks, mut);
for (s = 0; s < generations[g].n_steps; s++) {
step = &generations[g].steps[s];
- for (bd = step->large_objects, lge = 0; bd; bd = bd->link)
- lge++;
live = 0;
- if (RtsFlags.GcFlags.generations == 1) {
- bd = step->to_space;
- } else {
- bd = step->blocks;
+ for (bd = step->large_objects, lge = 0; bd; bd = bd->link) {
+ lge++;
}
+ live = step->n_large_blocks * BLOCK_SIZE;
+ bd = step->blocks;
+ // This live figure will be slightly less that the "live" figure
+ // given by +RTS -Sstderr, because we take don't count the
+ // slop at the end of each block.
for (; bd; bd = bd->link) {
live += (bd->free - bd->start) * sizeof(W_);
}
if (s != 0) {
- fprintf(stderr,"%46s","");
+ debugBelch("%36s","");
}
- fprintf(stderr,"%6d %8d %8d %8d\n", s, step->n_blocks,
+ debugBelch("%6d %8d %8d %8d\n", s, step->n_blocks,
live, lge);
}
}
- fprintf(stderr,"\n");
+ debugBelch("\n");
+}
+#endif
+
+/* -----------------------------------------------------------------------------
+ Stats available via a programmatic interface, so eg. GHCi can time
+ each compilation and expression evaluation.
+ -------------------------------------------------------------------------- */
+
+extern HsInt64 getAllocations( void )
+{ return (HsInt64)total_allocated * sizeof(W_); }
+
+/* -----------------------------------------------------------------------------
+ Dumping stuff in the stats file, or via the debug message interface
+ -------------------------------------------------------------------------- */
+
+static void
+statsPrintf( char *s, ... )
+{
+ FILE *sf = RtsFlags.GcFlags.statsFile;
+ va_list ap;
+
+ va_start(ap,s);
+ if (sf == NULL) {
+ vdebugBelch(s,ap);
+ } else {
+ vfprintf(sf, s, ap);
+ }
+ va_end(ap);
+}
+
+static void
+statsFlush( void )
+{
+ FILE *sf = RtsFlags.GcFlags.statsFile;
+ if (sf != NULL) {
+ fflush(sf);
+ }
+}
+
+static void
+statsClose( void )
+{
+ FILE *sf = RtsFlags.GcFlags.statsFile;
+ if (sf != NULL) {
+ fclose(sf);
+ }
}