#include "Profiling.h"
#include "GetTime.h"
#include "GC.h"
-#include "GCUtils.h"
-#include "Evac.h"
#if USE_PAPI
#include "Papi.h"
static lnat MaxResidency = 0; // in words; for stats only
static lnat AvgResidency = 0;
static lnat ResidencySamples = 0; // for stats only
+static lnat MaxSlop = 0;
static lnat GC_start_faults = 0, GC_end_faults = 0;
}
#endif /* PROFILING */
+// initStats0() has no dependencies, it can be called right at the beginning
void
-initStats(void)
+initStats0(void)
+{
+ ElapsedTimeStart = 0;
+
+ InitUserTime = 0;
+ InitElapsedTime = 0;
+ InitElapsedStamp = 0;
+
+ MutUserTime = 0;
+ MutElapsedTime = 0;
+ MutElapsedStamp = 0;
+
+ ExitUserTime = 0;
+ ExitElapsedTime = 0;
+
+ GC_tot_alloc = 0;
+ GC_tot_copied = 0;
+ GC_par_max_copied = 0;
+ GC_par_avg_copied = 0;
+ GC_start_time = 0;
+ GC_tot_time = 0;
+ GCe_start_time = 0;
+ GCe_tot_time = 0;
+
+#ifdef PROFILING
+ RP_start_time = 0;
+ RP_tot_time = 0;
+ RPe_start_time = 0;
+ RPe_tot_time = 0;
+
+ HC_start_time = 0;
+ HC_tot_time = 0;
+ HCe_start_time = 0;
+ HCe_tot_time = 0;
+#endif
+
+ MaxResidency = 0;
+ AvgResidency = 0;
+ ResidencySamples = 0;
+ MaxSlop = 0;
+
+ GC_start_faults = 0;
+ GC_end_faults = 0;
+}
+
+// initStats1() can be called after setupRtsFlags()
+void
+initStats1 (void)
{
nat i;
GC_coll_times[i] = 0;
GC_coll_etimes[i] = 0;
}
-}
+}
/* -----------------------------------------------------------------------------
Initialisation time...
void
stat_endGC (lnat alloc, lnat live, lnat copied, lnat gen,
- lnat max_copied, lnat avg_copied)
+ lnat max_copied, lnat avg_copied, lnat slop)
{
if (RtsFlags.GcFlags.giveStats != NO_GC_STATS) {
Ticks time, etime, gc_time, gc_etime;
ResidencySamples++;
AvgResidency += live;
}
+
+ if (slop > MaxSlop) MaxSlop = slop;
}
if (rub_bell) {
statsPrintf(" (SLOW_CALLS_" #arity ") %% of (TOTAL_CALLS) : %.1f%%\n", \
SLOW_CALLS_##arity * 100.0/TOTAL_CALLS)
+extern lnat hw_alloc_blocks;
void
stat_exit(int alloc)
statsPrintf("%16s bytes maximum residency (%ld sample(s))\n",
temp, ResidencySamples);
}
- statsPrintf("%16ld MB total memory in use\n\n",
- mblocks_allocated * MBLOCK_SIZE / (1024 * 1024));
+
+ ullong_format_string(MaxSlop*sizeof(W_), temp, rtsTrue/*commas*/);
+ statsPrintf("%16s bytes maximum slop\n", temp);
+
+ statsPrintf("%16ld MB total memory in use (%ld MB lost due to fragmentation)\n\n",
+ mblocks_allocated * MBLOCK_SIZE_W / (1024 * 1024 / sizeof(W_)),
+ (mblocks_allocated * MBLOCK_SIZE_W - hw_alloc_blocks * BLOCK_SIZE_W) / (1024 * 1024 / sizeof(W_)));
/* Print garbage collections in each gen */
for (g = 0; g < RtsFlags.GcFlags.generations; g++) {
}
#if defined(THREADED_RTS)
- if (RtsFlags.ParFlags.gcThreads > 1) {
+ if (RtsFlags.ParFlags.parGcEnabled) {
statsPrintf("\n Parallel GC work balance: %.2f (%ld / %ld, ideal %d)\n",
(double)GC_par_avg_copied / (double)GC_par_max_copied,
(lnat)GC_par_avg_copied, (lnat)GC_par_max_copied,
- RtsFlags.ParFlags.gcThreads
+ RtsFlags.ParFlags.nNodes
);
}
#endif
TICK_TO_DBL(task->gc_etime));
}
}
+
+ {
+ nat i;
+ lnat sparks_created = 0;
+ lnat sparks_converted = 0;
+ lnat sparks_pruned = 0;
+ for (i = 0; i < n_capabilities; i++) {
+ sparks_created += capabilities[i].sparks_created;
+ sparks_converted += capabilities[i].sparks_converted;
+ sparks_pruned += capabilities[i].sparks_pruned;
+ }
+
+ statsPrintf(" SPARKS: %ld (%ld converted, %ld pruned)\n\n",
+ sparks_created, sparks_converted, sparks_pruned);
+ }
#endif
statsPrintf(" INIT time %6.2fs (%6.2fs elapsed)\n",
#if USE_PAPI
papi_stats_report();
#endif
+#if defined(THREADED_RTS) && defined(PROF_SPIN)
+ {
+ nat g, s;
+
+ statsPrintf("recordMutableGen_sync: %"FMT_Word64"\n", recordMutableGen_sync.spin);
+ statsPrintf("gc_alloc_block_sync: %"FMT_Word64"\n", gc_alloc_block_sync.spin);
+ statsPrintf("whitehole_spin: %"FMT_Word64"\n", whitehole_spin);
+ for (g = 0; g < RtsFlags.GcFlags.generations; g++) {
+ for (s = 0; s < generations[g].n_steps; s++) {
+ statsPrintf("gen[%d].steps[%d].sync_todo: %"FMT_Word64"\n", g, s, generations[g].steps[s].sync_todo.spin);
+ statsPrintf("gen[%d].steps[%d].sync_large_objects: %"FMT_Word64"\n", g, s, generations[g].steps[s].sync_large_objects.spin);
+ }
+ }
+ }
+#endif
}
if (RtsFlags.GcFlags.giveStats == ONELINE_GC_STATS) {
+ char *fmt1, *fmt2;
+ if (RtsFlags.MiscFlags.machineReadable) {
+ fmt1 = " [(\"bytes allocated\", \"%llu\")\n";
+ fmt2 = " ,(\"num_GCs\", \"%d\")\n"
+ " ,(\"average_bytes_used\", \"%ld\")\n"
+ " ,(\"max_bytes_used\", \"%ld\")\n"
+ " ,(\"num_byte_usage_samples\", \"%ld\")\n"
+ " ,(\"peak_megabytes_allocated\", \"%lu\")\n"
+ " ,(\"init_cpu_seconds\", \"%.2f\")\n"
+ " ,(\"init_wall_seconds\", \"%.2f\")\n"
+ " ,(\"mutator_cpu_seconds\", \"%.2f\")\n"
+ " ,(\"mutator_wall_seconds\", \"%.2f\")\n"
+ " ,(\"GC_cpu_seconds\", \"%.2f\")\n"
+ " ,(\"GC_wall_seconds\", \"%.2f\")\n"
+ " ]\n";
+ }
+ else {
+ fmt1 = "<<ghc: %llu bytes, ";
+ fmt2 = "%d GCs, %ld/%ld avg/max bytes residency (%ld samples), %luM in use, %.2f INIT (%.2f elapsed), %.2f MUT (%.2f elapsed), %.2f GC (%.2f elapsed) :ghc>>\n";
+ }
/* print the long long separately to avoid bugginess on mingwin (2001-07-02, mingw-0.5) */
- statsPrintf("<<ghc: %llu bytes, ", GC_tot_alloc*(ullong)sizeof(W_));
- statsPrintf("%d GCs, %ld/%ld avg/max bytes residency (%ld samples), %luM in use, %.2f INIT (%.2f elapsed), %.2f MUT (%.2f elapsed), %.2f GC (%.2f elapsed) :ghc>>\n",
+ statsPrintf(fmt1, GC_tot_alloc*(ullong)sizeof(W_));
+ statsPrintf(fmt2,
total_collections,
ResidencySamples == 0 ? 0 :
AvgResidency*sizeof(W_)/ResidencySamples,
TICK_TO_DBL(GC_tot_time), TICK_TO_DBL(GCe_tot_time));
}
-#if defined(THREADED_RTS) && defined(PROF_SPIN)
- {
- nat g, s;
-
- statsPrintf("recordMutableGen_sync: %"FMT_Word64"\n", recordMutableGen_sync.spin);
- statsPrintf("gc_alloc_block_sync: %"FMT_Word64"\n", gc_alloc_block_sync.spin);
- statsPrintf("whitehole_spin: %"FMT_Word64"\n", whitehole_spin);
- for (g = 0; g < RtsFlags.GcFlags.generations; g++) {
- for (s = 0; s < generations[g].n_steps; s++) {
- statsPrintf("gen[%d].steps[%d].sync_todo: %"FMT_Word64"\n", g, s, generations[g].steps[s].sync_todo.spin);
- statsPrintf("gen[%d].steps[%d].sync_large_objects: %"FMT_Word64"\n", g, s, generations[g].steps[s].sync_large_objects.spin);
- }
- }
- }
-#endif
-
statsFlush();
statsClose();
}