From 32adda2d3dabcd582238f9cd4ac9bcd1d6c908d7 Mon Sep 17 00:00:00 2001 From: sumeerbhola Date: Thu, 28 Sep 2023 15:24:02 -0400 Subject: [PATCH] goschedstats: reduce underloadedRunnablePerProcThreshold By reducing this threshold, we more often sample the stats at 1ms intervals, which is desirable for admission control slot adjustment. Fixes #111125 Epic: none Release note: None --- pkg/util/goschedstats/runnable.go | 13 ++++++++++--- 1 file changed, 10 insertions(+), 3 deletions(-) diff --git a/pkg/util/goschedstats/runnable.go b/pkg/util/goschedstats/runnable.go index 3f1a60fed778..ed3238bae273 100644 --- a/pkg/util/goschedstats/runnable.go +++ b/pkg/util/goschedstats/runnable.go @@ -67,9 +67,16 @@ var _ = numRunnableGoroutines const samplePeriodShort = time.Millisecond const samplePeriodLong = 250 * time.Millisecond -// The system is underloaded if the number of runnable goroutines per proc -// is below this threshold. -const underloadedRunnablePerProcThreshold = 1 * toFixedPoint +// The system is underloaded if the number of runnable goroutines per proc is +// below this threshold. We have observed that steady workloads (like kv0), +// can have 50% cpu utilization and < 0.2 runnable goroutines per proc. We +// want to err on the side of a lower threshold since the samplePeriodShort +// regime allows admission control to react faster to fluctuations in runnable +// goroutines -- real world workloads sometimes have very spiky CPU +// utilization (see the graphs in +// https://github.com/cockroachdb/cockroach/issues/111125). So we set this to +// 0.1 runnable goroutine per proc. +const underloadedRunnablePerProcThreshold = 1 * toFixedPoint / 10 // We "report" the average value every reportingPeriod. // Note: if this is changed from 1s, CumulativeNormalizedRunnableGoroutines()