Add a randomized start before running CheckMonitors.

This commit is contained in:
Ryan Breen 2014-12-17 21:44:12 -05:00
parent c728cb7cde
commit 60dacecb39
1 changed files with 23 additions and 1 deletions

View File

@ -5,6 +5,7 @@ import (
"github.com/armon/circbuf" "github.com/armon/circbuf"
"github.com/hashicorp/consul/consul/structs" "github.com/hashicorp/consul/consul/structs"
"log" "log"
"math/rand"
"os/exec" "os/exec"
"sync" "sync"
"syscall" "syscall"
@ -91,9 +92,30 @@ func (c *CheckMonitor) Stop() {
} }
} }
// getInitialPauseTime returns the random duration we should wait before starting this CheckMonitor,
// preventing potentially large numbers of checks from firing concurrently by staggering their starts.
func (c *CheckMonitor) getInitialPauseTime() time.Duration {
var initialPauseTime time.Duration
intervalSeconds := int(c.Interval.Seconds())
if intervalSeconds > 0 {
// If the check interval is greater than 500ms, as it will be in all real-world cases due to the
// application of MinInterval, start after some random number of seconds between 0 and c.Interval
initialPauseTime = time.Duration(rand.Intn(intervalSeconds)) * time.Second
} else {
// Test cases may use sub-second intervals. In this case, return 0 as the pause duration.
initialPauseTime = time.Duration(0)
}
return initialPauseTime
}
// run is invoked by a goroutine to run until Stop() is called // run is invoked by a goroutine to run until Stop() is called
func (c *CheckMonitor) run() { func (c *CheckMonitor) run() {
next := time.After(0)
// Get the randomized initial pause time
initialPauseTime := c.getInitialPauseTime()
c.Logger.Printf("[DEBUG] agent: pausing %ds before first invocation of %s", initialPauseTime, c.Script)
next := time.After(initialPauseTime)
for { for {
select { select {
case <-next: case <-next: