From 867d20ede8c9193f437d8f2ed7385d9e983d8f3e Mon Sep 17 00:00:00 2001 From: Nish Krishnan Date: Tue, 18 May 2021 15:17:21 -0700 Subject: [PATCH] [ORCA-782] Add some more metrics and logic to delete 30 days old pulls. (#75) --- .../events/events_controller_e2e_test.go | 9 ++-- server/events/event_parser.go | 2 + server/events/models/models.go | 2 + server/events/pull_closed_executor.go | 24 +++++++--- server/events/pull_closed_executor_test.go | 26 ++++++----- server/scheduled_executor_service.go | 44 ++++++++++++++++--- server/server.go | 21 ++++++--- 7 files changed, 96 insertions(+), 32 deletions(-) diff --git a/server/controllers/events/events_controller_e2e_test.go b/server/controllers/events/events_controller_e2e_test.go index 65e37c9411..e8fb8e8cbb 100644 --- a/server/controllers/events/events_controller_e2e_test.go +++ b/server/controllers/events/events_controller_e2e_test.go @@ -1063,10 +1063,11 @@ func setupE2E(t *testing.T, repoDir string) (events_controllers.VCSEventsControl TestingMode: true, CommandRunner: commandRunner, PullCleaner: &events.PullClosedExecutor{ - Locker: lockingClient, - VCSClient: e2eVCSClient, - WorkingDir: workingDir, - DB: boltdb, + Locker: lockingClient, + VCSClient: e2eVCSClient, + WorkingDir: workingDir, + DB: boltdb, + PullClosedTemplate: &events.PullClosedEventTemplate{}, }, Logger: logger, Parser: eventParser, diff --git a/server/events/event_parser.go b/server/events/event_parser.go index 029b08c2eb..ef663ec64f 100644 --- a/server/events/event_parser.go +++ b/server/events/event_parser.go @@ -514,6 +514,7 @@ func (e *EventParser) ParseGithubPull(pull *github.PullRequest) (pullModel model pullState := models.ClosedPullState closedAt := pull.GetClosedAt() + updatedAt := pull.GetUpdatedAt() if pull.GetState() == "open" { pullState = models.OpenPullState } @@ -528,6 +529,7 @@ func (e *EventParser) ParseGithubPull(pull *github.PullRequest) (pullModel model BaseRepo: baseRepo, BaseBranch: baseBranch, ClosedAt: closedAt, + UpdatedAt: updatedAt, } return } diff --git a/server/events/models/models.go b/server/events/models/models.go index 11947153be..072274b151 100644 --- a/server/events/models/models.go +++ b/server/events/models/models.go @@ -171,6 +171,8 @@ type PullRequest struct { State PullRequestState // BaseRepo is the repository that the pull request will be merged into. BaseRepo Repo + // UpdatedAt is the time the PR was last updated. + UpdatedAt time.Time // ClosedAt is the time the PR was closed. This is nil if the PR is open ClosedAt time.Time } diff --git a/server/events/pull_closed_executor.go b/server/events/pull_closed_executor.go index 2ecaebe042..3e6521a18d 100644 --- a/server/events/pull_closed_executor.go +++ b/server/events/pull_closed_executor.go @@ -16,6 +16,7 @@ package events import ( "bytes" "fmt" + "io" "sort" "strings" "text/template" @@ -42,11 +43,12 @@ type PullCleaner interface { // PullClosedExecutor executes the tasks required to clean up a closed pull // request. type PullClosedExecutor struct { - Locker locking.Locker - VCSClient vcs.Client - WorkingDir WorkingDir - Logger logging.SimpleLogging - DB *db.BoltDB + Locker locking.Locker + VCSClient vcs.Client + WorkingDir WorkingDir + Logger logging.SimpleLogging + DB *db.BoltDB + PullClosedTemplate PullCleanupTemplate } type templatedProject struct { @@ -54,6 +56,16 @@ type templatedProject struct { Workspaces string } +type PullCleanupTemplate interface { + Execute(wr io.Writer, data interface{}) error +} + +type PullClosedEventTemplate struct{} + +func (t *PullClosedEventTemplate) Execute(wr io.Writer, data interface{}) error { + return pullClosedTemplate.Execute(wr, data) +} + var pullClosedTemplate = template.Must(template.New("").Parse( "Locks and plans deleted for the projects and workspaces modified in this pull request:\n" + "{{ range . }}\n" + @@ -85,7 +97,7 @@ func (p *PullClosedExecutor) CleanUpPull(repo models.Repo, pull models.PullReque templateData := p.buildTemplateData(locks) var buf bytes.Buffer - if err = pullClosedTemplate.Execute(&buf, templateData); err != nil { + if err = p.PullClosedTemplate.Execute(&buf, templateData); err != nil { return errors.Wrap(err, "rendering template for comment") } return p.VCSClient.CreateComment(repo, pull.Num, buf.String(), "") diff --git a/server/events/pull_closed_executor_test.go b/server/events/pull_closed_executor_test.go index e5d5953bbf..d692ce4ae0 100644 --- a/server/events/pull_closed_executor_test.go +++ b/server/events/pull_closed_executor_test.go @@ -35,7 +35,8 @@ func TestCleanUpPullWorkspaceErr(t *testing.T) { RegisterMockTestingT(t) w := mocks.NewMockWorkingDir() pce := events.PullClosedExecutor{ - WorkingDir: w, + WorkingDir: w, + PullClosedTemplate: &events.PullClosedEventTemplate{}, } err := errors.New("err") When(w.Delete(fixtures.GithubRepo, fixtures.Pull)).ThenReturn(err) @@ -49,8 +50,9 @@ func TestCleanUpPullUnlockErr(t *testing.T) { w := mocks.NewMockWorkingDir() l := lockmocks.NewMockLocker() pce := events.PullClosedExecutor{ - Locker: l, - WorkingDir: w, + Locker: l, + WorkingDir: w, + PullClosedTemplate: &events.PullClosedEventTemplate{}, } err := errors.New("err") When(l.UnlockByPull(fixtures.GithubRepo.FullName, fixtures.Pull.Num)).ThenReturn(nil, err) @@ -69,10 +71,11 @@ func TestCleanUpPullNoLocks(t *testing.T) { db, err := db.New(tmp) Ok(t, err) pce := events.PullClosedExecutor{ - Locker: l, - VCSClient: cp, - WorkingDir: w, - DB: db, + Locker: l, + VCSClient: cp, + WorkingDir: w, + DB: db, + PullClosedTemplate: &events.PullClosedEventTemplate{}, } When(l.UnlockByPull(fixtures.GithubRepo.FullName, fixtures.Pull.Num)).ThenReturn(nil, nil) err = pce.CleanUpPull(fixtures.GithubRepo, fixtures.Pull) @@ -155,10 +158,11 @@ func TestCleanUpPullComments(t *testing.T) { db, err := db.New(tmp) Ok(t, err) pce := events.PullClosedExecutor{ - Locker: l, - VCSClient: cp, - WorkingDir: w, - DB: db, + Locker: l, + VCSClient: cp, + WorkingDir: w, + DB: db, + PullClosedTemplate: &events.PullClosedEventTemplate{}, } t.Log("testing: " + c.Description) When(l.UnlockByPull(fixtures.GithubRepo.FullName, fixtures.Pull.Num)).ThenReturn(c.Locks, nil) diff --git a/server/scheduled_executor_service.go b/server/scheduled_executor_service.go index eb868110cc..7a7ad1b2d7 100644 --- a/server/scheduled_executor_service.go +++ b/server/scheduled_executor_service.go @@ -1,14 +1,17 @@ package server import ( + "io" "os" "os/signal" "strconv" "syscall" + "text/template" "time" stats "github.com/lyft/gostats" "github.com/runatlantis/atlantis/server/events" + "github.com/runatlantis/atlantis/server/events/metrics" "github.com/runatlantis/atlantis/server/events/models" "github.com/runatlantis/atlantis/server/logging" ) @@ -24,11 +27,13 @@ func NewScheduledExecutorService( workingDirIterator events.WorkDirIterator, statsScope stats.Scope, log logging.SimpleLogging, + pullCleaner events.PullCleaner, ) *ScheduledExecutorService { garbageCollector := &GarbageCollector{ workingDirIterator: workingDirIterator, stats: statsScope.Scope("scheduled.garbagecollector"), log: log, + cleaner: pullCleaner, } garbageCollectorCron := CronDefinition{ @@ -76,20 +81,36 @@ type Job interface { Run() } +var gcStaleClosedPullTemplate = template.Must(template.New("").Parse( + "Pull Request has been closed for 30 days. Atlantis GC has deleted the locks and plans for the following projects and workspaces:\n" + + "{{ range . }}\n" + + "- dir: `{{ .RepoRelDir }}` {{ .Workspaces }}{{ end }}")) + +type GCStalePullTemplate struct{} + +func (t *GCStalePullTemplate) Execute(wr io.Writer, data interface{}) error { + return gcStaleClosedPullTemplate.Execute(wr, data) +} + type GarbageCollector struct { workingDirIterator events.WorkDirIterator stats stats.Scope log logging.SimpleLogging + cleaner events.PullCleaner } func (g *GarbageCollector) Run() { + errCounter := g.stats.NewCounter(metrics.ExecutionErrorMetric) + pulls, err := g.workingDirIterator.ListCurrentWorkingDirPulls() if err != nil { g.log.Err("error listing pulls %s", err) + errCounter.Inc() } openPullsCounter := g.stats.NewCounter("pulls.open") + updatedthirtyDaysAgoOpenPullsCounter := g.stats.NewCounter("pulls.open.updated.thirtydaysago") closedPullsCounter := g.stats.NewCounter("pulls.closed") thirtyDaysAgoClosedPullsCounter := g.stats.NewCounter("pulls.closed.thirtydaysago") fiveMinutesAgoClosedPullsCounter := g.stats.NewCounter("pulls.closed.fiveminutesago") @@ -101,29 +122,40 @@ func (g *GarbageCollector) Run() { for _, pull := range pulls { logger := g.log.With(fmtLogSrc(pull.BaseRepo, pull.Num)...) + if pull.State == models.OpenPullState { - logger.Debug("pull #%d is open", pull.Num) openPullsCounter.Inc() + + if pull.UpdatedAt.Before(thirtyDaysAgo) { + updatedthirtyDaysAgoOpenPullsCounter.Inc() + + logger.Warn("Pull hasn't been updated for more than 30 days.") + } continue } // assume only other state is closed closedPullsCounter.Inc() - logger.Debug("pull #%d is closed but data still on disk", pull.Num) - - // TODO: update this to actually go ahead and delete things if pull.ClosedAt.Before(thirtyDaysAgo) { thirtyDaysAgoClosedPullsCounter.Inc() - logger.Info("Pull closed for more than 30 days but data still on disk") + logger.Warn("Pull closed for more than 30 days but data still on disk") + + err := g.cleaner.CleanUpPull(pull.BaseRepo, pull) + + if err != nil { + logger.Err("Error cleaning up 30 days old closed pulls %s", err) + errCounter.Inc() + return + } } // This will allow us to catch leaks as soon as they happen (hopefully) if pull.ClosedAt.Before(fiveMinutesAgo) { fiveMinutesAgoClosedPullsCounter.Inc() - logger.Info("Pull closed for more than 5 minutes but data still on disk") + logger.Warn("Pull closed for more than 5 minutes but data still on disk") } } } diff --git a/server/server.go b/server/server.go index dc48d17b26..fdcbb68a4b 100644 --- a/server/server.go +++ b/server/server.go @@ -401,11 +401,12 @@ func NewServer(userConfig UserConfig, config Config) (*Server, error) { statsScope, logger, &events.PullClosedExecutor{ - VCSClient: vcsClient, - Locker: lockingClient, - WorkingDir: workingDir, - Logger: logger, - DB: boltdb, + VCSClient: vcsClient, + Locker: lockingClient, + WorkingDir: workingDir, + Logger: logger, + DB: boltdb, + PullClosedTemplate: &events.PullClosedEventTemplate{}, }, ) eventParser := &events.EventParser{ @@ -685,6 +686,16 @@ func NewServer(userConfig UserConfig, config Config) (*Server, error) { ), statsScope, logger, + &events.PullClosedExecutor{ + VCSClient: vcsClient, + Locker: lockingClient, + WorkingDir: workingDir, + Logger: logger, + DB: boltdb, + + // using a specific template to signal that this is from an async process + PullClosedTemplate: &GCStalePullTemplate{}, + }, ) return &Server{