m3db · ryanhall07 · Sep 17, 2020 · Sep 16, 2020 · Sep 17, 2020 · Sep 17, 2020
diff --git a/src/dbnode/storage/bootstrap/bootstrapper/commitlog/source.go b/src/dbnode/storage/bootstrap/bootstrapper/commitlog/source.go
@@ -46,6 +46,7 @@ import (
 	"github.com/m3db/m3/src/x/pool"
 	xtime "github.com/m3db/m3/src/x/time"
 
+	"github.com/opentracing/opentracing-go"
 	"github.com/uber-go/tally"
 	"go.uber.org/zap"
 )
@@ -72,6 +73,11 @@ type commitLogSource struct {
 	newReaderFn     newReaderFn
 
 	metrics commitLogSourceMetrics
+	// Cache the results of reading the commit log between passes. The commit log is not sharded by time range, so the
+	// entire log needs to be read irrespective of the configured time ranges for the pass. The commit log only needs
+	// to be read once (during the first pass) and the results can be subsequently cached and returned on future passes.
+	// Since the bootstrapper is single threaded this does not need to be guarded with a mutex.
+	commitLogResult commitLogResult
 }
 
 type bootstrapNamespace struct {
@@ -177,14 +183,10 @@ func (s *commitLogSource) Read(
 
 	var (
 		// Emit bootstrapping gauge for duration of ReadData.
-		doneReadingData         = s.metrics.emitBootstrapping()
-		encounteredCorruptData  = false
-		fsOpts                  = s.opts.CommitLogOptions().FilesystemOptions()
-		filePathPrefix          = fsOpts.FilePathPrefix()
-		namespaceIter           = namespaces.Namespaces.Iter()
-		namespaceResults        = make(map[string]*readNamespaceResult, len(namespaceIter))
-		setInitialTopologyState bool
-		initialTopologyState    *topology.StateSnapshot
+		doneReadingData = s.metrics.emitBootstrapping()
+		fsOpts          = s.opts.CommitLogOptions().FilesystemOptions()
+		filePathPrefix  = fsOpts.FilePathPrefix()
+		namespaceIter   = namespaces.Namespaces.Iter()
 	)
 	defer doneReadingData()
 
@@ -206,17 +208,6 @@ func (s *commitLogSource) Read(
 			shardTimeRanges.AddRanges(ns.IndexRunOptions.TargetShardTimeRanges)
 		}
 
-		namespaceResults[ns.Metadata.ID().String()] = &readNamespaceResult{
-			namespace:               ns,
-			dataAndIndexShardRanges: shardTimeRanges,
-		}
-
-		// Make the initial topology state available.
-		if !setInitialTopologyState {
-			setInitialTopologyState = true
-			initialTopologyState = ns.DataRunOptions.RunOptions.InitialTopologyState()
-		}
-
 		// Determine which snapshot files are available.
 		snapshotFilesByShard, err := s.snapshotFilesByShard(
 			ns.Metadata.ID(), filePathPrefix, shardTimeRanges)
@@ -246,10 +237,56 @@ func (s *commitLogSource) Read(
 		zap.Duration("took", s.nowFn().Sub(startSnapshotsRead)))
 	span.LogEvent("read_snapshots_done")
 
+	commitLogResult, err := s.readCommitLog(namespaces, span)
+	if err != nil {
+		return bootstrap.NamespaceResults{}, err
+	}
+
+	bootstrapResult := bootstrap.NamespaceResults{
+		Results: bootstrap.NewNamespaceResultsMap(bootstrap.NamespaceResultsMapOptions{}),
+	}
+	for _, elem := range namespaceIter {
+		ns := elem.Value()
+		id := ns.Metadata.ID()
+		dataResult := result.NewDataBootstrapResult()
+		if commitLogResult.shouldReturnUnfulfilled {
+			shardTimeRanges := ns.DataRunOptions.ShardTimeRanges
+			dataResult = shardTimeRanges.ToUnfulfilledDataResult()
+		}
+		var indexResult result.IndexBootstrapResult
+		if ns.Metadata.Options().IndexOptions().Enabled() {
+			indexResult = result.NewIndexBootstrapResult()
+			if commitLogResult.shouldReturnUnfulfilled {
+				shardTimeRanges := ns.IndexRunOptions.ShardTimeRanges
+				indexResult = shardTimeRanges.ToUnfulfilledIndexResult()
+			}
+		}
+		bootstrapResult.Results.Set(id, bootstrap.NamespaceResult{
+			Metadata:    ns.Metadata,
+			Shards:      ns.Shards,
+			DataResult:  dataResult,
+			IndexResult: indexResult,
+		})
+	}
+
+	return bootstrapResult, nil
+}
+
+type commitLogResult struct {
+	shouldReturnUnfulfilled bool
+	read                    bool
+}
+
+func (s *commitLogSource) readCommitLog(namespaces bootstrap.Namespaces, span opentracing.Span) (commitLogResult, error) {
+	if s.commitLogResult.read {
+		s.log.Debug("commit log already read in a previous pass. skipping and returning previous result.	")
+		return s.commitLogResult, nil
+	}
+
 	// Setup the series accumulator pipeline.
 	var (
-		numWorkers = s.opts.AccumulateConcurrency()
-		workers    = make([]*accumulateWorker, 0, numWorkers)
+		numWorkers              = s.opts.AccumulateConcurrency()
+		workers                 = make([]*accumulateWorker, 0, numWorkers)
 	)
 	for i := 0; i < numWorkers; i++ {
 		worker := &accumulateWorker{
@@ -270,6 +307,37 @@ func (s *commitLogSource) Read(
 	// NB(r): Ensure that channels always get closed.
 	defer closeWorkerChannels()
 
+	var(
+		namespaceIter           = namespaces.Namespaces.Iter()
+		namespaceResults        = make(map[string]*readNamespaceResult, len(namespaceIter))
+		setInitialTopologyState bool
+		initialTopologyState    *topology.StateSnapshot
+	)
+	for _, elem := range namespaceIter {
+		ns := elem.Value()
+
+		// NB(r): Combine all shard time ranges across data and index
+		// so we can do in one go.
+		shardTimeRanges := result.NewShardTimeRanges()
+		// NB(bodu): Use TargetShardTimeRanges which covers the entire original target shard range
+		// since the commitlog bootstrapper should run for the entire bootstrappable range per shard.
+		shardTimeRanges.AddRanges(ns.DataRunOptions.TargetShardTimeRanges)
+		if ns.Metadata.Options().IndexOptions().Enabled() {
+			shardTimeRanges.AddRanges(ns.IndexRunOptions.TargetShardTimeRanges)
+		}
+
+		namespaceResults[ns.Metadata.ID().String()] = &readNamespaceResult{
+			namespace:               ns,
+			dataAndIndexShardRanges: shardTimeRanges,
+		}
+
+		// Make the initial topology state available.
+		if !setInitialTopologyState {
+			setInitialTopologyState = true
+			initialTopologyState = ns.DataRunOptions.RunOptions.InitialTopologyState()
+		}
+	}
+
 	// Setup the commit log iterator.
 	var (
 		iterOpts = commitlog.IteratorOpts{
@@ -285,6 +353,7 @@ func (s *commitLogSource) Read(
 		datapointsSkippedNotBootstrappingShard     = 0
 		datapointsSkippedShardNoLongerOwned        = 0
 		startCommitLogsRead                        = s.nowFn()
+		encounteredCorruptData                     = false
 	)
 	s.log.Info("read commit logs start")
 	span.LogEvent("read_commitlogs_start")
@@ -305,7 +374,7 @@ func (s *commitLogSource) Read(
 	iter, corruptFiles, err := s.newIteratorFn(iterOpts)
 	if err != nil {
 		err = fmt.Errorf("unable to create commit log iterator: %v", err)
-		return bootstrap.NamespaceResults{}, err
+		return commitLogResult{}, err
 	}
 
 	if len(corruptFiles) > 0 {
@@ -446,7 +515,7 @@ func (s *commitLogSource) Read(
 						commitLogSeries[seriesKey] = seriesMapEntry{shardNoLongerOwned: true}
 						continue
 					}
-					return bootstrap.NamespaceResults{}, err
+					return commitLogResult{}, err
 				}
 
 				seriesEntry = seriesMapEntry{
@@ -518,36 +587,13 @@ func (s *commitLogSource) Read(
 	shouldReturnUnfulfilled, err := s.shouldReturnUnfulfilled(
 		workers, encounteredCorruptData, initialTopologyState)
 	if err != nil {
-		return bootstrap.NamespaceResults{}, err
+		return commitLogResult{}, err
 	}
-
-	bootstrapResult := bootstrap.NamespaceResults{
-		Results: bootstrap.NewNamespaceResultsMap(bootstrap.NamespaceResultsMapOptions{}),
-	}
-	for _, ns := range namespaceResults {
-		id := ns.namespace.Metadata.ID()
-		dataResult := result.NewDataBootstrapResult()
-		if shouldReturnUnfulfilled {
-			shardTimeRanges := ns.namespace.DataRunOptions.ShardTimeRanges
-			dataResult = shardTimeRanges.ToUnfulfilledDataResult()
-		}
-		var indexResult result.IndexBootstrapResult
-		if ns.namespace.Metadata.Options().IndexOptions().Enabled() {
-			indexResult = result.NewIndexBootstrapResult()
-			if shouldReturnUnfulfilled {
-				shardTimeRanges := ns.namespace.IndexRunOptions.ShardTimeRanges
-				indexResult = shardTimeRanges.ToUnfulfilledIndexResult()
-			}
-		}
-		bootstrapResult.Results.Set(id, bootstrap.NamespaceResult{
-			Metadata:    ns.namespace.Metadata,
-			Shards:      ns.namespace.Shards,
-			DataResult:  dataResult,
-			IndexResult: indexResult,
-		})
+	s.commitLogResult = commitLogResult{
+		shouldReturnUnfulfilled: shouldReturnUnfulfilled,
+		read:                    true,
 	}
-
-	return bootstrapResult, nil
+	return s.commitLogResult, nil
 }
 
 func (s *commitLogSource) snapshotFilesByShard(