m3db · linasm · Aug 11, 2020 · Jul 14, 2020 · Jul 23, 2020 · Jul 22, 2020
diff --git a/src/dbnode/persist/fs/cross_block_reader.go b/src/dbnode/persist/fs/cross_block_reader.go
@@ -34,13 +34,16 @@ import (
 )
 
 var (
-	errReaderNotOrderedByIndex = errors.New("CrossBlockReader can only use DataFileSetReaders ordered by index")
-	_ heap.Interface   = (*minHeap)(nil)
+	errReaderNotOrderedByIndex                = errors.New("CrossBlockReader can only use DataFileSetReaders ordered by index")
+	errEmptyReader                            = errors.New("trying to read from empty reader")
+	_                          heap.Interface = (*minHeap)(nil)
 )
 
 type crossBlockReader struct {
 	dataFileSetReaders []DataFileSetReader
-	activeReadersCount int
+	id                 ident.ID
+	tags               ident.TagIterator
+	records            []BlockRecord
 	initialized        bool
 	minHeap            minHeap
 	err                error
@@ -63,51 +66,66 @@ func NewCrossBlockReader(dataFileSetReaders []DataFileSetReader) (CrossBlockRead
 		previousStart = currentStart
 	}
 
-	return &crossBlockReader{dataFileSetReaders: dataFileSetReaders, activeReadersCount: len(dataFileSetReaders)}, nil
+	return &crossBlockReader{
+		dataFileSetReaders: dataFileSetReaders,
+		records:            make([]BlockRecord, 0, len(dataFileSetReaders)),
+	}, nil
 }
 
-func (r *crossBlockReader) Read() (id ident.ID, tags ident.TagIterator, datas []checked.Bytes, checksums []uint32, err error) {
+func (r *crossBlockReader) Next() bool {
 	if !r.initialized {
-		r.initialized = true
 		err := r.init()
 		if err != nil {
-			return nil, nil, nil, nil, err
+			r.err = err
+			return false
 		}
 	}
 
+	if len(r.minHeap) == 0 {
+		return false
+	}
+
 	firstEntry, err := r.readOne()
 	if err != nil {
-		return nil, nil, nil, nil, err
+		r.err = err
+		return false
 	}
 
-	datas = make([]checked.Bytes, 0, r.activeReadersCount)
-	checksums = make([]uint32, 0, r.activeReadersCount)
+	r.id = firstEntry.id
+	r.tags = firstEntry.tags
 
-	datas = append(datas, firstEntry.data)
-	checksums = append(checksums, firstEntry.checksum)
+	r.records = r.records[:0]
+	r.records = append(r.records, BlockRecord{firstEntry.data, firstEntry.checksum})
 
 	for len(r.minHeap) > 0 && r.minHeap[0].id.Equal(firstEntry.id) {
 		nextEntry, err := r.readOne()
 		if err != nil {
-			// Finalize what was already read:
-			for _, data := range datas {
-				data.DecRef()
-				data.Finalize()
+			// Close the resources that were already read but not returned to the consumer:
+			r.id.Finalize()
+			r.tags.Close()
+			for _, record := range r.records {
+				record.Data.DecRef()
+				record.Data.Finalize()
 			}
-			return nil, nil, nil, nil, err
+			r.records = r.records[:0]
+			r.err = err
+			return false
 		}
 		nextEntry.id.Finalize()
 		nextEntry.tags.Close()
-		datas = append(datas, nextEntry.data)
-		checksums = append(checksums, nextEntry.checksum)
+		r.records = append(r.records, BlockRecord{nextEntry.data, nextEntry.checksum})
 	}
 
-	return firstEntry.id, firstEntry.tags, datas, checksums, nil
+	return true
+}
+
+func (r *crossBlockReader) Current() (ident.ID, ident.TagIterator, []BlockRecord) {
+	return r.id, r.tags, r.records
 }
 
 func (r *crossBlockReader) readOne() (*minHeapEntry, error) {
 	if len(r.minHeap) == 0 {
-		return nil, io.EOF
+		return nil, errEmptyReader
 	}
 
 	entry := heap.Pop(&r.minHeap).(*minHeapEntry)
@@ -116,7 +134,6 @@ func (r *crossBlockReader) readOne() (*minHeapEntry, error) {
 		if err == io.EOF {
 			// will no longer read from this one
 			r.dataFileSetReaders[entry.dataFileSetReaderIndex] = nil
-			r.activeReadersCount--
 		} else if err != nil {
 			return nil, err
 		} else {
@@ -128,6 +145,7 @@ func (r *crossBlockReader) readOne() (*minHeapEntry, error) {
 }
 
 func (r *crossBlockReader) init() error {
+	r.initialized = true
 	r.minHeap = make([]*minHeapEntry, 0, len(r.dataFileSetReaders))
 
 	for i := range r.dataFileSetReaders {
@@ -169,7 +187,12 @@ func (r *crossBlockReader) readFromDataFileSet(index int) (*minHeapEntry, error)
 	}, nil
 }
 
+func (r *crossBlockReader) Err() error {
+	return r.err
+}
+
 func (r *crossBlockReader) Close() error {
+	// Close the resources that were buffered in minHeap:
 	for _, entry := range r.minHeap {
 		entry.id.Finalize()
 		entry.tags.Close()

diff --git a/src/dbnode/persist/fs/cross_block_reader_test.go b/src/dbnode/persist/fs/cross_block_reader_test.go
@@ -83,7 +83,8 @@ func TestCrossBlockReader(t *testing.T) {
 		{"many readers with different series", [][]string{{"id1"}, {"id2"}, {"id3"}}},
 		{"many readers with unordered series", [][]string{{"id3"}, {"id1"}, {"id2"}}},
 		{"complex case", [][]string{{"id2", "id3", "id5"}, {"id1", "id2", "id4"}, {"id1", "id4"}}},
-		{"reader error", [][]string{{"id1", "id2"}, {"id1", "error"}}},
+		{"immediate reader error", [][]string{{"error"}}},
+		{"reader error later", [][]string{{"id1", "id2"}, {"id1", "error"}}},
 	}
 
 	for _, tt := range tests {
@@ -131,19 +132,10 @@ func testCrossBlockReader(t *testing.T, blockSeriesIds [][]string) {
 	require.NoError(t, err)
 	defer cbReader.Close()
 
-	hadError := false
 	actualCount := 0
 	previousId := ""
-	for {
-		id, tags, datas, checksums, err := cbReader.Read()
-		if err == io.EOF {
-			break
-		}
-		if err != nil && err.Error() == expectedError.Error() {
-			hadError = true
-			break
-		}
-		require.NoError(t, err)
+	for cbReader.Next() {
+		id, tags, records := cbReader.Current()
 
 		strId := id.String()
 		id.Finalize()
@@ -152,25 +144,23 @@ func testCrossBlockReader(t *testing.T, blockSeriesIds [][]string) {
 		assert.NotNil(t, tags)
 		tags.Close()
 
-		assert.Equal(t, len(datas), len(checksums))
-
 		var previousBlockIndex uint32
-		for _, blockIndex := range checksums { // see the comment above
+		for _, record := range records {
+			blockIndex := record.Checksum // see the comment above
 			assert.True(t, blockIndex >= previousBlockIndex, "same id blocks must be read in temporal order")
 			previousBlockIndex = blockIndex
-		}
-
-		for _, data := range datas {
-			assert.NotNil(t, data)
-			data.DecRef()
-			data.Finalize()
+			assert.NotNil(t, record.Data)
+			record.Data.DecRef()
+			record.Data.Finalize()
 		}
 
 		previousId = strId
-		actualCount += len(datas)
+		actualCount += len(records)
 	}
 
-	if !hadError {
+	err = cbReader.Err()
+	if err == nil || err.Error() != expectedError.Error() {
+		require.NoError(t, cbReader.Err())
 		assert.Equal(t, expectedCount, actualCount, "count of series read")
 	}
 }
diff --git a/src/dbnode/persist/fs/types.go b/src/dbnode/persist/fs/types.go
@@ -590,15 +590,25 @@ type Segments interface {
 	BlockStart() time.Time
 }
 
+// BlockRecord wraps together M3TSZ data bytes with their checksum.
+type BlockRecord struct {
+	Data checked.Bytes
+	Checksum uint32
+}
+
 // CrossBlockReader allows reading data (encoded bytes) from multiple DataFileSetReaders of the same shard,
 // ordered by series id first, and block start time next.
 type CrossBlockReader interface {
 	io.Closer
 
-	// Read returns the next distinct id and tags, plus slices with data and checksums from all blocks corresponding to
-	// the id returned. Returns io.EOF after all DataFileSetReaders exhausted.
+	Next() bool
+
+	Err() error
+
+	// Current returns distinct series id and tags, plus a slice with data and checksums from all blocks corresponding
+	// to that series (in temporal order).
 	// Note: make sure to finalize the ID, close the Tags and finalize the Data when done with
 	// them so they can be returned to their respective pools.
-	Read() (id ident.ID, tags ident.TagIterator, datas []checked.Bytes, checksums []uint32, err error)
+	Current() (ident.ID, ident.TagIterator, []BlockRecord)
 
 }