Skip to content

Commit

Permalink
Browse files Browse the repository at this point in the history
78251: backupccl: SHOW BACKUP FILES IN (on collection) returns the full SST path r=dt a=msbutler

 backupccl: SHOW BACKUP FILES IN (on collection) returns the full SST path
    
Previously, SHOW BACKUP FILES on a backup collection  would return the  SST
file path relative to the manifest directory. Given that the incremental backup
and full backup manifests are stored in different directories, the file paths
that SHOW BACKUP FILES should reflect that.

This patch changes the path `SHOW BACKUP FILES IN` returns to the backup
path relative to the collection root. As an example:

Previously, the command `SHOW BACKUP FILES LATEST IN s3://mybackups`, would
return:
```
data/001.SST // from a full backup
data/002.SST  // from an incremental backup
```
Now, the command will return (assuming the full and inc live in same subdir):
```
/2020/12/25-060000.00/data/001.SST
/2020/12/25-060000.00/20201225/070000.00/data/002.SST
```
Note: when a user passes the incremental_location parameter, the output result
will be slightly misleading because the incrementals will have a different
collection root. To aid in this confusion, I added a backup_type column
equal to 'incremental' or 'full'.

I plan to test this change in the PR for cockroachdb#77694

Release note: None

Co-authored-by: Michael Butler <[email protected]>
  • Loading branch information
craig[bot] and msbutler committed Mar 24, 2022
2 parents 8b36717 + 72c970d commit d51cd4f
Showing 1 changed file with 82 additions and 25 deletions.
107 changes: 82 additions & 25 deletions pkg/ccl/backupccl/show.go
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@ package backupccl
import (
"context"
"net/url"
"path"
"strings"
"time"

Expand Down Expand Up @@ -73,6 +74,7 @@ type backupInfoReader interface {
cloud.ExternalStorage,
*jobspb.BackupEncryptionOptions,
[]string,
[]string,
chan<- tree.Datums,
) error
header() colinfo.ResultColumns
Expand All @@ -91,13 +93,17 @@ func (m manifestInfoReader) header() colinfo.ResultColumns {
// showBackup reads backup info from the manifest, populates the manifestInfoReader,
// calls the backupShower to process the manifest info into datums,
// and pipes the information to the user's sql console via the results channel.

// TODO(msbutler): during the old backup syntax purge, remove store, incStore, incPaths,
// and pass only `stores []cloud.ExternalStorage` object in signature
func (m manifestInfoReader) showBackup(
ctx context.Context,
mem *mon.BoundAccount,
store cloud.ExternalStorage,
incStore cloud.ExternalStorage,
enc *jobspb.BackupEncryptionOptions,
incPaths []string,
manifestDirs []string,
resultsCh chan<- tree.Datums,
) error {
var memSize int64
Expand Down Expand Up @@ -148,7 +154,7 @@ func (m manifestInfoReader) showBackup(
return err
}

datums, err := m.shower.fn(manifests)
datums, err := m.shower.fn(manifests, manifestDirs)
if err != nil {
return err
}
Expand Down Expand Up @@ -182,6 +188,7 @@ func (m metadataSSTInfoReader) showBackup(
incStore cloud.ExternalStorage,
enc *jobspb.BackupEncryptionOptions,
incPaths []string,
manifestDirs []string,
resultsCh chan<- tree.Datums,
) error {
filename := metadataSSTName
Expand Down Expand Up @@ -269,13 +276,13 @@ func showBackupPlanHook(
case tree.BackupRangeDetails:
shower = backupShowerRanges
case tree.BackupFileDetails:
shower = backupShowerFiles
shower = backupShowerFileSetup(backup.InCollection)
case tree.BackupManifestAsJSON:
shower = jsonShower
default:
shower = backupShowerDefault(ctx, p, backup.ShouldIncludeSchemas, opts)
}
infoReader = manifestInfoReader{shower}
infoReader = manifestInfoReader{shower: shower}
}

fn := func(ctx context.Context, _ []sql.PlanNode, resultsCh chan<- tree.Datums) error {
Expand Down Expand Up @@ -395,6 +402,7 @@ you must pass the 'encryption_info_dir' parameter that points to the directory o
computedSubdir,
)
var incPaths []string
var manifestDirs []string
var incStore cloud.ExternalStorage
if err != nil {
if errors.Is(err, cloud.ErrListingUnsupported) {
Expand All @@ -419,23 +427,57 @@ you must pass the 'encryption_info_dir' parameter that points to the directory o
if err != nil {
return errors.Wrapf(err, "make incremental storage")
}
manifestDirs = getManifestDirs(computedSubdir, incLocations[0], incPaths, explicitIncPaths)
}
mem := p.ExecCfg().RootMemoryMonitor.MakeBoundAccount()
defer mem.Close(ctx)

return infoReader.showBackup(ctx, &mem, store, incStore, encryption, incPaths, resultsCh)
return infoReader.showBackup(ctx, &mem, store, incStore, encryption, incPaths,
manifestDirs, resultsCh)
}

return fn, infoReader.header(), nil, false, nil
}

// getManifestDirs gathers the path to the directory for each backup manifest,
// relative to the collection root. In other words, path.Join(dest,
// manifestDirs[i]) is the resolved manifest path. If the user passed
// incremental_location, the path.Join(explicitIncPath,manifestDirs[i]) is the
// resolved incremental manifest path.
func getManifestDirs(
fullSubdir string, incLocation string, incPaths []string, explicitIncPaths []string,
) []string {
manifestDirs := make([]string, len(incPaths)+1)

// The full backup manifest path is always in the fullSubdir
manifestDirs[0] = fullSubdir

// The incLocation reveals if incremental backups were stored in the full
// backup's subdirectory, the default incremental directory, or in a different
// incremental_location. To figure this out, remove the fullSubdir from the
// incremental location, then check if the defaultIncrementalSubdir is in the
// path AND that the user did not pass explicit incremental paths:
defaultIncSubdir := ""
incLocNoSubdir := strings.Replace(incLocation, fullSubdir, "", 1)
splitIncLocation := strings.Split(incLocNoSubdir, "/")
if splitIncLocation[len(splitIncLocation)-1] == DefaultIncrementalsSubdir && len(
explicitIncPaths) == 0 {
defaultIncSubdir = "/" + DefaultIncrementalsSubdir
}
for i, incPath := range incPaths {
incPathNoManifest := strings.Replace(incPath, backupManifestName, "", 1)
manifestDirs[i+1] = path.Join(defaultIncSubdir, fullSubdir, incPathNoManifest)
}
return manifestDirs
}

type backupShower struct {
// header defines the columns of the table printed as output of the show command.
header colinfo.ResultColumns

// fn is the specific implementation of the shower that can either be a default, ranges, files,
// or JSON shower.
fn func([]BackupManifest) ([]tree.Datums, error)
fn func(manifests []BackupManifest, manifestDirs []string) ([]tree.Datums, error)
}

// backupShowerHeaders defines the schema for the table presented to the user.
Expand Down Expand Up @@ -481,7 +523,7 @@ func backupShowerDefault(
) backupShower {
return backupShower{
header: backupShowerHeaders(showSchemas, opts),
fn: func(manifests []BackupManifest) ([]tree.Datums, error) {
fn: func(manifests []BackupManifest, manifestDirs []string) ([]tree.Datums, error) {
var rows []tree.Datums
for _, manifest := range manifests {
// Map database ID to descriptor name.
Expand Down Expand Up @@ -733,7 +775,7 @@ var backupShowerRanges = backupShower{
{Name: "end_key", Typ: types.Bytes},
},

fn: func(manifests []BackupManifest) (rows []tree.Datums, err error) {
fn: func(manifests []BackupManifest, manifestDirs []string) (rows []tree.Datums, err error) {
for _, manifest := range manifests {
for _, span := range manifest.Spans {
rows = append(rows, tree.Datums{
Expand All @@ -748,9 +790,10 @@ var backupShowerRanges = backupShower{
},
}

var backupShowerFiles = backupShower{
header: colinfo.ResultColumns{
func backupShowerFileSetup(inCol tree.Expr) backupShower {
return backupShower{header: colinfo.ResultColumns{
{Name: "path", Typ: types.String},
{Name: "backup_type", Typ: types.String},
{Name: "start_pretty", Typ: types.String},
{Name: "end_pretty", Typ: types.String},
{Name: "start_key", Typ: types.Bytes},
Expand All @@ -759,30 +802,44 @@ var backupShowerFiles = backupShower{
{Name: "rows", Typ: types.Int},
},

fn: func(manifests []BackupManifest) (rows []tree.Datums, err error) {
for _, manifest := range manifests {
for _, file := range manifest.Files {
rows = append(rows, tree.Datums{
tree.NewDString(file.Path),
tree.NewDString(file.Span.Key.String()),
tree.NewDString(file.Span.EndKey.String()),
tree.NewDBytes(tree.DBytes(file.Span.Key)),
tree.NewDBytes(tree.DBytes(file.Span.EndKey)),
tree.NewDInt(tree.DInt(file.EntryCounts.DataSize)),
tree.NewDInt(tree.DInt(file.EntryCounts.Rows)),
})
fn: func(manifests []BackupManifest, manifestDirs []string) (rows []tree.Datums, err error) {
if (inCol != nil) && len(manifestDirs) == 0 {
return nil, errors.AssertionFailedf(
"manifestDirs empty even though backup is in collection")
}
}
return rows, nil
},
for i, manifest := range manifests {
backupType := "full"
if manifest.isIncremental() {
backupType = "incremental"
}
for _, file := range manifest.Files {
filePath := file.Path
if inCol != nil {
filePath = path.Join(manifestDirs[i], filePath)
}
rows = append(rows, tree.Datums{
tree.NewDString(filePath),
tree.NewDString(backupType),
tree.NewDString(file.Span.Key.String()),
tree.NewDString(file.Span.EndKey.String()),
tree.NewDBytes(tree.DBytes(file.Span.Key)),
tree.NewDBytes(tree.DBytes(file.Span.EndKey)),
tree.NewDInt(tree.DInt(file.EntryCounts.DataSize)),
tree.NewDInt(tree.DInt(file.EntryCounts.Rows)),
})
}
}
return rows, nil
},
}
}

var jsonShower = backupShower{
header: colinfo.ResultColumns{
{Name: "manifest", Typ: types.Jsonb},
},

fn: func(manifests []BackupManifest) ([]tree.Datums, error) {
fn: func(manifests []BackupManifest, manifestDirs []string) ([]tree.Datums, error) {
rows := make([]tree.Datums, len(manifests))
for i, manifest := range manifests {
j, err := protoreflect.MessageToJSON(
Expand Down

0 comments on commit d51cd4f

Please sign in to comment.