-
Notifications
You must be signed in to change notification settings - Fork 502
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
exp/lighthorizon: Add a set of tools to aide in index inspection. (#4561
- Loading branch information
Showing
5 changed files
with
328 additions
and
6 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,259 @@ | ||
package main | ||
|
||
import ( | ||
"context" | ||
"io" | ||
"os" | ||
"os/signal" | ||
"strings" | ||
"syscall" | ||
"time" | ||
|
||
"github.com/spf13/cobra" | ||
|
||
"github.com/stellar/go/exp/lighthorizon/index" | ||
"github.com/stellar/go/historyarchive" | ||
"github.com/stellar/go/strkey" | ||
"github.com/stellar/go/support/collections/maps" | ||
"github.com/stellar/go/support/collections/set" | ||
"github.com/stellar/go/support/log" | ||
"github.com/stellar/go/support/ordered" | ||
) | ||
|
||
var ( | ||
checkpointMgr = historyarchive.NewCheckpointManager(0) | ||
) | ||
|
||
func addIndexCommands(parent *cobra.Command) *cobra.Command { | ||
cmd := &cobra.Command{ | ||
Use: "index", | ||
Long: "Lets you view details about an index source.", | ||
Example: ` | ||
index view file:///tmp/indices | ||
index view file:///tmp/indices GAGJZWQ5QT34VK3U6W6YKRYFIK6YSAXQC6BHIIYLG6X3CE5QW2KAYNJR | ||
index stats file:///tmp/indices`, | ||
RunE: func(cmd *cobra.Command, args []string) error { | ||
// require a subcommand - this is just a "category" | ||
return cmd.Help() | ||
}, | ||
} | ||
|
||
stats := &cobra.Command{ | ||
Use: "stats <index path>", | ||
Long: "Summarize the statistics (like the # of active checkpoints " + | ||
"or accounts). Note that this is a very read-heavy operation and " + | ||
"will incur download bandwidth costs if reading from remote, " + | ||
"billable sources.", | ||
Example: `stats s3://indices`, | ||
RunE: func(cmd *cobra.Command, args []string) error { | ||
if len(args) != 1 { | ||
return cmd.Usage() | ||
} | ||
|
||
path := args[0] | ||
start := time.Now() | ||
log.Infof("Analyzing indices at %s", path) | ||
|
||
allCheckpoints := set.Set[uint32]{} | ||
allIndexNames := set.Set[string]{} | ||
accounts := showAccounts(path, 0) | ||
log.Infof("Analyzing indices for %d accounts.", len(accounts)) | ||
|
||
// We want to summarize as much as possible on a Ctrl+C event, so | ||
// this handles that by setting up a context that gets cancelled on | ||
// SIGINT. A second Ctrl+C will kill the process as usual. | ||
// | ||
// https://millhouse.dev/posts/graceful-shutdowns-in-golang-with-signal-notify-context | ||
ctx, stop := signal.NotifyContext(context.Background(), os.Interrupt, syscall.SIGTERM, syscall.SIGINT) | ||
defer stop() | ||
go func() { | ||
<-ctx.Done() | ||
stop() | ||
log.WithField("error", ctx.Err()). | ||
Warn("Received interrupt, shutting down gracefully & summarizing findings...") | ||
log.Warn("Press Ctrl+C again to abort.") | ||
}() | ||
|
||
mostActiveAccountChk := 0 | ||
mostActiveAccount := "" | ||
for _, account := range accounts { | ||
if ctx.Err() != nil { | ||
break | ||
} | ||
|
||
activity := getIndex(path, account, "", 0) | ||
allCheckpoints.AddSlice(maps.Keys(activity)) | ||
for _, names := range activity { | ||
allIndexNames.AddSlice(names) | ||
} | ||
|
||
if len(activity) > mostActiveAccountChk { | ||
mostActiveAccount = account | ||
mostActiveAccountChk = len(activity) | ||
} | ||
} | ||
|
||
ledgerCount := len(allCheckpoints) * int(checkpointMgr.GetCheckpointFrequency()) | ||
|
||
log.Info("Done analyzing indices, summarizing...") | ||
log.Infof("") | ||
log.Infof("=== Final Summary ===") | ||
log.Infof("Analysis took %s.", time.Since(start)) | ||
log.Infof("Path: %s", path) | ||
log.Infof("Accounts: %d", len(accounts)) | ||
log.Infof("Smallest checkpoint: %d", ordered.MinSlice(allCheckpoints.Slice())) | ||
log.Infof("Largest checkpoint: %d", ordered.MaxSlice(allCheckpoints.Slice())) | ||
log.Infof("Checkpoint count: %d (%d possible ledgers, ~%0.2f days)", | ||
len(allCheckpoints), ledgerCount, | ||
float64(ledgerCount)/(float64(60*60*24)/6.0) /* approx. ledgers per day */) | ||
log.Infof("Index names: %s", strings.Join(allIndexNames.Slice(), ", ")) | ||
log.Infof("Most active account: %s (%d checkpoints)", | ||
mostActiveAccount, mostActiveAccountChk) | ||
|
||
return nil | ||
}, | ||
} | ||
|
||
view := &cobra.Command{ | ||
Use: "view <index path> [accounts?]", | ||
Long: "View the accounts in an index source or view the " + | ||
"checkpoints specific account(s) are active in.", | ||
Example: `view s3://indices | ||
view s3:///indices GAXLQGKIUAIIUHAX4GJO3J7HFGLBCNF6ZCZSTLJE7EKO5IUHGLQLMXZO | ||
view file:///tmp/indices --limit=0 GAXLQGKIUAIIUHAX4GJO3J7HFGLBCNF6ZCZSTLJE7EKO5IUHGLQLMXZO | ||
view gcs://indices --limit=10 GAXLQGKIUAIIUHAX4GJO3J7HFGLBCNF6ZCZSTLJE7EKO5IUHGLQLMXZO,GBUUWQDVEEXBJCUF5UL24YGXKJIP5EMM7KFWIAR33KQRJR34GN6HEDPV,GBYETUYNBK2ZO5MSYBJKSLDEA2ZHIXLCFL3MMWU6RHFVAUBKEWQORYKS`, | ||
RunE: func(cmd *cobra.Command, args []string) error { | ||
if len(args) > 2 { | ||
return cmd.Usage() | ||
} | ||
|
||
path := args[0] | ||
log.Infof("Analyzing indices at %s", path) | ||
|
||
accounts := []string{} | ||
if len(args) == 2 { | ||
accounts = strings.Split(args[1], ",") | ||
} | ||
|
||
limit, err := cmd.Flags().GetUint("limit") | ||
if err != nil { | ||
return cmd.Usage() | ||
} | ||
|
||
if len(accounts) > 0 { | ||
indexName, err := cmd.Flags().GetString("index-name") | ||
if err != nil { | ||
return cmd.Usage() | ||
} | ||
|
||
for _, account := range accounts { | ||
if !strkey.IsValidEd25519PublicKey(account) && | ||
!strkey.IsValidMuxedAccountEd25519PublicKey(account) { | ||
log.Errorf("Invalid account ID: '%s'", account) | ||
continue | ||
} | ||
|
||
getIndex(path, account, indexName, limit) | ||
} | ||
} else { | ||
showAccounts(path, limit) | ||
} | ||
|
||
return nil | ||
}, | ||
} | ||
|
||
view.Flags().Uint("limit", 10, "a maximum number of accounts or checkpoints to show") | ||
view.Flags().String("index-name", "", "filter for a particular index") | ||
cmd.AddCommand(stats, view) | ||
|
||
if parent == nil { | ||
return cmd | ||
} | ||
parent.AddCommand(cmd) | ||
return parent | ||
} | ||
|
||
func getIndex(path, account, indexName string, limit uint) map[uint32][]string { | ||
freq := checkpointMgr.GetCheckpointFrequency() | ||
|
||
store, err := index.Connect(path) | ||
if err != nil { | ||
log.Fatal(err) | ||
} | ||
|
||
indices, err := store.Read(account) | ||
if err != nil { | ||
log.Fatal(err) | ||
} | ||
|
||
// It's better to summarize activity and then group it by index rather than | ||
// just show activity in each index, because there's likely a ton of overlap | ||
// across indices. | ||
activity := map[uint32][]string{} | ||
indexNames := []string{} | ||
|
||
for name, idx := range indices { | ||
log.Infof("Index found: '%s'", name) | ||
if indexName != "" && name != indexName { | ||
continue | ||
} | ||
|
||
indexNames = append(indexNames, name) | ||
|
||
checkpoint, err := idx.NextActiveBit(0) | ||
for err != io.EOF { | ||
activity[checkpoint] = append(activity[checkpoint], name) | ||
checkpoint, err = idx.NextActiveBit(checkpoint + 1) | ||
|
||
if limit > 0 && limit <= uint(len(activity)) { | ||
break | ||
} | ||
} | ||
} | ||
|
||
log.WithField("account", account).WithField("limit", limit). | ||
Infof("Activity for account:") | ||
|
||
for checkpoint, names := range activity { | ||
first := (checkpoint - 1) * freq | ||
last := first + freq | ||
|
||
nameStr := strings.Join(names, ", ") | ||
log.WithField("indices", nameStr). | ||
Infof(" - checkpoint %d, ledgers [%d, %d)", checkpoint, first, last) | ||
} | ||
|
||
log.Infof("Summary: %d active checkpoints, %d possible active ledgers", | ||
len(activity), len(activity)*int(freq)) | ||
log.Infof("Checkpoint range: [%d, %d]", | ||
ordered.MinSlice(maps.Keys(activity)), | ||
ordered.MaxSlice(maps.Keys(activity))) | ||
log.Infof("All discovered indices: %s", strings.Join(indexNames, ", ")) | ||
|
||
return activity | ||
} | ||
|
||
func showAccounts(path string, limit uint) []string { | ||
store, err := index.Connect(path) | ||
if err != nil { | ||
log.Fatalf("Failed to connect to index store at %s: %v", path, err) | ||
return nil | ||
} | ||
|
||
accounts, err := store.ReadAccounts() | ||
if err != nil { | ||
log.Fatalf("Failed read accounts from index store at %s: %v", path, err) | ||
return nil | ||
} | ||
|
||
if limit == 0 { | ||
limit = uint(len(accounts)) | ||
} | ||
|
||
for i := uint(0); i < limit; i++ { | ||
log.Info(accounts[i]) | ||
} | ||
|
||
return accounts | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,25 @@ | ||
package main | ||
|
||
import ( | ||
"github.com/spf13/cobra" | ||
|
||
"github.com/stellar/go/support/log" | ||
) | ||
|
||
func main() { | ||
log.SetLevel(log.InfoLevel) | ||
|
||
cmd := &cobra.Command{ | ||
Use: "tools", | ||
Long: "Please specify a subcommand to use this toolset.", | ||
Example: "", | ||
RunE: func(cmd *cobra.Command, args []string) error { | ||
// require a subcommand - this is just a "category" | ||
return cmd.Help() | ||
}, | ||
} | ||
|
||
cmd = addCacheCommands(cmd) | ||
cmd = addIndexCommands(cmd) | ||
cmd.Execute() | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters