Skip to content

Commit

Permalink
cli/demo: prevent a call to os.Exit in the license goroutine
Browse files Browse the repository at this point in the history
Prior to this patch, the async goroutine responsible for license
acquisition was also taking over the responsibility to call os.Exit.

This was sad because it meant that in case license acquisition failed,
the temporary files created for the demo cluster were not cleaned up.

This patch repairs that by bringing error handling back into the main
goroutine.

(It's still possible for demo to leave stray files behind - see
cockroachdb#46988 - and that will
need a separate patch.)

Release note (bug fix): `cockroach demo` now properly cleans up its
temporary files if the background license acquisition fails.
  • Loading branch information
knz committed Apr 3, 2020
1 parent c19b385 commit 121ac01
Show file tree
Hide file tree
Showing 3 changed files with 39 additions and 21 deletions.
4 changes: 1 addition & 3 deletions pkg/cli/cli.go
Original file line number Diff line number Diff line change
Expand Up @@ -65,10 +65,7 @@ func Main() {
defer log.RecoverAndReportPanic(context.Background(), &serverCfg.Settings.SV)

err := Run(os.Args[1:])
exitWithError(cmdName, err)
}

func exitWithError(cmdName string, err error) {
errCode := 0
if err != nil {
// Display the error and its details/hints.
Expand All @@ -85,6 +82,7 @@ func exitWithError(cmdName string, err error) {
errCode = cliErr.exitCode
}
}

os.Exit(errCode)
}

Expand Down
53 changes: 37 additions & 16 deletions pkg/cli/demo.go
Original file line number Diff line number Diff line change
Expand Up @@ -623,7 +623,7 @@ func setupTransientCluster(
}

func (c *transientCluster) setupWorkload(
ctx context.Context, gen workload.Generator, licenseDone chan struct{},
ctx context.Context, gen workload.Generator, licenseDone <-chan error,
) error {
// If there is a load generator, create its database and load its
// fixture.
Expand Down Expand Up @@ -652,7 +652,9 @@ func (c *transientCluster) setupWorkload(
if cliCtx.isInteractive {
fmt.Println("#\n# Waiting for license acquisition to complete...")
}
<-licenseDone
if err := waitForLicense(licenseDone); err != nil {
return err
}
if cliCtx.isInteractive {
fmt.Println("#\n# Partitioning the demo database, please wait...")
}
Expand Down Expand Up @@ -822,8 +824,9 @@ func checkDemoConfiguration(
demoCtx.disableTelemetry || (GetAndApplyLicense == nil) || demoCtx.disableLicenseAcquisition

if demoCtx.geoPartitionedReplicas {
geoFlag := "--" + cliflags.DemoGeoPartitionedReplicas.Name
if demoCtx.disableLicenseAcquisition {
return nil, errors.New("enterprise features are needed for this demo (--geo-partitioned-replicas)")
return nil, errors.Newf("enterprise features are needed for this demo (%s)", geoFlag)
}

// Make sure that the user didn't request to have a topology and an empty database.
Expand All @@ -833,18 +836,18 @@ func checkDemoConfiguration(

// Make sure that the Movr database is selected when automatically partitioning.
if gen == nil || gen.Meta().Name != "movr" {
return nil, errors.New("--geo-partitioned-replicas must be used with the Movr dataset")
return nil, errors.Newf("%s must be used with the Movr dataset", geoFlag)
}

// If the geo-partitioned replicas flag was given and the demo localities have changed, throw an error.
if demoCtx.localities != nil {
return nil, errors.New("--demo-locality cannot be used with --geo-partitioned-replicas")
return nil, errors.Newf("--demo-locality cannot be used with %s", geoFlag)
}

// If the geo-partitioned replicas flag was given and the nodes have changed, throw an error.
if flagSetForCmd(cmd).Lookup(cliflags.DemoNodes.Name).Changed {
if demoCtx.nodes != 9 {
return nil, errors.New("--nodes with a value different from 9 cannot be used with --geo-partitioned-replicas")
return nil, errors.Newf("--nodes with a value different from 9 cannot be used with %s", geoFlag)
}
} else {
const msg = `#
Expand Down Expand Up @@ -872,10 +875,10 @@ func checkDemoConfiguration(
// temporary demo license from the Cockroach Labs website. It returns
// a channel that can be waited on if it is needed to wait on the
// license acquisition.
func (c *transientCluster) acquireDemoLicense(ctx context.Context) (chan struct{}, error) {
func (c *transientCluster) acquireDemoLicense(ctx context.Context) (chan error, error) {
// Communicate information about license acquisition to services
// that depend on it.
licenseDone := make(chan struct{})
licenseDone := make(chan error)
if demoCtx.disableLicenseAcquisition {
// If we are not supposed to acquire a license, close the channel
// immediately so that future waiters don't hang.
Expand All @@ -892,17 +895,17 @@ func (c *transientCluster) acquireDemoLicense(ctx context.Context) (chan struct{

success, err := GetAndApplyLicense(db, c.s.ClusterID(), demoOrg)
if err != nil {
exitWithError("demo", err)
licenseDone <- err
return
}
if !success {
if demoCtx.geoPartitionedReplicas {
log.Shout(ctx, log.Severity_ERROR,
"license acquisition was unsuccessful.\nNote: enterprise features are needed for --geo-partitioned-replicas.")
exitWithError("demo", errors.New("unable to acquire a license for this demo"))
licenseDone <- errors.WithDetailf(
errors.New("unable to acquire a license for this demo"),
"Enterprise features are needed for this demo (--%s).",
cliflags.DemoGeoPartitionedReplicas.Name)
return
}

const msg = "\nwarning: unable to acquire demo license - enterprise features are not enabled."
fmt.Fprintln(stderr, msg)
}
close(licenseDone)
}()
Expand Down Expand Up @@ -989,11 +992,24 @@ func runDemo(cmd *cobra.Command, gen workload.Generator) (err error) {
defaultRootPassword,
)
}
// If we didn't launch a workload, we still need to inform the
// user if the license check fails. Do this asynchronously and print
// the final error if any.
//
// It's ok to do this twice (if workload setup already waited) because
// then the error return is guaranteed to be nil.
go func() {
if err := waitForLicense(licenseDone); err != nil {
_ = checkAndMaybeShout(err)
}
}()
} else {
// If we are not running an interactive shell, we need to wait to ensure
// that license acquisition is successful. If license acquisition is
// disabled, then a read on this channel will return immediately.
<-licenseDone
if err := waitForLicense(licenseDone); err != nil {
return checkAndMaybeShout(err)
}
}

conn := makeSQLConn(c.connURL)
Expand All @@ -1002,6 +1018,11 @@ func runDemo(cmd *cobra.Command, gen workload.Generator) (err error) {
return runClient(cmd, conn)
}

func waitForLicense(licenseDone <-chan error) error {
err := <-licenseDone
return err
}

// sockForServer generates the metadata for a unix socket for the given node.
// For example, node 1 gets socket /tmpdemodir/.s.PGSQL.26267,
// node 2 gets socket /tmpdemodir/.s.PGSQL.26268, etc.
Expand Down
3 changes: 1 addition & 2 deletions pkg/cli/interactive_tests/test_demo_partitioning.tcl
Original file line number Diff line number Diff line change
Expand Up @@ -100,8 +100,7 @@ start_test "Expect an error if geo-partitioning is requested and a license canno
set env(COCKROACH_DEMO_LICENSE_URL) "https://127.0.0.1:9999/"
spawn $argv demo --geo-partitioned-replicas
eexpect "error while contacting licensing server"
eexpect "dial tcp"
eexpect "ERROR: license acquisition was unsuccessful"
eexpect "Enterprise features are needed for this demo"
eexpect eof
end_test

Expand Down

0 comments on commit 121ac01

Please sign in to comment.