diff --git a/docs/generated/http/full.md b/docs/generated/http/full.md index a36ba2c8ca1a..0f73ea23fea7 100644 --- a/docs/generated/http/full.md +++ b/docs/generated/http/full.md @@ -2140,6 +2140,7 @@ ActiveQuery represents a query in flight on some Session. | is_full_scan | [bool](#cockroach.server.serverpb.ListSessionsResponse-bool) | | True if the query contains a full table or index scan. Note that this field is only valid if the query is in the EXECUTING phase. | [reserved](#support-status) | | elapsed_time | [google.protobuf.Duration](#cockroach.server.serverpb.ListSessionsResponse-google.protobuf.Duration) | | Time elapsed since this query started execution. | [reserved](#support-status) | | plan_gist | [string](#cockroach.server.serverpb.ListSessionsResponse-string) | | The compressed plan that can be converted back into the statement's logical plan. Empty if the statement is in the PREPARING state. | [reserved](#support-status) | +| placeholders | [string](#cockroach.server.serverpb.ListSessionsResponse-string) | repeated | The placeholders if any. | [reserved](#support-status) | @@ -2283,6 +2284,7 @@ ActiveQuery represents a query in flight on some Session. | is_full_scan | [bool](#cockroach.server.serverpb.ListSessionsResponse-bool) | | True if the query contains a full table or index scan. Note that this field is only valid if the query is in the EXECUTING phase. | [reserved](#support-status) | | elapsed_time | [google.protobuf.Duration](#cockroach.server.serverpb.ListSessionsResponse-google.protobuf.Duration) | | Time elapsed since this query started execution. | [reserved](#support-status) | | plan_gist | [string](#cockroach.server.serverpb.ListSessionsResponse-string) | | The compressed plan that can be converted back into the statement's logical plan. Empty if the statement is in the PREPARING state. | [reserved](#support-status) | +| placeholders | [string](#cockroach.server.serverpb.ListSessionsResponse-string) | repeated | The placeholders if any. | [reserved](#support-status) | diff --git a/pkg/server/serverpb/status.proto b/pkg/server/serverpb/status.proto index 453f0cb201a5..de9ec82df7a8 100644 --- a/pkg/server/serverpb/status.proto +++ b/pkg/server/serverpb/status.proto @@ -916,6 +916,10 @@ message ActiveQuery { // The compressed plan that can be converted back into the statement's logical plan. // Empty if the statement is in the PREPARING state. string plan_gist = 12; + + // The placeholders if any. + repeated string placeholders = 13; + } // Request object for ListSessions and ListLocalSessions. diff --git a/pkg/sql/conn_executor.go b/pkg/sql/conn_executor.go index c7f6e526a782..85553cb1e44d 100644 --- a/pkg/sql/conn_executor.go +++ b/pkg/sql/conn_executor.go @@ -3177,12 +3177,16 @@ func (ex *connExecutor) serialize() serverpb.Session { if query.hidden { continue } - ast, err := query.getStatement() - if err != nil { - continue + sqlNoConstants := truncateSQL(formatStatementHideConstants(query.stmt.AST)) + nPlaceholders := 0 + if query.placeholders != nil { + nPlaceholders = len(query.placeholders.Values) + } + placeholders := make([]string, nPlaceholders) + for i := range placeholders { + placeholders[i] = tree.AsStringWithFlags(query.placeholders.Values[i], tree.FmtSimple) } - sqlNoConstants := truncateSQL(formatStatementHideConstants(ast)) - sql := truncateSQL(ast.String()) + sql := truncateSQL(query.stmt.SQL) progress := math.Float64frombits(atomic.LoadUint64(&query.progressAtomic)) queryStart := query.start.UTC() activeQueries = append(activeQueries, serverpb.ActiveQuery{ @@ -3192,7 +3196,8 @@ func (ex *connExecutor) serialize() serverpb.Session { ElapsedTime: timeNow.Sub(queryStart), Sql: sql, SqlNoConstants: sqlNoConstants, - SqlSummary: formatStatementSummary(ast), + SqlSummary: formatStatementSummary(query.stmt.AST), + Placeholders: placeholders, IsDistributed: query.isDistributed, Phase: (serverpb.ActiveQuery_Phase)(query.phase), Progress: float32(progress), diff --git a/pkg/sql/conn_executor_exec.go b/pkg/sql/conn_executor_exec.go index efd9fc98aae0..f6d904bfc02a 100644 --- a/pkg/sql/conn_executor_exec.go +++ b/pkg/sql/conn_executor_exec.go @@ -307,15 +307,9 @@ func (ex *connExecutor) execStmtInOpenState( var queryDoneAfterFunc chan struct{} var txnDoneAfterFunc chan struct{} - // Early-associate placeholder info with the eval context, - // so that we can fill in placeholder values in our call to addActiveQuery, below. - if !ex.planner.EvalContext().HasPlaceholders() { - ex.planner.EvalContext().Placeholders = pinfo - } - var cancelQuery context.CancelFunc ctx, cancelQuery = contextutil.WithCancel(ctx) - ex.addActiveQuery(ast, formatWithPlaceholders(ctx, ast, ex.planner.EvalContext()), queryID, cancelQuery) + ex.addActiveQuery(parserStmt, pinfo, queryID, cancelQuery) // Make sure that we always unregister the query. It also deals with // overwriting res.Error to a more user-friendly message in case of query @@ -547,7 +541,7 @@ func (ex *connExecutor) execStmtInOpenState( if perr, ok := retPayload.(payloadWithError); ok { execErr = perr.errorCause() } - filter(ctx, ex.sessionData(), ast.String(), execErr) + filter(ctx, ex.sessionData(), stmt.AST.String(), execErr) } // Do the auto-commit, if necessary. In the extended protocol, the @@ -2106,13 +2100,17 @@ func (ex *connExecutor) enableTracing(modes []string) error { // addActiveQuery adds a running query to the list of running queries. func (ex *connExecutor) addActiveQuery( - ast tree.Statement, rawStmt string, queryID clusterunique.ID, cancelQuery context.CancelFunc, + stmt parser.Statement, + placeholders *tree.PlaceholderInfo, + queryID clusterunique.ID, + cancelQuery context.CancelFunc, ) { - _, hidden := ast.(tree.HiddenFromShowQueries) + _, hidden := stmt.AST.(tree.HiddenFromShowQueries) qm := &queryMeta{ txnID: ex.state.mu.txn.ID(), start: ex.phaseTimes.GetSessionPhaseTime(sessionphase.SessionQueryReceived), - rawStmt: rawStmt, + stmt: stmt, + placeholders: placeholders, phase: preparing, isDistributed: false, isFullScan: false, diff --git a/pkg/sql/crdb_internal.go b/pkg/sql/crdb_internal.go index 97f551c12846..0dfc53395a9c 100644 --- a/pkg/sql/crdb_internal.go +++ b/pkg/sql/crdb_internal.go @@ -53,6 +53,7 @@ import ( "github.com/cockroachdb/cockroach/pkg/sql/catalog/tabledesc" "github.com/cockroachdb/cockroach/pkg/sql/clusterunique" "github.com/cockroachdb/cockroach/pkg/sql/idxusage" + "github.com/cockroachdb/cockroach/pkg/sql/parser" "github.com/cockroachdb/cockroach/pkg/sql/pgwire/pgcode" "github.com/cockroachdb/cockroach/pkg/sql/pgwire/pgerror" "github.com/cockroachdb/cockroach/pkg/sql/privilege" @@ -1891,6 +1892,8 @@ func populateQueriesTable( planGistDatum = tree.NewDString(query.PlanGist) } + // Interpolate placeholders into the SQL statement. + sql := formatActiveQuery(query) if err := addRow( tree.NewDString(query.ID), txnID, @@ -1898,7 +1901,7 @@ func populateQueriesTable( sessionID, tree.NewDString(session.Username), ts, - tree.NewDString(query.Sql), + tree.NewDString(sql), tree.NewDString(session.ClientAddress), tree.NewDString(session.ApplicationName), isDistributedDatum, @@ -1938,6 +1941,33 @@ func populateQueriesTable( return nil } +// formatActiveQuery formats a serverpb.ActiveQuery by interpolating its +// placeholders within the string. +func formatActiveQuery(query serverpb.ActiveQuery) string { + parsed, parseErr := parser.ParseOne(query.Sql) + if parseErr != nil { + // If we failed to interpolate, rather than give up just send out the + // SQL without interpolated placeholders. Hallelujah! + return query.Sql + } + var sb strings.Builder + sql := tree.AsStringWithFlags(parsed.AST, tree.FmtSimple, + tree.FmtPlaceholderFormat(func(ctx *tree.FmtCtx, p *tree.Placeholder) { + if int(p.Idx) > len(query.Placeholders) { + ctx.Printf("$%d", p.Idx+1) + return + } + ctx.Printf(query.Placeholders[p.Idx]) + }), + ) + sb.WriteString(sql) + for i := range parsed.Comments { + sb.WriteString(" ") + sb.WriteString(parsed.Comments[i]) + } + return sb.String() +} + const sessionsSchemaPattern = ` CREATE TABLE crdb_internal.%s ( node_id INT NOT NULL, -- the node on which the query is running @@ -2008,7 +2038,8 @@ func populateSessionsTable( // The array is leftover from a time when we allowed multiple // queries to be executed at once in a session. activeQueryStart = query.Start - activeQueries.WriteString(query.Sql) + sql := formatActiveQuery(query) + activeQueries.WriteString(sql) } var err error diff --git a/pkg/sql/exec_util.go b/pkg/sql/exec_util.go index b6a5c42aad6b..7c805ff6bde4 100644 --- a/pkg/sql/exec_util.go +++ b/pkg/sql/exec_util.go @@ -1928,10 +1928,11 @@ type queryMeta struct { // The timestamp when this query began execution. start time.Time - // The string of the SQL statement being executed. This string may - // contain sensitive information, so it must be converted back into - // an AST and dumped before use in logging. - rawStmt string + // The SQL statement being executed. + stmt parser.Statement + + // The placeholders that the query was executed with if any. + placeholders *tree.PlaceholderInfo // States whether this query is distributed. Note that all queries, // including those that are distributed, have this field set to false until @@ -1970,16 +1971,6 @@ func (q *queryMeta) cancel() { q.cancelQuery() } -// getStatement returns a cleaned version of the query associated -// with this queryMeta. -func (q *queryMeta) getStatement() (tree.Statement, error) { - parsed, err := parser.ParseOne(q.rawStmt) - if err != nil { - return nil, err - } - return parsed.AST, nil -} - // SessionDefaults mirrors fields in Session, for restoring default // configuration values in SET ... TO DEFAULT (or RESET ...) statements. type SessionDefaults map[string]string diff --git a/pkg/sql/parser/parse.go b/pkg/sql/parser/parse.go index c38e99444fcb..16f48a6adc85 100644 --- a/pkg/sql/parser/parse.go +++ b/pkg/sql/parser/parse.go @@ -43,6 +43,9 @@ type Statement struct { // AST is the root of the AST tree for the parsed statement. AST tree.Statement + // Comments is the list of parsed SQL comments. + Comments []string + // SQL is the original SQL from which the statement was parsed. Note that this // is not appropriate for use in logging, as it may contain passwords and // other sensitive data. @@ -182,7 +185,6 @@ func (p *Parser) scanOneStmt() (sql string, tokens []sqlSymType, done bool) { return p.scanner.In()[startPos:], tokens, true } preValID = lval.id - posBeforeScan := p.scanner.Pos() tokens = append(tokens, sqlSymType{}) lval = &tokens[len(tokens)-1] p.scanner.Scan(lval) @@ -194,8 +196,13 @@ func (p *Parser) scanOneStmt() (sql string, tokens []sqlSymType, done bool) { curFuncBodyCnt-- } if lval.id == 0 || (curFuncBodyCnt == 0 && lval.id == ';') { + endPos := p.scanner.Pos() + if lval.id == ';' { + // Don't include the ending semicolon, if there is one, in the raw SQL. + endPos-- + } tokens = tokens[:len(tokens)-1] - return p.scanner.In()[startPos:posBeforeScan], tokens, (lval.id == 0) + return p.scanner.In()[startPos:endPos], tokens, (lval.id == 0) } lval.pos -= startPos } @@ -253,6 +260,7 @@ func (p *Parser) parse( return Statement{ AST: p.lexer.stmt, SQL: sql, + Comments: p.scanner.Comments, NumPlaceholders: p.lexer.numPlaceholders, NumAnnotations: p.lexer.numAnnotations, }, nil diff --git a/pkg/sql/parser/parse_internal_test.go b/pkg/sql/parser/parse_internal_test.go index e878bdf0673e..6a077e90f6d3 100644 --- a/pkg/sql/parser/parse_internal_test.go +++ b/pkg/sql/parser/parse_internal_test.go @@ -44,7 +44,7 @@ func TestScanOneStmt(t *testing.T) { { sql: `SELECT 1 /* comment */ ; /* comment */ ; /* comment */ `, exp: []stmt{{ - sql: `SELECT 1`, + sql: `SELECT 1 /* comment */ `, tok: []int{SELECT, ICONST}, }}, }, @@ -73,11 +73,11 @@ func TestScanOneStmt(t *testing.T) { sql: ` ; /* x */ SELECT 1 ; SET /* y */ ; ; INSERT INTO table; ;`, exp: []stmt{ { - sql: `SELECT 1`, + sql: `SELECT 1 `, tok: []int{SELECT, ICONST}, }, { - sql: `SET`, + sql: `SET /* y */ `, tok: []int{SET}, }, { diff --git a/pkg/sql/parser/parse_test.go b/pkg/sql/parser/parse_test.go index f9042c7dbeb3..bf4186553cc2 100644 --- a/pkg/sql/parser/parse_test.go +++ b/pkg/sql/parser/parse_test.go @@ -639,10 +639,12 @@ func TestParseSQL(t *testing.T) { {in: ``, exp: nil}, {in: `SELECT 1`, exp: []string{`SELECT 1`}}, {in: `SELECT 1;`, exp: []string{`SELECT 1`}}, - {in: `SELECT 1 /* comment */`, exp: []string{`SELECT 1`}}, + // We currently chop off beginning-of-line comments. + {in: `/* comment */ SELECT 1`, exp: []string{`SELECT 1`}}, + {in: `SELECT 1 /* comment */`, exp: []string{`SELECT 1 /* comment */`}}, {in: `SELECT 1;SELECT 2`, exp: []string{`SELECT 1`, `SELECT 2`}}, - {in: `SELECT 1 /* comment */ ;SELECT 2`, exp: []string{`SELECT 1`, `SELECT 2`}}, - {in: `SELECT 1 /* comment */ ; /* comment */ SELECT 2`, exp: []string{`SELECT 1`, `SELECT 2`}}, + {in: `SELECT 1 /* comment */ ;SELECT 2`, exp: []string{`SELECT 1 /* comment */ `, `SELECT 2`}}, + {in: `SELECT 1 /* comment */ ; SELECT 2`, exp: []string{`SELECT 1 /* comment */ `, `SELECT 2`}}, } var p parser.Parser // Verify that the same parser can be reused. for _, d := range testData { @@ -656,7 +658,7 @@ func TestParseSQL(t *testing.T) { res = append(res, stmts[i].SQL) } if !reflect.DeepEqual(res, d.exp) { - t.Errorf("expected \n%v\n, but found %v", res, d.exp) + t.Errorf("expected \n%v\n, but found %v", d.exp, res) } }) } diff --git a/pkg/sql/scanner/scan.go b/pkg/sql/scanner/scan.go index ff5d06a0ef67..87a27dd10c2c 100644 --- a/pkg/sql/scanner/scan.go +++ b/pkg/sql/scanner/scan.go @@ -57,6 +57,9 @@ type Scanner struct { in string pos int bytesPrealloc []byte + + // Comments is the list of parsed comments from the SQL statement. + Comments []string } // In returns the input string. @@ -453,6 +456,7 @@ func (s *Scanner) next() int { func (s *Scanner) skipWhitespace(lval ScanSymType, allowComments bool) (newline, ok bool) { newline = false for { + startPos := s.pos ch := s.peek() if ch == '\n' { s.pos++ @@ -467,6 +471,8 @@ func (s *Scanner) skipWhitespace(lval ScanSymType, allowComments bool) (newline, if present, cok := s.ScanComment(lval); !cok { return false, false } else if present { + // Mark down the comments that we found. + s.Comments = append(s.Comments, s.in[startPos:s.pos]) continue } } diff --git a/pkg/sql/show_test.go b/pkg/sql/show_test.go index b4115f7272dc..19dc44dd0821 100644 --- a/pkg/sql/show_test.go +++ b/pkg/sql/show_test.go @@ -726,6 +726,21 @@ func TestShowQueriesFillsInValuesForPlaceholders(t *testing.T) { []interface{}{"hello"}, "SELECT upper('hello')", }, + { + "SELECT /* test */ upper($1)", + []interface{}{"hello"}, + "SELECT upper('hello') /* test */", + }, + { + "SELECT /* test */ 'hi'::string", + []interface{}{}, + "SELECT 'hi'::STRING /* test */", + }, + { + "SELECT /* test */ 'hi'::string /* fnord */", + []interface{}{}, + "SELECT 'hi'::STRING /* test */ /* fnord */", + }, } // Perform both as a simple execution and as a prepared statement, @@ -761,7 +776,14 @@ func TestShowQueriesFillsInValuesForPlaceholders(t *testing.T) { t.Fatal(err) } - require.Equal(t, test.expected, recordedQueries[test.statement]) + // parse and stringify the statement so that it matches the key in the + // recordedQueries map. + stmt, err := parser.ParseOne(test.statement) + if err != nil { + t.Fatal(err) + } + sql := stmt.AST.String() + require.Equal(t, test.expected, recordedQueries[sql]) }) } }