Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Implement new pganalyze.explain_analyze() helper #655

Merged
merged 3 commits into from
Jan 6, 2025
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 9 additions & 0 deletions .github/workflows/ci.yml
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,15 @@ jobs:
build:
# Use new enough OS that has CGroupsv2 enabled (required by the integration tests)
runs-on: ubuntu-22.04
env:
TEST_DATABASE_URL: postgresql://postgres:postgres@localhost:5432/postgres?sslmode=disable
services:
postgres:
image: postgres:14
Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Using 14 as a minimum here since the EXPLAIN ANALYZE tests rely on being able to turn off compute_query_id in the output (and that was added in 14).

env:
POSTGRES_PASSWORD: postgres
ports:
- 5432:5432

steps:

Expand Down
2 changes: 0 additions & 2 deletions input/postgres/establish_connection.go
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,6 @@ import (
"context"
"database/sql"
"fmt"
"time"

"github.com/aws/aws-sdk-go/service/rds/rdsutils"
"github.com/pganalyze/collector/config"
Expand Down Expand Up @@ -78,7 +77,6 @@ func connectToDb(ctx context.Context, config config.ServerConfig, logger *util.L
}

db.SetMaxOpenConns(1)
db.SetConnMaxLifetime(30 * time.Second)

err = db.PingContext(ctx)
if err != nil {
Expand Down
68 changes: 68 additions & 0 deletions input/postgres/explain_analyze.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,68 @@
package postgres

import (
"context"
"database/sql"
"fmt"
"strings"

"github.com/guregu/null"
"github.com/lib/pq"
"github.com/pganalyze/collector/util"
)

func RunExplainAnalyzeForQueryRun(ctx context.Context, db *sql.DB, query string, parameters []null.String, parameterTypes []string, marker string) (result string, err error) {
err = validateQuery(query)
if err != nil {
return
}

// Warm up caches without collecting timing info (slightly faster)
_, err = runExplainAnalyze(ctx, db, query, parameters, parameterTypes, []string{"ANALYZE", "TIMING OFF"}, marker)
if err != nil {
if !strings.Contains(err.Error(), "statement timeout") {
return
}

// Run again if it was a timeout error, to make sure we got the caches warmed up all the way
_, err = runExplainAnalyze(ctx, db, query, parameters, parameterTypes, []string{"ANALYZE", "TIMING OFF"}, marker)
if err != nil {
if !strings.Contains(err.Error(), "statement timeout") {
return
}

// If it timed out again, capture a non-ANALYZE EXPLAIN instead
return runExplainAnalyze(ctx, db, query, parameters, parameterTypes, []string{}, marker)
}
}

// Run EXPLAIN ANALYZE once more to get a warm cache result (this is the one we return)
return runExplainAnalyze(ctx, db, query, parameters, parameterTypes, []string{"ANALYZE", "BUFFERS"}, marker)
}

func runExplainAnalyze(ctx context.Context, db *sql.DB, query string, parameters []null.String, parameterTypes []string, analyzeFlags []string, marker string) (explainOutput string, err error) {
tx, err := db.BeginTx(ctx, &sql.TxOptions{ReadOnly: true})
if err != nil {
return "", err
}
defer tx.Rollback()

err = tx.QueryRowContext(ctx, marker+"SELECT pganalyze.explain_analyze($1, $2, $3, $4)", marker+query, pq.Array(parameters), pq.Array(parameterTypes), pq.Array(analyzeFlags)).Scan(&explainOutput)

return
}

func validateQuery(query string) error {
var isUtil []bool
// To be on the safe side never EXPLAIN a statement that can't be parsed,
// or multiple statements in one (leading to accidental execution)
isUtil, err := util.IsUtilityStmt(query)
if err != nil || len(isUtil) != 1 || isUtil[0] {
err = fmt.Errorf("query is not permitted to run (multi-statement or utility command?)")
return err
}

// TODO: Consider adding additional checks here (e.g. blocking known bad function calls)

return nil
}
Loading
Loading